doxygen-c/html/ideep_2operators_2concat__split__op_8cc_source.html

 #include <caffe2/ideep/ideep_utils.h>
 #include <caffe2/ideep/operators/operator_fallback_ideep.h>
 #include <caffe2/operators/concat_split_op.h>

 namespace caffe2 {

 class IDEEPConcatOp final : public IDEEPOperator {
  public:
   USE_IDEEP_DEF_ALIASES();
   USE_IDEEP_OPERATOR_FUNCTIONS();
   using FALLBACK_OP = IDEEPFallbackOp<ConcatOp<CPUContext>, SkipIndices<0>>;

   IDEEPConcatOp(const OperatorDef& operator_def, Workspace* ws)
       : IDEEPOperator(operator_def, ws),
         fallback_(operator_def, ws) {
     CAFFE_ENFORCE(
       !(OperatorBase::HasArgument("axis") && OperatorBase::HasArgument("order")),
         "You shouldn't specify both the dim to concat, and the order "
         "in the case of 4-D images.");
     if (OperatorBase::HasArgument("axis")) {
       axis_ = OperatorBase::GetSingleArgument<int>("axis", -1);
       add_axis_ = OperatorBase::GetSingleArgument<int>("add_axis", 0);
     } else {
       axis_ = 1;
       add_axis_ = 0;
     }
     CAFFE_ENFORCE_GE(axis_, 0);
   }
   ~IDEEPConcatOp() override {}

   bool RunOnDevice() override {
     bool fallback_to_cpu = false;
     vector<itensor> inputs_itensor;

     for (int i = 0; i < InputSize(); ++i) {
       if (OperatorBase::InputBlob(i).template IsType<itensor>()) {
         auto& tensor_ideep = Input(i);
         if (tensor_ideep.ndims() == 0 || tensor_ideep.get_nelems() == 0)
           continue;
         inputs_itensor.emplace_back(tensor_ideep);
       } else {
         CAFFE_ENFORCE(
             BlobIsTensorType(OperatorBase::InputBlob(i), CPU),
             "Expect cpu tensor if not itensor");
         auto& tensor_cpu = OperatorBase::Input<Tensor>(i, CPU);
         if (tensor_cpu.sizes().size() == 0 || tensor_cpu.numel() == 0)
           continue;
         fallback_to_cpu = true;
         break;
       }
     }

     if (!fallback_to_cpu) {
       auto* output = Output(OUTPUT);
       Tensor* axis_info = OutputTensor(AXIS_INFO,
         vector<int64_t>(1, InputSize()), at::dtype<int>().device(CPU));
       auto* axis_data = axis_info->template mutable_data<int>();
       auto axis_vdata =
         ideep::concat::compute(inputs_itensor, axis_, add_axis_, *output);
       for (int i = 0; i < axis_vdata.size(); i++) {
         axis_data[i] = axis_vdata[i];
       }
       return true;
     }

     return fallback_.Run(0);
   }

  private:
   int axis_;
   int add_axis_;
   FALLBACK_OP fallback_;

   INPUT_TAGS(INPUT0);
   OUTPUT_TAGS(OUTPUT, AXIS_INFO);
 };

 class IDEEPSplitOp final : public IDEEPOperator {
  public:
   USE_IDEEP_DEF_ALIASES();
   USE_IDEEP_OPERATOR_FUNCTIONS();

   IDEEPSplitOp(const OperatorDef& operator_def, Workspace* ws)
       : IDEEPOperator(operator_def, ws),
         axis_offset_(OperatorBase::GetRepeatedArgument<int>("split")) {
     CAFFE_ENFORCE(
       !(OperatorBase::HasArgument("axis") && OperatorBase::HasArgument("order")),
         "You shouldn't specify both the dim to split, and the order "
         "in the case of 4-D images.");
     if (OperatorBase::HasArgument("axis")) {
       axis_ = OperatorBase::GetSingleArgument<int>("axis", -1);
       // only exists for computing the gradient of a Concat with 'add_axis'
       add_axis_ = OperatorBase::GetSingleArgument<int>("add_axis", 0);
     } else {
       axis_ = 1;
       add_axis_ = 0;
     }
     CAFFE_ENFORCE_GE(axis_, 0);
   }
   ~IDEEPSplitOp() override {}

   bool RunOnDevice() override {
     const auto& input = Input(INPUT);
     CAFFE_ENFORCE_LT(axis_, input.ndims(), "Axis not in input ndim range.");
     const int input_channels = input.get_dim(axis_);
     vector<int> axis_vdata(OutputSize(), 0);
     if (InputSize() == 2) {
       // We obtain split from the input tensor.
       CAFFE_ENFORCE_EQ(
           axis_offset_.size(),
           0,
           "If you set split with an input blob, do not pass in "
           "split in the argument.");
       auto& axis_info = OperatorBase::Input<Tensor>(AXIS_INFO, CPU);
       CAFFE_ENFORCE_EQ(axis_info.numel(), OutputSize());
       auto* axis_data = axis_info.template data<int>();
       axis_vdata.assign(axis_data, axis_data + OutputSize());
     } else if (axis_offset_.size() == 0) {
       CAFFE_ENFORCE_EQ(
           input_channels % OutputSize(),
           0,
           "If you did not specify split explicitly, the number of "
           "input channels should be divisible by the output size.");
       axis_vdata.assign(OutputSize(), input_channels / OutputSize());
     } else {
       // We obtain split from the parameters.
       CAFFE_ENFORCE_EQ(
           axis_offset_.size(),
           OutputSize(),
           "The number of splits specified should be equal to the "
           "number of outputs.");
       axis_vdata = axis_offset_;
     }

     CAFFE_ENFORCE_EQ(
         add_axis_ ? OutputSize()
                   : std::accumulate(
                     axis_vdata.data(), axis_vdata.data() + OutputSize(), 0),
         input_channels,
         "Sum of split dimensions do not match: should be ",
         input_channels);

     auto iten_vector = ideep::spliter::compute(
         input, axis_vdata, axis_, add_axis_);
     CAFFE_ENFORCE_EQ(
         iten_vector.size(),
         OutputSize(),
         "Output size does not match: should be ",
         OutputSize());

     for (int i = 0; i < OutputSize(); i++) {
       auto* output = Output(i);
       *output = iten_vector[i];
     }

     return true;
   }

  private:
   int axis_;
   int add_axis_;
   vector<int> axis_offset_;

   INPUT_TAGS(INPUT, AXIS_INFO);
 };


 REGISTER_IDEEP_OPERATOR(Concat, IDEEPConcatOp);
 REGISTER_IDEEP_OPERATOR(Split, IDEEPSplitOp);

 } // namespace caffe2
caffe2::SkipIndices
Definition: common.h:132

nom::repr::Tensor
Definition: NeuralNet.h:158

caffe2::Workspace
Workspace is a class that holds all the related objects created during runtime: (1) all blobs...
Definition: workspace.h:47

caffe2::IDEEPConcatOp
Definition: concat_split_op.cc:7

c10::ArrayRef::size
constexpr size_t size() const
size - Get the array size.
Definition: ArrayRef.h:138

caffe2::IDEEPOperator
Definition: ideep_operator.h:35

caffe2
A global dictionary that holds information about what Caffe2 modules have been loaded in the current ...
Definition: blob.h:13

caffe2::IDEEPSplitOp
Definition: concat_split_op.cc:78

Concat
Definition: OpClasses.h:607

caffe2::IDEEPFallbackOp
A templated class to allow one to wrap a CPU operator as an IDEEP operator.
Definition: operator_fallback_ideep.h:39

caffe2::OperatorBase::HasArgument
bool HasArgument(const string &name) const
Checks if the operator has an argument of the given name.
Definition: operator.h:70