doxygen-c/html/lengths__reducer__fused__8bit__rowwise__ops_8h_source.html

 #ifndef CAFFE2_OPERATORS_LENGTHS_REDUCER_FUSED_8BIT_ROWWISE_OPS_H_
 #define CAFFE2_OPERATORS_LENGTHS_REDUCER_FUSED_8BIT_ROWWISE_OPS_H_

 #include "caffe2/core/context.h"
 #include "caffe2/core/logging.h"
 #include "caffe2/core/operator.h"
 #include "caffe2/operators/fused_rowwise_8bit_conversion_ops.h"
 #include "caffe2/operators/reducer_functors.h"
 #include "caffe2/perfkernels/fused_8bit_rowwise_embedding_lookup.h"
 #include "caffe2/utils/math.h"

 namespace caffe2 {

 template <class Context, bool with_weights = 0, bool is_mean = 0>
 class SparseLengthsFused8BitRowwiseOp : public Operator<Context> {
  public:
   static_assert(
       !(with_weights && is_mean),
       "Cannot have with_weights and is_mean a the same time");

   USE_OPERATOR_CONTEXT_FUNCTIONS;
   USE_SIMPLE_CTOR_DTOR(SparseLengthsFused8BitRowwiseOp)

   bool RunOnDevice() override {
     return DispatchHelper<TensorTypes<int32_t, int64_t>>::call(
         this, Input(INDICES));
   }

   template <typename IndexType>
   bool DoRunWithType() {
     const auto& data = Input(DATA);
     const auto& indices = Input(INDICES);
     const auto& lengths = Input(LENGTHS);

     CAFFE_ENFORCE_EQ(indices.dim(), 1, "INDICES must be a vector");
     CAFFE_ENFORCE_EQ(lengths.dim(), 1, "LENGTHS must be a vector");

     const float* weights = nullptr;
     if (with_weights) {
       const auto& weights_input = Input(WEIGHTS);
       CAFFE_ENFORCE_EQ(weights_input.dim(), 1, "WEIGHTS must be a vector");
       CAFFE_ENFORCE_EQ(
           weights_input.numel(),
           indices.numel(),
           "WEIGHTS should have the same length as INDICES.");
       weights = weights_input.template data<float>();
     }

     CAFFE_ENFORCE_GT(data.size(1), 8, "DATA must have more than 8 columns");
     // Subtract 8 from the #columns of data for the 4 bytes for scale and 4
     // bytes for bias that we use in the fused representation (per row).
     const std::vector<int64_t> shape = {lengths.size(0), data.size(1) - 8};
     auto* output = Output(0, shape, at::dtype<float>());

     Fused8BitRowwiseEmbeddingLookup(
         /*block_size=*/output->size(1),
         /*output_size=*/output->size(0),
         /*index_size=*/indices.numel(),
         /*data_size=*/data.size(0),
         /*input=*/data.template data<uint8_t>(),
         /*indices=*/indices.template data<IndexType>(),
         /*lengths=*/lengths.template data<int>(),
         /*weights=*/weights,
         /*normalize_by_lengths=*/is_mean,
         /*out=*/output->template mutable_data<float>());

     return true;
   }

   enum {
     DATA = 0,
     WEIGHTS = 1,
     INDICES = 1 + with_weights,
     LENGTHS = 2 + with_weights,
   };
 };

 } // namespace caffe2

 #endif // CAFFE2_OPERATORS_LENGTHS_REDUCER_FUSED_8BIT_ROWWISE_OPS_H_
caffe2::SparseLengthsFused8BitRowwiseOp
Definition: lengths_reducer_fused_8bit_rowwise_ops.h:15

caffe2::Operator::Input
const Tensor & Input(int idx, DeviceType type=Context::GetDeviceType())
Retrieve a non-owning reference to the input at position &#39;idx&#39; for this operator. ...
Definition: operator.h:702

caffe2
A global dictionary that holds information about what Caffe2 modules have been loaded in the current ...
Definition: blob.h:13

caffe2::DispatchHelper
Definition: operator.h:1052

caffe2::Operator
Definition: operator.h:677

caffe2::Fused8BitRowwiseEmbeddingLookup
void Fused8BitRowwiseEmbeddingLookup(const std::int64_t block_size, const std::int64_t output_size, const std::int64_t index_size, const std::int64_t data_size, const InType *input, const IndexType *indices, const int *lengths, const float *weights, bool normalize_by_lengths, OutType *out)
Embedding lookup with reduction.