doxygen-c/html/argument__spec_8h_source.html

 #pragma once

 #include <torch/csrc/autograd/variable.h>
 #include <torch/csrc/jit/ir.h>
 #include <ATen/core/stack.h>
 #include <ATen/core/jit_type.h>
 #include <torch/csrc/jit/variable_tensor_list.h>
 #include <torch/csrc/utils/hash.h>
 #include <iostream>
 #include <vector>

 namespace torch {
 namespace jit {

 // GraphExecutor creates specializations of Graphs for different
 // dimensionalitities and types of inputs.

 inline static at::Device ConvertIntToCPUOrCUDA(int device) {
   return device < 0 ? at::kCPU : at::Device(at::DeviceType::CUDA, device);
 }
 struct ArgumentInfo {
   friend struct ArgumentSpec;
   using plain_data_type = uint32_t;

   bool isTensor() const {
     return is_tensor_;
   }
   bool defined() const {
     return defined_;
   }
   int device() const {
     return device_;
   }
   // XXX: It is guaranteed that this will return false when called on non-tensor
   // arguments
   bool requires_grad() const {
     return requires_grad_;
   }
   int dim() const {
     return dim_;
   }
   at::ScalarType type() const {
     return at::ScalarType(type_);
   }
   operator TypePtr() const {
     if (!defined())
       return TensorType::get();
     return DimensionedTensorType::create(type(), ConvertIntToCPUOrCUDA(device()), dim());
   }

  private:
   unsigned is_tensor_ : 1;
   unsigned defined_ : 1;
   unsigned requires_grad_ : 1;
   unsigned : 5;
   unsigned dim_ : 8;
   int device_ : 8; // NOTE: this needs to be signed because we use -1 to
                    // represent CPU
   unsigned type_ : 8;
 };

 static_assert(
     std::is_pod<ArgumentInfo>::value,
     "ArgumentInfo is to be a POD struct");
 static_assert(
     sizeof(ArgumentInfo) == sizeof(ArgumentInfo::plain_data_type),
     "ArgumentInfo is expected to be a 32-bit struct");

 struct ArgumentSpec {
   ArgumentSpec(
       bool with_grad,
       at::ArrayRef<IValue> inputs,
       size_t num_flat_inputs) {
     hash_code = num_flat_inputs;
     args.resize(num_flat_inputs);
     size_t offset = 0;
     for (const auto& i : inputs) {
       addInput(i, offset, with_grad);
     }
     AT_ASSERT(offset <= num_flat_inputs);
   }

   void addInput(const IValue& input, size_t& offset, bool with_grad) {
     auto& arg = args.at(offset);
     // Initialize all fields to 0. This is convenient, because e.g.
     // requires_grad() can be checked even on tensors AND will make
     // padding bits all 0s.
     std::memset(&arg, 0, sizeof(ArgumentInfo));

     if (input.isTensor()) {
       at::Tensor t = input.toTensor();
       if ((arg.defined_ = t.defined())) {
         arg.requires_grad_ = with_grad && autograd::Variable(t).requires_grad();
         arg.dim_ = t.dim();
         arg.device_ = t.is_cuda() ? t.get_device() : -1;
         arg.type_ = static_cast<unsigned>(t.scalar_type());
       }

       arg.is_tensor_ = true;
       combineHash(arg);
       offset++;
     } else if (input.isTuple()) {
       for (const IValue& elem : input.toTuple()->elements()) {
         addInput(elem, offset, with_grad);
       }
     } else {
       // NB: no need to set is_tensor to false, because we memset the struct to
       // 0 above
       combineHash(arg);
       offset++;
     }
   }

   void combineHash(const ArgumentInfo& arg) {
     ArgumentInfo::plain_data_type arg_data;
     std::memcpy(&arg_data, &arg, sizeof(ArgumentInfo));
     hash_code = hash_combine(hash_code, arg_data);
   }

   // equality is fast: check ninputs, and then check the raw array data,
   // there are no size/stride indirections
   bool operator==(const ArgumentSpec& spec) const {
     if (args.size() != spec.args.size())
       return false;
     // NB: we need to break out early when there are no elements, because
     // passing a nullptr to memcmp is UB.
     if (args.size() == 0)
       return true;
     return std::memcmp(
                args.data(),
                spec.args.data(),
                args.size() * sizeof(ArgumentInfo)) == 0;
   }
   bool operator!=(const ArgumentSpec& spec) const {
     return !(*this == spec);
   }
   size_t size() const {
     return args.size();
   }
   const ArgumentInfo& at(size_t i) const {
     return args[i];
   }
   size_t hashCode() const {
     return hash_code;
   }
   // For every input of a given graph, returns a most detailed type that can be
   // inferred for it based on this ArgumentSpec.
   std::vector<TypePtr> getTypes(Graph& graph) const {
     size_t offset = 0;
     return fmap(
         graph.inputs(), [&](Value* v) { return fillType(v->type(), offset); });
   }

  private:
   TypePtr fillType(TypePtr original, size_t& offset) const {
     if (original->isSubtypeOf(TensorType::get())) {
       auto& arg = args.at(offset++);
       if (!arg.defined())
         return AutogradZeroTensorType::get();
       return DimensionedTensorType::create(
           arg.type(),
           ConvertIntToCPUOrCUDA(arg.device()),
           arg.dim(),
           arg.requires_grad());
     } else if (auto tuple_type = original->cast<TupleType>()) {
       return TupleType::create(fmap(
           tuple_type->elements(),
           [&](const TypePtr& subtype) { return fillType(subtype, offset); }));
     } else {
       offset++;
       return original;
     }
   }
   size_t hash_code; // precomputed on construction
   std::vector<ArgumentInfo> args;
 };

 // CompleteArgumentSpec represents one particular specialization.
 // It is designed so that it can be created, hashed, and compared quickly
 // since it is used along the hot-path of the JIT to check if the code
 // we have created is valid for the given inputs.

 // COmpleteArgumentInfoPOD is only used internally in CompleteArgumentSpec
 // API users should use ArgumentInfo
 struct CompleteArgumentInfoPOD {
   // total size is 64-bit
   unsigned is_tensor : 8; // all other fields are invalid if this is false
   unsigned type : 8; // scalar type
   unsigned defined : 1;
   unsigned requires_grad : 1;
   signed device : 14;
   uint32_t total_dims; // all TensorInfoPODs are in CompleteArgumentSpec's
                        // tensor_info() array. total_dims is the total number of
                        // dimensions seen so far in all previous members of
                        // tensor_info(), including this tensor 2*total_dims
                        // becomes the offset into the sizes_strides list for the
                        // _next_ tensor in the tensor_info array for tensor 0,
                        // the offset is always 0
 };

 static_assert(
     sizeof(CompleteArgumentInfoPOD) == sizeof(int64_t),
     "CompleteArgumentInfoPOD must be 64-bit struct for CompleteArgumentSpec encoding to work");

 struct CompleteArgumentInfo;

 struct CompleteArgumentSpec {
   CompleteArgumentSpec(bool with_grad, at::ArrayRef<IValue> inputs)
       : hash_code(0), ninputs(inputs.size()) {
     int32_t all_dims = 0;
     const int32_t num_inputs = inputs.size();
     for (int32_t i = 0; i < num_inputs; i++) {
       if (!inputs[i].isTensor())
         continue;
       auto tensor = inputs[i].toTensor();
       all_dims += tensor.defined() ? tensor.ndimension() : 0;
     }
     // allocate enough room for all TensorPODs and dimensions
     data.resize(ninputs + all_dims * 2);

     // and reinterpret our data array as these structs
     auto* pods = reinterpret_cast<CompleteArgumentInfoPOD*>(data.data());
     int64_t* next_dim = sizes_strides();
     int32_t total_dims = 0;
     for (int32_t i = 0; i < num_inputs; i++) {
       auto& pod = pods[i];
       pod.is_tensor = static_cast<uint32_t>(inputs[i].isTensor());
       if (pod.is_tensor) {
         at::Tensor t = inputs[i].toTensor();
         pod.defined = t.defined();
         if (pod.defined) {
           pod.type = static_cast<int>(t.scalar_type());
           pod.device = (!t.is_cuda()) ? -1 : t.get_device();
           pod.requires_grad =
               with_grad && autograd::as_variable_ref(t).requires_grad();
           total_dims += t.ndimension();
           auto sizes = t.sizes();
           std::copy(sizes.begin(), sizes.end(), next_dim);
           next_dim += sizes.size();
           auto strides = t.strides();
           std::copy(strides.begin(), strides.end(), next_dim);
           next_dim += strides.size();
         }
       }
       // each POD has a running tally of all dimensions including its own
       pod.total_dims = total_dims;
     }
     // we precompute the hash_code to minimize the time inside of hash
     // table operations where we may need to hold a compiler cache lock.
     hash_code = hash_combine(0, ninputs);
     for (auto d : data) {
       hash_code = hash_combine(hash_code, d);
     }
   }

   // equality is fast: check ninputs, and then check the raw array data,
   // there are no size/stride indirections
   bool operator==(const CompleteArgumentSpec& spec) const {
     return ninputs == spec.ninputs && data == spec.data;
   }
   bool operator!=(const CompleteArgumentSpec& spec) const {
     return !(*this == spec);
   }
   friend struct CompleteArgumentInfo;
   CompleteArgumentInfo at(size_t i) const;
   size_t size() const {
     return ninputs;
   }
   size_t hashCode() const {
     return hash_code;
   }

  private:
   ArrayRef<CompleteArgumentInfoPOD> tensor_info() const {
     return ArrayRef<CompleteArgumentInfoPOD>(
         reinterpret_cast<const CompleteArgumentInfoPOD*>(data.data()), ninputs);
   }
   // the start of the sizes_strides information, which comes after the
   // CompleteArgumentInfoPOD list.
   const int64_t* sizes_strides() const {
     return data.data() + ninputs;
   }
   int64_t* sizes_strides() {
     return data.data() + ninputs;
   }
   size_t hash_code; // precomputed on construction
   int32_t ninputs;
   // layout is ninputs of TensorPOD (each 64-bit) followed by their size and
   // stride info for 3 tensors:
   // [t0POD][t1POD][t2POD]...
   // [t0 sizes][t0 strides][t1 sizes][t1 strides][t2 sizes][t2 strides]
   std::vector<int64_t> data;
 };

 // public view of compressed CompleteArgumentInfo
 struct CompleteArgumentInfo {
   CompleteArgumentInfo(const CompleteArgumentSpec& spec, const int i)
       : spec(spec), i(i) {}
   bool isTensor() const {
     return pod(i).is_tensor;
   }
   at::ScalarType type() const {
     return at::ScalarType(pod(i).type);
   }
   bool defined() const {
     return pod(i).defined;
   }
   bool requires_grad() const {
     return pod(i).requires_grad;
   }
   int device() const {
     return pod(i).device;
   }
   int ndimension() const {
     // See [valid range], it is always valid to ask for offset for (i + 1)
     return (sizes_strides_offset(i + 1) - sizes_strides_offset(i)) / 2;
   }
   at::IntArrayRef sizes() const {
     return at::IntArrayRef(
         spec.sizes_strides() + sizes_strides_offset(i), ndimension());
   }
   at::IntArrayRef strides() const {
     int ndim = ndimension();
     return at::IntArrayRef(
         spec.sizes_strides() + sizes_strides_offset(i) + ndim, ndim);
   }
   operator TypePtr() const {
     if (!defined())
       return TensorType::get();
     return CompleteTensorType::create(
         type(), ConvertIntToCPUOrCUDA(device()), sizes(), strides());
   }

  private:
   // offsetinto sizes_strides() array where the sizes start for tensor j
   // [valid range] valid range is [0, ninputs]
   // (i.e. you can ask for the offset at ninputs, which would be the offset of
   // the next tensor if it existed)
   int sizes_strides_offset(int j) const {
     if (j == 0)
       return 0;
     return 2 * pod(j - 1).total_dims;
   }
   const CompleteArgumentInfoPOD& pod(int j) const {
     return spec.tensor_info().at(j);
   }
   const CompleteArgumentSpec& spec;
   const int i;
 };

 inline std::ostream& operator<<(std::ostream& out, const ArgumentInfo& info) {
   if (!info.defined()) {
     return out << "<undefined>";
   }
   out << "Tensor(device=" << info.device() << ", type=" << toString(info.type())
       << ", requires_grad=" << info.requires_grad() << ", dims=" << info.dim()
       << ")";
   return out;
 }

 inline std::ostream& operator<<(std::ostream& out, const ArgumentSpec& spec) {
   out << "{";
   for (size_t i = 0; i < spec.size(); ++i) {
     if (i > 0)
       out << ", ";
     out << spec.at(i);
   }
   out << "}";
   return out;
 }

 inline std::ostream& operator<<(
     std::ostream& out,
     const CompleteArgumentInfo& info) {
   if (!info.defined()) {
     return out << "<undefined>";
   }
   out << "Tensor(device=" << info.device() << ", type=" << toString(info.type())
       << ", requires_grad=" << info.requires_grad()
       << ", sizes=" << info.sizes() << ", strides=" << info.strides() << ")";
   return out;
 }

 inline std::ostream& operator<<(
     std::ostream& out,
     const CompleteArgumentSpec& spec) {
   out << "{";
   for (size_t i = 0; i < spec.size(); ++i) {
     if (i > 0)
       out << ", ";
     out << spec.at(i);
   }
   out << "}";
   return out;
 }

 inline CompleteArgumentInfo CompleteArgumentSpec::at(size_t i) const {
   return CompleteArgumentInfo(*this, i);
 }

 inline void setInputTypes(Graph& g, const ArgumentSpec& spec) {
   auto input_types = spec.getTypes(g);
   auto inputs = g.inputs();
   for (size_t i = 0; i < inputs.size(); ++i) {
     inputs[i]->setType(input_types[i]);
   }
 }

 } // namespace jit
 } // namespace torch

 namespace std {
 template <>
 struct hash<torch::jit::ArgumentSpec> {
   size_t operator()(const torch::jit::ArgumentSpec& spec) const {
     return spec.hashCode();
   }
 };
 template <>
 struct hash<torch::jit::CompleteArgumentSpec> {
   size_t operator()(const torch::jit::CompleteArgumentSpec& spec) const {
     return spec.hashCode();
   }
 };
 } // namespace std
torch::jit::ArgumentInfo
Definition: argument_spec.h:21

at::Tensor
Definition: Tensor.h:48

torch::jit::ArgumentSpec
Definition: argument_spec.h:69

at::Tensor::get_device
int64_t get_device() const
Returns a Tensor&#39;s device index.
Definition: TensorMethods.h:1299

std
Definition: interned_strings.h:312

torch::jit::CompleteArgumentSpec
Definition: argument_spec.h:207

torch::jit::Graph
Definition: ir.h:936

c10::Device
Represents a a compute device on which a tensor is located.
Definition: Device.h:30

c10::ArrayRef::size
constexpr size_t size() const
size - Get the array size.
Definition: ArrayRef.h:138

at::Tensor::is_cuda
bool is_cuda() const
Returns if a Tensor has CUDA backend.
Definition: TensorMethods.h:1308

torch::jit::Value
Definition: ir.h:144

torch::jit::CompleteArgumentInfo
Definition: argument_spec.h:296

torch::autograd::Variable
Variable A Variable augments a Tensor with the ability to interact in our autograd machinery...
Definition: variable.h:85

torch
Definition: jit_type.h:17

c10::IValue
Definition: ivalue.h:127

c10::ArrayRef
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory)...
Definition: ArrayRef.h:41

c10::requires_grad
TensorOptions requires_grad(bool requires_grad=true)
Convenience function that returns a TensorOptions object with the requires_grad set to the given one...
Definition: TensorOptions.h:501

c10::TupleType
Definition: jit_type.h:651

torch::jit::CompleteArgumentInfoPOD
Definition: argument_spec.h:185

at
Flush-To-Zero and Denormals-Are-Zero mode.
Definition: AccumulateType.h:17

c10::TensorOptions::requires_grad
C10_NODISCARD TensorOptions requires_grad(c10::optional< bool > requires_grad) const noexcept
Sets the requires_grad property of the TensorOptions.
Definition: TensorOptions.h:222