doxygen-c/html/torch_2csrc_2api_2src_2nn_2module_8cpp_source.html

 #include <torch/nn/module.h>

 #include <torch/ordered_dict.h>

 #include <torch/csrc/autograd/generated/VariableType.h>

 #include <c10/util/Exception.h>

 #include <algorithm>
 #include <functional>
 #include <map>
 #include <ostream>
 #include <string>
 #include <typeinfo>

 namespace torch {
 namespace nn {
 namespace {
 std::string join_name(const std::string& name_prefix, const std::string& name) {
   size_t total_size = name.size();
   if (!name_prefix.empty()) {
     total_size += name_prefix.size() + 1;
   }
   std::string full_name;
   full_name.reserve(total_size);
   if (!name_prefix.empty()) {
     full_name += name_prefix;
     full_name.push_back('.');
   }
   full_name += name;
   return full_name;
 }

 void extend(
     std::vector<Tensor>& vector,
     const OrderedDict<std::string, Tensor>& dict) {
   vector.reserve(vector.size() + dict.size());
   for (const auto& item : dict) {
     vector.push_back(item.value());
   }
 }
 } // namespace

 Module::Module()
     : parameters_("Parameter"), buffers_("Buffer"), children_("Submodule") {}

 Module::Module(std::string name) : Module() {
   name_ = std::move(name);
 }

 const std::string& Module::name() const noexcept {
   // If the name optional is empty at this point, we grab the name of the
   // dynamic type via RTTI. Note that we cannot do this in the constructor,
   // because in the constructor of a base class `this` always refers to the base
   // type. Inheritance effectively does not work in constructors. Also this note
   // from http://en.cppreference.com/w/cpp/language/typeid:
   // If typeid is used on an object under construction or destruction (in a
   // destructor or in a constructor, including constructor's initializer list
   // or default member initializers), then the std::type_info object referred
   // to by this typeid represents the class that is being constructed or
   // destroyed even if it is not the most-derived class.
   if (!name_.has_value()) {
     name_ = c10::demangle(typeid(*this).name());
 #if defined(_WIN32)
     // Windows adds "struct" or "class" as a prefix.
     if (name_->find("struct ") == 0) {
       name_->erase(name_->begin(), name_->begin() + 7);
     } else if (name_->find("class ") == 0) {
       name_->erase(name_->begin(), name_->begin() + 6);
     }
 #endif // defined(_WIN32)
   }
   return *name_;
 }

 std::shared_ptr<Module> Module::clone(const optional<Device>& device) const {
   AT_ERROR(
       "clone() has not been implemented for ",
       name(),
       ". Subclass torch::nn::Cloneable<",
       name(),
       "> instead of torch::nn::Module to inherit the ability to clone.");
 }

 void Module::apply(const ModuleApplyFunction& function) {
   function(*this);
   apply_to_submodules(
       [&function](const std::string&, const std::shared_ptr<Module>& module) {
         function(*module);
       });
 }

 void Module::apply(const ConstModuleApplyFunction& function) const {
   function(*this);
   apply_to_submodules(
       [&function](const std::string&, const std::shared_ptr<Module>& module) {
         function(*module);
       });
 }

 void Module::apply(
     const NamedModuleApplyFunction& function,
     const std::string& name_prefix) {
   function(/*name=*/name_prefix, *this);
   apply_to_submodules(
       [&function](
           const std::string& name, const std::shared_ptr<Module>& module) {
         function(name, *module);
       },
       name_prefix);
 }

 void Module::apply(
     const ConstNamedModuleApplyFunction& function,
     const std::string& name_prefix) const {
   function(/*name=*/name_prefix, *this);
   apply_to_submodules(
       [&function](
           const std::string& name, const std::shared_ptr<Module>& module) {
         function(name, *module);
       },
       name_prefix);
 }

 void Module::apply(const ModulePointerApplyFunction& function) const {
   function(shared_from_this_checked());
   apply_to_submodules(
       [&function](const std::string&, const std::shared_ptr<Module>& module) {
         function(module);
       });
 }

 void Module::apply(
     const NamedModulePointerApplyFunction& function,
     const std::string& name_prefix) const {
   function(
       /*name=*/name_prefix, shared_from_this_checked());
   apply_to_submodules(function, name_prefix);
 }

 std::vector<Tensor> Module::parameters(bool recurse) const {
   if (!recurse) {
     return parameters_.values();
   }
   std::vector<Tensor> result;
   apply(
       [&result](const Module& module) { extend(result, module.parameters_); });
   return result;
 }

 OrderedDict<std::string, Tensor> Module::named_parameters(bool recurse) const {
   if (!recurse) {
     return parameters_;
   }
   OrderedDict<std::string, Tensor> result;
   apply([&result](const std::string& name, const Module& module) {
     for (const auto& parameter : module.parameters_) {
       result.insert(join_name(name, parameter.key()), parameter.value());
     }
   });
   return result;
 }

 std::vector<Tensor> Module::buffers(bool recurse) const {
   if (!recurse) {
     return buffers_.values();
   }
   std::vector<Tensor> result;
   apply([&result](const Module& module) { extend(result, module.buffers_); });
   return result;
 }
 OrderedDict<std::string, Tensor> Module::named_buffers(bool recurse) const {
   if (!recurse) {
     return buffers_;
   }
   OrderedDict<std::string, Tensor> result;
   apply([&result](const std::string& name, const Module& module) {
     for (const auto& buffer : module.buffers_) {
       result.insert(join_name(name, buffer.key()), buffer.value());
     }
   });
   return result;
 }

 std::vector<std::shared_ptr<Module>> Module::modules(bool include_self) const {
   std::vector<std::shared_ptr<Module>> result;
   if (include_self) {
     apply([&result](const std::shared_ptr<Module>& module) {
       result.push_back(module);
     });
   } else {
     apply_to_submodules(
         [&result](const std::string&, const std::shared_ptr<Module>& module) {
           result.push_back(module);
         });
   }
   return result;
 }

 OrderedDict<std::string, std::shared_ptr<Module>> Module::named_modules(
     const std::string& name_prefix,
     bool include_self) const {
   OrderedDict<std::string, std::shared_ptr<Module>> result;
   if (include_self) {
     apply(
         [&result](
             const std::string& key, const std::shared_ptr<Module>& module) {
           result.insert(key, module);
         },
         name_prefix);
   } else {
     apply_to_submodules(
         [&result](
             const std::string& key, const std::shared_ptr<Module>& module) {
           result.insert(key, module);
         },
         name_prefix);
   }
   return result;
 }

 std::vector<std::shared_ptr<Module>> Module::children() const {
   return children_.values();
 }

 OrderedDict<std::string, std::shared_ptr<Module>> Module::named_children()
     const {
   return children_;
 }

 void Module::train(bool on) {
   for (auto& child : children_) {
     child.value()->train(on);
   }
   is_training_ = on;
 }

 void Module::eval() {
   train(/*on=*/false);
 }

 void Module::to(torch::Device device, torch::Dtype dtype, bool non_blocking) {
   to_impl(device, dtype, non_blocking);
 }

 void Module::to(torch::Dtype dtype, bool non_blocking) {
   to_impl(dtype, non_blocking);
 }

 void Module::to(torch::Device device, bool non_blocking) {
   to_impl(device, non_blocking);
 }

 bool Module::is_training() const noexcept {
   return is_training_;
 }

 void Module::zero_grad() {
   for (auto& child : children_) {
     child.value()->zero_grad();
   }
   for (auto& parameter : parameters_) {
     auto& grad = parameter->grad();
     if (grad.defined()) {
       grad = grad.detach();
       grad.zero_();
     }
   }
 }

 void Module::save(serialize::OutputArchive& archive) const {
   for (const auto& parameter : parameters_) {
     archive.write(parameter.key(), parameter.value());
   }
   for (const auto& buffer : buffers_) {
     archive.write(buffer.key(), buffer.value(), /*is_buffer=*/true);
   }
   for (const auto& child : children_) {
     serialize::OutputArchive child_archive;
     child.value()->save(child_archive);
     archive.write(child.key(), child_archive);
   }
 }

 void Module::load(serialize::InputArchive& archive) {
   for (auto& parameter : parameters_) {
     archive.read(parameter.key(), parameter.value());
   }
   for (auto& buffer : buffers_) {
     archive.read(buffer.key(), buffer.value(), /*is_buffer=*/true);
   }
   for (const auto& child : children_) {
     serialize::InputArchive child_archive;
     archive.read(child.key(), child_archive);
     child.value()->load(child_archive);
   }
 }

 Tensor& Module::register_parameter(
     std::string name,
     Tensor tensor,
     bool requires_grad) {
   AT_CHECK(!name.empty(), "Parameter name must not be empty");
   AT_CHECK(
       name.find('.') == std::string::npos,
       "Parameter name must not contain a dot (got '",
       name,
       "')");
   tensor.set_requires_grad(requires_grad);
   return parameters_.insert(std::move(name), std::move(tensor));
 }

 Tensor& Module::register_buffer(std::string name, Tensor tensor) {
   AT_CHECK(!name.empty(), "Buffer name must not be empty");
   AT_CHECK(
       name.find('.') == std::string::npos,
       "Buffer name must not contain a dot (got '",
       name,
       "')");
   return buffers_.insert(std::move(name), std::move(tensor));
 }

 void Module::pretty_print(std::ostream& stream) const {
   stream << name();
 }

 void Module::pretty_print_recursive(
     std::ostream& stream,
     const std::string& indentation) const {
   pretty_print(stream);
   if (!children_.is_empty()) {
     stream << "(\n";
     const std::string next_indentation = indentation + "  ";
     for (const auto& child : children_) {
       stream << next_indentation << "(" << child.key() << "): ";
       child.value()->pretty_print_recursive(stream, next_indentation);
       stream << '\n';
     }
     stream << indentation << ")";
   }
 }

 void Module::clone_(Module& other, const optional<Device>& device) {}

 void Module::apply_to_submodules(
     const NamedModulePointerApplyFunction& function,
     const std::string& name_prefix) const {
   for (const auto& child : children_) {
     auto qualified_name = join_name(name_prefix, child.key());
     function(qualified_name, child.value());
     child.value()->apply_to_submodules(function, qualified_name);
   }
 }

 std::shared_ptr<Module> Module::shared_from_this_checked() const {
   std::shared_ptr<const Module> ptr;
   try {
     ptr = shared_from_this();
   } catch (const std::bad_weak_ptr& e) {
     AT_ERROR(
         "It looks like you attempted to retrieve your top-level module "
         "as a shared_ptr, but it is not stored in a shared_ptr. "
         "Use std::make_shared<",
         name(),
         "> instead of creating your module on "
         "the stack, or alternatively do not try to access your top-level "
         "module at all by passing /*include_self=*/false "
         "to modules() or named_modules()");
   }
   return std::const_pointer_cast<Module>(ptr);
 }

 std::ostream& operator<<(std::ostream& stream, const nn::Module& module) {
   module.pretty_print_recursive(stream, "");
   return stream;
 }

 serialize::OutputArchive& operator<<(
     serialize::OutputArchive& archive,
     const std::shared_ptr<nn::Module>& module) {
   AT_CHECK(module != nullptr, "Cannot serialize empty module");
   module->save(archive);
   return archive;
 }

 serialize::InputArchive& operator>>(
     serialize::InputArchive& archive,
     const std::shared_ptr<nn::Module>& module) {
   AT_CHECK(module != nullptr, "Cannot deserialize empty module");
   module->load(archive);
   return archive;
 }
 } // namespace nn
 } // namespace torch
torch::serialize::OutputArchive
Definition: output-archive.h:25

torch::nn::Module::pretty_print
virtual void pretty_print(std::ostream &stream) const
Streams a pretty representation of the Module into the given stream.
Definition: module.cpp:325

torch::OrderedDict::size
size_t size() const noexcept
Returns the number of items currently stored in the OrderedDict.
Definition: ordered_dict.h:419

torch::nn::Module::save
virtual void save(serialize::OutputArchive &archive) const
Serializes the Module into the given OutputArchive.
Definition: module.cpp:273

at::Tensor
Definition: Tensor.h:48

torch::nn::Module::buffers
std::vector< Tensor > buffers(bool recurse=true) const
Returns the buffers of this Module and if recurse is true, also recursively of every submodule...
Definition: module.cpp:166

torch::nn::Module::register_parameter
Tensor & register_parameter(std::string name, Tensor tensor, bool requires_grad=true)
Registers a parameter with this Module.
Definition: module.cpp:301

torch::nn::Module::named_parameters
OrderedDict< std::string, Tensor > named_parameters(bool recurse=true) const
Returns an OrderedDict with the parameters of this Module along with their keys, and if recurse is tr...
Definition: module.cpp:153

torch::OrderedDict::insert
Value & insert(K &&key, V &&value)
Inserts a new (key, value) pair into the OrderedDict.
Definition: ordered_dict.h:357

torch::nn::Module::load
virtual void load(serialize::InputArchive &archive)
Deserializes the Module from the given InputArchive.
Definition: module.cpp:287

torch::nn::Module::name
const std::string & name() const noexcept
Returns the name of the Module.
Definition: module.cpp:53

torch::nn::Module::is_training
virtual bool is_training() const noexcept
True if the module is in training mode.
Definition: module.cpp:256

torch::nn::Module::children
std::vector< std::shared_ptr< Module > > children() const
Returns the direct submodules of this Module.
Definition: module.cpp:224

torch::nn::Module::zero_grad
virtual void zero_grad()
Recursively zeros out the grad value of each registered parameter.
Definition: module.cpp:260

torch::nn::Module::modules
std::vector< std::shared_ptr< Module > > modules(bool include_self=true) const
Returns the submodules of this Module (the entire submodule hierarchy) and if include_self is true...
Definition: module.cpp:187

torch::serialize::InputArchive::read
void read(const std::string &key, Tensor &tensor, bool is_buffer=false)
Reads a tensor associated with a given key.
Definition: input-archive.cpp:22

c10::Device
Represents a a compute device on which a tensor is located.
Definition: Device.h:30

torch::nn::Module::parameters
std::vector< Tensor > parameters(bool recurse=true) const
Returns the parameters of this Module and if recurse is true, also recursively of every submodule...
Definition: module.cpp:143

torch::nn::Module::train
virtual void train(bool on=true)
Enables "training" mode.
Definition: module.cpp:233

torch::nn::Module::register_buffer
Tensor & register_buffer(std::string name, Tensor tensor)
Registers a buffer with this Module.
Definition: module.cpp:315

torch::nn::Module::clone
virtual std::shared_ptr< Module > clone(const optional< Device > &device=nullopt) const
Performs a recursive deep copy of the module and all its registered parameters, buffers and submodule...
Definition: module.cpp:78

torch::nn::Module::operator<<
TORCH_API friend std::ostream & operator<<(std::ostream &stream, const nn::Module &module)
Pretty prints the given Module into the ostream.
Definition: module.cpp:375

torch::nn::Module::named_children
OrderedDict< std::string, std::shared_ptr< Module > > named_children() const
Returns an OrderedDict of the direct submodules of this Module and their keys.
Definition: module.cpp:228

torch::nn::Module::to
virtual void to(torch::Device device, torch::Dtype dtype, bool non_blocking=false)
Recursively casts all parameters to the given dtype and device.
Definition: module.cpp:244

c10::optional
Definition: Optional.h:118

torch::nn::Module
The base class for all modules in PyTorch.
Definition: module.h:62

torch
Definition: jit_type.h:17

torch::nn::Module::named_buffers
OrderedDict< std::string, Tensor > named_buffers(bool recurse=true) const
Returns an OrderedDict with the buffers of this Module along with their keys, and if recurse is true ...
Definition: module.cpp:174

torch::serialize::OutputArchive::write
void write(const std::string &key, const Tensor &tensor, bool is_buffer=false)
Writes a (key, tensor) pair to the OutputArchive, and marks it as being or not being a buffer (non-di...
Definition: output-archive.cpp:20

c10::demangle
std::string demangle(const char *name)
Utility to demangle a C++ symbol name.
Definition: Type.cpp:23

torch::nn::Module::apply
void apply(const ModuleApplyFunction &function)
Applies the function to the Module and recursively to every submodule.
Definition: module.cpp:87

torch::serialize::InputArchive
A recursive representation of tensors that can be deserialized from a file or stream.
Definition: input-archive.h:32

torch::nn::Module::Module
Module()
Constructs the module without immediate knowledge of the submodule&#39;s name.
Definition: module.cpp:46

torch::nn::Module::eval
void eval()
Calls train(false) to enable "eval" mode.
Definition: module.cpp:240

torch::OrderedDict
An ordered dictionary implementation, akin to Python&#39;s OrderedDict.
Definition: ordered_dict.h:16

torch::nn::Module::named_modules
OrderedDict< std::string, std::shared_ptr< Module > > named_modules(const std::string &name_prefix=std::string(), bool include_self=true) const
Returns an OrderedDict of he submodules of this Module (the entire submodule hierarchy) and thei keys...
Definition: module.cpp:202