doxygen-c/html/rnn_8h_source.html

 #pragma once

 #include <torch/nn/cloneable.h>
 #include <torch/nn/modules/dropout.h>
 #include <torch/nn/pimpl.h>
 #include <torch/types.h>

 #include <ATen/ATen.h>
 #include <c10/util/Exception.h>

 #include <cstddef>
 #include <functional>
 #include <memory>
 #include <vector>

 namespace torch {
 namespace nn {

 struct TORCH_API RNNOutput {
   Tensor output;
   Tensor state;
 };

 namespace detail {

 struct TORCH_API RNNOptionsBase {
   RNNOptionsBase(int64_t input_size, int64_t hidden_size);
   virtual ~RNNOptionsBase() = default;
   TORCH_ARG(int64_t, input_size);
   TORCH_ARG(int64_t, hidden_size);
   TORCH_ARG(int64_t, layers) = 1;
   TORCH_ARG(bool, with_bias) = true;
   TORCH_ARG(double, dropout) = 0.0;
   TORCH_ARG(bool, bidirectional) = false;
   TORCH_ARG(bool, batch_first) = false;
 };

 template <typename Derived>
 class RNNImplBase : public torch::nn::Cloneable<Derived> {
  public:
   enum class CuDNNMode { RNN_RELU = 0, RNN_TANH = 1, LSTM = 2, GRU = 3 };

   explicit RNNImplBase(
       const RNNOptionsBase& options_,
       optional<CuDNNMode> cudnn_mode = nullopt,
       int64_t number_of_gates = 1);

   void reset() override;

   void to(torch::Device device, torch::Dtype dtype, bool non_blocking = false)
       override;
   void to(torch::Dtype dtype, bool non_blocking = false) override;
   void to(torch::Device device, bool non_blocking = false) override;

   void pretty_print(std::ostream& stream) const override;

   void flatten_parameters();

   RNNOptionsBase options;

   std::vector<Tensor> w_ih;
   std::vector<Tensor> w_hh;
   std::vector<Tensor> b_ih;
   std::vector<Tensor> b_hh;

  protected:
   using RNNFunctionSignature = std::tuple<Tensor, Tensor>(
       /*input=*/const Tensor&,
       /*state=*/const Tensor&,
       /*params=*/TensorList,
       /*has_biases=*/bool,
       /*layers=*/int64_t,
       /*dropout=*/double,
       /*train=*/bool,
       /*bidirectional=*/bool,
       /*batch_first=*/bool);

   RNNOutput generic_forward(
       std::function<RNNFunctionSignature> function,
       const Tensor& input,
       Tensor state);

   std::vector<Tensor> flat_weights() const;

   bool any_parameters_alias() const;

   int64_t number_of_gates_;

   optional<CuDNNMode> cudnn_mode_;

   std::vector<Tensor> flat_weights_;
 };
 } // namespace detail

 // ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ RNN ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~

 enum class RNNActivation : uint32_t {ReLU, Tanh};

 struct TORCH_API RNNOptions {
   RNNOptions(int64_t input_size, int64_t hidden_size);

   RNNOptions& tanh();
   RNNOptions& relu();

   TORCH_ARG(int64_t, input_size);
   TORCH_ARG(int64_t, hidden_size);
   TORCH_ARG(int64_t, layers) = 1;
   TORCH_ARG(bool, with_bias) = true;
   TORCH_ARG(double, dropout) = 0.0;
   TORCH_ARG(bool, bidirectional) = false;
   TORCH_ARG(bool, batch_first) = false;
   TORCH_ARG(RNNActivation, activation) = RNNActivation::ReLU;
 };

 class TORCH_API RNNImpl : public detail::RNNImplBase<RNNImpl> {
  public:
   RNNImpl(int64_t input_size, int64_t hidden_size)
       : RNNImpl(RNNOptions(input_size, hidden_size)) {}
   explicit RNNImpl(const RNNOptions& options);

   void pretty_print(std::ostream& stream) const override;

   RNNOutput forward(const Tensor& input, Tensor state = {});

   RNNOptions options;
 };

 TORCH_MODULE(RNN);

 // ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ LSTM ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~

 using LSTMOptions = detail::RNNOptionsBase;

 class TORCH_API LSTMImpl : public detail::RNNImplBase<LSTMImpl> {
  public:
   LSTMImpl(int64_t input_size, int64_t hidden_size)
       : LSTMImpl(LSTMOptions(input_size, hidden_size)) {}
   explicit LSTMImpl(const LSTMOptions& options);

   RNNOutput forward(const Tensor& input, Tensor state = {});
 };

 TORCH_MODULE(LSTM);

 // ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ GRU ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~

 using GRUOptions = detail::RNNOptionsBase;

 class TORCH_API GRUImpl : public detail::RNNImplBase<GRUImpl> {
  public:
   GRUImpl(int64_t input_size, int64_t hidden_size)
       : GRUImpl(GRUOptions(input_size, hidden_size)) {}
   explicit GRUImpl(const GRUOptions& options);

   RNNOutput forward(const Tensor& input, Tensor state = {});
 };

 TORCH_MODULE(GRU);

 } // namespace nn
 } // namespace torch
torch::nn::detail::RNNImplBase::cudnn_mode_
optional< CuDNNMode > cudnn_mode_
The cuDNN RNN mode, if this RNN subclass has any.
Definition: rnn.h:133

torch::nn::detail::RNNImplBase::number_of_gates_
int64_t number_of_gates_
The number of gate weights/biases required by the RNN subclass.
Definition: rnn.h:130

torch::nn::RNNOutput::state
Tensor state
The new, updated state that can be fed into the RNN in the next forward step.
Definition: rnn.h:26

at::Tensor
Definition: Tensor.h:48

torch::nn::RNNOutput
The output of a single invocation of an RNN module&#39;s forward() method.
Definition: rnn.h:20

torch::nn::detail::RNNImplBase::w_hh
std::vector< Tensor > w_hh
The weights for hidden x hidden gates.
Definition: rnn.h:96

torch::nn::detail::RNNOptionsBase
Common options for LSTM and GRU modules.
Definition: rnn.h:32

torch::nn::detail::RNNImplBase< GRUImpl >::CuDNNMode
CuDNNMode
These must line up with the CUDNN mode codes: https://docs.nvidia.com/deeplearning/sdk/cudnn-develope...
Definition: rnn.h:60

c10::Device
Represents a a compute device on which a tensor is located.
Definition: Device.h:30

torch::nn::detail::RNNImplBase::b_ih
std::vector< Tensor > b_ih
The biases for input x hidden gates.
Definition: rnn.h:98

torch::nn::GRUImpl
A multi-layer gated recurrent unit (GRU) module.
Definition: rnn.h:234

torch::nn::RNNOptions
Options for RNN modules.
Definition: rnn.h:145

torch::nn::RNNImpl
A multi-layer Elman RNN module with Tanh or ReLU activation.
Definition: rnn.h:177

detail
Definition: Dispatch.h:13

torch::nn::detail::RNNImplBase::w_ih
std::vector< Tensor > w_ih
The weights for input x hidden gates.
Definition: rnn.h:94

torch::nn::LSTMImpl
A multi-layer long-short-term-memory (LSTM) module.
Definition: rnn.h:208

torch::nn::Cloneable
The clone() method in the base Module class does not have knowledge of the concrete runtime type of i...
Definition: cloneable.h:23

c10::optional< CuDNNMode >

torch
Definition: jit_type.h:17

torch::nn::RNNOutput::output
Tensor output
The result of applying the specific RNN algorithm to the input tensor and input state.
Definition: rnn.h:23

c10::ArrayRef
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory)...
Definition: ArrayRef.h:41

torch::nn::detail::RNNImplBase::options
RNNOptionsBase options
The RNN&#39;s options.
Definition: rnn.h:91

torch::nn::detail::RNNImplBase< GRUImpl >::RNNFunctionSignature
std::tuple< Tensor, Tensor >(const Tensor &, const Tensor &, TensorList, bool, int64_t, double, bool, bool, bool) RNNFunctionSignature
The function signature of rnn_relu, rnn_tanh and gru.
Definition: rnn.h:113

torch::nn::detail::RNNImplBase
Base class for all RNN implementations (intended for code sharing).
Definition: rnn.h:56

torch::nn::detail::RNNImplBase::b_hh
std::vector< Tensor > b_hh
The biases for hidden x hidden gates.
Definition: rnn.h:100

torch::nn::detail::RNNImplBase::flat_weights_
std::vector< Tensor > flat_weights_
The cached result of the latest flat_weights() call.
Definition: rnn.h:136