doxygen-c/html/elu__op__cudnn_8cc_source.html

 #include "caffe2/operators/elu_op.h"

 #include "caffe2/operators/activation_ops_cudnn.h"

 namespace caffe2 {

 template <>
 class CuDNNActivationOp<CUDNN_ACTIVATION_ELU> final
     : public CuDNNActivationOpBase {
  public:
   USE_OPERATOR_FUNCTIONS(CUDAContext);

   template <class... Args>
   explicit CuDNNActivationOp(Args&&... args)
       : CuDNNActivationOpBase(std::forward<Args>(args)...),
         OP_SINGLE_ARG(float, "alpha", alpha_, 1.0f) {
     CUDNN_ENFORCE(cudnnSetActivationDescriptor(
         act_desc_,
         CUDNN_ACTIVATION_ELU,
         CUDNN_PROPAGATE_NAN,
         static_cast<double>(alpha_)));
   }

   bool RunOnDevice() override {
     return DispatchHelper<TensorTypes<float, at::Half>>::call(this, Input(0));
   }

   template <typename T>
   bool DoRunWithType() {
     const auto& X = Input(0);

     auto* Y = Output(0, X.sizes(), at::dtype<T>());
     if (X.numel() == 0) {
       Y->template mutable_data<T>();
       return true;
     }
     this->SetTensorDescriptor(cudnnTypeWrapper<T>::type, X.numel());
     CUDNN_ENFORCE(cudnnActivationForward(
         this->cudnn_wrapper_.inline_cudnn_handle(),
         this->act_desc_,
         cudnnTypeWrapper<T>::kOne(),
         this->data_desc_,
         X.template data<T>(),
         cudnnTypeWrapper<T>::kZero(),
         this->data_desc_,
         Y->template mutable_data<T>()));
     return true;
   }

  private:
   const float alpha_;
 };

 template <>
 class CuDNNActivationGradientOp<CUDNN_ACTIVATION_ELU> final
     : public CuDNNActivationOpBase {
  public:
   USE_OPERATOR_FUNCTIONS(CUDAContext);

   template <class... Args>
   explicit CuDNNActivationGradientOp(Args&&... args)
       : CuDNNActivationOpBase(std::forward<Args>(args)...),
         OP_SINGLE_ARG(float, "alpha", alpha_, 1.0f) {
     CUDNN_ENFORCE(cudnnSetActivationDescriptor(
         act_desc_,
         CUDNN_ACTIVATION_ELU,
         CUDNN_PROPAGATE_NAN,
         static_cast<double>(alpha_)));
   }

   bool RunOnDevice() override {
     return DispatchHelper<TensorTypes<float, at::Half>>::call(this, Input(0));
   }

   template <typename T>
   bool DoRunWithType() {
     const auto& Y = Input(0);
     const auto& dY = Input(1);

     auto* dX = Output(0, Y.sizes(), at::dtype<T>());
     if (Y.numel() == 0) {
       dX->template mutable_data<T>();
       return true;
     }
     this->SetTensorDescriptor(cudnnTypeWrapper<T>::type, Y.numel());
     CUDNN_ENFORCE(cudnnActivationBackward(
         this->cudnn_wrapper_.inline_cudnn_handle(),
         this->act_desc_,
         cudnnTypeWrapper<T>::kOne(),
         this->data_desc_,
         Y.template data<T>(),
         this->data_desc_,
         dY.template data<T>(),
         this->data_desc_,
         Y.template data<T>(), // Use Y_data as placeholder here.
         cudnnTypeWrapper<T>::kZero(),
         this->data_desc_,
         dX->template mutable_data<T>()));
     return true;
   }

  private:
   const float alpha_;
 };

 REGISTER_CUDNN_OPERATOR(Elu, CuDNNActivationOp<CUDNN_ACTIVATION_ELU>);
 REGISTER_CUDNN_OPERATOR(
     EluGradient,
     CuDNNActivationGradientOp<CUDNN_ACTIVATION_ELU>);

 } // namespace caffe2
caffe2::CuDNNActivationOp< CUDNN_ACTIVATION_ELU >
Definition: elu_op_cudnn.cc:8

caffe2::CuDNNActivationOpBase
Definition: activation_ops_cudnn.h:12

caffe2::Operator< CUDAContext >::Input
const Tensor & Input(int idx, DeviceType type=CUDAContext::GetDeviceType())
Retrieve a non-owning reference to the input at position &#39;idx&#39; for this operator. ...
Definition: operator.h:702

caffe2
A global dictionary that holds information about what Caffe2 modules have been loaded in the current ...
Definition: blob.h:13

caffe2::DispatchHelper
Definition: operator.h:1052

caffe2::CuDNNActivationOp
Definition: activation_ops_cudnn.h:56

caffe2::CuDNNActivationGradientOp< CUDNN_ACTIVATION_ELU >
Definition: elu_op_cudnn.cc:55

caffe2::CuDNNActivationGradientOp
Definition: activation_ops_cudnn.h:95

caffe2::CuDNNWrapper::inline_cudnn_handle
cudnnHandle_t inline_cudnn_handle()
Returns the inline cudnn handle that executes on the current thread&#39;s cuda_stream.
Definition: cudnn_wrappers.h:154

caffe2::CUDAContext
Definition: context_gpu.h:164

caffe2::cudnnTypeWrapper
cudnnTypeWrapper is a wrapper class that allows us to refer to the cudnn type in a template function...
Definition: common_cudnn.h:120