da/d96/layers_2regularizers_2dropout_8hpp_source.html

 // Copyright (c) 2014-2023, Lawrence Livermore National Security, LLC.
 // Produced at the Lawrence Livermore National Laboratory.
 // Written by the LBANN Research Team (B. Van Essen, et al.) listed in
 // the CONTRIBUTORS file. <lbann-dev@llnl.gov>
 //
 // LLNL-CODE-697807.
 // All rights reserved.
 //
 // This file is part of LBANN: Livermore Big Artificial Neural Network
 // Toolkit. For details, see http://software.llnl.gov/LBANN or
 // https://github.com/LLNL/LBANN.
 //
 // Licensed under the Apache License, Version 2.0 (the "Licensee"); you
 // may not use this file except in compliance with the License.  You may
 // obtain a copy of the License at:
 //
 // http://www.apache.org/licenses/LICENSE-2.0
 //
 // Unless required by applicable law or agreed to in writing, software
 // distributed under the License is distributed on an "AS IS" BASIS,
 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
 // implied. See the License for the specific language governing
 // permissions and limitations under the license.

 #ifndef LBANN_LAYER_REGULARIZER_DROPOUT_HPP_INCLUDED
 #define LBANN_LAYER_REGULARIZER_DROPOUT_HPP_INCLUDED

 #include "lbann/layers/data_type_layer.hpp"
 #ifdef LBANN_HAS_DNN_LIB
 #include "lbann/utils/dnn_lib/dropout.hpp"
 #include "lbann/utils/dnn_lib/helpers.hpp"
 #endif // LBANN_HAS_DNN_LIB
 #include "lbann/utils/random_number_generators.hpp"

 namespace lbann {

 template <typename TensorDataType, data_layout T_layout, El::Device Dev>
 class dropout : public data_type_layer<TensorDataType>
 {
 public:

   using AbsDistMatrixType = El::AbstractDistMatrix<TensorDataType>;


 public:
   dropout(EvalType keep_prob = EvalType(0.5))
     : data_type_layer<TensorDataType>(nullptr),
       m_keep_prob(keep_prob)
 #ifdef LBANN_HAS_DNN_LIB
       ,
       m_tensors_dnn_desc(this)
 #endif // LBANN_HAS_DNN_LIB
   {}

   dropout(const dropout& other)
     : data_type_layer<TensorDataType>(other),
       m_keep_prob(other.m_keep_prob),
       m_mask(other.m_mask ? other.m_mask->Copy() : nullptr)
 #ifdef LBANN_HAS_DNN_LIB
       ,
       m_tensors_dnn_desc(other.m_tensors_dnn_desc)
 #endif // LBANN_HAS_DNN_LIB
   {
 #ifdef LBANN_HAS_DNN_LIB
     m_tensors_dnn_desc.set_layer(this);
     m_states = other.m_states;
     m_reserve_space = other.m_reserve_space;
     if (other.m_dropout_dnn_desc != nullptr) {
       setup_dropout_dnn_desc();
     }
 #endif // LBANN_HAS_DNN_LIB
   }

   dropout& operator=(const dropout& other)
   {
     data_type_layer<TensorDataType>::operator=(other);
     m_keep_prob = other.m_keep_prob;
     m_mask = other.m_mask
                ? std::unique_ptr<AbsDistMatrixType>(other.m_mask->Copy())
                : nullptr;
 #ifdef LBANN_HAS_DNN_LIB
     m_tensors_dnn_desc = other.m_tensors_dnn_desc;
     m_tensors_dnn_desc.set_layer(this);
     m_states = other.m_states;
     m_reserve_space = other.m_reserve_space;
     if (other.m_dropout_dnn_desc != nullptr) {
       setup_dropout_dnn_desc();
     }
 #endif // LBANN_HAS_DNN_LIB
     return *this;
   }

   ~dropout() override = default;

   dropout* copy() const override { return new dropout(*this); }
   std::string get_type() const override { return "dropout"; }
   data_layout get_data_layout() const override { return T_layout; }
   El::Device get_device_allocation() const override { return Dev; }
   bool can_run_inplace() const override { return true; }
   int get_backprop_requirements() const override { return ERROR_SIGNALS; }

   description get_description() const override
   {
     auto desc = data_type_layer<TensorDataType>::get_description();
     desc.add("Keep probability", m_keep_prob);
     return desc;
   }
   EvalType get_keep_prob() const { return m_keep_prob; }
   void set_keep_prob(EvalType keep_prob) { m_keep_prob = keep_prob; }


   template <typename ArchiveT>
   void serialize(ArchiveT& ar);


 protected:
   void write_specific_proto(lbann_data::Layer& proto) const final;

   void setup_dims() override
   {
     data_type_layer<TensorDataType>::setup_dims();
     this->set_output_dims(this->get_input_dims());
   }

   void setup_data(size_t max_mini_batch_size) override
   {
     data_type_layer<TensorDataType>::setup_data(max_mini_batch_size);
     m_mask = std::unique_ptr<AbsDistMatrixType>(this->get_activations().Copy());
   }

   void setup_gpu() override
   {
     data_type_layer<TensorDataType>::setup_gpu();
 #ifndef LBANN_HAS_DNN_LIB
     LBANN_ERROR("DNN library not detected");
 #else

 #ifdef LBANN_DETERMINISTIC
     if (this->get_comm()->am_trainer_master()) {
       LBANN_WARNING(this->get_type(),
                     " layer \"",
                     this->get_name(),
                     "\" ",
                     "does not guarantee sequential consistency");
     }
 #endif // LBANN_DETERMINISTIC

     // Initialize DNN library objects
     setup_dropout_dnn_desc();

 #endif // LBANN_HAS_DNN_LIB
   }

   void fp_compute() override
   {
     if (this->using_gpus()) {
       fp_compute_gpu();
     }
     else {
       fp_compute_cpu();
     }
   }

   void bp_compute() override
   {
     if (this->using_gpus()) {
       bp_compute_gpu();
     }
     else {
       bp_compute_cpu();
     }
   }

 private:
   void fp_compute_cpu();

   void bp_compute_cpu();

   void fp_compute_gpu();

   void bp_compute_gpu();

 #ifdef LBANN_HAS_DNN_LIB

   void setup_dropout_dnn_desc()
   {

     // Setup RNG state
     size_t size = dnn_lib::get_dropout_states_size();
     m_states.Resize((size + sizeof(TensorDataType) - 1) /
                       sizeof(TensorDataType),
                     1);

     // Setup dropout descriptor
     m_dropout_dnn_desc.set(float(1 - m_keep_prob),
                            m_states.Buffer(),
                            m_states.Height() * sizeof(TensorDataType),
                            get_generator()());
   }
 #endif // LBANN_HAS_DNN_LIB

   EvalType m_keep_prob;
   std::unique_ptr<AbsDistMatrixType> m_mask;

 #ifdef LBANN_HAS_DNN_LIB

   dnn_lib::DropoutDescriptor m_dropout_dnn_desc;
   dnn_lib::entrywise_layer_tensor_manager<TensorDataType> m_tensors_dnn_desc;
   El::Matrix<TensorDataType, El::Device::GPU> m_states;
   El::Matrix<TensorDataType, El::Device::GPU> m_reserve_space;
 #endif // LBANN_HAS_DNN_LIB
 };

 template <typename T, data_layout L, El::Device D>
 using dropout_layer = dropout<T, L, D>;

 LBANN_DEFINE_LAYER_BUILDER(dropout);

 #ifndef LBANN_DROPOUT_LAYER_INSTANTIATE
 #define PROTO_DEVICE(T, Device)                                                \
   extern template class dropout<T, data_layout::DATA_PARALLEL, Device>;        \
   extern template class dropout<T, data_layout::MODEL_PARALLEL, Device>

 #include "lbann/macros/instantiate_device.hpp"
 #undef PROTO_DEVICE
 #endif // LBANN_DROPOUT_LAYER_INSTANTIATE

 } // namespace lbann

 #endif // LBANN_LAYER_REGULARIZER_DROPOUT_HPP_INCLUDED
lbann::dropout::copy
dropout * copy() const override
Copy function. This function dynamically allocates memory for a layer instance and instantiates a cop...
Definition: layers/regularizers/dropout.hpp:113

lbann::dropout::get_description
description get_description() const override
Human-readable description.
Definition: layers/regularizers/dropout.hpp:120

lbann::Layer::setup_dims
virtual void setup_dims()
Setup tensor dimensions Called by the &#39;setup&#39; function. If there are any input tensors, the base method sets all uninitialized output tensor dimensions equal to the first input tensor dimensions.

lbann::ERROR_SIGNALS
Definition: base.hpp:207

lbann::dropout::get_device_allocation
El::Device get_device_allocation() const override
Get the device allocation for the data tensors. We assume that the decice allocation of the previous ...
Definition: layers/regularizers/dropout.hpp:116

lbann::Layer::get_comm
lbann_comm * get_comm() const

lbann::dropout::fp_compute_cpu
void fp_compute_cpu()

LBANN_ERROR
#define LBANN_ERROR(...)
Definition: exception.hpp:37

lbann::dropout::bp_compute_gpu
void bp_compute_gpu()

lbann::dropout::get_data_layout
data_layout get_data_layout() const override
Get data layout of the data tensors. We assume that the data layouts of the previous activations...
Definition: layers/regularizers/dropout.hpp:115

lbann::dropout::serialize
void serialize(ArchiveT &ar)

lbann::Layer::get_input_dims
std::vector< int > get_input_dims(size_t input_index=0) const
Get input tensor dimensions.

lbann::description
Generates nicely formatted description messages.
Definition: description.hpp:49

lbann::dropout::get_backprop_requirements
int get_backprop_requirements() const override
Returns the necessary tensors for computing backpropagation.
Definition: layers/regularizers/dropout.hpp:118

lbann::Layer::get_description
virtual description get_description() const
Human-readable description.

lbann::dropout::dropout
dropout(const dropout &other)
Definition: layers/regularizers/dropout.hpp:73

lbann::Device
constexpr El::Device Device
Definition: OperatorTraits.hpp:62

lbann::dropout::write_specific_proto
void write_specific_proto(lbann_data::Layer &proto) const final

dropout.hpp

lbann::data_type_layer< TensorDataType >::get_activations
const OutputAbsDistMatrixType & get_activations(const Layer &child) const override

lbann::dropout::~dropout
~dropout() override=default

lbann::dropout::operator=
dropout & operator=(const dropout &other)
Definition: layers/regularizers/dropout.hpp:92

lbann::dropout::bp_compute_cpu
void bp_compute_cpu()

lbann::Layer::set_output_dims
void set_output_dims(std::vector< int > dims, size_t output_index=0)
Set output tensor dimensions.

lbann::Layer::setup_gpu
virtual void setup_gpu()
Setup GPU objects. Called by the &#39;setup&#39; function if the layer is on GPUs.
Definition: layer.hpp:782

lbann::dnn_lib::entrywise_layer_tensor_manager
Definition: data_type_layer.hpp:54

helpers.hpp

lbann::data_type_layer
Definition: data_type_layer.hpp:69

lbann::dropout::can_run_inplace
bool can_run_inplace() const override
If True, the computation can run in-place (feeding each input activations tensor as the corresponding...
Definition: layers/regularizers/dropout.hpp:117

lbann::Layer::get_name
std::string get_name() const
Get the layer instance&#39;s name.
Definition: layer.hpp:332

lbann::dropout::set_keep_prob
void set_keep_prob(EvalType keep_prob)
set prob for keep each unit.
Definition: layers/regularizers/dropout.hpp:129

random_number_generators.hpp

lbann::dropout::AbsDistMatrixType
El::AbstractDistMatrix< TensorDataType > AbsDistMatrixType
The tensor type expected in this object.
Definition: layers/regularizers/dropout.hpp:58

lbann::dropout::m_keep_prob
EvalType m_keep_prob
Definition: layers/regularizers/dropout.hpp:230

lbann::dropout::setup_dims
void setup_dims() override
Setup tensor dimensions Called by the &#39;setup&#39; function. If there are any input tensors, the base method sets all uninitialized output tensor dimensions equal to the first input tensor dimensions.
Definition: layers/regularizers/dropout.hpp:143

instantiate_device.hpp

lbann::dropout::get_type
std::string get_type() const override
Get the layer type&#39;s name.
Definition: layers/regularizers/dropout.hpp:114

lbann::dropout
Probabilistically drop layer outputs.
Definition: layers/regularizers/dropout.hpp:51

lbann::data_layout
data_layout
Data layout that is optimized for different modes of parallelism.
Definition: base.hpp:218

data_type_layer.hpp

LBANN_WARNING
#define LBANN_WARNING(...)
Definition: exception.hpp:53

lbann::Layer::using_gpus
bool using_gpus() const noexcept
Whether the layer is using a GPU implementation.
Definition: layer.hpp:417

lbann::dropout::m_mask
std::unique_ptr< AbsDistMatrixType > m_mask
Definition: layers/regularizers/dropout.hpp:232

lbann::data_type_layer::setup_data
void setup_data(size_t max_mini_batch_size) override

lbann::LBANN_DEFINE_LAYER_BUILDER
LBANN_DEFINE_LAYER_BUILDER(elu)

lbann::dropout::fp_compute_gpu
void fp_compute_gpu()

lbann::get_generator
rng_gen & get_generator()

lbann::dropout::setup_gpu
void setup_gpu() override
Setup GPU objects. Called by the &#39;setup&#39; function if the layer is on GPUs.
Definition: layers/regularizers/dropout.hpp:155

lbann::dropout::get_keep_prob
EvalType get_keep_prob() const
get prob for keep each unit.
Definition: layers/regularizers/dropout.hpp:127

lbann::dropout::fp_compute
void fp_compute() override
Apply layer operation. Called by the &#39;forward_prop&#39; function. Given the input tensors, the output tensors are populated with computed values.
Definition: layers/regularizers/dropout.hpp:179

lbann::data_type_layer::operator=
data_type_layer & operator=(data_type_layer &&other)=default

lbann::dropout::dropout
dropout(EvalType keep_prob=EvalType(0.5))
Definition: layers/regularizers/dropout.hpp:64

lbann::EvalType
double EvalType
Definition: base.hpp:189

lbann
Definition: callback_helpers.hpp:32

lbann::dropout::setup_data
void setup_data(size_t max_mini_batch_size) override
Setup layer data. Called by the &#39;setup&#39; function. Memory is allocated for distributed matrices...
Definition: layers/regularizers/dropout.hpp:149

lbann::dropout::bp_compute
void bp_compute() override
Compute objective funciton gradients. Called by the &#39;back_prop&#39; function. Given the input...
Definition: layers/regularizers/dropout.hpp:189