d3/d02/layers_2transform_2pooling_8hpp_source.html

 // Copyright (c) 2014-2023, Lawrence Livermore National Security, LLC.
 // Produced at the Lawrence Livermore National Laboratory.
 // Written by the LBANN Research Team (B. Van Essen, et al.) listed in
 // the CONTRIBUTORS file. <lbann-dev@llnl.gov>
 //
 // LLNL-CODE-697807.
 // All rights reserved.
 //
 // This file is part of LBANN: Livermore Big Artificial Neural Network
 // Toolkit. For details, see http://software.llnl.gov/LBANN or
 // https://github.com/LLNL/LBANN.
 //
 // Licensed under the Apache License, Version 2.0 (the "Licensee"); you
 // may not use this file except in compliance with the License.  You may
 // obtain a copy of the License at:
 //
 // http://www.apache.org/licenses/LICENSE-2.0
 //
 // Unless required by applicable law or agreed to in writing, software
 // distributed under the License is distributed on an "AS IS" BASIS,
 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
 // implied. See the License for the specific language governing
 // permissions and limitations under the license.

 #ifndef LBANN_LAYER_POOLING_HPP_INCLUDED
 #define LBANN_LAYER_POOLING_HPP_INCLUDED

 #include "lbann/layers/data_type_layer.hpp"
 #include "lbann/models/model.hpp"
 #include "lbann/utils/dim_helpers.hpp"
 #include "lbann/utils/dnn_enums.hpp"
 #ifdef LBANN_HAS_DNN_LIB
 #include "lbann/utils/dnn_lib/helpers.hpp"
 #include "lbann/utils/dnn_lib/pooling.hpp"
 #endif // LBANN_HAS_DNN_LIB
 #include "lbann/utils/exception.hpp"
 #include "lbann/utils/im2col.hpp"

 #include <utility>
 #include <vector>

 #ifdef LBANN_HAS_DISTCONV
 #include "distconv/dnn_backend/pooling.hpp"
 #include "lbann/utils/distconv.hpp"
 #endif // LBANN_HAS_DISTCONV

 namespace lbann {

 inline pooling_mode to_pool_mode(std::string m)
 {
 #ifdef LBANN_DETERMINISTIC
   if (m == "max")
     return pooling_mode::MAX_DETERMINISTIC;
 #else
   if (m == "max")
     return pooling_mode::MAX;
 #endif // LBANN_DETERMINISTIC
   if (m == "average")
     return pooling_mode::AVERAGE_COUNT_INCLUDE_PADDING;
   if (m == "average_no_pad")
     return pooling_mode::AVERAGE_COUNT_EXCLUDE_PADDING;
   else {
     LBANN_ERROR("Invalid pooling mode requested.");
   }
 }

 #ifdef LBANN_HAS_DISTCONV

 namespace dc {
 using Shape = ::distconv::tensor::Shape;
 using Backend = ::distconv::BackendDNNLib;
 template <typename TensorDataType>
 using Pooling = ::distconv::Pooling<Backend, TensorDataType>;
 } // namespace dc

 template <typename TensorDataType,
           data_layout T_layout = data_layout::DATA_PARALLEL,
           El::Device Dev = El::Device::CPU>
 class pooling_distconv_adapter
   : public data_type_distconv_adapter<TensorDataType>
 {
 public:
   using TensorDevType =
     typename data_type_distconv_adapter<TensorDataType>::TensorDevType;
   pooling_distconv_adapter(Layer& layer)
     : data_type_distconv_adapter<TensorDataType>(layer)
   {}
   virtual ~pooling_distconv_adapter() = default;
   void setup_distributions(tensor_overlap_constraints& constraints) override;
   dc::Shape get_activations_local_shape(int index = 0) const override;
   void setup_layer(size_t workspace_capacity) override;
   void
   fp_compute(bool training = true); // training=true for max back-compatibility.
   void bp_compute();
   std::unique_ptr<dc::Pooling<TensorDataType>> m_pooling;
 };
 #endif // LBANN_HAS_DISTCONV

 // Forward declaration
 template <typename TensorDataType, data_layout T_layout, El::Device Dev>
 class unpooling_layer;

 template <typename TensorDataType,
           data_layout T_layout = data_layout::DATA_PARALLEL,
           El::Device Dev = El::Device::CPU>
 class pooling_layer : public data_type_layer<TensorDataType>
 {
   static_assert(T_layout == data_layout::DATA_PARALLEL,
                 "pooling only supports DATA_PARALLEL");

 private:
   pooling_mode m_pool_mode;

   std::vector<int> m_pool_dims;
   int m_pool_size;
   std::vector<int> m_pads;
   std::vector<int> m_strides;

   std::vector<int> m_max_pool_indices;

 #ifdef LBANN_HAS_DNN_LIB

   dnn_lib::PoolingDescriptor m_pooling_dnn_desc;
   dnn_lib::data_parallel_layer_tensor_manager<TensorDataType>
     m_tensors_dnn_desc;
 #endif // LBANN_HAS_DNN_LIB

   friend class unpooling_layer<TensorDataType, T_layout, Dev>;

 public:
   pooling_layer(lbann_comm* comm,
                 int num_data_dims,
                 int pool_dim,
                 int pad,
                 int stride,
                 pooling_mode mode)
     : pooling_layer(comm,
                     num_data_dims,
                     std::vector<int>(num_data_dims, pool_dim),
                     std::vector<int>(num_data_dims, pad),
                     std::vector<int>(num_data_dims, stride),
                     mode)
   {}

   pooling_layer(lbann_comm* comm,
                 int num_data_dims,
                 std::vector<int> pool_dims,
                 std::vector<int> pads,
                 std::vector<int> strides,
                 pooling_mode mode)
     : data_type_layer<TensorDataType>(comm),
       m_pool_mode(mode),
       m_pool_dims(pool_dims),
       m_pads(pads),
       m_strides(strides)
 #ifdef LBANN_HAS_DNN_LIB
       ,
       m_tensors_dnn_desc(this)
 #endif // LBANN_HAS_DNN_LIB
   {
     // Initialize input dimensions and pooling parameters
     m_pool_size = get_linear_size(m_pool_dims);
   }

   pooling_layer(const pooling_layer& other)
     : data_type_layer<TensorDataType>(other),
       m_pool_mode(other.m_pool_mode),
       m_pool_dims(other.m_pool_dims),
       m_pool_size(other.m_pool_size),
       m_pads(other.m_pads),
       m_strides(other.m_strides),
       m_max_pool_indices(other.m_max_pool_indices)
 #ifdef LBANN_HAS_DNN_LIB
       ,
       m_pooling_dnn_desc(other.m_pooling_dnn_desc),
       m_tensors_dnn_desc(other.m_tensors_dnn_desc)
 #endif // LBANN_HAS_DNN_LIB
   {
 #ifdef LBANN_HAS_DNN_LIB
     m_tensors_dnn_desc.set_layer(this);
 #endif // LBANN_HAS_DNN_LIB
   }

   pooling_layer& operator=(const pooling_layer& other)
   {
     data_type_layer<TensorDataType>::operator=(other);
     m_pool_mode = other.m_pool_mode;
     m_pool_dims = other.m_pool_dims;
     m_pool_size = other.m_pool_size;
     m_pads = other.m_pads;
     m_strides = other.m_strides;
     m_max_pool_indices = other.m_max_pool_indices;
 #ifdef LBANN_HAS_DNN_LIB
     m_pooling_dnn_desc = other.m_pooling_dnn_desc;
     m_tensors_dnn_desc = other.m_tensors_dnn_desc;
     m_tensors_dnn_desc.set_layer(this);
 #endif // LBANN_HAS_DNN_LIB
     return *this;
   }

   ~pooling_layer() override = default;

   pooling_layer* copy() const override { return new pooling_layer(*this); }


   template <typename ArchiveT>
   void serialize(ArchiveT& ar);


   std::string get_type() const override { return "pooling"; }
   data_layout get_data_layout() const override { return T_layout; }
   El::Device get_device_allocation() const override { return Dev; }
   bool can_run_inplace() const override { return false; }
   int get_backprop_requirements() const override
   {
     return ERROR_SIGNALS | PREV_ACTIVATIONS | ACTIVATIONS;
   }

 #ifdef LBANN_HAS_ONNX
   void fill_onnx_node(onnx::GraphProto& graph) const override;
 #endif // LBANN_HAS_ONNX

   description get_description() const override
   {
     auto desc = data_type_layer<TensorDataType>::get_description();
     std::stringstream ss;

     // Pool mode
     ss.str(std::string{});
     ss.clear();
     switch (m_pool_mode) {
     case pooling_mode::MAX:
       ss << "max";
       break;
     case pooling_mode::MAX_DETERMINISTIC:
       ss << "max (deterministic)";
       break;
     case pooling_mode::AVERAGE_COUNT_INCLUDE_PADDING:
       ss << "average";
       break;
     case pooling_mode::AVERAGE_COUNT_EXCLUDE_PADDING:
       ss << "average (no pad)";
       break;
     default:
       ss << "invalid";
     }
     desc.add("Pool mode", ss.str());

     // Pool dimensions
     ss.str(std::string{});
     ss.clear();
     for (size_t i = 0; i < m_pool_dims.size(); ++i) {
       ss << (i > 0 ? ", " : "") << m_pool_dims[i];
     }
     desc.add("Pool dimensions", ss.str());

     // Strides
     ss.str(std::string{});
     ss.clear();
     for (size_t i = 0; i < m_strides.size(); ++i) {
       ss << (i > 0 ? ", " : "") << m_strides[i];
     }
     desc.add("Strides", ss.str());

     // Pads
     ss.str(std::string{});
     ss.clear();
     for (size_t i = 0; i < m_pads.size(); ++i) {
       ss << (i > 0 ? ", " : "") << m_pads[i];
     }
     desc.add("Pads", ss.str());

     // Result
     return desc;
   }

 protected:
   void write_specific_proto(lbann_data::Layer& proto) const final;

   friend class cereal::access;
   pooling_layer() : pooling_layer(nullptr, 1, 1, 1, 1, pooling_mode::MAX) {}

   void setup_dims() override
   {
     data_type_layer<TensorDataType>::setup_dims();
     const auto& input_dims = this->get_input_dims();
     auto output_dims = input_dims;
     for (size_t i = 0; i < output_dims.size() - 1; ++i) {
       const int effective_dim =
         (input_dims[i + 1] + 2 * m_pads[i] - m_pool_dims[i] + 1);
       output_dims[i + 1] = (effective_dim + m_strides[i] - 1) / m_strides[i];
     }
     this->set_output_dims(output_dims);
   }

   void setup_gpu() override
   {
     data_type_layer<TensorDataType>::setup_gpu();
 #ifndef LBANN_HAS_DNN_LIB
     LBANN_ERROR("DNN library not detected");
 #else

     // Set pooling descriptor
     m_pooling_dnn_desc.set(m_pool_mode,
                            dnn_lib::DNN_PROPAGATE_NAN,
                            m_pool_dims.size(),
                            m_pool_dims.data(),
                            m_pads.data(),
                            m_strides.data());

 #endif // #ifndef LBANN_HAS_DNN_LIB
   }

   void fp_compute() override;

   void bp_compute() override;

 private:
   void fp_compute_dnn();

   void bp_compute_dnn();

   void fp_compute_im2col();

   void bp_compute_im2col();

 #ifdef LBANN_HAS_DISTCONV
   friend class pooling_distconv_adapter<TensorDataType, T_layout, Dev>;

 protected:
   bool is_distconv_supported() const override;
   void setup_distconv_adapter() override
   {
     this->get_distconv_adapter_ptr() =
       std::make_unique<pooling_distconv_adapter<TensorDataType, T_layout, Dev>>(
         *this);
   }
   pooling_distconv_adapter<TensorDataType, T_layout, Dev>&
   get_distconv_adapter() override;
   const pooling_distconv_adapter<TensorDataType, T_layout, Dev>&
   get_distconv_adapter() const override;
 #endif // LBANN_HAS_DISTCONV
 };

 #ifdef LBANN_HAS_ONNX
 template <typename T, data_layout L, El::Device D>
 void pooling_layer<T, L, D>::fill_onnx_node(onnx::GraphProto& graph) const
 {
   auto* pool = graph.add_node();

   // Get the attributes setup first
   {
     auto* kernel_shape = pool->add_attribute();
     kernel_shape->set_name("kernel_shape");
     kernel_shape->set_type(onnx::AttributeProto::INTS);
     for (auto const& k : this->m_pool_dims)
       kernel_shape->add_ints(k);
   }
   if (!this->m_strides.empty()) {
     auto* strides = pool->add_attribute();
     strides->set_name("strides");
     strides->set_type(onnx::AttributeProto::INTS);
     for (auto const& s : this->m_strides)
       strides->add_ints(s);
   }
   if (!this->m_pads.empty()) {
     auto* pads = pool->add_attribute();
     pads->set_name("pads");
     pads->set_type(onnx::AttributeProto::INTS);
     for (auto const& p : this->m_pads) {
       pads->add_ints(p);
       pads->add_ints(p);
     }
   }
   // FIXME: This is missing "dilations". However, they're only a valid
   // attribute for MaxPool, not AveragePool.

   for (auto const* parent : this->get_parent_layers()) {
     size_t idx = parent->find_child_layer_index(*this);
     pool->add_input(parent->get_name() + "_" + std::to_string(idx));
   }
   for (size_t ii = 0; ii < this->num_weights(); ii++)
     pool->add_input(this->get_weights(ii).get_name());
   for (auto const* child : this->get_child_layers()) {
     size_t idx = this->find_child_layer_index(*child);
     pool->add_output(this->get_name() + "_" + std::to_string(idx));
   }
   pool->set_name(this->get_name());

   switch (m_pool_mode) {
   case pooling_mode::MAX:
     pool->set_op_type("MaxPool");
     break;
   case pooling_mode::MAX_DETERMINISTIC:
     pool->set_op_type("MaxPool");
     break;
   case pooling_mode::AVERAGE_COUNT_INCLUDE_PADDING:
     pool->set_op_type("AveragePool");
     break;
   case pooling_mode::AVERAGE_COUNT_EXCLUDE_PADDING:
     pool->set_op_type("AveragePool");
     break;
   default:
     LBANN_ERROR("pooling_layer: no ONNX implementation for pooling mode");
   }

   pool->set_domain("");
   pool->set_doc_string(this->get_type());
 }
 #endif

 #ifndef LBANN_POOLING_LAYER_INSTANTIATE
 #define PROTO_DEVICE(T, Device)                                                \
   extern template class pooling_layer<T, data_layout::DATA_PARALLEL, Device>

 #include "lbann/macros/instantiate_device.hpp"
 #undef PROTO_DEVICE
 #endif // LBANN_POOLING_LAYER_INSTANTIATE

 } // namespace lbann

 #endif // LBANN_LAYER_POOLING_HPP_INCLUDED
lbann::data_type_distconv_adapter
Definition: data_type_distconv_adapter.hpp:56

lbann::pooling_layer::get_backprop_requirements
int get_backprop_requirements() const override
Returns the necessary tensors for computing backpropagation.
Definition: layers/transform/pooling.hpp:230

lbann::pooling_layer::get_device_allocation
El::Device get_device_allocation() const override
Get the device allocation for the data tensors. We assume that the decice allocation of the previous ...
Definition: layers/transform/pooling.hpp:228

pooling.hpp

lbann::Layer::setup_dims
virtual void setup_dims()
Setup tensor dimensions Called by the &#39;setup&#39; function. If there are any input tensors, the base method sets all uninitialized output tensor dimensions equal to the first input tensor dimensions.

lbann::ERROR_SIGNALS
Definition: base.hpp:207

lbann::pooling_mode::AVERAGE_COUNT_EXCLUDE_PADDING

lbann::pad
std::basic_string< T > pad(const std::basic_string< T > &s, typename std::basic_string< T >::size_type n, T c)
Definition: file_utils.hpp:93

lbann::get_linear_size
auto get_linear_size(std::vector< T > const &dims)
Definition: dim_helpers.hpp:59

lbann::PREV_ACTIVATIONS
Definition: base.hpp:208

lbann::pooling_layer
Definition: layers/transform/pooling.hpp:108

LBANN_ERROR
#define LBANN_ERROR(...)
Definition: exception.hpp:37

lbann::pooling_layer::setup_gpu
void setup_gpu() override
Initialize GPU objects.
Definition: layers/transform/pooling.hpp:314

lbann::pooling_layer::pooling_layer
pooling_layer(lbann_comm *comm, int num_data_dims, std::vector< int > pool_dims, std::vector< int > pads, std::vector< int > strides, pooling_mode mode)
Definition: layers/transform/pooling.hpp:158

distconv.hpp

lbann::pooling_mode::MAX_DETERMINISTIC

lbann::lbann_comm
Definition: comm.hpp:105

lbann::protobuf::serialize
void serialize(std::ostream &os, google::protobuf::Message const &msg)
Serialize the protobuf message to a stream.

lbann::Layer
Neural network tensor operation.
Definition: layer.hpp:285

lbann::description
Generates nicely formatted description messages.
Definition: description.hpp:49

lbann::to_pool_mode
pooling_mode to_pool_mode(std::string m)
Definition: layers/transform/pooling.hpp:51

lbann::dnn_lib::data_parallel_layer_tensor_manager
Definition: data_type_layer.hpp:52

lbann::pooling_layer::m_pool_dims
std::vector< int > m_pool_dims
Definition: layers/transform/pooling.hpp:118

lbann::Layer::get_description
virtual description get_description() const
Human-readable description.

lbann::Device
constexpr El::Device Device
Definition: OperatorTraits.hpp:62

lbann::to_string
std::string to_string(El::Device const &d)

lbann::pooling_layer::can_run_inplace
bool can_run_inplace() const override
If True, the computation can run in-place (feeding each input activations tensor as the corresponding...
Definition: layers/transform/pooling.hpp:229

lbann::tensor_overlap_constraints
Definition: distconv_adapter.hpp:48

lbann::pooling_layer::pooling_layer
pooling_layer(const pooling_layer &other)
Definition: layers/transform/pooling.hpp:178

lbann::pooling_mode::MAX

lbann::ACTIVATIONS
Definition: base.hpp:209

lbann::Layer::setup_gpu
virtual void setup_gpu()
Setup GPU objects. Called by the &#39;setup&#39; function if the layer is on GPUs.
Definition: layer.hpp:782

lbann::pooling_mode
pooling_mode
Which pooling mode to use.
Definition: dnn_enums.hpp:78

helpers.hpp

lbann::data_type_layer
Definition: data_type_layer.hpp:69

lbann::pooling_layer::get_data_layout
data_layout get_data_layout() const override
Get data layout of the data tensors. We assume that the data layouts of the previous activations...
Definition: layers/transform/pooling.hpp:227

lbann::pooling_mode::AVERAGE_COUNT_INCLUDE_PADDING

lbann::dc::Shape
::distconv::tensor::Shape Shape
Definition: data_type_distconv_adapter.hpp:40

lbann::data_layout::DATA_PARALLEL

lbann::pooling_layer::pooling_layer
pooling_layer()
Definition: layers/transform/pooling.hpp:298

exception.hpp

dnn_enums.hpp

instantiate_device.hpp

lbann::pooling_layer::m_pads
std::vector< int > m_pads
Definition: layers/transform/pooling.hpp:122

lbann::pooling_layer::setup_dims
void setup_dims() override
Setup tensor dimensions Called by the &#39;setup&#39; function. If there are any input tensors, the base method sets all uninitialized output tensor dimensions equal to the first input tensor dimensions.
Definition: layers/transform/pooling.hpp:300

lbann::pooling_layer::m_max_pool_indices
std::vector< int > m_max_pool_indices
Definition: layers/transform/pooling.hpp:131

lbann::execution_mode::training

lbann::data_layout
data_layout
Data layout that is optimized for different modes of parallelism.
Definition: base.hpp:218

data_type_layer.hpp

lbann::pooling_layer::operator=
pooling_layer & operator=(const pooling_layer &other)
Definition: layers/transform/pooling.hpp:197

lbann::pooling_layer::m_pool_mode
pooling_mode m_pool_mode
Definition: layers/transform/pooling.hpp:111

lbann::pooling_layer::m_pool_size
int m_pool_size
Definition: layers/transform/pooling.hpp:120

lbann::pooling_layer::m_strides
std::vector< int > m_strides
Definition: layers/transform/pooling.hpp:124

lbann::unpooling_layer
Transpose of pooling layer.
Definition: layers/transform/pooling.hpp:103

lbann::pooling_layer::get_description
description get_description() const override
Human-readable description.
Definition: layers/transform/pooling.hpp:239

im2col.hpp

lbann::pooling_layer::copy
pooling_layer * copy() const override
Copy function. This function dynamically allocates memory for a layer instance and instantiates a cop...
Definition: layers/transform/pooling.hpp:216

lbann::pooling_layer::get_type
std::string get_type() const override
Get the layer type&#39;s name.
Definition: layers/transform/pooling.hpp:226

dim_helpers.hpp

lbann::Layer::set_name
void set_name(const std::string name)
Set the layer instance&#39;s name. Each layer in a model should have a unique, preferably human-readable...
Definition: layer.hpp:319

model.hpp

lbann::data_type_layer::operator=
data_type_layer & operator=(data_type_layer &&other)=default

lbann
Definition: callback_helpers.hpp:32

lbann::data_type_distconv_adapter::TensorDevType
dc::TensorDev< OutputTensorDataType > TensorDevType
Definition: data_type_distconv_adapter.hpp:60

lbann::pooling_layer::pooling_layer
pooling_layer(lbann_comm *comm, int num_data_dims, int pool_dim, int pad, int stride, pooling_mode mode)
Definition: layers/transform/pooling.hpp:144