d2/dbf/tessellate_8hpp_source.html

 // Copyright (c) 2014-2023, Lawrence Livermore National Security, LLC.
 // Produced at the Lawrence Livermore National Laboratory.
 // Written by the LBANN Research Team (B. Van Essen, et al.) listed in
 // the CONTRIBUTORS file. <lbann-dev@llnl.gov>
 //
 // LLNL-CODE-697807.
 // All rights reserved.
 //
 // This file is part of LBANN: Livermore Big Artificial Neural Network
 // Toolkit. For details, see http://software.llnl.gov/LBANN or
 // https://github.com/LLNL/LBANN.
 //
 // Licensed under the Apache License, Version 2.0 (the "Licensee"); you
 // may not use this file except in compliance with the License.  You may
 // obtain a copy of the License at:
 //
 // http://www.apache.org/licenses/LICENSE-2.0
 //
 // Unless required by applicable law or agreed to in writing, software
 // distributed under the License is distributed on an "AS IS" BASIS,
 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
 // implied. See the License for the specific language governing
 // permissions and limitations under the license.

 #ifndef LBANN_LAYERS_TRANSFORM_TESSELLATE_HPP_INCLUDED
 #define LBANN_LAYERS_TRANSFORM_TESSELLATE_HPP_INCLUDED

 #include "lbann/layers/data_type_layer.hpp"
 #include "lbann/layers/layer.hpp"
 #include "lbann/proto/datatype_helpers.hpp"
 #include "lbann/proto/layers.pb.h"
 #include "lbann/utils/protobuf.hpp"

 namespace lbann {

 template <typename TensorDataType,
           data_layout Layout = data_layout::DATA_PARALLEL,
           El::Device Device = El::Device::CPU>
 class tessellate_layer : public data_type_layer<TensorDataType>
 {
 public:

   using AbsDistMatrixType = El::AbstractDistMatrix<TensorDataType>;

   using AbsMatrixType = El::AbstractMatrix<TensorDataType>;


 public:
   tessellate_layer(lbann_comm* comm, std::vector<int> dims = {})
     : data_type_layer<TensorDataType>(comm)
   {
     this->set_output_dims(dims);
   }

   tessellate_layer(const tessellate_layer& other)
     : data_type_layer<TensorDataType>(other),
       m_input_v(other.m_input_v ? other.m_input_v->Copy() : nullptr)
   {}
   tessellate_layer& operator=(const tessellate_layer& other)
   {
     data_type_layer<TensorDataType>::operator=(other);
     m_input_v.reset(other.m_input_v ? other.m_input_v->Copy() : nullptr);
     return *this;
   }

   tessellate_layer* copy() const override
   {
     return new tessellate_layer(*this);
   }


   template <typename ArchiveT>
   void serialize(ArchiveT& ar);


   std::string get_type() const override { return "tessellate"; }
   data_layout get_data_layout() const override { return Layout; }
   El::Device get_device_allocation() const override { return Device; }
   bool can_run_inplace() const override { return false; }
   int get_backprop_requirements() const override { return ERROR_SIGNALS; }

   void setup_dims() override
   {
     data_type_layer<TensorDataType>::setup_dims();
     std::stringstream err;

     // Check input and output dimensions
     const auto input_dims = this->get_input_dims();
     const auto& output_dims = this->get_output_dims();
     if (input_dims.size() != output_dims.size()) {
       err << get_type() << " layer \"" << this->get_name() << "\" "
           << "attempted to tessellate a ";
       for (size_t i = 0; i < input_dims.size(); ++i) {
         err << (i > 0 ? "x" : "") << input_dims[i];
       }
       err << " tensor into a ";
       for (size_t i = 0; i < output_dims.size(); ++i) {
         err << (i > 0 ? "x" : "") << output_dims[i];
       }
       err << " tensor";
       LBANN_ERROR(err.str());
     }

     if (input_dims.size() > 3) {
       err << get_type() << " layer \"" << this->get_name() << "\" "
           << "attempted to tessellate a ";
       for (size_t i = 0; i < input_dims.size(); ++i) {
         err << (i > 0 ? "x" : "") << input_dims[i];
       }
       err << " tensor, but tessellation is currently only supported "
           << "with 3 dimensions or less";
     }
   }

   void setup_data(size_t max_mini_batch_size) override
   {
     data_type_layer<TensorDataType>::setup_data(max_mini_batch_size);
     auto dist_data = this->get_prev_activations().DistData();
     dist_data.colDist = El::STAR;
     m_input_v.reset(AbsDistMatrixType::Instantiate(dist_data));
   }

 protected:
   void write_specific_proto(lbann_data::Layer& proto) const final;

   friend class cereal::access;
   tessellate_layer() : tessellate_layer(nullptr) {}

   void fp_compute() override
   {

     // Get input and output dimensions
     auto input_dims = this->get_input_dims();
     auto output_dims = this->get_output_dims();
     while (input_dims.size() < 3) {
       input_dims.insert(input_dims.begin(), 1);
     }
     while (output_dims.size() < 3) {
       output_dims.insert(output_dims.begin(), 1);
     }

     // Get input and output data
     auto& output = this->get_activations();
     const auto& input = this->get_prev_activations();
     m_input_v->Empty(false);
     m_input_v->AlignWith(output);
     if (m_input_v->DistData() == input.DistData()) {
       El::LockedView(*m_input_v, input);
     }
     else {
       El::Copy(input, *m_input_v);
     }
     const auto& local_input = m_input_v->LockedMatrix();

     // Apply tessellation
     if (input_dims.size() > 3) {
       LBANN_ERROR("tessellate layer currently only supports 3D tensors");
     }
     fp_compute_3d(input_dims, output_dims, local_input, output);
   }

   void bp_compute() override
   {

     // Get input and output dimensions
     auto input_dims = this->get_input_dims();
     auto output_dims = this->get_output_dims();
     while (input_dims.size() < 3) {
       input_dims.insert(input_dims.begin(), 1);
     }
     while (output_dims.size() < 3) {
       output_dims.insert(output_dims.begin(), 1);
     }

     // Get input and output data
     const auto& gradient_wrt_output = this->get_prev_error_signals();
     auto& gradient_wrt_input = this->get_error_signals();
     m_input_v->Empty(false);
     m_input_v->AlignWith(gradient_wrt_output);
     if (m_input_v->DistData() == gradient_wrt_input.DistData()) {
       El::View(*m_input_v, gradient_wrt_input);
     }
     else {
       m_input_v->Resize(gradient_wrt_input.Height(),
                         gradient_wrt_input.Width());
     }
     auto& local_gradient_wrt_input = m_input_v->Matrix();

     // Apply back prop with local data
     bp_compute_3d(input_dims,
                   output_dims,
                   gradient_wrt_output,
                   local_gradient_wrt_input);

     // Accumulate local error signals, if needed
     if (m_input_v->DistData() != gradient_wrt_input.DistData()) {
       this->get_comm()->allreduce(*m_input_v, m_input_v->RedundantComm());
       El::Copy(*m_input_v, gradient_wrt_input);
     }
   }

 private:
   std::unique_ptr<AbsDistMatrixType> m_input_v;

   void fp_compute_3d(const std::vector<int>& input_dims,
                      const std::vector<int>& output_dims,
                      const AbsMatrixType& input,
                      AbsDistMatrixType& output);
   void bp_compute_3d(const std::vector<int>& input_dims,
                      const std::vector<int>& output_dims,
                      const AbsDistMatrixType& gradient_wrt_output,
                      AbsMatrixType& gradient_wrt_input);
 };

 template <typename T, data_layout L, El::Device D>
 void tessellate_layer<T, L, D>::write_specific_proto(
   lbann_data::Layer& proto) const
 {
   proto.set_datatype(proto::ProtoDataType<T>);
   auto* msg = proto.mutable_tessellate();
   protobuf::assign_to_repeated(*msg->mutable_dims(), this->get_output_dims());
 }

 #ifndef LBANN_TESSELLATE_LAYER_INSTANTIATE
 #define PROTO_DEVICE(T, Device)                                                \
   extern template class tessellate_layer<T,                                    \
                                          data_layout::DATA_PARALLEL,           \
                                          Device>;                              \
   extern template class tessellate_layer<T, data_layout::MODEL_PARALLEL, Device>

 #include "lbann/macros/instantiate_device.hpp"
 #undef PROTO_DEVICE
 #endif // LBANN_TESSELLATE_LAYER_INSTANTIATE

 } // namespace lbann

 #endif // LBANN_LAYERS_TRANSFORM_TESSELLATE_HPP_INCLUDED
lbann::tessellate_layer::copy
tessellate_layer * copy() const override
Copy function. This function dynamically allocates memory for a layer instance and instantiates a cop...
Definition: tessellate.hpp:93

lbann::tessellate_layer::serialize
void serialize(ArchiveT &ar)

lbann::Layer::setup_dims
virtual void setup_dims()
Setup tensor dimensions Called by the &#39;setup&#39; function. If there are any input tensors, the base method sets all uninitialized output tensor dimensions equal to the first input tensor dimensions.

lbann::tessellate_layer::setup_data
void setup_data(size_t max_mini_batch_size) override
Setup layer data. Called by the &#39;setup&#39; function. Memory is allocated for distributed matrices...
Definition: tessellate.hpp:146

lbann::ERROR_SIGNALS
Definition: base.hpp:207

lbann::tessellate_layer::operator=
tessellate_layer & operator=(const tessellate_layer &other)
Definition: tessellate.hpp:86

lbann::tessellate_layer::write_specific_proto
void write_specific_proto(lbann_data::Layer &proto) const final
Definition: tessellate.hpp:260

lbann::tessellate_layer::AbsDistMatrixType
El::AbstractDistMatrix< TensorDataType > AbsDistMatrixType
The tensor type expected in this object.
Definition: tessellate.hpp:68

lbann::tessellate_layer
Repeat a tensor until it matches specified dimensions.
Definition: tessellate.hpp:61

lbann::Layer::get_comm
lbann_comm * get_comm() const

lbann::tessellate_layer::get_type
std::string get_type() const override
Get the layer type&#39;s name.
Definition: tessellate.hpp:106

lbann::tessellate_layer::bp_compute_3d
void bp_compute_3d(const std::vector< int > &input_dims, const std::vector< int > &output_dims, const AbsDistMatrixType &gradient_wrt_output, AbsMatrixType &gradient_wrt_input)

lbann::tessellate_layer::m_input_v
std::unique_ptr< AbsDistMatrixType > m_input_v
Definition: tessellate.hpp:238

LBANN_ERROR
#define LBANN_ERROR(...)
Definition: exception.hpp:37

lbann::lbann_comm
Definition: comm.hpp:105

lbann::tessellate_layer::AbsMatrixType
El::AbstractMatrix< TensorDataType > AbsMatrixType
The local tensor type expected in this object.
Definition: tessellate.hpp:71

lbann::Layer::get_input_dims
std::vector< int > get_input_dims(size_t input_index=0) const
Get input tensor dimensions.

lbann::tessellate_layer::get_device_allocation
El::Device get_device_allocation() const override
Get the device allocation for the data tensors. We assume that the decice allocation of the previous ...
Definition: tessellate.hpp:108

lbann::Device
constexpr El::Device Device
Definition: OperatorTraits.hpp:62

lbann::data_type_layer< TensorDataType >::get_prev_error_signals
OutputAbsDistMatrixType & get_prev_error_signals(int child_index=0)

lbann::data_type_layer< TensorDataType >::get_prev_activations
InputAbsDistMatrixType & get_prev_activations(int parent_index=0)

lbann::data_type_layer< TensorDataType >::get_activations
const OutputAbsDistMatrixType & get_activations(const Layer &child) const override

lbann::tessellate_layer::can_run_inplace
bool can_run_inplace() const override
If True, the computation can run in-place (feeding each input activations tensor as the corresponding...
Definition: tessellate.hpp:109

lbann::Layer::set_output_dims
void set_output_dims(std::vector< int > dims, size_t output_index=0)
Set output tensor dimensions.

lbann::protobuf::assign_to_repeated
void assign_to_repeated(google::protobuf::RepeatedField< T > &field, ContainerT const &values)
Assign a range of values to a repeated protobuf field.
Definition: impl.hpp:125

lbann::tessellate_layer::tessellate_layer
tessellate_layer(lbann_comm *comm, std::vector< int > dims={})
Definition: tessellate.hpp:76

lbann::tessellate_layer::setup_dims
void setup_dims() override
Setup tensor dimensions Called by the &#39;setup&#39; function. If there are any input tensors, the base method sets all uninitialized output tensor dimensions equal to the first input tensor dimensions.
Definition: tessellate.hpp:112

lbann::tessellate_layer::access
friend class cereal::access
Definition: tessellate.hpp:158

lbann::tessellate_layer::get_backprop_requirements
int get_backprop_requirements() const override
Returns the necessary tensors for computing backpropagation.
Definition: tessellate.hpp:110

lbann::data_type_layer
Definition: data_type_layer.hpp:69

lbann::tessellate_layer::tessellate_layer
tessellate_layer(const tessellate_layer &other)
Definition: tessellate.hpp:82

lbann::lbann_comm::allreduce
T allreduce(T snd, const El::mpi::Comm &c, El::mpi::Op op=El::mpi::SUM) const
Definition: comm_impl.hpp:643

layer.hpp

lbann::data_layout::DATA_PARALLEL

lbann::Layer::get_name
std::string get_name() const
Get the layer instance&#39;s name.
Definition: layer.hpp:332

instantiate_device.hpp

lbann::tessellate_layer::get_data_layout
data_layout get_data_layout() const override
Get data layout of the data tensors. We assume that the data layouts of the previous activations...
Definition: tessellate.hpp:107

lbann::data_layout
data_layout
Data layout that is optimized for different modes of parallelism.
Definition: base.hpp:218

lbann::tessellate_layer::tessellate_layer
tessellate_layer()
Definition: tessellate.hpp:159

data_type_layer.hpp

lbann::tessellate_layer::fp_compute_3d
void fp_compute_3d(const std::vector< int > &input_dims, const std::vector< int > &output_dims, const AbsMatrixType &input, AbsDistMatrixType &output)

lbann::tessellate_layer::fp_compute
void fp_compute() override
Apply layer operation. Called by the &#39;forward_prop&#39; function. Given the input tensors, the output tensors are populated with computed values.
Definition: tessellate.hpp:161

lbann::data_type_layer::setup_data
void setup_data(size_t max_mini_batch_size) override

lbann::tessellate_layer::bp_compute
void bp_compute() override
Compute objective funciton gradients. Called by the &#39;back_prop&#39; function. Given the input...
Definition: tessellate.hpp:195

lbann::Layer::get_output_dims
std::vector< int > get_output_dims(size_t output_index=0) const
Get output tensor dimensions.

lbann::data_type_layer::operator=
data_type_layer & operator=(data_type_layer &&other)=default

lbann::data_type_layer< TensorDataType >::get_error_signals
const InputAbsDistMatrixType & get_error_signals(const Layer &parent) const override

lbann
Definition: callback_helpers.hpp:32

protobuf.hpp

datatype_helpers.hpp