d8/da1/weighted__sum_8hpp_source.html

 // Copyright (c) 2014-2023, Lawrence Livermore National Security, LLC.
 // Produced at the Lawrence Livermore National Laboratory.
 // Written by the LBANN Research Team (B. Van Essen, et al.) listed in
 // the CONTRIBUTORS file. <lbann-dev@llnl.gov>
 //
 // LLNL-CODE-697807.
 // All rights reserved.
 //
 // This file is part of LBANN: Livermore Big Artificial Neural Network
 // Toolkit. For details, see http://software.llnl.gov/LBANN or
 // https://github.com/LLNL/LBANN.
 //
 // Licensed under the Apache License, Version 2.0 (the "Licensee"); you
 // may not use this file except in compliance with the License.  You may
 // obtain a copy of the License at:
 //
 // http://www.apache.org/licenses/LICENSE-2.0
 //
 // Unless required by applicable law or agreed to in writing, software
 // distributed under the License is distributed on an "AS IS" BASIS,
 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
 // implied. See the License for the specific language governing
 // permissions and limitations under the license.

 #ifndef LBANN_LAYER_WEIGHTED_SUM_HPP_INCLUDED
 #define LBANN_LAYER_WEIGHTED_SUM_HPP_INCLUDED

 #include "lbann/layers/data_type_layer.hpp"
 #include "lbann/utils/exception.hpp"
 #include <vector>

 namespace lbann {

 template <typename TensorDataType,
           data_layout T_layout = data_layout::DATA_PARALLEL,
           El::Device Dev = El::Device::CPU>
 class weighted_sum_layer : public data_type_layer<TensorDataType>
 {
 private:
   std::vector<DataType> m_scaling_factors;

 public:
   weighted_sum_layer(lbann_comm* comm, std::vector<DataType> scaling_factors)
     : data_type_layer<TensorDataType>(comm), m_scaling_factors(scaling_factors)
   {
     this->m_expected_num_parent_layers = -1; // No limit on parents
   }

   weighted_sum_layer* copy() const override
   {
     return new weighted_sum_layer(*this);
   }


   template <typename ArchiveT>
   void serialize(ArchiveT& ar);


   std::string get_type() const override { return "weighted sum"; }
   data_layout get_data_layout() const override { return T_layout; }
   El::Device get_device_allocation() const override { return Dev; }
   bool can_run_inplace() const override { return true; }
   int get_backprop_requirements() const override { return ERROR_SIGNALS; }

   description get_description() const override
   {
     auto desc = data_type_layer<TensorDataType>::get_description();
     std::stringstream ss;
     for (size_t i = 0; i < m_scaling_factors.size(); ++i) {
       ss << (i > 0 ? ", " : "") << m_scaling_factors[i];
     }
     desc.add("Scaling factors", ss.str());
     return desc;
   }

 protected:
   void write_specific_proto(lbann_data::Layer& proto) const final;

   friend class cereal::access;
   weighted_sum_layer() : weighted_sum_layer(nullptr, {1}) {}

   void setup_pointers() override
   {
     data_type_layer<TensorDataType>::setup_pointers();
     std::stringstream err;
     if (this->get_num_parents() < 1) {
       err << get_type() << " layer \"" << this->get_name() << "\" "
           << "has no parent layers";
       LBANN_ERROR(err.str());
     }
     if ((int)m_scaling_factors.size() != this->get_num_parents()) {
       err << get_type() << " layer \"" << this->get_name() << "\" "
           << "has an invalid number of scaling factors "
           << "(found " << m_scaling_factors.size() << ", "
           << "but there are " << this->get_num_parents() << " parent layers)";
       LBANN_ERROR(err.str());
     }
   }

   void setup_dims() override
   {
     data_type_layer<TensorDataType>::setup_dims();
     this->set_output_dims(this->get_input_dims());

     // Check that input dimensions match
     const auto& output_dims = this->get_output_dims();
     for (int i = 0; i < this->get_num_parents(); ++i) {
       if (this->get_input_dims(i) != output_dims) {
         const auto& parents = this->get_parent_layers();
         std::stringstream err;
         err << get_type() << " layer \"" << this->get_name() << "\" "
             << "has input tensors with incompatible dimensions (";
         for (int j = 0; j < this->get_num_parents(); ++j) {
           const auto& dims = this->get_input_dims(j);
           err << (j > 0 ? ", " : "") << "layer \"" << parents[j]->get_name()
               << "\" outputs ";
           for (size_t k = 0; k < dims.size(); ++k) {
             err << (k > 0 ? " x " : "") << dims[k];
           }
         }
         err << ")";
         LBANN_ERROR(err.str());
       }
     }
   }

   void fp_compute() override
   {
     auto& output = this->get_activations();

     // Special case for the first input so that in-place operation works
     if (!this->m_runs_inplace)
       El::Copy(this->get_prev_activations(0), output);

     El::Scale(m_scaling_factors[0], output);
     for (int i = 1; i < this->get_num_parents(); ++i) {
       El::Axpy(m_scaling_factors[i], this->get_prev_activations(i), output);
     }
   }

   void bp_compute() override
   {
     const auto& gradient_wrt_output = this->get_prev_error_signals();

     for (int i = 1; i < this->get_num_parents(); ++i) {
       auto& gradient_wrt_input = this->get_error_signals(i);
       El::Zero(gradient_wrt_input);
       El::Axpy(m_scaling_factors[i], gradient_wrt_output, gradient_wrt_input);
     }

     // Special case for the first input so that in-place operation works
     if (!this->m_runs_inplace)
       El::Copy(gradient_wrt_output, this->get_error_signals(0));
     El::Scale(m_scaling_factors[0], this->get_error_signals(0));
   }
 };

 #ifndef LBANN_WEIGHTED_SUM_LAYER_INSTANTIATE
 #define PROTO_DEVICE(T, Device)                                                \
   extern template class weighted_sum_layer<T,                                  \
                                            data_layout::DATA_PARALLEL,         \
                                            Device>;                            \
   extern template class weighted_sum_layer<T,                                  \
                                            data_layout::MODEL_PARALLEL,        \
                                            Device>

 #include "lbann/macros/instantiate_device.hpp"
 #undef PROTO_DEVICE
 #endif // LBANN_WEIGHTED_SUM_LAYER_INSTANTIATE

 } // namespace lbann

 #endif // LBANN_LAYER_WEIGHTED_SUM_HPP_INCLUDED
lbann::weighted_sum_layer::write_specific_proto
void write_specific_proto(lbann_data::Layer &proto) const final

lbann::weighted_sum_layer::bp_compute
void bp_compute() override
Compute objective funciton gradients. Called by the &#39;back_prop&#39; function. Given the input...
Definition: weighted_sum.hpp:149

lbann::Layer::setup_dims
virtual void setup_dims()
Setup tensor dimensions Called by the &#39;setup&#39; function. If there are any input tensors, the base method sets all uninitialized output tensor dimensions equal to the first input tensor dimensions.

lbann::ERROR_SIGNALS
Definition: base.hpp:207

lbann::weighted_sum_layer::weighted_sum_layer
weighted_sum_layer(lbann_comm *comm, std::vector< DataType > scaling_factors)
Definition: weighted_sum.hpp:47

lbann::weighted_sum_layer::setup_dims
void setup_dims() override
Setup tensor dimensions Called by the &#39;setup&#39; function. If there are any input tensors, the base method sets all uninitialized output tensor dimensions equal to the first input tensor dimensions.
Definition: weighted_sum.hpp:108

lbann::weighted_sum_layer
Add tensors with scaling factors.
Definition: weighted_sum.hpp:40

lbann::Layer::m_runs_inplace
bool m_runs_inplace
If true, the layer will run in-place (the input and output activations point to the same tensor)...
Definition: layer.hpp:872

LBANN_ERROR
#define LBANN_ERROR(...)
Definition: exception.hpp:37

lbann::Layer::get_num_parents
int get_num_parents() const noexcept
Get number of parent layers.
Definition: layer.hpp:574

lbann::weighted_sum_layer::get_backprop_requirements
int get_backprop_requirements() const override
Returns the necessary tensors for computing backpropagation.
Definition: weighted_sum.hpp:70

lbann::lbann_comm
Definition: comm.hpp:105

lbann::Layer::get_input_dims
std::vector< int > get_input_dims(size_t input_index=0) const
Get input tensor dimensions.

lbann::description
Generates nicely formatted description messages.
Definition: description.hpp:49

lbann::weighted_sum_layer::access
friend class cereal::access
Definition: weighted_sum.hpp:87

lbann::Layer::get_description
virtual description get_description() const
Human-readable description.

lbann::weighted_sum_layer::serialize
void serialize(ArchiveT &ar)

lbann::Device
constexpr El::Device Device
Definition: OperatorTraits.hpp:62

lbann::data_type_layer< TensorDataType >::get_prev_error_signals
OutputAbsDistMatrixType & get_prev_error_signals(int child_index=0)

lbann::data_type_layer< TensorDataType >::get_prev_activations
InputAbsDistMatrixType & get_prev_activations(int parent_index=0)

lbann::weighted_sum_layer::get_description
description get_description() const override
Human-readable description.
Definition: weighted_sum.hpp:72

lbann::data_type_layer< TensorDataType >::get_activations
const OutputAbsDistMatrixType & get_activations(const Layer &child) const override

lbann::weighted_sum_layer::can_run_inplace
bool can_run_inplace() const override
If True, the computation can run in-place (feeding each input activations tensor as the corresponding...
Definition: weighted_sum.hpp:69

lbann::weighted_sum_layer::fp_compute
void fp_compute() override
Apply layer operation. Called by the &#39;forward_prop&#39; function. Given the input tensors, the output tensors are populated with computed values.
Definition: weighted_sum.hpp:135

lbann::Layer::set_output_dims
void set_output_dims(std::vector< int > dims, size_t output_index=0)
Set output tensor dimensions.

lbann::Layer::get_parent_layers
std::vector< const Layer * > get_parent_layers() const

lbann::data_type_layer
Definition: data_type_layer.hpp:69

lbann::data_layout::DATA_PARALLEL

lbann::Layer::get_name
std::string get_name() const
Get the layer instance&#39;s name.
Definition: layer.hpp:332

lbann::weighted_sum_layer::get_device_allocation
El::Device get_device_allocation() const override
Get the device allocation for the data tensors. We assume that the decice allocation of the previous ...
Definition: weighted_sum.hpp:68

exception.hpp

instantiate_device.hpp

lbann::data_layout
data_layout
Data layout that is optimized for different modes of parallelism.
Definition: base.hpp:218

lbann::weighted_sum_layer::setup_pointers
void setup_pointers() override
Setup layer pointers. Called by the &#39;setup&#39; function. Pointers to parent/child layers are assumed to ...
Definition: weighted_sum.hpp:90

data_type_layer.hpp

lbann::weighted_sum_layer::copy
weighted_sum_layer * copy() const override
Copy function. This function dynamically allocates memory for a layer instance and instantiates a cop...
Definition: weighted_sum.hpp:53

lbann::weighted_sum_layer::weighted_sum_layer
weighted_sum_layer()
Definition: weighted_sum.hpp:88

lbann::weighted_sum_layer::get_type
std::string get_type() const override
Get the layer type&#39;s name.
Definition: weighted_sum.hpp:66

lbann::Layer::setup_pointers
virtual void setup_pointers()
Setup layer pointers. Called by the &#39;setup&#39; function. Pointers to parent/child layers are assumed to ...

lbann::Layer::get_output_dims
std::vector< int > get_output_dims(size_t output_index=0) const
Get output tensor dimensions.

lbann::weighted_sum_layer::get_data_layout
data_layout get_data_layout() const override
Get data layout of the data tensors. We assume that the data layouts of the previous activations...
Definition: weighted_sum.hpp:67

lbann::weighted_sum_layer::m_scaling_factors
std::vector< DataType > m_scaling_factors
Definition: weighted_sum.hpp:44

lbann::Layer::m_expected_num_parent_layers
int m_expected_num_parent_layers
Definition: layer.hpp:838

lbann::data_type_layer< TensorDataType >::get_error_signals
const InputAbsDistMatrixType & get_error_signals(const Layer &parent) const override

lbann
Definition: callback_helpers.hpp:32