doc/v618/GeneralLayer_8h_source.html

// @(#)root/tmva/tmva/dnn:$Id$

// Author: Vladimir Ilievski


/**********************************************************************************

 * Project: TMVA - a Root-integrated toolkit for multivariate data analysis       *

 * Package: TMVA                                                                  *

 * Class  : TGeneralLayer                                                         *

 * Web    : http://tmva.sourceforge.net                                           *

 *                                                                                *

 * Description:                                                                   *

 *      General Deep Neural Network Layer                                         *

 *                                                                                *

 * Authors (alphabetical):                                                        *

 *      Vladimir Ilievski      <ilievski.vladimir@live.com>  - CERN, Switzerland  *

 *                                                                                *

 * Copyright (c) 2005-2015:                                                       *

 *      CERN, Switzerland                                                         *

 *      U. of Victoria, Canada                                                    *

 *      MPI-K Heidelberg, Germany                                                 *

 *      U. of Bonn, Germany                                                       *

 *                                                                                *

 * Redistribution and use in source and binary forms, with or without             *

 * modification, are permitted according to the terms listed in LICENSE           *

 * (http://tmva.sourceforge.net/LICENSE)                                          *

 **********************************************************************************/


#ifndef TMVA_DNN_GENERALLAYER

#define TMVA_DNN_GENERALLAYER


#include <iostream>

#include <limits>


// for xml

#include "TMVA/Tools.h"


namespace TMVA {

namespace DNN {


/** \class VGeneralLayer

    Generic General Layer class.


    This class represents the general class for all layers in the Deep Learning

    Module.

 */

template <typename Architecture_t>

class VGeneralLayer {

   using Matrix_t = typename Architecture_t::Matrix_t;

   using Scalar_t = typename Architecture_t::Scalar_t;


protected:

   size_t fBatchSize; ///< Batch size used for training and evaluation


   size_t fInputDepth;  ///< The depth of the previous layer or input.

   size_t fInputHeight; ///< The height of the previous layer or input.

   size_t fInputWidth;  ///< The width of the previous layer or input.


   size_t fDepth;  ///< The depth of the layer.

   size_t fHeight; ///< The height of the layer.

   size_t fWidth;  ///< The width of this layer.


   bool fIsTraining; ///< Flag indicatig the mode


   std::vector<Matrix_t> fWeights; ///< The weights associated to the layer.

   std::vector<Matrix_t> fBiases;  ///< The biases associated to the layer.


   std::vector<Matrix_t> fWeightGradients; ///< Gradients w.r.t. the weights of the layer.

   std::vector<Matrix_t> fBiasGradients;   ///< Gradients w.r.t. the bias values of the layer.


   std::vector<Matrix_t> fOutput;              ///< Activations of this layer.

   std::vector<Matrix_t> fActivationGradients; ///< Gradients w.r.t. the activations of this layer.


   EInitialization fInit; ///< The initialization method.


public:

   /*! Constructor */

   VGeneralLayer(size_t BatchSize, size_t InputDepth, size_t InputHeight, size_t InputWidth, size_t Depth,

                 size_t Height, size_t Width, size_t WeightsNSlices, size_t WeightsNRows, size_t WeightsNCols,

                 size_t BiasesNSlices, size_t BiasesNRows, size_t BiasesNCols, size_t OutputNSlices, size_t OutputNRows,

                 size_t OutputNCols, EInitialization Init);


   /*! General Constructor with different weights dimension */

   VGeneralLayer(size_t BatchSize, size_t InputDepth, size_t InputHeight, size_t InputWidth, size_t Depth,

                 size_t Height, size_t Width, size_t WeightsNSlices, std::vector<size_t> WeightsNRows,

                 std::vector<size_t> WeightsNCols, size_t BiasesNSlices, std::vector<size_t> BiasesNRows,

                 std::vector<size_t> BiasesNCols, size_t OutputNSlices, size_t OutputNRows, size_t OutputNCols,

                 EInitialization Init);


   /*! Copy the layer provided as a pointer */

   VGeneralLayer(VGeneralLayer<Architecture_t> *layer);


   /*! Copy Constructor */

   VGeneralLayer(const VGeneralLayer &);


   /*! Virtual Destructor. */

   virtual ~VGeneralLayer();


   /*! Initialize the weights and biases according to the given initialization method. */

   void Initialize();


   /*! Computes activation of the layer for the given input. The input

    * must be in 3D tensor form with the different matrices corresponding to

    * different events in the batch.  */

   virtual void Forward(std::vector<Matrix_t> &input, bool applyDropout = false) = 0;


   /*! Backpropagates the error. Must only be called directly at the corresponding

    *  call to Forward(...). */

   virtual void Backward(std::vector<Matrix_t> &gradients_backward, const std::vector<Matrix_t> &activations_backward,

                         std::vector<Matrix_t> &inp1, std::vector<Matrix_t> &inp2) = 0;


   /*! Updates the weights and biases, given the learning rate */

   void Update(const Scalar_t learningRate);


   /*! Updates the weights, given the gradients and the learning rate, */

   void UpdateWeights(const std::vector<Matrix_t> &weightGradients, const Scalar_t learningRate);


   /*! Updates the biases, given the gradients and the learning rate. */

   void UpdateBiases(const std::vector<Matrix_t> &biasGradients, const Scalar_t learningRate);


   /*! Updates the weight gradients, given some other weight gradients and learning rate. */

   void UpdateWeightGradients(const std::vector<Matrix_t> &weightGradients, const Scalar_t learningRate);


   /*! Updates the bias gradients, given some other weight gradients and learning rate. */

   void UpdateBiasGradients(const std::vector<Matrix_t> &biasGradients, const Scalar_t learningRate);


   /*! Copies the weights provided as an input.  */

   void CopyWeights(const std::vector<Matrix_t> &otherWeights);


   /*! Copies the biases provided as an input. */

   void CopyBiases(const std::vector<Matrix_t> &otherBiases);


   /*! Prints the info about the layer. */

   virtual void Print() const = 0;


   /*! Writes the information and the weights about the layer in an XML node. */

   virtual void AddWeightsXMLTo(void *parent) = 0;


   /*! Read the information and the weights about the layer from XML node. */

   virtual void ReadWeightsFromXML(void *parent) = 0;


   /*! Set Dropout probability. Reimplemented for layesrs supporting droput */

   virtual void SetDropoutProbability(Scalar_t ) {}


   /*! Getters */

   size_t GetBatchSize() const { return fBatchSize; }

   size_t GetInputDepth() const { return fInputDepth; }

   size_t GetInputHeight() const { return fInputHeight; }

   size_t GetInputWidth() const { return fInputWidth; }

   size_t GetDepth() const { return fDepth; }

   size_t GetHeight() const { return fHeight; }

   size_t GetWidth() const { return fWidth; }

   bool IsTraining() const { return fIsTraining; }


   const std::vector<Matrix_t> &GetWeights() const { return fWeights; }

   std::vector<Matrix_t> &GetWeights() { return fWeights; }


   const Matrix_t &GetWeightsAt(size_t i) const { return fWeights[i]; }

   Matrix_t &GetWeightsAt(size_t i) { return fWeights[i]; }


   const std::vector<Matrix_t> &GetBiases() const { return fBiases; }

   std::vector<Matrix_t> &GetBiases() { return fBiases; }


   const Matrix_t &GetBiasesAt(size_t i) const { return fBiases[i]; }

   Matrix_t &GetBiasesAt(size_t i) { return fBiases[i]; }


   const std::vector<Matrix_t> &GetWeightGradients() const { return fWeightGradients; }

   std::vector<Matrix_t> &GetWeightGradients() { return fWeightGradients; }


   const Matrix_t &GetWeightGradientsAt(size_t i) const { return fWeightGradients[i]; }

   Matrix_t &GetWeightGradientsAt(size_t i) { return fWeightGradients[i]; }


   const std::vector<Matrix_t> &GetBiasGradients() const { return fBiasGradients; }

   std::vector<Matrix_t> &GetBiasGradients() { return fBiasGradients; }


   const Matrix_t &GetBiasGradientsAt(size_t i) const { return fBiasGradients[i]; }

   Matrix_t &GetBiasGradientsAt(size_t i) { return fBiasGradients[i]; }


   const std::vector<Matrix_t> &GetOutput() const { return fOutput; }

   std::vector<Matrix_t> &GetOutput() { return fOutput; }


   const std::vector<Matrix_t> &GetActivationGradients() const { return fActivationGradients; }

   std::vector<Matrix_t> &GetActivationGradients() { return fActivationGradients; }


   Matrix_t &GetOutputAt(size_t i) { return fOutput[i]; }

   const Matrix_t &GetOutputAt(size_t i) const { return fOutput[i]; }


   Matrix_t &GetActivationGradientsAt(size_t i) { return fActivationGradients[i]; }

   const Matrix_t &GetActivationGradientsAt(size_t i) const { return fActivationGradients[i]; }


   EInitialization GetInitialization() const { return fInit; }


   /*! Setters */

   void SetBatchSize(size_t batchSize) { fBatchSize = batchSize; }

   void SetInputDepth(size_t inputDepth) { fInputDepth = inputDepth; }

   void SetInputHeight(size_t inputHeight) { fInputHeight = inputHeight; }

   void SetInputWidth(size_t inputWidth) { fInputWidth = inputWidth; }

   void SetDepth(size_t depth) { fDepth = depth; }

   void SetHeight(size_t height) { fHeight = height; }

   void SetWidth(size_t width) { fWidth = width; }

   void SetIsTraining(bool isTraining) { fIsTraining = isTraining; }


   /// helper functions for XML

   void WriteTensorToXML( void * node, const char * name, const std::vector<Matrix_t> & tensor);

   void WriteMatrixToXML( void * node, const char * name, const Matrix_t & matrix);


   void ReadMatrixXML( void * node, const char * name, Matrix_t & matrix);


};


//

//

//  The General Layer Class - Implementation

//_________________________________________________________________________________________________

template <typename Architecture_t>

VGeneralLayer<Architecture_t>::VGeneralLayer(size_t batchSize, size_t inputDepth, size_t inputHeight, size_t inputWidth,

                                             size_t depth, size_t height, size_t width, size_t weightsNSlices,

                                             size_t weightsNRows, size_t weightsNCols, size_t biasesNSlices,

                                             size_t biasesNRows, size_t biasesNCols, size_t outputNSlices,

                                             size_t outputNRows, size_t outputNCols, EInitialization init)

   : fBatchSize(batchSize), fInputDepth(inputDepth), fInputHeight(inputHeight), fInputWidth(inputWidth), fDepth(depth),

     fHeight(height), fWidth(width), fIsTraining(true), fWeights(), fBiases(), fWeightGradients(), fBiasGradients(),

     fOutput(), fActivationGradients(), fInit(init)

{


   for (size_t i = 0; i < weightsNSlices; i++) {

      fWeights.emplace_back(weightsNRows, weightsNCols);

      fWeightGradients.emplace_back(weightsNRows, weightsNCols);

   }


   for (size_t i = 0; i < biasesNSlices; i++) {

      fBiases.emplace_back(biasesNRows, biasesNCols);

      fBiasGradients.emplace_back(biasesNRows, biasesNCols);

   }


   for (size_t i = 0; i < outputNSlices; i++) {

      fOutput.emplace_back(outputNRows, outputNCols);

      fActivationGradients.emplace_back(outputNRows, outputNCols);

   }

}


//_________________________________________________________________________________________________

template <typename Architecture_t>

VGeneralLayer<Architecture_t>::VGeneralLayer(size_t batchSize, size_t inputDepth, size_t inputHeight, size_t inputWidth,

                                             size_t depth, size_t height, size_t width, size_t weightsNSlices,

                                             std::vector<size_t> weightsNRows, std::vector<size_t> weightsNCols,

                                             size_t biasesNSlices, std::vector<size_t> biasesNRows,

                                             std::vector<size_t> biasesNCols, size_t outputNSlices, size_t outputNRows,

                                             size_t outputNCols, EInitialization init)

   : fBatchSize(batchSize), fInputDepth(inputDepth), fInputHeight(inputHeight), fInputWidth(inputWidth), fDepth(depth),

     fHeight(height), fWidth(width), fIsTraining(true), fWeights(), fBiases(), fWeightGradients(), fBiasGradients(),

     fOutput(), fActivationGradients(), fInit(init)

{


   for (size_t i = 0; i < weightsNSlices; i++) {

      fWeights.emplace_back(weightsNRows[i], weightsNCols[i]);

      fWeightGradients.emplace_back(weightsNRows[i], weightsNCols[i]);

   }


   for (size_t i = 0; i < biasesNSlices; i++) {

      fBiases.emplace_back(biasesNRows[i], biasesNCols[i]);

      fBiasGradients.emplace_back(biasesNRows[i], biasesNCols[i]);

   }


   for (size_t i = 0; i < outputNSlices; i++) {

      fOutput.emplace_back(outputNRows, outputNCols);

      fActivationGradients.emplace_back(outputNRows, outputNCols);

   }

}


//_________________________________________________________________________________________________

template <typename Architecture_t>

VGeneralLayer<Architecture_t>::VGeneralLayer(VGeneralLayer<Architecture_t> *layer)

   : fBatchSize(layer->GetBatchSize()), fInputDepth(layer->GetInputDepth()), fInputHeight(layer->GetInputHeight()),

     fInputWidth(layer->GetInputWidth()), fDepth(layer->GetDepth()), fHeight(layer->GetHeight()),

     fWidth(layer->GetWidth()), fIsTraining(layer->IsTraining()), fWeights(), fBiases(), fWeightGradients(),

     fBiasGradients(), fOutput(), fActivationGradients(), fInit(layer->GetInitialization())

{

   size_t weightsNSlices = (layer->GetWeights()).size();

   size_t weightsNRows = 0;

   size_t weightsNCols = 0;


   for (size_t i = 0; i < weightsNSlices; i++) {

      weightsNRows = (layer->GetWeightsAt(i)).GetNrows();

      weightsNCols = (layer->GetWeightsAt(i)).GetNcols();


      fWeights.emplace_back(weightsNRows, weightsNCols);

      fWeightGradients.emplace_back(weightsNRows, weightsNCols);


      Architecture_t::Copy(fWeights[i], layer->GetWeightsAt(i));

   }


   size_t biasesNSlices = (layer->GetBiases()).size();

   size_t biasesNRows = 0;

   size_t biasesNCols = 0;


   for (size_t i = 0; i < biasesNSlices; i++) {

      biasesNRows = (layer->GetBiasesAt(i)).GetNrows();

      biasesNCols = (layer->GetBiasesAt(i)).GetNcols();


      fBiases.emplace_back(biasesNRows, biasesNCols);

      fBiasGradients.emplace_back(biasesNRows, biasesNCols);


      Architecture_t::Copy(fBiases[i], layer->GetBiasesAt(i));

   }


   size_t outputNSlices = (layer->GetOutput()).size();

   size_t outputNRows = 0;

   size_t outputNCols = 0;


   for (size_t i = 0; i < outputNSlices; i++) {

      outputNRows = (layer->GetOutputAt(i)).GetNrows();

      outputNCols = (layer->GetOutputAt(i)).GetNcols();


      fOutput.emplace_back(outputNRows, outputNCols);

      fActivationGradients.emplace_back(outputNRows, outputNCols);

   }

}


//_________________________________________________________________________________________________

template <typename Architecture_t>

VGeneralLayer<Architecture_t>::VGeneralLayer(const VGeneralLayer &layer)

   : fBatchSize(layer.fBatchSize), fInputDepth(layer.fInputDepth), fInputHeight(layer.fInputHeight),

     fInputWidth(layer.fInputWidth), fDepth(layer.fDepth), fHeight(layer.fHeight), fWidth(layer.fWidth),

     fIsTraining(layer.fIsTraining), fWeights(), fBiases(), fWeightGradients(), fBiasGradients(), fOutput(),

     fActivationGradients(), fInit(layer.fInit)

{

   size_t weightsNSlices = layer.fWeights.size();

   size_t weightsNRows = 0;

   size_t weightsNCols = 0;


   for (size_t i = 0; i < weightsNSlices; i++) {

      weightsNRows = (layer.fWeights[i]).GetNrows();

      weightsNCols = (layer.fWeights[i]).GetNcols();


      fWeights.emplace_back(weightsNRows, weightsNCols);

      fWeightGradients.emplace_back(weightsNRows, weightsNCols);


      Architecture_t::Copy(fWeights[i], layer.fWeights[i]);

   }


   size_t biasesNSlices = layer.fBiases.size();

   size_t biasesNRows = 0;

   size_t biasesNCols = 0;


   for (size_t i = 0; i < biasesNSlices; i++) {

      biasesNRows = (layer.fBiases[i]).GetNrows();

      biasesNCols = (layer.fBiases[i]).GetNcols();


      fBiases.emplace_back(biasesNRows, biasesNCols);

      fBiasGradients.emplace_back(biasesNRows, biasesNCols);


      Architecture_t::Copy(fBiases[i], layer.fBiases[i]);

   }


   size_t outputNSlices = layer.fOutput.size();

   size_t outputNRows = 0;

   size_t outputNCols = 0;


   for (size_t i = 0; i < outputNSlices; i++) {

      outputNRows = (layer.fOutput[i]).GetNrows();

      outputNCols = (layer.fOutput[i]).GetNcols();


      fOutput.emplace_back(outputNRows, outputNCols);

      fActivationGradients.emplace_back(outputNRows, outputNCols);

   }

}


//_________________________________________________________________________________________________

template <typename Architecture_t>

VGeneralLayer<Architecture_t>::~VGeneralLayer()

{

   // Nothing to do here.

}


//_________________________________________________________________________________________________

template <typename Architecture_t>

auto VGeneralLayer<Architecture_t>::Initialize() -> void

{

   for (size_t i = 0; i < fWeights.size(); i++) {

      initialize<Architecture_t>(fWeights[i], this->GetInitialization());

      initialize<Architecture_t>(fWeightGradients[i], EInitialization::kZero);

   }


   for (size_t i = 0; i < fBiases.size(); i++) {

      initialize<Architecture_t>(fBiases[i], EInitialization::kZero);

      initialize<Architecture_t>(fBiasGradients[i], EInitialization::kZero);

   }

}


//_________________________________________________________________________________________________

template <typename Architecture_t>

auto VGeneralLayer<Architecture_t>::Update(const Scalar_t learningRate) -> void

{

   this->UpdateWeights(fWeightGradients, learningRate);

   this->UpdateBiases(fBiasGradients, learningRate);

}


//_________________________________________________________________________________________________

template <typename Architecture_t>

auto VGeneralLayer<Architecture_t>::UpdateWeights(const std::vector<Matrix_t> &weightGradients,

                                                  const Scalar_t learningRate) -> void

{

   for (size_t i = 0; i < fWeights.size(); i++) {

      Architecture_t::ScaleAdd(fWeights[i], weightGradients[i], -learningRate);

   }

}


//_________________________________________________________________________________________________

template <typename Architecture_t>

auto VGeneralLayer<Architecture_t>::UpdateBiases(const std::vector<Matrix_t> &biasGradients,

                                                 const Scalar_t learningRate) -> void

{

   for (size_t i = 0; i < fBiases.size(); i++) {

      Architecture_t::ScaleAdd(fBiases[i], biasGradients[i], -learningRate);

   }

}


//_________________________________________________________________________________________________

template <typename Architecture_t>

auto VGeneralLayer<Architecture_t>::UpdateWeightGradients(const std::vector<Matrix_t> &weightGradients,

                                                          const Scalar_t learningRate) -> void

{

   for (size_t i = 0; i < fWeightGradients.size(); i++) {

      Architecture_t::ScaleAdd(fWeightGradients[i], weightGradients[i], -learningRate);

   }

}


//_________________________________________________________________________________________________

template <typename Architecture_t>

auto VGeneralLayer<Architecture_t>::UpdateBiasGradients(const std::vector<Matrix_t> &biasGradients,

                                                        const Scalar_t learningRate) -> void

{

   for (size_t i = 0; i < fBiasGradients.size(); i++) {

      Architecture_t::ScaleAdd(fBiasGradients[i], biasGradients[i], -learningRate);

   }

}


//_________________________________________________________________________________________________

template <typename Architecture_t>

auto VGeneralLayer<Architecture_t>::CopyWeights(const std::vector<Matrix_t> &otherWeights) -> void

{


   for (size_t i = 0; i < fWeights.size(); i++) {

      Architecture_t::Copy(fWeights[i], otherWeights[i]);

   }

}


//_________________________________________________________________________________________________

template <typename Architecture_t>

auto VGeneralLayer<Architecture_t>::CopyBiases(const std::vector<Matrix_t> &otherBiases) -> void

{

   for (size_t i = 0; i < fBiases.size(); i++) {

      Architecture_t::Copy(fBiases[i], otherBiases[i]);

   }

}


//_________________________________________________________________________________________________

template <typename Architecture_t>

auto VGeneralLayer<Architecture_t>::WriteTensorToXML(void * node, const char * name, const std::vector<Matrix_t> & tensor) -> void

{

   auto xmlengine = gTools().xmlengine();

   void* matnode = xmlengine.NewChild(node, 0, name);

   if (tensor.size() == 0) return;

   xmlengine.NewAttr(matnode,0,"Depth", gTools().StringFromInt(tensor.size()) );

   // assume same number of rows and columns for every matrix in std::vector

   xmlengine.NewAttr(matnode,0,"Rows", gTools().StringFromInt(tensor[0].GetNrows()) );

   xmlengine.NewAttr(matnode,0,"Columns", gTools().StringFromInt(tensor[0].GetNcols()) );

   std::stringstream s;

   for (size_t i = 0; i < tensor.size(); ++i) {

      auto & mat = tensor[i];

      for (Int_t row = 0; row < mat.GetNrows(); row++) {

         for (Int_t col = 0; col < mat.GetNcols(); col++) {

            TString tmp = TString::Format( "%5.15e ", (mat)(row,col) );

            s << tmp.Data();

         }

      }

   }

   xmlengine.AddRawLine( matnode, s.str().c_str() );

}


//_________________________________________________________________________________________________

template <typename Architecture_t>

auto VGeneralLayer<Architecture_t>::WriteMatrixToXML(void * node, const char * name, const Matrix_t & matrix) -> void

{

   auto xmlengine = gTools().xmlengine();

   void* matnode = xmlengine.NewChild(node, 0, name);


   xmlengine.NewAttr(matnode,0,"Rows", gTools().StringFromInt(matrix.GetNrows()) );

   xmlengine.NewAttr(matnode,0,"Columns", gTools().StringFromInt(matrix.GetNcols()) );

   std::stringstream s;

   s.precision( std::numeric_limits<Scalar_t>::digits10 );

   size_t nrows = matrix.GetNrows();

   size_t ncols = matrix.GetNcols();

   for (size_t row = 0; row < nrows; row++) {

      for (size_t col = 0; col < ncols; col++) {

         //TString tmp = TString::Format( "%5.15e ", matrix(row,col) );

         s << std::scientific <<  matrix(row,col) << "  ";

      }

   }


   xmlengine.AddRawLine( matnode, s.str().c_str() );

}


//_________________________________________________________________________________________________

template <typename Architecture_t>

auto VGeneralLayer<Architecture_t>::ReadMatrixXML(void * node, const char * name, Matrix_t & matrix) -> void

{

   void *matrixXML = gTools().GetChild(node, name);

   size_t rows, cols;

   gTools().ReadAttr(matrixXML, "Rows", rows);

   gTools().ReadAttr(matrixXML, "Columns", cols);


   R__ASSERT((size_t) matrix.GetNrows() == rows);

   R__ASSERT((size_t) matrix.GetNcols() == cols);


   const char * matrixString = gTools().xmlengine().GetNodeContent(matrixXML);

   std::stringstream matrixStringStream(matrixString);


   for (size_t i = 0; i < rows; i++)

   {

      for (size_t j = 0; j < cols; j++)

      {

#ifndef R__HAS_TMVAGPU

         matrixStringStream >> matrix(i,j);

#else

         Scalar_t value;

         matrixStringStream >> value;

         matrix(i,j) = value;

#endif


      }

   }

}


} // namespace DNN

} // namespace TMVA


#endif

init
static Int_t init()
Definition: RooClassFactory.cxx:52

Int_t
int Int_t
Definition: RtypesCore.h:41

width
include TDocParser_001 C image html pict1_TDocParser_001 png width
Definition: TDocParser.cxx:121

R__ASSERT
#define R__ASSERT(e)
Definition: TError.h:96

name
char name[80]
Definition: TGX11.cxx:109

Tools.h

TMVA::DNN::VGeneralLayer
Generic General Layer class.
Definition: GeneralLayer.h:46

TMVA::DNN::VGeneralLayer::fWeightGradients
std::vector< Matrix_t > fWeightGradients
Gradients w.r.t. the weights of the layer.
Definition: GeneralLayer.h:66

TMVA::DNN::VGeneralLayer::GetWeightGradients
const std::vector< Matrix_t > & GetWeightGradients() const
Definition: GeneralLayer.h:165

TMVA::DNN::VGeneralLayer::SetDropoutProbability
virtual void SetDropoutProbability(Scalar_t)
Set Dropout probability.
Definition: GeneralLayer.h:141

TMVA::DNN::VGeneralLayer::GetWeightsAt
const Matrix_t & GetWeightsAt(size_t i) const
Definition: GeneralLayer.h:156

TMVA::DNN::VGeneralLayer::SetHeight
void SetHeight(size_t height)
Definition: GeneralLayer.h:197

TMVA::DNN::VGeneralLayer::UpdateWeightGradients
void UpdateWeightGradients(const std::vector< Matrix_t > &weightGradients, const Scalar_t learningRate)
Updates the weight gradients, given some other weight gradients and learning rate.
Definition: GeneralLayer.h:419

TMVA::DNN::VGeneralLayer::Initialize
void Initialize()
Initialize the weights and biases according to the given initialization method.
Definition: GeneralLayer.h:376

TMVA::DNN::VGeneralLayer::GetBiasesAt
Matrix_t & GetBiasesAt(size_t i)
Definition: GeneralLayer.h:163

TMVA::DNN::VGeneralLayer::SetInputHeight
void SetInputHeight(size_t inputHeight)
Definition: GeneralLayer.h:194

TMVA::DNN::VGeneralLayer::fBiasGradients
std::vector< Matrix_t > fBiasGradients
Gradients w.r.t. the bias values of the layer.
Definition: GeneralLayer.h:67

TMVA::DNN::VGeneralLayer::SetDepth
void SetDepth(size_t depth)
Definition: GeneralLayer.h:196

TMVA::DNN::VGeneralLayer::ReadWeightsFromXML
virtual void ReadWeightsFromXML(void *parent)=0
Read the information and the weights about the layer from XML node.

TMVA::DNN::VGeneralLayer::Backward
virtual void Backward(std::vector< Matrix_t > &gradients_backward, const std::vector< Matrix_t > &activations_backward, std::vector< Matrix_t > &inp1, std::vector< Matrix_t > &inp2)=0
Backpropagates the error.

TMVA::DNN::VGeneralLayer::UpdateBiasGradients
void UpdateBiasGradients(const std::vector< Matrix_t > &biasGradients, const Scalar_t learningRate)
Updates the bias gradients, given some other weight gradients and learning rate.
Definition: GeneralLayer.h:429

TMVA::DNN::VGeneralLayer::SetBatchSize
void SetBatchSize(size_t batchSize)
Setters.
Definition: GeneralLayer.h:192

TMVA::DNN::VGeneralLayer::CopyWeights
void CopyWeights(const std::vector< Matrix_t > &otherWeights)
Copies the weights provided as an input.
Definition: GeneralLayer.h:439

TMVA::DNN::VGeneralLayer::fBatchSize
size_t fBatchSize
Batch size used for training and evaluation.
Definition: GeneralLayer.h:51

TMVA::DNN::VGeneralLayer::AddWeightsXMLTo
virtual void AddWeightsXMLTo(void *parent)=0
Writes the information and the weights about the layer in an XML node.

TMVA::DNN::VGeneralLayer::fActivationGradients
std::vector< Matrix_t > fActivationGradients
Gradients w.r.t. the activations of this layer.
Definition: GeneralLayer.h:70

TMVA::DNN::VGeneralLayer::UpdateWeights
void UpdateWeights(const std::vector< Matrix_t > &weightGradients, const Scalar_t learningRate)
Updates the weights, given the gradients and the learning rate,.
Definition: GeneralLayer.h:399

TMVA::DNN::VGeneralLayer::Matrix_t
typename Architecture_t::Matrix_t Matrix_t
Definition: GeneralLayer.h:47

TMVA::DNN::VGeneralLayer::GetBiasGradients
const std::vector< Matrix_t > & GetBiasGradients() const
Definition: GeneralLayer.h:171

TMVA::DNN::VGeneralLayer::SetInputDepth
void SetInputDepth(size_t inputDepth)
Definition: GeneralLayer.h:193

TMVA::DNN::VGeneralLayer::GetWeights
const std::vector< Matrix_t > & GetWeights() const
Definition: GeneralLayer.h:153

TMVA::DNN::VGeneralLayer::GetDepth
size_t GetDepth() const
Definition: GeneralLayer.h:148

TMVA::DNN::VGeneralLayer::GetWeights
std::vector< Matrix_t > & GetWeights()
Definition: GeneralLayer.h:154

TMVA::DNN::VGeneralLayer::fWidth
size_t fWidth
The width of this layer.
Definition: GeneralLayer.h:59

TMVA::DNN::VGeneralLayer::fInit
EInitialization fInit
The initialization method.
Definition: GeneralLayer.h:72

TMVA::DNN::VGeneralLayer::fBiases
std::vector< Matrix_t > fBiases
The biases associated to the layer.
Definition: GeneralLayer.h:64

TMVA::DNN::VGeneralLayer::SetIsTraining
void SetIsTraining(bool isTraining)
Definition: GeneralLayer.h:199

TMVA::DNN::VGeneralLayer::fInputWidth
size_t fInputWidth
The width of the previous layer or input.
Definition: GeneralLayer.h:55

TMVA::DNN::VGeneralLayer::fHeight
size_t fHeight
The height of the layer.
Definition: GeneralLayer.h:58

TMVA::DNN::VGeneralLayer::Print
virtual void Print() const =0
Prints the info about the layer.

TMVA::DNN::VGeneralLayer::fOutput
std::vector< Matrix_t > fOutput
Activations of this layer.
Definition: GeneralLayer.h:69

TMVA::DNN::VGeneralLayer::fInputDepth
size_t fInputDepth
The depth of the previous layer or input.
Definition: GeneralLayer.h:53

TMVA::DNN::VGeneralLayer::SetWidth
void SetWidth(size_t width)
Definition: GeneralLayer.h:198

TMVA::DNN::VGeneralLayer::fIsTraining
bool fIsTraining
Flag indicatig the mode.
Definition: GeneralLayer.h:61

TMVA::DNN::VGeneralLayer::GetOutputAt
Matrix_t & GetOutputAt(size_t i)
Definition: GeneralLayer.h:183

TMVA::DNN::VGeneralLayer::GetBiases
const std::vector< Matrix_t > & GetBiases() const
Definition: GeneralLayer.h:159

TMVA::DNN::VGeneralLayer::Scalar_t
typename Architecture_t::Scalar_t Scalar_t
Definition: GeneralLayer.h:48

TMVA::DNN::VGeneralLayer::GetBiasGradients
std::vector< Matrix_t > & GetBiasGradients()
Definition: GeneralLayer.h:172

TMVA::DNN::VGeneralLayer::fWeights
std::vector< Matrix_t > fWeights
The weights associated to the layer.
Definition: GeneralLayer.h:63

TMVA::DNN::VGeneralLayer::GetInitialization
EInitialization GetInitialization() const
Definition: GeneralLayer.h:189

TMVA::DNN::VGeneralLayer::GetWeightsAt
Matrix_t & GetWeightsAt(size_t i)
Definition: GeneralLayer.h:157

TMVA::DNN::VGeneralLayer::GetBiasGradientsAt
Matrix_t & GetBiasGradientsAt(size_t i)
Definition: GeneralLayer.h:175

TMVA::DNN::VGeneralLayer::GetActivationGradients
std::vector< Matrix_t > & GetActivationGradients()
Definition: GeneralLayer.h:181

TMVA::DNN::VGeneralLayer::GetInputDepth
size_t GetInputDepth() const
Definition: GeneralLayer.h:145

TMVA::DNN::VGeneralLayer::GetActivationGradientsAt
const Matrix_t & GetActivationGradientsAt(size_t i) const
Definition: GeneralLayer.h:187

TMVA::DNN::VGeneralLayer::GetBiases
std::vector< Matrix_t > & GetBiases()
Definition: GeneralLayer.h:160

TMVA::DNN::VGeneralLayer::WriteMatrixToXML
void WriteMatrixToXML(void *node, const char *name, const Matrix_t &matrix)
Definition: GeneralLayer.h:483

TMVA::DNN::VGeneralLayer::GetWeightGradients
std::vector< Matrix_t > & GetWeightGradients()
Definition: GeneralLayer.h:166

TMVA::DNN::VGeneralLayer::GetActivationGradients
const std::vector< Matrix_t > & GetActivationGradients() const
Definition: GeneralLayer.h:180

TMVA::DNN::VGeneralLayer::fInputHeight
size_t fInputHeight
The height of the previous layer or input.
Definition: GeneralLayer.h:54

TMVA::DNN::VGeneralLayer::fDepth
size_t fDepth
The depth of the layer.
Definition: GeneralLayer.h:57

TMVA::DNN::VGeneralLayer::GetOutput
const std::vector< Matrix_t > & GetOutput() const
Definition: GeneralLayer.h:177

TMVA::DNN::VGeneralLayer::CopyBiases
void CopyBiases(const std::vector< Matrix_t > &otherBiases)
Copies the biases provided as an input.
Definition: GeneralLayer.h:449

TMVA::DNN::VGeneralLayer::GetOutput
std::vector< Matrix_t > & GetOutput()
Definition: GeneralLayer.h:178

TMVA::DNN::VGeneralLayer::Update
void Update(const Scalar_t learningRate)
Updates the weights and biases, given the learning rate.
Definition: GeneralLayer.h:391

TMVA::DNN::VGeneralLayer::GetBiasesAt
const Matrix_t & GetBiasesAt(size_t i) const
Definition: GeneralLayer.h:162

TMVA::DNN::VGeneralLayer::Forward
virtual void Forward(std::vector< Matrix_t > &input, bool applyDropout=false)=0
Computes activation of the layer for the given input.

TMVA::DNN::VGeneralLayer::GetInputHeight
size_t GetInputHeight() const
Definition: GeneralLayer.h:146

TMVA::DNN::VGeneralLayer::SetInputWidth
void SetInputWidth(size_t inputWidth)
Definition: GeneralLayer.h:195

TMVA::DNN::VGeneralLayer::GetBiasGradientsAt
const Matrix_t & GetBiasGradientsAt(size_t i) const
Definition: GeneralLayer.h:174

TMVA::DNN::VGeneralLayer::WriteTensorToXML
void WriteTensorToXML(void *node, const char *name, const std::vector< Matrix_t > &tensor)
helper functions for XML
Definition: GeneralLayer.h:459

TMVA::DNN::VGeneralLayer::GetBatchSize
size_t GetBatchSize() const
Getters.
Definition: GeneralLayer.h:144

TMVA::DNN::VGeneralLayer::GetWeightGradientsAt
Matrix_t & GetWeightGradientsAt(size_t i)
Definition: GeneralLayer.h:169

TMVA::DNN::VGeneralLayer::ReadMatrixXML
void ReadMatrixXML(void *node, const char *name, Matrix_t &matrix)
Definition: GeneralLayer.h:506

TMVA::DNN::VGeneralLayer::GetWidth
size_t GetWidth() const
Definition: GeneralLayer.h:150

TMVA::DNN::VGeneralLayer::GetHeight
size_t GetHeight() const
Definition: GeneralLayer.h:149

TMVA::DNN::VGeneralLayer::GetWeightGradientsAt
const Matrix_t & GetWeightGradientsAt(size_t i) const
Definition: GeneralLayer.h:168

TMVA::DNN::VGeneralLayer::UpdateBiases
void UpdateBiases(const std::vector< Matrix_t > &biasGradients, const Scalar_t learningRate)
Updates the biases, given the gradients and the learning rate.
Definition: GeneralLayer.h:409

TMVA::DNN::VGeneralLayer::IsTraining
bool IsTraining() const
Definition: GeneralLayer.h:151

TMVA::DNN::VGeneralLayer::~VGeneralLayer
virtual ~VGeneralLayer()
Virtual Destructor.
Definition: GeneralLayer.h:369

TMVA::DNN::VGeneralLayer::GetOutputAt
const Matrix_t & GetOutputAt(size_t i) const
Definition: GeneralLayer.h:184

TMVA::DNN::VGeneralLayer::GetActivationGradientsAt
Matrix_t & GetActivationGradientsAt(size_t i)
Definition: GeneralLayer.h:186

TMVA::DNN::VGeneralLayer::VGeneralLayer
VGeneralLayer(size_t BatchSize, size_t InputDepth, size_t InputHeight, size_t InputWidth, size_t Depth, size_t Height, size_t Width, size_t WeightsNSlices, size_t WeightsNRows, size_t WeightsNCols, size_t BiasesNSlices, size_t BiasesNRows, size_t BiasesNCols, size_t OutputNSlices, size_t OutputNRows, size_t OutputNCols, EInitialization Init)
Constructor.
Definition: GeneralLayer.h:214

TMVA::DNN::VGeneralLayer::GetInputWidth
size_t GetInputWidth() const
Definition: GeneralLayer.h:147

TMVA::Tools::GetChild
void * GetChild(void *parent, const char *childname=0)
get child node
Definition: Tools.cxx:1162

TMVA::Tools::xmlengine
TXMLEngine & xmlengine()
Definition: Tools.h:270

TMVA::Tools::ReadAttr
void ReadAttr(void *node, const char *, T &value)
read attribute from xml
Definition: Tools.h:337

TString
Basic string class.
Definition: TString.h:131

TString::Data
const char * Data() const
Definition: TString.h:364

TString::Format
static TString Format(const char *fmt,...)
Static method which formats a string using a printf style format descriptor and return a TString.
Definition: TString.cxx:2311

TXMLEngine::NewChild
XMLNodePointer_t NewChild(XMLNodePointer_t parent, XMLNsPointer_t ns, const char *name, const char *content=0)
create new child element for parent node
Definition: TXMLEngine.cxx:709

TXMLEngine::GetNodeContent
const char * GetNodeContent(XMLNodePointer_t xmlnode)
get contents (if any) of xmlnode
Definition: TXMLEngine.cxx:1077

ROOT::Math::GSLSimAn::Copy
void Copy(void *source, void *dest)
Definition: GSLSimAnnealing.cxx:149

TClassEdit::Init
void Init(TClassEdit::TInterpreterLookupHelper *helper)
Definition: TClassEdit.cxx:144

TGeant4Unit::s
static constexpr double s
Definition: TGeant4SystemOfUnits.h:162

TMVA::DNN::EInitialization
EInitialization
Definition: Functions.h:70

TMVA::DNN::EInitialization::kZero
@ kZero

TMVA::kNN::Depth
UInt_t Depth(const Node< T > *node)
Definition: NodekNN.h:213

TMVA
create variable transformations
Definition: GeneticMinimizer.h:21

TMVA::gTools
Tools & gTools()