doc/hackathon/ConvLayer_8h_source.html

// @(#)root/tmva/tmva/dnn:$Id$

// Author: Vladimir Ilievski


/**********************************************************************************

 * Project: TMVA - a Root-integrated toolkit for multivariate data analysis       *

 * Package: TMVA                                                                  *

 * Class  : TConvLayer                                                            *

 *                                             *

 *                                                                                *

 * Description:                                                                   *

 *      Convolutional Deep Neural Network Layer                                   *

 *                                                                                *

 * Authors (alphabetical):                                                        *

 *      Vladimir Ilievski      <ilievski.vladimir@live.com>  - CERN, Switzerland  *

 *                                                                                *

 * Copyright (c) 2005-2015:                                                       *

 *      CERN, Switzerland                                                         *

 *      U. of Victoria, Canada                                                    *

 *      MPI-K Heidelberg, Germany                                                 *

 *      U. of Bonn, Germany                                                       *

 *                                                                                *

 * Redistribution and use in source and binary forms, with or without             *

 * modification, are permitted according to the terms listed in LICENSE           *

 * (see tmva/doc/LICENSE)                                          *

 **********************************************************************************/


#ifndef TMVA_CNN_CONVLAYER

#define TMVA_CNN_CONVLAYER


#include "TMatrix.h"


#include "TMVA/DNN/GeneralLayer.h"

#include "TMVA/DNN/Functions.h"

#include "TMVA/DNN/CNN/ContextHandles.h"


#include <vector>

#include <iostream>

#include <string>


namespace TMVA {

namespace DNN {

namespace CNN {


typedef struct TConvParams {


public:

   size_t batchSize; ///< Batch size used for training and evaluation


   size_t inputDepth;  ///< The depth of the previous layer or input.

   size_t inputHeight; ///< The height of the previous layer or input.

   size_t inputWidth;  ///< The width of the previous layer or input.


   size_t numberFilters; ///< The number of the filters, which is equal to the output's depth.

   size_t filterHeight;  ///< The height of the filter.

   size_t filterWidth;   ///< The width of the filter.


   size_t strideRows;    ///< The number of row pixels to slid the filter each step.

   size_t strideCols;    ///< The number of column pixels to slid the filter each step.

   size_t paddingHeight; ///< The number of zero layers added top and bottom of the input.

   size_t paddingWidth;  ///< The number of zero layers left and right of the input.


   TConvParams(size_t _batchSize, size_t _inputDepth, size_t _inputHeight, size_t _inputWidth, size_t _numberFilters,

               size_t _filterHeight, size_t _filterWidth, size_t _strideRows, size_t _strideCols,

               size_t _paddingHeight, size_t _paddingWidth)

           : batchSize(_batchSize), inputDepth(_inputDepth), inputHeight(_inputHeight), inputWidth(_inputWidth),

             numberFilters(_numberFilters), filterHeight(_filterHeight), filterWidth(_filterWidth),

             strideRows(_strideRows), strideCols(_strideCols), paddingHeight(_paddingHeight),

             paddingWidth(_paddingWidth)

   {}


} TConvParams;


template <typename Architecture_t>


class TConvLayer : public VGeneralLayer<Architecture_t> {

public:

   using Tensor_t = typename Architecture_t::Tensor_t;

   using Matrix_t = typename Architecture_t::Matrix_t;

   using Scalar_t = typename Architecture_t::Scalar_t;


   using LayerDescriptor_t   = typename Architecture_t::ConvolutionDescriptor_t;

   using WeightsDescriptor_t = typename Architecture_t::FilterDescriptor_t;

   using HelperDescriptor_t  = typename Architecture_t::ActivationDescriptor_t;


   using AlgorithmForward_t  = typename Architecture_t::AlgorithmForward_t;  // Forward layer operation

   using AlgorithmBackward_t = typename Architecture_t::AlgorithmBackward_t; // Backward layer operation

   using AlgorithmHelper_t   = typename Architecture_t::AlgorithmHelper_t;   // Used for weight grad backward pass

   using ReduceTensorDescriptor_t = typename Architecture_t::ReduceTensorDescriptor_t; // used for reduction of tensor(bias grad)


   // FIXME: Add other cudnn types (algorithm preference etc.)

   using AlgorithmDataType_t = typename Architecture_t::AlgorithmDataType_t;


   /* Calculate the output dimension of the convolutional layer */

   static size_t calculateDimension(size_t imgDim, size_t fltDim, size_t padding, size_t stride);


   /* Calculate the number of pixels in a single receptive field */

   static size_t inline calculateNLocalViewPixels(size_t depth, size_t height, size_t width) { return depth * height * width; }


   /* Calculate the number of receptive fields in an image given the filter and image sizes */

   static size_t calculateNLocalViews(size_t inputHeight, size_t filterHeight, size_t paddingHeight, size_t strideRows,

                               size_t inputWidth, size_t filterWidth, size_t paddingWidth, size_t strideCols);


protected:

   size_t fFilterDepth;  ///< The depth of the filter.

   size_t fFilterHeight; ///< The height of the filter.

   size_t fFilterWidth;  ///< The width of the filter.


   size_t fStrideRows;   ///< The number of row pixels to slid the filter each step.

   size_t fStrideCols;   ///< The number of column pixels to slid the filter each step.


   size_t fNLocalViewPixels;     ///< The number of pixels in one local image view.

   size_t fNLocalViews;          ///< The number of local views in one image.


   Scalar_t fDropoutProbability; ///< Probability that an input is active.


   TDescriptors * fDescriptors = nullptr;  ///< Keeps the convolution, activations and filter descriptors


   TWorkspace * fWorkspace = nullptr;

private:

   size_t fPaddingHeight;        ///< The number of zero layers added top and bottom of the input.

   size_t fPaddingWidth;         ///< The number of zero layers left and right of the input.


   Tensor_t fInputActivation;        ///< First output of this layer after conv, before activation.


   std::vector<int> fBackwardIndices;  ///< Vector of indices used for a fast Im2Col in backward pass


   EActivationFunction fF;             ///< Activation function of the layer.

   ERegularization fReg;               ///< The regularization method.

   Scalar_t fWeightDecay;              ///< The weight decay.


   Tensor_t fForwardTensor;            ///< Cache tensor used for speeding-up the forward pass.


   void InitializeDescriptors();

   void ReleaseDescriptors();

   void InitializeWorkspace();

   void FreeWorkspace();


public:

   /*! Constructor. */

   TConvLayer(size_t BatchSize, size_t InputDepth, size_t InputHeight, size_t InputWidth, size_t Depth, EInitialization Init,

              size_t FilterHeight, size_t FilterWidth, size_t StrideRows, size_t StrideCols, size_t PaddingHeight,

              size_t PaddingWidth, Scalar_t DropoutProbability, EActivationFunction f, ERegularization Reg,

              Scalar_t WeightDecay);


   /*! Copy the conv layer provided as a pointer */

   TConvLayer(TConvLayer<Architecture_t> *layer);


   /*! Copy constructor. */

   TConvLayer(const TConvLayer &);


   /*! Destructor. */

   virtual ~TConvLayer();


   //virtual void Initialize();


   /*! Computes activation of the layer for the given input. The input

   * must be in 3D tensor form with the different matrices corresponding to

   * different events in the batch. Computes activations as well as

   * the first partial derivative of the activation function at those

   * activations. */

   void Forward(Tensor_t &input, bool applyDropout = false) override;


   /*! Compute weight, bias and activation gradients. Uses the precomputed

    *  first partial derivatives of the activation function computed during

    *  forward propagation and modifies them. Must only be called directly

    *  at the corresponding call to Forward(...). */

   void Backward(Tensor_t &gradients_backward, const Tensor_t &activations_backward) override;

   ////              Tensor_t &inp1, Tensor_t &inp2);


   /*! Prints the info about the layer. */

   void Print() const override;


   /*! Writes the information and the weights about the layer in an XML node. */

   void AddWeightsXMLTo(void *parent) override;


   /*! Read the information and the weights about the layer from XML node. */

   void ReadWeightsFromXML(void *parent) override;


   /*! Getters */

   size_t GetFilterDepth() const { return fFilterDepth; }

   size_t GetFilterHeight() const { return fFilterHeight; }

   size_t GetFilterWidth() const { return fFilterWidth; }


   size_t GetStrideRows() const { return fStrideRows; }

   size_t GetStrideCols() const { return fStrideCols; }


   size_t GetPaddingHeight() const { return fPaddingHeight; }

   size_t GetPaddingWidth() const { return fPaddingWidth; }


   size_t GetNLocalViewPixels() const { return fNLocalViewPixels; }

   size_t GetNLocalViews() const { return fNLocalViews; }


   Scalar_t GetDropoutProbability() const { return fDropoutProbability; }


   const Tensor_t &GetInputActivation() const { return fInputActivation; }

   Tensor_t &GetInputActivation() { return fInputActivation; }


   Matrix_t &GetInputActivationAt(size_t i) { return fInputActivation[i]; }

   const Matrix_t &GetInputActivationAt(size_t i) const { return fInputActivation[i]; }


   const Tensor_t &GetForwardMatrices() const { return fForwardTensor; }

   Tensor_t &GetForwardMatrices() { return fForwardTensor; }


   EActivationFunction GetActivationFunction() const { return fF; }

   ERegularization GetRegularization() const { return fReg; }

   Scalar_t GetWeightDecay() const { return fWeightDecay; }


   // The following getters are used for testing

   TDescriptors * GetDescriptors() {return fDescriptors;}

   const TDescriptors * GetDescriptors() const {return fDescriptors;}


   TWorkspace * GetWorkspace() {return fWorkspace;}

   const TWorkspace * GetWorkspace() const {return fWorkspace;}

};


//

//

//  Conv Layer Class - Implementation

//______________________________________________________________________________

template <typename Architecture_t>


TConvLayer<Architecture_t>::TConvLayer(size_t batchSize, size_t inputDepth, size_t inputHeight, size_t inputWidth,

                                       size_t depth, EInitialization init, size_t filterHeight, size_t filterWidth,

                                       size_t strideRows, size_t strideCols, size_t paddingHeight, size_t paddingWidth,

                                       Scalar_t dropoutProbability, EActivationFunction f, ERegularization reg,

                                       Scalar_t weightDecay)

   : VGeneralLayer<Architecture_t>(batchSize, inputDepth, inputHeight, inputWidth, depth,

                                   calculateDimension(inputHeight, filterHeight, paddingHeight, strideRows),

                                   calculateDimension(inputWidth, filterWidth, paddingWidth, strideCols),

                                   1, depth, calculateNLocalViewPixels(inputDepth, filterHeight, filterWidth),

                                   1, depth, 1, batchSize, depth,

                                   calculateNLocalViews(inputHeight, filterHeight, paddingHeight, strideRows,

                                                        inputWidth, filterWidth, paddingWidth, strideCols),

                                   init),

     fFilterDepth(inputDepth), fFilterHeight(filterHeight), fFilterWidth(filterWidth), fStrideRows(strideRows),

     fStrideCols(strideCols), fNLocalViewPixels(calculateNLocalViewPixels(inputDepth, filterHeight, filterWidth)),

     fNLocalViews(calculateNLocalViews(inputHeight, filterHeight, paddingHeight, strideRows,

                                       inputWidth, filterWidth, paddingWidth, strideCols)),

     fDropoutProbability(dropoutProbability), fPaddingHeight(paddingHeight), fPaddingWidth(paddingWidth),

     fInputActivation(), fF(f), fReg(reg), fWeightDecay(weightDecay)

{

   /** Each element in the vector is a `T_Matrix` representing an event, therefore `vec.size() == batchSize`.

    *  Cells in these matrices are distributed in the following manner:

    *  Each row represents a single feature map, therefore we have `nRows == depth`.

    *  Each column represents a single pixel in that feature map, therefore we have `nCols == nLocalViews`.

    **/

   fInputActivation = Tensor_t( batchSize, depth, fNLocalViews);     // create tensor (shape is B x C x LV)

   fForwardTensor = Tensor_t ( batchSize, fNLocalViews, fNLocalViewPixels );


   InitializeDescriptors();

   InitializeWorkspace();

}


//______________________________________________________________________________

template <typename Architecture_t>


TConvLayer<Architecture_t>::TConvLayer(TConvLayer<Architecture_t> *layer)

   : VGeneralLayer<Architecture_t>(layer), fFilterDepth(layer->GetFilterDepth()),

     fFilterHeight(layer->GetFilterHeight()), fFilterWidth(layer->GetFilterWidth()),

     fStrideRows(layer->GetStrideRows()), fStrideCols(layer->GetStrideCols()),

     fNLocalViewPixels(layer->GetNLocalViewPixels()), fNLocalViews(layer->GetNLocalViews()),

     fDropoutProbability(layer->GetDropoutProbability()), fPaddingHeight(layer->GetPaddingHeight()),

     fPaddingWidth(layer->GetPaddingWidth()),

     fInputActivation( layer->GetInputActivation().GetShape() ),

     fF(layer->GetActivationFunction()),

     fReg(layer->GetRegularization()), fWeightDecay(layer->GetWeightDecay()),

     fForwardTensor( layer->GetForwardMatrices().GetShape() )

{

   InitializeDescriptors();

   InitializeWorkspace();


}


//______________________________________________________________________________

template <typename Architecture_t>


TConvLayer<Architecture_t>::TConvLayer(const TConvLayer &convLayer)

   :  VGeneralLayer<Architecture_t>(convLayer), fFilterDepth(convLayer.fFilterDepth),

      fFilterHeight(convLayer.fFilterHeight), fFilterWidth(convLayer.fFilterWidth), fStrideRows(convLayer.fStrideRows),

      fStrideCols(convLayer.fStrideCols), fNLocalViewPixels(convLayer.fNLocalViewPixels),

      fNLocalViews(convLayer.fNLocalViews), fDropoutProbability(convLayer.fDropoutProbability),

      fPaddingHeight(convLayer.fPaddingHeight), fPaddingWidth(convLayer.fPaddingWidth),

      fInputActivation( convLayer.GetInputActivation().GetShape() ),

      fF(convLayer.fF),

      fReg(convLayer.fReg), fWeightDecay(convLayer.fWeightDecay),

      fForwardTensor( convLayer.GetForwardMatrices().GetShape() )

{

   InitializeDescriptors();

   InitializeWorkspace();

}


//______________________________________________________________________________

//FIXME: Add function for cudaFree

template <typename Architecture_t>


TConvLayer<Architecture_t>::~TConvLayer()

{

   //std::cout << "!!!!Delete conv layer " << this->GetOutput().GetShape()[1] << "  " << this->GetOutput().GetShape()[2] << "  " << this->GetOutput().GetShape()[3] << std::endl;

   if (fDescriptors) {

      ReleaseDescriptors();

      delete fDescriptors;

   }


   if (fWorkspace) {

      FreeWorkspace();

      delete fWorkspace;

   }

}


//______________________________________________________________________________

template <typename Architecture_t>


auto TConvLayer<Architecture_t>::Forward(Tensor_t &input, bool /*applyDropout*/) -> void

{

   TConvParams params(this->GetBatchSize(), this->GetInputDepth(), this->GetInputHeight(), this->GetInputWidth(),

                      this->GetDepth(), this->GetFilterHeight(), this->GetFilterWidth(),

                      this->GetStrideRows(), this->GetStrideCols(), this->GetPaddingHeight(), this->GetPaddingWidth());


   //R__ASSERT( input.size() > 0);

   Architecture_t::ConvLayerForward(this->GetOutput(), this->GetInputActivation(), input, this->GetWeightsAt(0),

                                    this->GetBiasesAt(0), params, this->GetActivationFunction(),

                                    this->GetForwardMatrices(), (TCNNDescriptors<TConvLayer<Architecture_t>> &) (*fDescriptors),

                                    (TCNNWorkspace<TConvLayer<Architecture_t>> &) (*fWorkspace));

}


//______________________________________________________________________________

template <typename Architecture_t>


auto TConvLayer<Architecture_t>::Backward(Tensor_t &gradients_backward,

                                          const Tensor_t &activations_backward) -> void

//                                          Tensor_t & /*inp1*/, Tensor_t &

//                                          /*inp2*/) -> void

{

   Architecture_t::ConvLayerBackward(

      gradients_backward, this->GetWeightGradientsAt(0), this->GetBiasGradientsAt(0), this->GetInputActivation(),

      this->GetActivationGradients(), this->GetWeightsAt(0), activations_backward, this->GetOutput(),

      this->GetActivationFunction(),

      (TCNNDescriptors<TConvLayer<Architecture_t>> &) (*fDescriptors),

      (TCNNWorkspace<TConvLayer<Architecture_t>> &) (*fWorkspace),

      this->GetBatchSize(), this->GetInputHeight(), this->GetInputWidth(), this->GetDepth(),

      this->GetHeight(), this->GetWidth(), this->GetFilterDepth(), this->GetFilterHeight(),

      this->GetFilterWidth(), this->GetNLocalViews());


   addRegularizationGradients<Architecture_t>(this->GetWeightGradientsAt(0), this->GetWeightsAt(0),

                                              this->GetWeightDecay(), this->GetRegularization());

}


//______________________________________________________________________________

template <typename Architecture_t>


auto TConvLayer<Architecture_t>::Print() const -> void

{

   std::cout << " CONV LAYER: \t";

   std::cout << "( W = " << this->GetWidth() << " , ";

   std::cout << " H = " << this->GetHeight() << " , ";

   std::cout << " D = " << this->GetDepth() << " ) ";


   std::cout << "\t Filter ( W = " << this->GetFilterWidth() << " , ";

   std::cout << " H = " << this->GetFilterHeight() << " ) ";

   //std::cout << "\t Local Views = " << this->GetNLocalViews()  << " " ;

   if (this->GetOutput().GetSize() > 0) {

      std::cout << "\tOutput = ( " << this->GetOutput().GetFirstSize() << " , "

                << this->GetOutput().GetCSize() << " , " << this->GetOutput().GetHSize() << " , " << this->GetOutput().GetWSize()

                << " ) ";

   }

   std::vector<std::string> activationNames = { "Identity","Relu","Sigmoid","Tanh","SymmRelu","SoftSign","Gauss" };

   std::cout << "\t Activation Function = ";

   std::cout << activationNames[ static_cast<int>(fF) ] << std::endl;

}


//______________________________________________________________________________

template <typename Architecture_t>


void TConvLayer<Architecture_t>::AddWeightsXMLTo(void *parent)

{

   auto layerxml = gTools().xmlengine().NewChild(parent, nullptr, "ConvLayer");


   gTools().xmlengine().NewAttr(layerxml, nullptr, "Depth", gTools().StringFromInt(this->GetDepth()));

   gTools().xmlengine().NewAttr(layerxml, nullptr, "FilterHeight", gTools().StringFromInt(this->GetFilterHeight()));

   gTools().xmlengine().NewAttr(layerxml, nullptr, "FilterWidth", gTools().StringFromInt(this->GetFilterWidth()));

   gTools().xmlengine().NewAttr(layerxml, nullptr, "StrideRows", gTools().StringFromInt(this->GetStrideRows()));

   gTools().xmlengine().NewAttr(layerxml, nullptr, "StrideCols", gTools().StringFromInt(this->GetStrideCols()));

   gTools().xmlengine().NewAttr(layerxml, nullptr, "PaddingHeight", gTools().StringFromInt(this->GetPaddingHeight()));

   gTools().xmlengine().NewAttr(layerxml, nullptr, "PaddingWidth", gTools().StringFromInt(this->GetPaddingWidth()));


   int activationFunction = static_cast<int>(this -> GetActivationFunction());

   gTools().xmlengine().NewAttr(layerxml, nullptr, "ActivationFunction",

                                TString::Itoa(activationFunction, 10));


   // write weights and bias matrix

   this->WriteMatrixToXML(layerxml, "Weights", this -> GetWeightsAt(0));

   this->WriteMatrixToXML(layerxml, "Biases",  this -> GetBiasesAt(0));

}


//______________________________________________________________________________

template <typename Architecture_t>


void TConvLayer<Architecture_t>::ReadWeightsFromXML(void *parent)

{

   // read weights and biases

   // the meta information is read before because it is needed before creating the Conv layer

   this->ReadMatrixXML(parent,"Weights", this -> GetWeightsAt(0));

   this->ReadMatrixXML(parent,"Biases", this -> GetBiasesAt(0));

}


template <typename Architecture_t>


size_t TConvLayer<Architecture_t>::calculateDimension(size_t imgDim, size_t fltDim, size_t padding, size_t stride)

{

   size_t temp = imgDim - fltDim + 2 * padding;

   if (temp % stride || temp + stride <= 0) {

      Fatal("calculateDimension", "Not compatible hyper parameters for layer - (imageDim, filterDim, padding, stride) "

            "%zu, %zu, %zu, %zu", imgDim, fltDim, padding, stride);

   }

   return temp / stride + 1;

}


template <typename Architecture_t>


size_t TConvLayer<Architecture_t>::calculateNLocalViews(size_t inputHeight, size_t filterHeight, size_t paddingHeight,

                                                        size_t strideRows, size_t inputWidth, size_t filterWidth,

                                                        size_t paddingWidth, size_t strideCols)

{

    int height = calculateDimension(inputHeight, filterHeight, paddingHeight, strideRows);

    int width = calculateDimension(inputWidth, filterWidth, paddingWidth, strideCols);


    return height * width;

}


//______________________________________________________________________________

template <typename Architecture_t>


void TConvLayer<Architecture_t>::InitializeDescriptors() {

   Architecture_t::InitializeConvDescriptors(fDescriptors, this);

}


template <typename Architecture_t>


void TConvLayer<Architecture_t>::ReleaseDescriptors() {

   Architecture_t::ReleaseConvDescriptors(fDescriptors);

}


//______________________________________________________________________________

template <typename Architecture_t>


void TConvLayer<Architecture_t>::InitializeWorkspace() {

   TConvParams params(this->GetBatchSize(), this->GetInputDepth(), this->GetInputHeight(), this->GetInputWidth(),

                      this->GetDepth(), this->GetFilterHeight(), this->GetFilterWidth(),

                      this->GetStrideRows(), this->GetStrideCols(), this->GetPaddingHeight(), this->GetPaddingWidth());


   Architecture_t::InitializeConvWorkspace(fWorkspace, fDescriptors, params, this);

}


template <typename Architecture_t>


void TConvLayer<Architecture_t>::FreeWorkspace() {

   Architecture_t::FreeConvWorkspace(fWorkspace);

}


//______________________________________________________________________________


} // namespace CNN

} // namespace DNN

} // namespace TMVA


#endif

ContextHandles.h

GeneralLayer.h

f
#define f(i)
Definition RSha256.hxx:104

Fatal
void Fatal(const char *location, const char *msgfmt,...)
Use this function in case of a fatal error. It will abort the program.
Definition TError.cxx:267

TMatrix.h

TMVA::DNN::CNN::TConvLayer::Print
void Print() const override
Prints the info about the layer.
Definition ConvLayer.h:347

TMVA::DNN::CNN::TConvLayer< TCpu< AReal > >::fNLocalViews
size_t fNLocalViews
Definition ConvLayer.h:112

TMVA::DNN::CNN::TConvLayer::calculateNLocalViews
static size_t calculateNLocalViews(size_t inputHeight, size_t filterHeight, size_t paddingHeight, size_t strideRows, size_t inputWidth, size_t filterWidth, size_t paddingWidth, size_t strideCols)
Definition ConvLayer.h:413

TMVA::DNN::CNN::TConvLayer::GetForwardMatrices
const Tensor_t & GetForwardMatrices() const
Definition ConvLayer.h:201

TMVA::DNN::CNN::TConvLayer::GetNLocalViewPixels
size_t GetNLocalViewPixels() const
Definition ConvLayer.h:190

TMVA::DNN::CNN::TConvLayer< TCpu< AReal > >::fInputActivation
Tensor_t fInputActivation
Definition ConvLayer.h:123

TMVA::DNN::CNN::TConvLayer::GetDescriptors
const TDescriptors * GetDescriptors() const
Definition ConvLayer.h:210

TMVA::DNN::CNN::TConvLayer< TCpu< AReal > >::HelperDescriptor_t
typename TCpu< AReal >::ActivationDescriptor_t HelperDescriptor_t
Definition ConvLayer.h:83

TMVA::DNN::CNN::TConvLayer::GetStrideRows
size_t GetStrideRows() const
Definition ConvLayer.h:184

TMVA::DNN::CNN::TConvLayer< TCpu< AReal > >::Tensor_t
typename TCpu< AReal >::Tensor_t Tensor_t
Definition ConvLayer.h:77

TMVA::DNN::CNN::TConvLayer< TCpu< AReal > >::fPaddingWidth
size_t fPaddingWidth
Definition ConvLayer.h:121

TMVA::DNN::CNN::TConvLayer< TCpu< AReal > >::fWorkspace
TWorkspace * fWorkspace
Definition ConvLayer.h:118

TMVA::DNN::CNN::TConvLayer::GetWeightDecay
Scalar_t GetWeightDecay() const
Definition ConvLayer.h:206

TMVA::DNN::CNN::TConvLayer< TCpu< AReal > >::fWeightDecay
Scalar_t fWeightDecay
Definition ConvLayer.h:129

TMVA::DNN::CNN::TConvLayer::GetInputActivation
Tensor_t & GetInputActivation()
Definition ConvLayer.h:196

TMVA::DNN::CNN::TConvLayer< TCpu< AReal > >::fFilterWidth
size_t fFilterWidth
Definition ConvLayer.h:106

TMVA::DNN::CNN::TConvLayer< TCpu< AReal > >::fBackwardIndices
std::vector< int > fBackwardIndices
Definition ConvLayer.h:125

TMVA::DNN::CNN::TConvLayer::GetFilterWidth
size_t GetFilterWidth() const
Definition ConvLayer.h:182

TMVA::DNN::CNN::TConvLayer::TConvLayer
TConvLayer(size_t BatchSize, size_t InputDepth, size_t InputHeight, size_t InputWidth, size_t Depth, EInitialization Init, size_t FilterHeight, size_t FilterWidth, size_t StrideRows, size_t StrideCols, size_t PaddingHeight, size_t PaddingWidth, Scalar_t DropoutProbability, EActivationFunction f, ERegularization Reg, Scalar_t WeightDecay)
Constructor.
Definition ConvLayer.h:222

TMVA::DNN::CNN::TConvLayer::calculateDimension
static size_t calculateDimension(size_t imgDim, size_t fltDim, size_t padding, size_t stride)
Definition ConvLayer.h:402

TMVA::DNN::CNN::TConvLayer< TCpu< AReal > >::fForwardTensor
Tensor_t fForwardTensor
Definition ConvLayer.h:131

TMVA::DNN::CNN::TConvLayer::TConvLayer
TConvLayer(TConvLayer< Architecture_t > *layer)
Copy the conv layer provided as a pointer.
Definition ConvLayer.h:257

TMVA::DNN::CNN::TConvLayer::GetDescriptors
TDescriptors * GetDescriptors()
Definition ConvLayer.h:209

TMVA::DNN::CNN::TConvLayer::TConvLayer
TConvLayer(const TConvLayer &)
Copy constructor.
Definition ConvLayer.h:276

TMVA::DNN::CNN::TConvLayer::ReleaseDescriptors
void ReleaseDescriptors()
Definition ConvLayer.h:430

TMVA::DNN::CNN::TConvLayer< TCpu< AReal > >::LayerDescriptor_t
typename TCpu< AReal >::ConvolutionDescriptor_t LayerDescriptor_t
Definition ConvLayer.h:81

TMVA::DNN::CNN::TConvLayer< TCpu< AReal > >::fFilterDepth
size_t fFilterDepth
Definition ConvLayer.h:104

TMVA::DNN::CNN::TConvLayer::Forward
void Forward(Tensor_t &input, bool applyDropout=false) override
Computes activation of the layer for the given input.
Definition ConvLayer.h:311

TMVA::DNN::CNN::TConvLayer::GetPaddingWidth
size_t GetPaddingWidth() const
Definition ConvLayer.h:188

TMVA::DNN::CNN::TConvLayer< TCpu< AReal > >::fNLocalViewPixels
size_t fNLocalViewPixels
Definition ConvLayer.h:111

TMVA::DNN::CNN::TConvLayer< TCpu< AReal > >::AlgorithmForward_t
typename TCpu< AReal >::AlgorithmForward_t AlgorithmForward_t
Definition ConvLayer.h:85

TMVA::DNN::CNN::TConvLayer< TCpu< AReal > >::fDropoutProbability
Scalar_t fDropoutProbability
Definition ConvLayer.h:114

TMVA::DNN::CNN::TConvLayer::calculateNLocalViewPixels
static size_t calculateNLocalViewPixels(size_t depth, size_t height, size_t width)
Definition ConvLayer.h:97

TMVA::DNN::CNN::TConvLayer< TCpu< AReal > >::fStrideCols
size_t fStrideCols
Definition ConvLayer.h:109

TMVA::DNN::CNN::TConvLayer< TCpu< AReal > >::AlgorithmDataType_t
typename TCpu< AReal >::AlgorithmDataType_t AlgorithmDataType_t
Definition ConvLayer.h:91

TMVA::DNN::CNN::TConvLayer::~TConvLayer
virtual ~TConvLayer()
Destructor.
Definition ConvLayer.h:294

TMVA::DNN::CNN::TConvLayer::GetForwardMatrices
Tensor_t & GetForwardMatrices()
Definition ConvLayer.h:202

TMVA::DNN::CNN::TConvLayer< TCpu< AReal > >::AlgorithmBackward_t
typename TCpu< AReal >::AlgorithmBackward_t AlgorithmBackward_t
Definition ConvLayer.h:86

TMVA::DNN::CNN::TConvLayer::FreeWorkspace
void FreeWorkspace()
Definition ConvLayer.h:445

TMVA::DNN::CNN::TConvLayer< TCpu< AReal > >::fStrideRows
size_t fStrideRows
Definition ConvLayer.h:108

TMVA::DNN::CNN::TConvLayer< TCpu< AReal > >::fReg
ERegularization fReg
Definition ConvLayer.h:128

TMVA::DNN::CNN::TConvLayer::GetWorkspace
const TWorkspace * GetWorkspace() const
Definition ConvLayer.h:213

TMVA::DNN::CNN::TConvLayer::GetInputActivationAt
const Matrix_t & GetInputActivationAt(size_t i) const
Definition ConvLayer.h:199

TMVA::DNN::CNN::TConvLayer< TCpu< AReal > >::Matrix_t
typename TCpu< AReal >::Matrix_t Matrix_t
Definition ConvLayer.h:78

TMVA::DNN::CNN::TConvLayer::GetActivationFunction
EActivationFunction GetActivationFunction() const
Definition ConvLayer.h:204

TMVA::DNN::CNN::TConvLayer< TCpu< AReal > >::fDescriptors
TDescriptors * fDescriptors
Definition ConvLayer.h:116

TMVA::DNN::CNN::TConvLayer< TCpu< AReal > >::fPaddingHeight
size_t fPaddingHeight
Definition ConvLayer.h:120

TMVA::DNN::CNN::TConvLayer::GetInputActivationAt
Matrix_t & GetInputActivationAt(size_t i)
Definition ConvLayer.h:198

TMVA::DNN::CNN::TConvLayer::GetWorkspace
TWorkspace * GetWorkspace()
Definition ConvLayer.h:212

TMVA::DNN::CNN::TConvLayer< TCpu< AReal > >::fFilterHeight
size_t fFilterHeight
Definition ConvLayer.h:105

TMVA::DNN::CNN::TConvLayer::GetStrideCols
size_t GetStrideCols() const
Definition ConvLayer.h:185

TMVA::DNN::CNN::TConvLayer< TCpu< AReal > >::WeightsDescriptor_t
typename TCpu< AReal >::FilterDescriptor_t WeightsDescriptor_t
Definition ConvLayer.h:82

TMVA::DNN::CNN::TConvLayer< TCpu< AReal > >::fF
EActivationFunction fF
Definition ConvLayer.h:127

TMVA::DNN::CNN::TConvLayer::GetFilterDepth
size_t GetFilterDepth() const
Getters.
Definition ConvLayer.h:180

TMVA::DNN::CNN::TConvLayer::GetPaddingHeight
size_t GetPaddingHeight() const
Definition ConvLayer.h:187

TMVA::DNN::CNN::TConvLayer::GetFilterHeight
size_t GetFilterHeight() const
Definition ConvLayer.h:181

TMVA::DNN::CNN::TConvLayer::GetInputActivation
const Tensor_t & GetInputActivation() const
Definition ConvLayer.h:195

TMVA::DNN::CNN::TConvLayer::Backward
void Backward(Tensor_t &gradients_backward, const Tensor_t &activations_backward) override
Compute weight, bias and activation gradients.
Definition ConvLayer.h:326

TMVA::DNN::CNN::TConvLayer::InitializeWorkspace
void InitializeWorkspace()
Definition ConvLayer.h:436

TMVA::DNN::CNN::TConvLayer< TCpu< AReal > >::ReduceTensorDescriptor_t
typename TCpu< AReal >::ReduceTensorDescriptor_t ReduceTensorDescriptor_t
Definition ConvLayer.h:88

TMVA::DNN::CNN::TConvLayer::GetNLocalViews
size_t GetNLocalViews() const
Definition ConvLayer.h:191

TMVA::DNN::CNN::TConvLayer< TCpu< AReal > >::AlgorithmHelper_t
typename TCpu< AReal >::AlgorithmHelper_t AlgorithmHelper_t
Definition ConvLayer.h:87

TMVA::DNN::CNN::TConvLayer::GetDropoutProbability
Scalar_t GetDropoutProbability() const
Definition ConvLayer.h:193

TMVA::DNN::CNN::TConvLayer< TCpu< AReal > >::Scalar_t
typename TCpu< AReal >::Scalar_t Scalar_t
Definition ConvLayer.h:79

TMVA::DNN::CNN::TConvLayer::AddWeightsXMLTo
void AddWeightsXMLTo(void *parent) override
Writes the information and the weights about the layer in an XML node.
Definition ConvLayer.h:369

TMVA::DNN::CNN::TConvLayer::GetRegularization
ERegularization GetRegularization() const
Definition ConvLayer.h:205

TMVA::DNN::CNN::TConvLayer::InitializeDescriptors
void InitializeDescriptors()
Definition ConvLayer.h:425

TMVA::DNN::CNN::TConvLayer::ReadWeightsFromXML
void ReadWeightsFromXML(void *parent) override
Read the information and the weights about the layer from XML node.
Definition ConvLayer.h:393

TMVA::DNN::VGeneralLayer::GetWeightsAt
const Matrix_t & GetWeightsAt(size_t i) const
Definition GeneralLayer.h:175

TMVA::DNN::VGeneralLayer::GetDepth
size_t GetDepth() const
Definition GeneralLayer.h:167

TMVA::DNN::VGeneralLayer::GetOutput
const Tensor_t & GetOutput() const
Definition GeneralLayer.h:196

TMVA::DNN::VGeneralLayer::GetInputDepth
size_t GetInputDepth() const
Definition GeneralLayer.h:164

TMVA::DNN::VGeneralLayer::WriteMatrixToXML
void WriteMatrixToXML(void *node, const char *name, const Matrix_t &matrix)
Definition GeneralLayer.h:521

TMVA::DNN::VGeneralLayer::GetActivationGradients
const Tensor_t & GetActivationGradients() const
Definition GeneralLayer.h:199

TMVA::DNN::VGeneralLayer::GetBiasesAt
const Matrix_t & GetBiasesAt(size_t i) const
Definition GeneralLayer.h:181

TMVA::DNN::VGeneralLayer::GetInputHeight
size_t GetInputHeight() const
Definition GeneralLayer.h:165

TMVA::DNN::VGeneralLayer::GetBiasGradientsAt
const Matrix_t & GetBiasGradientsAt(size_t i) const
Definition GeneralLayer.h:193

TMVA::DNN::VGeneralLayer::GetBatchSize
size_t GetBatchSize() const
Getters.
Definition GeneralLayer.h:163

TMVA::DNN::VGeneralLayer::ReadMatrixXML
void ReadMatrixXML(void *node, const char *name, Matrix_t &matrix)
Definition GeneralLayer.h:544

TMVA::DNN::VGeneralLayer::GetWidth
size_t GetWidth() const
Definition GeneralLayer.h:169

TMVA::DNN::VGeneralLayer::GetHeight
size_t GetHeight() const
Definition GeneralLayer.h:168

TMVA::DNN::VGeneralLayer::GetWeightGradientsAt
const Matrix_t & GetWeightGradientsAt(size_t i) const
Definition GeneralLayer.h:187

TMVA::DNN::VGeneralLayer::VGeneralLayer
VGeneralLayer(size_t BatchSize, size_t InputDepth, size_t InputHeight, size_t InputWidth, size_t Depth, size_t Height, size_t Width, size_t WeightsNSlices, size_t WeightsNRows, size_t WeightsNCols, size_t BiasesNSlices, size_t BiasesNRows, size_t BiasesNCols, size_t OutputNSlices, size_t OutputNRows, size_t OutputNCols, EInitialization Init)
Constructor.
Definition GeneralLayer.h:239

TMVA::DNN::VGeneralLayer::GetInputWidth
size_t GetInputWidth() const
Definition GeneralLayer.h:166

TMVA::Tools::xmlengine
TXMLEngine & xmlengine()
Definition Tools.h:262

TString::Itoa
static TString Itoa(Int_t value, Int_t base)
Converts an Int_t to a TString with respect to the base specified (2-36).
Definition TString.cxx:2098

TXMLEngine::NewChild
XMLNodePointer_t NewChild(XMLNodePointer_t parent, XMLNsPointer_t ns, const char *name, const char *content=nullptr)
create new child element for parent node
Definition TXMLEngine.cxx:725

TXMLEngine::NewAttr
XMLAttrPointer_t NewAttr(XMLNodePointer_t xmlnode, XMLNsPointer_t, const char *name, const char *value)
creates new attribute for xmlnode, namespaces are not supported for attributes
Definition TXMLEngine.cxx:596

TMVA::DNN::CNN
Definition ContextHandles.h:43

TMVA::DNN
Definition Adadelta.h:36

TMVA::DNN::EInitialization
EInitialization
Definition Functions.h:72

TMVA::DNN::addRegularizationGradients
void addRegularizationGradients(typename Architecture_t::Matrix_t &A, const typename Architecture_t::Matrix_t &W, typename Architecture_t::Scalar_t weightDecay, ERegularization R)
Add the regularization gradient corresponding to weight matrix W, to the matrix A.
Definition Functions.h:258

TMVA::DNN::weightDecay
double weightDecay(double error, ItWeight itWeight, ItWeight itWeightEnd, double factorWeightDecay, EnumRegularization eRegularization)
compute the weight decay for regularization (L1 or L2)
Definition NeuralNet.icc:498

TMVA::DNN::ERegularization
ERegularization
Enum representing the regularization type applied for a given layer.
Definition Functions.h:65

TMVA::DNN::EActivationFunction
EActivationFunction
Enum that represents layer activation functions.
Definition Functions.h:32

TMVA
create variable transformations
Definition GeneticMinimizer.h:22

TMVA::gTools
Tools & gTools()

TMVA::DNN::CNN::TCNNDescriptors
Definition ContextHandles.h:51

TMVA::DNN::CNN::TCNNWorkspace
Definition ContextHandles.h:62

TMVA::DNN::CNN::TConvParams
Definition ConvLayer.h:44

TMVA::DNN::CNN::TConvParams::strideRows
size_t strideRows
The number of row pixels to slid the filter each step.
Definition ConvLayer.h:57

TMVA::DNN::CNN::TConvParams::filterHeight
size_t filterHeight
The height of the filter.
Definition ConvLayer.h:54

TMVA::DNN::CNN::TConvParams::inputHeight
size_t inputHeight
The height of the previous layer or input.
Definition ConvLayer.h:50

TMVA::DNN::CNN::TConvParams::batchSize
size_t batchSize
Batch size used for training and evaluation.
Definition ConvLayer.h:47

TMVA::DNN::CNN::TConvParams::paddingWidth
size_t paddingWidth
The number of zero layers left and right of the input.
Definition ConvLayer.h:60

TMVA::DNN::CNN::TConvParams::filterWidth
size_t filterWidth
The width of the filter.
Definition ConvLayer.h:55

TMVA::DNN::CNN::TConvParams::paddingHeight
size_t paddingHeight
The number of zero layers added top and bottom of the input.
Definition ConvLayer.h:59

TMVA::DNN::CNN::TConvParams::inputWidth
size_t inputWidth
The width of the previous layer or input.
Definition ConvLayer.h:51

TMVA::DNN::CNN::TConvParams::TConvParams
TConvParams(size_t _batchSize, size_t _inputDepth, size_t _inputHeight, size_t _inputWidth, size_t _numberFilters, size_t _filterHeight, size_t _filterWidth, size_t _strideRows, size_t _strideCols, size_t _paddingHeight, size_t _paddingWidth)
Definition ConvLayer.h:62

TMVA::DNN::CNN::TConvParams::numberFilters
size_t numberFilters
The number of the filters, which is equal to the output's depth.
Definition ConvLayer.h:53

TMVA::DNN::CNN::TConvParams::inputDepth
size_t inputDepth
The depth of the previous layer or input.
Definition ConvLayer.h:49

TMVA::DNN::CNN::TConvParams::strideCols
size_t strideCols
The number of column pixels to slid the filter each step.
Definition ConvLayer.h:58

TMVA::DNN::TDescriptors
Definition ContextHandles.h:29

TMVA::DNN::TWorkspace
Definition ContextHandles.h:32

Functions.h