doc/v624/Layer_8h_source.html

// @(#)root/tmva/tmva/dnn:$Id$

// Author: Simon Pfreundschuh 20/06/16


/*************************************************************************

 * Copyright (C) 2016, Simon Pfreundschuh                                *

 * All rights reserved.                                                  *

 *                                                                       *

 * For the licensing terms see $ROOTSYS/LICENSE.                         *

 * For the list of contributors see $ROOTSYS/README/CREDITS.             *

 *************************************************************************/


//////////////////////////////////////////////////////////////////////

// Contains Layer and SharedLayer classes, that represent layers in //

// neural networks.                                                 //

//////////////////////////////////////////////////////////////////////


#ifndef TMVA_DNN_LAYER

#define TMVA_DNN_LAYER


#include <iostream>


#include "TMatrix.h"

#include "Functions.h"


namespace TMVA

{

namespace DNN

{


//______________________________________________________________________________

//

//  The Layer Class

//______________________________________________________________________________


/** \class TLayer


    Generic layer class.


    This generic layer class represents a layer of a neural network with

    a given width n and activation function f. The activation

    function of each layer is given by \f$\mathbf{u} =

    \mathbf{W}\mathbf{x} + \boldsymbol{\theta}\f$.


    In addition to the weight and bias matrices, each layer allocates memory

    for its activations and the corresponding first partial fDerivatives of

    the activation function as well as the gradients of the fWeights and fBiases.


    The layer provides member functions for the forward propagation of

    activations through the given layer.

*/

template<typename Architecture_t>

   class TLayer

{


public:

   using Scalar_t = typename Architecture_t::Scalar_t;

   using Matrix_t = typename Architecture_t::Matrix_t;

   using Tensor_t = typename Architecture_t::Tensor_t;


private:


   size_t fBatchSize;  ///< Batch size used for training and evaluation.

   size_t fInputWidth; ///< Number of neurons of the previous layer.

   size_t fWidth;      ///< Number of neurons of this layer.


   Scalar_t fDropoutProbability;  ///< Probability that an input is active.


   Matrix_t fWeights;             ///< The fWeights of this layer.

   Matrix_t fBiases;              ///< The bias values of this layer.

   Matrix_t fOutput;              ///< Activations of this layer.

   Matrix_t fDerivatives;         ///< First fDerivatives of the activations of this layer.

   Matrix_t fWeightGradients;     ///< Gradients w.r.t. the weigths of this layer.

   Matrix_t fBiasGradients;       ///< Gradients w.r.t. the bias values of this layer.

   Matrix_t fActivationGradients; ///< Gradients w.r.t. the activations of this layer.


   EActivationFunction fF; ///< Activation function of the layer.


public:


   TLayer(size_t             BatchSize,

          size_t             InputWidth,

          size_t             Width,

          EActivationFunction f,

          Scalar_t           dropoutProbability);

   TLayer(const TLayer &);


   /*! Initialize fWeights according to the given initialization

    *  method. */

   void Initialize(EInitialization m);

   /*! Compute activation of the layer for the given input. The input

    * must be in matrix form with the different rows corresponding to

    * different events in the batch. Computes activations as well as

    * the first partial derivative of the activation function at those

    * activations. */

   void inline Forward(Matrix_t & input, bool applyDropout = false);

   /*! Compute weight, bias and activation gradients. Uses the precomputed

    *  first partial derviatives of the activation function computed during

    *  forward propagation and modifies them. Must only be called directly

    *  a the corresponding call to Forward(...). */

   void inline Backward(Matrix_t & gradients_backward,

                        const Matrix_t & activations_backward,

                        ERegularization r,

                        Scalar_t weightDecay);


   void Print() const;


   size_t GetBatchSize()          const {return fBatchSize;}

   size_t GetInputWidth()         const {return fInputWidth;}

   size_t GetWidth()              const {return fWidth;}

   size_t GetDropoutProbability() const {return fDropoutProbability;}


   void SetDropoutProbability(Scalar_t p) {fDropoutProbability = p;}


   EActivationFunction GetActivationFunction() const {return fF;}


   Matrix_t       & GetOutput()        {return fOutput;}

   const Matrix_t & GetOutput() const  {return fOutput;}

   Matrix_t       & GetWeights()       {return fWeights;}

   const Matrix_t & GetWeights() const {return fWeights;}

   Matrix_t       & GetBiases()       {return fBiases;}

   const Matrix_t & GetBiases() const {return fBiases;}

   Matrix_t       & GetActivationGradients()       {return fActivationGradients;}

   const Matrix_t & GetActivationGradients() const {return fActivationGradients;}

   Matrix_t       & GetBiasGradients()       {return fBiasGradients;}

   const Matrix_t & GetBiasGradients() const {return fBiasGradients;}

   Matrix_t       & GetWeightGradients()       {return fWeightGradients;}

   const Matrix_t & GetWeightGradients() const {return fWeightGradients;}


};


//______________________________________________________________________________

//

//  The Shared Layer Class

//______________________________________________________________________________


/** \class TSharedLayer


    Layer class width shared weight and bias layers.


    Like the Layer class only that weight matrices are shared between

    different instances of the net, which can be used to implement

    multithreading 'Hogwild' style.

*/


template<typename Architecture_t>

class TSharedLayer

{


public:


   using Scalar_t = typename Architecture_t::Scalar_t;

   using Matrix_t = typename Architecture_t::Matrix_t;

   using Tensor_t = typename Architecture_t::Tensor_t;


private:


   size_t fBatchSize;  ///< Batch size used for training and evaluation.

   size_t fInputWidth; ///< Number of neurons of the previous layer.

   size_t fWidth;      ///< Number of neurons of this layer.


   Scalar_t fDropoutProbability;  ///< Probability that an input is active.


   Matrix_t & fWeights;           ///< Reference to the weight matrix of this layer.

   Matrix_t & fBiases;            ///< Reference to the bias vectors of this layer.

   Matrix_t fOutput;              ///< Activations of this layer.

   Matrix_t fDerivatives;         ///< First fDerivatives of the activations of this layer.

   Matrix_t fWeightGradients;     ///< Gradients w.r.t. the weigths of this layer.

   Matrix_t fBiasGradients;       ///< Gradients w.r.t. the bias values of this layer.

   Matrix_t fActivationGradients; ///< Gradients w.r.t. the activations of this layer.


   EActivationFunction fF; ///< Activation function of the layer.


public:


   TSharedLayer(size_t fBatchSize,

                TLayer<Architecture_t> & layer);

   TSharedLayer(const TSharedLayer & layer);


   /*! Compute activation of the layer for the given input. The input

    * must be in matrix form with the different rows corresponding to

    * different events in the batch. Computes activations as well as

    * the first partial derivative of the activation function at those

    * activations. */

   void inline Forward(Matrix_t & input, bool applyDropout = false);

   /*! Compute weight, bias and activation gradients. Uses the precomputed

    *  first partial derviatives of the activation function computed during

    *  forward propagation and modifies them. Must only be called directly

    *  a the corresponding call to Forward(...). */

   void inline Backward(Matrix_t & gradients_backward,

                        const Matrix_t & activations_backward,

                        ERegularization r,

                        Scalar_t weightDecay);


   void Print() const;


   size_t GetBatchSize()          const {return fBatchSize;}

   size_t GetInputWidth()         const {return fInputWidth;}

   size_t GetWidth()              const {return fWidth;}

   size_t GetDropoutProbability() const {return fDropoutProbability;}


   void SetDropoutProbability(Scalar_t p) {fDropoutProbability = p;}


   EActivationFunction GetActivationFunction() const {return fF;}


   Matrix_t       & GetOutput()        {return fOutput;}

   const Matrix_t & GetOutput() const  {return fOutput;}

   Matrix_t       & GetWeights() const {return fWeights;}

   Matrix_t       & GetBiases()       {return fBiases;}

   const Matrix_t & GetBiases() const {return fBiases;}

   Matrix_t       & GetActivationGradients()       {return fActivationGradients;}

   const Matrix_t & GetActivationGradients() const {return fActivationGradients;}

   Matrix_t       & GetBiasGradients()       {return fBiasGradients;}

   const Matrix_t & GetBiasGradients() const {return fBiasGradients;}

   Matrix_t       & GetWeightGradients()       {return fWeightGradients;}

   const Matrix_t & GetWeightGradients() const {return fWeightGradients;}


};


//______________________________________________________________________________

//

//  The Layer Class - Implementation

//______________________________________________________________________________


template<typename Architecture_t>

   TLayer<Architecture_t>::TLayer(size_t batchSize,

                                  size_t inputWidth,

                                  size_t width,

                                  EActivationFunction f,

                                  Scalar_t dropoutProbability)

   : fBatchSize(batchSize), fInputWidth(inputWidth), fWidth(width),

     fDropoutProbability(dropoutProbability), fWeights(width, fInputWidth),

     fBiases(width, 1), fOutput(fBatchSize, width), fDerivatives(fBatchSize, width),

     fWeightGradients(width, fInputWidth), fBiasGradients(width, 1),

     fActivationGradients(fBatchSize, width), fF(f)

{

   // Nothing to do here.

}


//______________________________________________________________________________

template<typename Architecture_t>

TLayer<Architecture_t>::TLayer(const TLayer &layer)

    : fBatchSize(layer.fBatchSize), fInputWidth(layer.fInputWidth),

    fWidth(layer.fWidth), fDropoutProbability(layer.fDropoutProbability),

    fWeights(layer.fWidth, layer.fInputWidth), fBiases(layer.fWidth, 1),

    fOutput(layer.fBatchSize, layer.fWidth),

    fDerivatives(layer.fBatchSize, layer.fWidth),

    fWeightGradients(layer.fWidth, layer.fInputWidth),

    fBiasGradients(layer.fWidth, 1),

    fActivationGradients(layer.fBatchSize, layer.fWidth),

    fF(layer.fF)

{

   Architecture_t::Copy(fWeights, layer.GetWeights());

   Architecture_t::Copy(fBiases,  layer.GetBiases());

}


//______________________________________________________________________________

template<typename Architecture_t>

auto TLayer<Architecture_t>::Initialize(EInitialization m)

-> void

{

   initialize<Architecture_t>(fWeights, m);

   initialize<Architecture_t>(fBiases,  EInitialization::kZero);

}


//______________________________________________________________________________

template<typename Architecture_t>

auto inline TLayer<Architecture_t>::Forward(Matrix_t & input,

                                            bool applyDropout)

-> void

{

   if (applyDropout && (fDropoutProbability != 1.0)) {

      Architecture_t::DropoutForward(input, fDropoutProbability);

   }

   Architecture_t::MultiplyTranspose(fOutput, input, fWeights);

   Architecture_t::AddRowWise(fOutput, fBiases);

   Tensor_t tOutput(fOutput);

   Tensor_t tDerivatives(fDerivatives);

   evaluateDerivative<Architecture_t>(tDerivatives, fF, tOutput);


   evaluate<Architecture_t>(tOutput, fF);

}


//______________________________________________________________________________

template<typename Architecture_t>

auto TLayer<Architecture_t>::Backward(Matrix_t & gradients_backward,

                                    const Matrix_t & activations_backward,

                                    ERegularization r,

                                    Scalar_t weightDecay)

-> void

{


   Tensor_t tGradBw(gradients_backward);

   Tensor_t tActBw(activations_backward);

   Tensor_t tActGrad(fActivationGradients);

   Tensor_t tDeriv(fDerivatives);


   Architecture_t::Hadamard( tDeriv, tActGrad);

   Architecture_t::Backward( tGradBw,

                            fWeightGradients,

                            fBiasGradients,

                            tDeriv,

                            tActGrad,

                            fWeights,

                            tActBw);

   addRegularizationGradients<Architecture_t>(fWeightGradients,

                                              fWeights,

                                              weightDecay, r);

}


//______________________________________________________________________________

template<typename Architecture_t>

   void TLayer<Architecture_t>::Print() const

{

   std::cout << "Width = " << fWeights.GetNrows();

   std::cout << ", Activation Function = ";

   std::cout << static_cast<int>(fF) << std::endl;

}


//______________________________________________________________________________

//

//  The Shared Layer Class - Implementation

//______________________________________________________________________________


//______________________________________________________________________________

template<typename Architecture_t>

TSharedLayer<Architecture_t>::TSharedLayer(size_t BatchSize,

                                         TLayer<Architecture_t> &layer)

: fBatchSize(BatchSize),

fInputWidth(layer.GetInputWidth()), fWidth(layer.GetWidth()),

fDropoutProbability(layer.GetDropoutProbability()),

fWeights(layer.GetWeights()), fBiases(layer.GetBiases()),

fOutput(fBatchSize, fWidth), fDerivatives(fBatchSize, fWidth),

fWeightGradients(fWidth, fInputWidth), fBiasGradients(fWidth, 1),

fActivationGradients(fBatchSize, fWidth), fF(layer.GetActivationFunction())

{

   // Nothing to do here.

}


//______________________________________________________________________________

template<typename Architecture_t>

TSharedLayer<Architecture_t>::TSharedLayer(const TSharedLayer &layer)

    : fBatchSize(layer.fBatchSize),

    fInputWidth(layer.GetInputWidth()), fWidth(layer.GetWidth()),

    fDropoutProbability(layer.fDropoutProbability), fWeights(layer.fWeights),

    fBiases(layer.fBiases), fOutput(layer.fBatchSize, fWidth),

    fDerivatives(layer.fBatchSize, fWidth), fWeightGradients(fWidth, fInputWidth),

    fBiasGradients(fWidth, 1), fActivationGradients(layer.fBatchSize, fWidth),

    fF(layer.fF)

{

}


//______________________________________________________________________________

template<typename Architecture_t>

auto inline TSharedLayer<Architecture_t>::Forward(Matrix_t & input,

                                                  bool applyDropout)

-> void

{

   if (applyDropout && (fDropoutProbability != 1.0)) {

      Architecture_t::DropoutForward(input, fDropoutProbability);

   }

   Architecture_t::MultiplyTranspose(fOutput, input, fWeights);

   Architecture_t::AddRowWise(fOutput, fBiases);

   Tensor_t tOutput(fOutput);

   Tensor_t tDerivatives(fDerivatives);

   evaluateDerivative<Architecture_t>(tDerivatives, fF, tOutput);

   evaluate<Architecture_t>(tOutput, fF);

}


//______________________________________________________________________________

template<typename Architecture_t>

auto inline TSharedLayer<Architecture_t>::Backward(Matrix_t & gradients_backward,

                                                 const Matrix_t & activations_backward,

                                                 ERegularization r,

                                                 Scalar_t weightDecay)

-> void

{

   Architecture_t::Backward(gradients_backward,

                            fWeightGradients,

                            fBiasGradients,

                            fDerivatives,

                            fActivationGradients,

                            fWeights,

                            activations_backward);

   addRegularizationGradients<Architecture_t>(fWeightGradients,

                                              fWeights,

                                              weightDecay, r);

}


//______________________________________________________________________________

template<typename Architecture_t>

void TSharedLayer<Architecture_t>::Print() const

{

   std::cout << "Width = " << fWeights.GetNrows();

   std::cout << ", Activation Function = ";

   std::cout << static_cast<int>(fF) << std::endl;

}


} // namespace DNN

} // namespace TMVA


#endif

r
ROOT::R::TRInterface & r
Definition Object.C:4

f
#define f(i)
Definition RSha256.hxx:104

width
include TDocParser_001 C image html pict1_TDocParser_001 png width
Definition TDocParser.cxx:121

TMatrix.h

TMVA::DNN::TLayer
Generic layer class.
Definition Layer.h:53

TMVA::DNN::TLayer::Backward
void Backward(Matrix_t &gradients_backward, const Matrix_t &activations_backward, ERegularization r, Scalar_t weightDecay)
Compute weight, bias and activation gradients.
Definition Layer.h:287

TMVA::DNN::TLayer::GetBiasGradients
const Matrix_t & GetBiasGradients() const
Definition Layer.h:126

TMVA::DNN::TLayer::SetDropoutProbability
void SetDropoutProbability(Scalar_t p)
Definition Layer.h:113

TMVA::DNN::TLayer::GetActivationGradients
const Matrix_t & GetActivationGradients() const
Definition Layer.h:124

TMVA::DNN::TLayer::fF
EActivationFunction fF
Activation function of the layer.
Definition Layer.h:77

TMVA::DNN::TLayer::GetWeights
Matrix_t & GetWeights()
Definition Layer.h:119

TMVA::DNN::TLayer::fActivationGradients
Matrix_t fActivationGradients
Gradients w.r.t. the activations of this layer.
Definition Layer.h:75

TMVA::DNN::TLayer::TLayer
TLayer(size_t BatchSize, size_t InputWidth, size_t Width, EActivationFunction f, Scalar_t dropoutProbability)
Definition Layer.h:227

TMVA::DNN::TLayer::fInputWidth
size_t fInputWidth
Number of neurons of the previous layer.
Definition Layer.h:64

TMVA::DNN::TLayer::fBiasGradients
Matrix_t fBiasGradients
Gradients w.r.t. the bias values of this layer.
Definition Layer.h:74

TMVA::DNN::TLayer::GetBiases
const Matrix_t & GetBiases() const
Definition Layer.h:122

TMVA::DNN::TLayer::GetOutput
const Matrix_t & GetOutput() const
Definition Layer.h:118

TMVA::DNN::TLayer::fOutput
Matrix_t fOutput
Activations of this layer.
Definition Layer.h:71

TMVA::DNN::TLayer::GetActivationFunction
EActivationFunction GetActivationFunction() const
Definition Layer.h:115

TMVA::DNN::TLayer::GetWeightGradients
const Matrix_t & GetWeightGradients() const
Definition Layer.h:128

TMVA::DNN::TLayer::GetBatchSize
size_t GetBatchSize() const
Definition Layer.h:108

TMVA::DNN::TLayer::GetInputWidth
size_t GetInputWidth() const
Definition Layer.h:109

TMVA::DNN::TLayer::GetBiasGradients
Matrix_t & GetBiasGradients()
Definition Layer.h:125

TMVA::DNN::TLayer::fDropoutProbability
Scalar_t fDropoutProbability
Probability that an input is active.
Definition Layer.h:67

TMVA::DNN::TLayer::fBiases
Matrix_t fBiases
The bias values of this layer.
Definition Layer.h:70

TMVA::DNN::TLayer::GetActivationGradients
Matrix_t & GetActivationGradients()
Definition Layer.h:123

TMVA::DNN::TLayer::fWidth
size_t fWidth
Number of neurons of this layer.
Definition Layer.h:65

TMVA::DNN::TLayer::Matrix_t
typename Architecture_t::Matrix_t Matrix_t
Definition Layer.h:57

TMVA::DNN::TLayer::GetOutput
Matrix_t & GetOutput()
Definition Layer.h:117

TMVA::DNN::TLayer::Scalar_t
typename Architecture_t::Scalar_t Scalar_t
Definition Layer.h:56

TMVA::DNN::TLayer::GetDropoutProbability
size_t GetDropoutProbability() const
Definition Layer.h:111

TMVA::DNN::TLayer::Print
void Print() const
Definition Layer.h:314

TMVA::DNN::TLayer::GetBiases
Matrix_t & GetBiases()
Definition Layer.h:121

TMVA::DNN::TLayer::Tensor_t
typename Architecture_t::Tensor_t Tensor_t
Definition Layer.h:58

TMVA::DNN::TLayer::fWeightGradients
Matrix_t fWeightGradients
Gradients w.r.t. the weigths of this layer.
Definition Layer.h:73

TMVA::DNN::TLayer::fBatchSize
size_t fBatchSize
Batch size used for training and evaluation.
Definition Layer.h:63

TMVA::DNN::TLayer::Initialize
void Initialize(EInitialization m)
Initialize fWeights according to the given initialization method.
Definition Layer.h:260

TMVA::DNN::TLayer::fWeights
Matrix_t fWeights
The fWeights of this layer.
Definition Layer.h:69

TMVA::DNN::TLayer::fDerivatives
Matrix_t fDerivatives
First fDerivatives of the activations of this layer.
Definition Layer.h:72

TMVA::DNN::TLayer::GetWeightGradients
Matrix_t & GetWeightGradients()
Definition Layer.h:127

TMVA::DNN::TLayer::GetWidth
size_t GetWidth() const
Definition Layer.h:110

TMVA::DNN::TLayer::GetWeights
const Matrix_t & GetWeights() const
Definition Layer.h:120

TMVA::DNN::TLayer::Forward
void Forward(Matrix_t &input, bool applyDropout=false)
Compute activation of the layer for the given input.
Definition Layer.h:269

TMVA::DNN::TSharedLayer
Layer class width shared weight and bias layers.
Definition Layer.h:148

TMVA::DNN::TSharedLayer::fBiases
Matrix_t & fBiases
Reference to the bias vectors of this layer.
Definition Layer.h:166

TMVA::DNN::TSharedLayer::fOutput
Matrix_t fOutput
Activations of this layer.
Definition Layer.h:167

TMVA::DNN::TSharedLayer::GetBiases
Matrix_t & GetBiases()
Definition Layer.h:210

TMVA::DNN::TSharedLayer::TSharedLayer
TSharedLayer(size_t fBatchSize, TLayer< Architecture_t > &layer)
Definition Layer.h:328

TMVA::DNN::TSharedLayer::fWeights
Matrix_t & fWeights
Reference to the weight matrix of this layer.
Definition Layer.h:165

TMVA::DNN::TSharedLayer::GetActivationGradients
Matrix_t & GetActivationGradients()
Definition Layer.h:212

TMVA::DNN::TSharedLayer::GetBiasGradients
const Matrix_t & GetBiasGradients() const
Definition Layer.h:215

TMVA::DNN::TSharedLayer::GetWidth
size_t GetWidth() const
Definition Layer.h:200

TMVA::DNN::TSharedLayer::fBiasGradients
Matrix_t fBiasGradients
Gradients w.r.t. the bias values of this layer.
Definition Layer.h:170

TMVA::DNN::TSharedLayer::GetWeightGradients
Matrix_t & GetWeightGradients()
Definition Layer.h:216

TMVA::DNN::TSharedLayer::Tensor_t
typename Architecture_t::Tensor_t Tensor_t
Definition Layer.h:154

TMVA::DNN::TSharedLayer::fDerivatives
Matrix_t fDerivatives
First fDerivatives of the activations of this layer.
Definition Layer.h:168

TMVA::DNN::TSharedLayer::GetBiases
const Matrix_t & GetBiases() const
Definition Layer.h:211

TMVA::DNN::TSharedLayer::Matrix_t
typename Architecture_t::Matrix_t Matrix_t
Definition Layer.h:153

TMVA::DNN::TSharedLayer::fInputWidth
size_t fInputWidth
Number of neurons of the previous layer.
Definition Layer.h:160

TMVA::DNN::TSharedLayer::GetOutput
Matrix_t & GetOutput()
Definition Layer.h:207

TMVA::DNN::TSharedLayer::fWidth
size_t fWidth
Number of neurons of this layer.
Definition Layer.h:161

TMVA::DNN::TSharedLayer::GetWeightGradients
const Matrix_t & GetWeightGradients() const
Definition Layer.h:217

TMVA::DNN::TSharedLayer::fBatchSize
size_t fBatchSize
Batch size used for training and evaluation.
Definition Layer.h:159

TMVA::DNN::TSharedLayer::fWeightGradients
Matrix_t fWeightGradients
Gradients w.r.t. the weigths of this layer.
Definition Layer.h:169

TMVA::DNN::TSharedLayer::GetActivationFunction
EActivationFunction GetActivationFunction() const
Definition Layer.h:205

TMVA::DNN::TSharedLayer::fActivationGradients
Matrix_t fActivationGradients
Gradients w.r.t. the activations of this layer.
Definition Layer.h:171

TMVA::DNN::TSharedLayer::GetDropoutProbability
size_t GetDropoutProbability() const
Definition Layer.h:201

TMVA::DNN::TSharedLayer::GetInputWidth
size_t GetInputWidth() const
Definition Layer.h:199

TMVA::DNN::TSharedLayer::Print
void Print() const
Definition Layer.h:393

TMVA::DNN::TSharedLayer::GetBatchSize
size_t GetBatchSize() const
Definition Layer.h:198

TMVA::DNN::TSharedLayer::Forward
void Forward(Matrix_t &input, bool applyDropout=false)
Compute activation of the layer for the given input.
Definition Layer.h:356

TMVA::DNN::TSharedLayer::Scalar_t
typename Architecture_t::Scalar_t Scalar_t
Definition Layer.h:152

TMVA::DNN::TSharedLayer::fF
EActivationFunction fF
Activation function of the layer.
Definition Layer.h:173

TMVA::DNN::TSharedLayer::fDropoutProbability
Scalar_t fDropoutProbability
Probability that an input is active.
Definition Layer.h:163

TMVA::DNN::TSharedLayer::GetWeights
Matrix_t & GetWeights() const
Definition Layer.h:209

TMVA::DNN::TSharedLayer::GetOutput
const Matrix_t & GetOutput() const
Definition Layer.h:208

TMVA::DNN::TSharedLayer::GetActivationGradients
const Matrix_t & GetActivationGradients() const
Definition Layer.h:213

TMVA::DNN::TSharedLayer::GetBiasGradients
Matrix_t & GetBiasGradients()
Definition Layer.h:214

TMVA::DNN::TSharedLayer::SetDropoutProbability
void SetDropoutProbability(Scalar_t p)
Definition Layer.h:203

TMVA::DNN::TSharedLayer::Backward
void Backward(Matrix_t &gradients_backward, const Matrix_t &activations_backward, ERegularization r, Scalar_t weightDecay)
Compute weight, bias and activation gradients.
Definition Layer.h:373

TMVA::DNN::EInitialization
EInitialization
Definition Functions.h:72

TMVA::DNN::EInitialization::kZero
@ kZero

TMVA::DNN::weightDecay
double weightDecay(double error, ItWeight itWeight, ItWeight itWeightEnd, double factorWeightDecay, EnumRegularization eRegularization)
compute the weight decay for regularization (L1 or L2)
Definition NeuralNet.icc:498

TMVA::DNN::ERegularization
ERegularization
Enum representing the regularization type applied for a given layer.
Definition Functions.h:65

TMVA::DNN::EActivationFunction
EActivationFunction
Enum that represents layer activation functions.
Definition Functions.h:32

TMVA
create variable transformations
Definition GeneticMinimizer.h:22

m
auto * m
Definition textangle.C:8

Functions.h