doc/v616/Layer_8h_source.html

// @(#)root/tmva/tmva/dnn:$Id$

// Author: Simon Pfreundschuh 20/06/16


/*************************************************************************

 * Copyright (C) 2016, Simon Pfreundschuh                                *

 * All rights reserved.                                                  *

 *                                                                       *

 * For the licensing terms see $ROOTSYS/LICENSE.                         *

 * For the list of contributors see $ROOTSYS/README/CREDITS.             *

 *************************************************************************/


//////////////////////////////////////////////////////////////////////

// Contains Layer and SharedLayer classes, that represent layers in //

// neural networks.                                                 //

//////////////////////////////////////////////////////////////////////


#ifndef TMVA_DNN_LAYER

#define TMVA_DNN_LAYER


#include <iostream>


#include "TMatrix.h"

#include "Functions.h"


namespace TMVA

{

namespace DNN

{


//______________________________________________________________________________

//

//  The Layer Class

//______________________________________________________________________________


/** \class TLayer


    Generic layer class.


    This generic layer class represents a layer of a neural network with

    a given width n and activation function f. The activation

    function of each layer is given by \f$\mathbf{u} =

    \mathbf{W}\mathbf{x} + \boldsymbol{\theta}\f$.


    In addition to the weight and bias matrices, each layer allocates memory

    for its activations and the corresponding first partial fDerivatives of

    the activation function as well as the gradients of the fWeights and fBiases.


    The layer provides member functions for the forward propagation of

    activations through the given layer.

*/

template<typename Architecture_t>

   class TLayer

{


public:

   using Scalar_t = typename Architecture_t::Scalar_t;

   using Matrix_t = typename Architecture_t::Matrix_t;


private:


   size_t fBatchSize;  ///< Batch size used for training and evaluation.

   size_t fInputWidth; ///< Number of neurons of the previous layer.

   size_t fWidth;      ///< Number of neurons of this layer.


   Scalar_t fDropoutProbability;  ///< Probability that an input is active.


   Matrix_t fWeights;             ///< The fWeights of this layer.

   Matrix_t fBiases;              ///< The bias values of this layer.

   Matrix_t fOutput;              ///< Activations of this layer.

   Matrix_t fDerivatives;         ///< First fDerivatives of the activations of this layer.

   Matrix_t fWeightGradients;     ///< Gradients w.r.t. the weigths of this layer.

   Matrix_t fBiasGradients;       ///< Gradients w.r.t. the bias values of this layer.

   Matrix_t fActivationGradients; ///< Gradients w.r.t. the activations of this layer.


   EActivationFunction fF; ///< Activation function of the layer.


public:


   TLayer(size_t             BatchSize,

          size_t             InputWidth,

          size_t             Width,

          EActivationFunction f,

          Scalar_t           dropoutProbability);

   TLayer(const TLayer &);


   /*! Initialize fWeights according to the given initialization

    *  method. */

   void Initialize(EInitialization m);

   /*! Compute activation of the layer for the given input. The input

    * must be in matrix form with the different rows corresponding to

    * different events in the batch. Computes activations as well as

    * the first partial derivative of the activation function at those

    * activations. */

   void inline Forward(Matrix_t & input, bool applyDropout = false);

   /*! Compute weight, bias and activation gradients. Uses the precomputed

    *  first partial derviatives of the activation function computed during

    *  forward propagation and modifies them. Must only be called directly

    *  a the corresponding call to Forward(...). */

   void inline Backward(Matrix_t & gradients_backward,

                        const Matrix_t & activations_backward,

                        ERegularization r,

                        Scalar_t weightDecay);


   void Print() const;


   size_t GetBatchSize()          const {return fBatchSize;}

   size_t GetInputWidth()         const {return fInputWidth;}

   size_t GetWidth()              const {return fWidth;}

   size_t GetDropoutProbability() const {return fDropoutProbability;}


   void SetDropoutProbability(Scalar_t p) {fDropoutProbability = p;}


   EActivationFunction GetActivationFunction() const {return fF;}


   Matrix_t       & GetOutput()        {return fOutput;}

   const Matrix_t & GetOutput() const  {return fOutput;}

   Matrix_t       & GetWeights()       {return fWeights;}

   const Matrix_t & GetWeights() const {return fWeights;}

   Matrix_t       & GetBiases()       {return fBiases;}

   const Matrix_t & GetBiases() const {return fBiases;}

   Matrix_t       & GetActivationGradients()       {return fActivationGradients;}

   const Matrix_t & GetActivationGradients() const {return fActivationGradients;}

   Matrix_t       & GetBiasGradients()       {return fBiasGradients;}

   const Matrix_t & GetBiasGradients() const {return fBiasGradients;}

   Matrix_t       & GetWeightGradients()       {return fWeightGradients;}

   const Matrix_t & GetWeightGradients() const {return fWeightGradients;}


};


//______________________________________________________________________________

//

//  The Shared Layer Class

//______________________________________________________________________________


/** \class TSharedLayer


    Layer class width shared weight and bias layers.


    Like the Layer class only that weight matrices are shared between

    different instances of the net, which can be used to implement

    multithreading 'Hogwild' style.

*/


template<typename Architecture_t>

class TSharedLayer

{


public:


   using Scalar_t = typename Architecture_t::Scalar_t;

   using Matrix_t = typename Architecture_t::Matrix_t;


private:


   size_t fBatchSize;  ///< Batch size used for training and evaluation.

   size_t fInputWidth; ///< Number of neurons of the previous layer.

   size_t fWidth;      ///< Number of neurons of this layer.


   Scalar_t fDropoutProbability;  ///< Probability that an input is active.


   Matrix_t & fWeights;           ///< Reference to the weight matrix of this layer.

   Matrix_t & fBiases;            ///< Reference to the bias vectors of this layer.

   Matrix_t fOutput;              ///< Activations of this layer.

   Matrix_t fDerivatives;         ///< First fDerivatives of the activations of this layer.

   Matrix_t fWeightGradients;     ///< Gradients w.r.t. the weigths of this layer.

   Matrix_t fBiasGradients;       ///< Gradients w.r.t. the bias values of this layer.

   Matrix_t fActivationGradients; ///< Gradients w.r.t. the activations of this layer.


   EActivationFunction fF; ///< Activation function of the layer.


public:


   TSharedLayer(size_t fBatchSize,

                TLayer<Architecture_t> & layer);

   TSharedLayer(const TSharedLayer & layer);


   /*! Compute activation of the layer for the given input. The input

    * must be in matrix form with the different rows corresponding to

    * different events in the batch. Computes activations as well as

    * the first partial derivative of the activation function at those

    * activations. */

   void inline Forward(Matrix_t & input, bool applyDropout = false);

   /*! Compute weight, bias and activation gradients. Uses the precomputed

    *  first partial derviatives of the activation function computed during

    *  forward propagation and modifies them. Must only be called directly

    *  a the corresponding call to Forward(...). */

   void inline Backward(Matrix_t & gradients_backward,

                        const Matrix_t & activations_backward,

                        ERegularization r,

                        Scalar_t weightDecay);


   void Print() const;


   size_t GetBatchSize()          const {return fBatchSize;}

   size_t GetInputWidth()         const {return fInputWidth;}

   size_t GetWidth()              const {return fWidth;}

   size_t GetDropoutProbability() const {return fDropoutProbability;}


   void SetDropoutProbability(Scalar_t p) {fDropoutProbability = p;}


   EActivationFunction GetActivationFunction() const {return fF;}


   Matrix_t       & GetOutput()        {return fOutput;}

   const Matrix_t & GetOutput() const  {return fOutput;}

   Matrix_t       & GetWeights() const {return fWeights;}

   Matrix_t       & GetBiases()       {return fBiases;}

   const Matrix_t & GetBiases() const {return fBiases;}

   Matrix_t       & GetActivationGradients()       {return fActivationGradients;}

   const Matrix_t & GetActivationGradients() const {return fActivationGradients;}

   Matrix_t       & GetBiasGradients()       {return fBiasGradients;}

   const Matrix_t & GetBiasGradients() const {return fBiasGradients;}

   Matrix_t       & GetWeightGradients()       {return fWeightGradients;}

   const Matrix_t & GetWeightGradients() const {return fWeightGradients;}


};


//______________________________________________________________________________

//

//  The Layer Class - Implementation

//______________________________________________________________________________


template<typename Architecture_t>

   TLayer<Architecture_t>::TLayer(size_t batchSize,

                                  size_t inputWidth,

                                  size_t width,

                                  EActivationFunction f,

                                  Scalar_t dropoutProbability)

   : fBatchSize(batchSize), fInputWidth(inputWidth), fWidth(width),

     fDropoutProbability(dropoutProbability), fWeights(width, fInputWidth),

     fBiases(width, 1), fOutput(fBatchSize, width), fDerivatives(fBatchSize, width),

     fWeightGradients(width, fInputWidth), fBiasGradients(width, 1),

     fActivationGradients(fBatchSize, width), fF(f)

{

   // Nothing to do here.

}


//______________________________________________________________________________

template<typename Architecture_t>

TLayer<Architecture_t>::TLayer(const TLayer &layer)

    : fBatchSize(layer.fBatchSize), fInputWidth(layer.fInputWidth),

    fWidth(layer.fWidth), fDropoutProbability(layer.fDropoutProbability),

    fWeights(layer.fWidth, layer.fInputWidth), fBiases(layer.fWidth, 1),

    fOutput(layer.fBatchSize, layer.fWidth),

    fDerivatives(layer.fBatchSize, layer.fWidth),

    fWeightGradients(layer.fWidth, layer.fInputWidth),

    fBiasGradients(layer.fWidth, 1),

    fActivationGradients(layer.fBatchSize, layer.fWidth),

    fF(layer.fF)

{

   Architecture_t::Copy(fWeights, layer.GetWeights());

   Architecture_t::Copy(fBiases,  layer.GetBiases());

}


//______________________________________________________________________________

template<typename Architecture_t>

auto TLayer<Architecture_t>::Initialize(EInitialization m)

-> void

{

   initialize<Architecture_t>(fWeights, m);

   initialize<Architecture_t>(fBiases,  EInitialization::kZero);

}


//______________________________________________________________________________

template<typename Architecture_t>

auto inline TLayer<Architecture_t>::Forward(Matrix_t & input,

                                            bool applyDropout)

-> void

{

   if (applyDropout && (fDropoutProbability != 1.0)) {

      Architecture_t::Dropout(input, fDropoutProbability);

   }

   Architecture_t::MultiplyTranspose(fOutput, input, fWeights);

   Architecture_t::AddRowWise(fOutput, fBiases);

   evaluateDerivative<Architecture_t>(fDerivatives, fF, fOutput);

   evaluate<Architecture_t>(fOutput, fF);

}


//______________________________________________________________________________

template<typename Architecture_t>

auto TLayer<Architecture_t>::Backward(Matrix_t & gradients_backward,

                                    const Matrix_t & activations_backward,

                                    ERegularization r,

                                    Scalar_t weightDecay)

-> void

{

   Architecture_t::Backward(gradients_backward,

                            fWeightGradients,

                            fBiasGradients,

                            fDerivatives,

                            fActivationGradients,

                            fWeights,

                            activations_backward);

   addRegularizationGradients<Architecture_t>(fWeightGradients,

                                              fWeights,

                                              weightDecay, r);

}


//______________________________________________________________________________

template<typename Architecture_t>

   void TLayer<Architecture_t>::Print() const

{

   std::cout << "Width = " << fWeights.GetNrows();

   std::cout << ", Activation Function = ";

   std::cout << static_cast<int>(fF) << std::endl;

}


//______________________________________________________________________________

//

//  The Shared Layer Class - Implementation

//______________________________________________________________________________


//______________________________________________________________________________

template<typename Architecture_t>

TSharedLayer<Architecture_t>::TSharedLayer(size_t BatchSize,

                                         TLayer<Architecture_t> &layer)

: fBatchSize(BatchSize),

fInputWidth(layer.GetInputWidth()), fWidth(layer.GetWidth()),

fDropoutProbability(layer.GetDropoutProbability()),

fWeights(layer.GetWeights()), fBiases(layer.GetBiases()),

fOutput(fBatchSize, fWidth), fDerivatives(fBatchSize, fWidth),

fWeightGradients(fWidth, fInputWidth), fBiasGradients(fWidth, 1),

fActivationGradients(fBatchSize, fWidth), fF(layer.GetActivationFunction())

{

   // Nothing to do here.

}


//______________________________________________________________________________

template<typename Architecture_t>

TSharedLayer<Architecture_t>::TSharedLayer(const TSharedLayer &layer)

    : fBatchSize(layer.fBatchSize),

    fInputWidth(layer.GetInputWidth()), fWidth(layer.GetWidth()),

    fDropoutProbability(layer.fDropoutProbability), fWeights(layer.fWeights),

    fBiases(layer.fBiases), fOutput(layer.fBatchSize, fWidth),

    fDerivatives(layer.fBatchSize, fWidth), fWeightGradients(fWidth, fInputWidth),

    fBiasGradients(fWidth, 1), fActivationGradients(layer.fBatchSize, fWidth),

    fF(layer.fF)

{

}


//______________________________________________________________________________

template<typename Architecture_t>

auto inline TSharedLayer<Architecture_t>::Forward(Matrix_t & input,

                                                  bool applyDropout)

-> void

{

   if (applyDropout && (fDropoutProbability != 1.0)) {

      Architecture_t::Dropout(input, fDropoutProbability);

   }

   Architecture_t::MultiplyTranspose(fOutput, input, fWeights);

   Architecture_t::AddRowWise(fOutput, fBiases);

   evaluateDerivative<Architecture_t>(fDerivatives, fF, fOutput);

   evaluate<Architecture_t>(fOutput, fF);

}


//______________________________________________________________________________

template<typename Architecture_t>

auto inline TSharedLayer<Architecture_t>::Backward(Matrix_t & gradients_backward,

                                                 const Matrix_t & activations_backward,

                                                 ERegularization r,

                                                 Scalar_t weightDecay)

-> void

{

   Architecture_t::Backward(gradients_backward,

                            fWeightGradients,

                            fBiasGradients,

                            fDerivatives,

                            fActivationGradients,

                            fWeights,

                            activations_backward);

   addRegularizationGradients<Architecture_t>(fWeightGradients,

                                              fWeights,

                                              weightDecay, r);

}


//______________________________________________________________________________

template<typename Architecture_t>

void TSharedLayer<Architecture_t>::Print() const

{

   std::cout << "Width = " << fWeights.GetNrows();

   std::cout << ", Activation Function = ";

   std::cout << static_cast<int>(fF) << std::endl;

}


} // namespace DNN

} // namespace TMVA


#endif

r
ROOT::R::TRInterface & r
Definition: Object.C:4

f
#define f(i)
Definition: RSha256.hxx:104

width
include TDocParser_001 C image html pict1_TDocParser_001 png width
Definition: TDocParser.cxx:121

TMatrix.h

TMVA::DNN::TLayer
Generic layer class.
Definition: Layer.h:53

TMVA::DNN::TLayer::Backward
void Backward(Matrix_t &gradients_backward, const Matrix_t &activations_backward, ERegularization r, Scalar_t weightDecay)
Compute weight, bias and activation gradients.
Definition: Layer.h:280

TMVA::DNN::TLayer::GetBiasGradients
const Matrix_t & GetBiasGradients() const
Definition: Layer.h:124

TMVA::DNN::TLayer::SetDropoutProbability
void SetDropoutProbability(Scalar_t p)
Definition: Layer.h:111

TMVA::DNN::TLayer::GetActivationGradients
const Matrix_t & GetActivationGradients() const
Definition: Layer.h:122

TMVA::DNN::TLayer::fF
EActivationFunction fF
Activation function of the layer.
Definition: Layer.h:75

TMVA::DNN::TLayer::GetWeights
Matrix_t & GetWeights()
Definition: Layer.h:117

TMVA::DNN::TLayer::fActivationGradients
Matrix_t fActivationGradients
Gradients w.r.t. the activations of this layer.
Definition: Layer.h:73

TMVA::DNN::TLayer::TLayer
TLayer(size_t BatchSize, size_t InputWidth, size_t Width, EActivationFunction f, Scalar_t dropoutProbability)
Definition: Layer.h:223

TMVA::DNN::TLayer::fInputWidth
size_t fInputWidth
Number of neurons of the previous layer.
Definition: Layer.h:62

TMVA::DNN::TLayer::fBiasGradients
Matrix_t fBiasGradients
Gradients w.r.t. the bias values of this layer.
Definition: Layer.h:72

TMVA::DNN::TLayer::GetBiases
const Matrix_t & GetBiases() const
Definition: Layer.h:120

TMVA::DNN::TLayer::GetOutput
const Matrix_t & GetOutput() const
Definition: Layer.h:116

TMVA::DNN::TLayer::fOutput
Matrix_t fOutput
Activations of this layer.
Definition: Layer.h:69

TMVA::DNN::TLayer::GetActivationFunction
EActivationFunction GetActivationFunction() const
Definition: Layer.h:113

TMVA::DNN::TLayer::GetWeightGradients
const Matrix_t & GetWeightGradients() const
Definition: Layer.h:126

TMVA::DNN::TLayer::GetBatchSize
size_t GetBatchSize() const
Definition: Layer.h:106

TMVA::DNN::TLayer::GetInputWidth
size_t GetInputWidth() const
Definition: Layer.h:107

TMVA::DNN::TLayer::GetBiasGradients
Matrix_t & GetBiasGradients()
Definition: Layer.h:123

TMVA::DNN::TLayer::fDropoutProbability
Scalar_t fDropoutProbability
Probability that an input is active.
Definition: Layer.h:65

TMVA::DNN::TLayer::fBiases
Matrix_t fBiases
The bias values of this layer.
Definition: Layer.h:68

TMVA::DNN::TLayer::GetActivationGradients
Matrix_t & GetActivationGradients()
Definition: Layer.h:121

TMVA::DNN::TLayer::fWidth
size_t fWidth
Number of neurons of this layer.
Definition: Layer.h:63

TMVA::DNN::TLayer::Matrix_t
typename Architecture_t::Matrix_t Matrix_t
Definition: Layer.h:57

TMVA::DNN::TLayer::GetOutput
Matrix_t & GetOutput()
Definition: Layer.h:115

TMVA::DNN::TLayer::Scalar_t
typename Architecture_t::Scalar_t Scalar_t
Definition: Layer.h:56

TMVA::DNN::TLayer::GetDropoutProbability
size_t GetDropoutProbability() const
Definition: Layer.h:109

TMVA::DNN::TLayer::Print
void Print() const
Definition: Layer.h:300

TMVA::DNN::TLayer::GetBiases
Matrix_t & GetBiases()
Definition: Layer.h:119

TMVA::DNN::TLayer::fWeightGradients
Matrix_t fWeightGradients
Gradients w.r.t. the weigths of this layer.
Definition: Layer.h:71

TMVA::DNN::TLayer::fBatchSize
size_t fBatchSize
Batch size used for training and evaluation.
Definition: Layer.h:61

TMVA::DNN::TLayer::Initialize
void Initialize(EInitialization m)
Initialize fWeights according to the given initialization method.
Definition: Layer.h:256

TMVA::DNN::TLayer::fWeights
Matrix_t fWeights
The fWeights of this layer.
Definition: Layer.h:67

TMVA::DNN::TLayer::fDerivatives
Matrix_t fDerivatives
First fDerivatives of the activations of this layer.
Definition: Layer.h:70

TMVA::DNN::TLayer::GetWeightGradients
Matrix_t & GetWeightGradients()
Definition: Layer.h:125

TMVA::DNN::TLayer::GetWidth
size_t GetWidth() const
Definition: Layer.h:108

TMVA::DNN::TLayer::GetWeights
const Matrix_t & GetWeights() const
Definition: Layer.h:118

TMVA::DNN::TLayer::Forward
void Forward(Matrix_t &input, bool applyDropout=false)
Compute activation of the layer for the given input.
Definition: Layer.h:265

TMVA::DNN::TSharedLayer
Layer class width shared weight and bias layers.
Definition: Layer.h:146

TMVA::DNN::TSharedLayer::fBiases
Matrix_t & fBiases
Reference to the bias vectors of this layer.
Definition: Layer.h:162

TMVA::DNN::TSharedLayer::fOutput
Matrix_t fOutput
Activations of this layer.
Definition: Layer.h:163

TMVA::DNN::TSharedLayer::GetBiases
Matrix_t & GetBiases()
Definition: Layer.h:206

TMVA::DNN::TSharedLayer::TSharedLayer
TSharedLayer(size_t fBatchSize, TLayer< Architecture_t > &layer)
Definition: Layer.h:314

TMVA::DNN::TSharedLayer::fWeights
Matrix_t & fWeights
Reference to the weight matrix of this layer.
Definition: Layer.h:161

TMVA::DNN::TSharedLayer::GetActivationGradients
Matrix_t & GetActivationGradients()
Definition: Layer.h:208

TMVA::DNN::TSharedLayer::GetBiasGradients
const Matrix_t & GetBiasGradients() const
Definition: Layer.h:211

TMVA::DNN::TSharedLayer::GetWidth
size_t GetWidth() const
Definition: Layer.h:196

TMVA::DNN::TSharedLayer::fBiasGradients
Matrix_t fBiasGradients
Gradients w.r.t. the bias values of this layer.
Definition: Layer.h:166

TMVA::DNN::TSharedLayer::GetWeightGradients
Matrix_t & GetWeightGradients()
Definition: Layer.h:212

TMVA::DNN::TSharedLayer::fDerivatives
Matrix_t fDerivatives
First fDerivatives of the activations of this layer.
Definition: Layer.h:164

TMVA::DNN::TSharedLayer::GetBiases
const Matrix_t & GetBiases() const
Definition: Layer.h:207

TMVA::DNN::TSharedLayer::Matrix_t
typename Architecture_t::Matrix_t Matrix_t
Definition: Layer.h:151

TMVA::DNN::TSharedLayer::fInputWidth
size_t fInputWidth
Number of neurons of the previous layer.
Definition: Layer.h:156

TMVA::DNN::TSharedLayer::GetOutput
Matrix_t & GetOutput()
Definition: Layer.h:203

TMVA::DNN::TSharedLayer::fWidth
size_t fWidth
Number of neurons of this layer.
Definition: Layer.h:157

TMVA::DNN::TSharedLayer::GetWeightGradients
const Matrix_t & GetWeightGradients() const
Definition: Layer.h:213

TMVA::DNN::TSharedLayer::fBatchSize
size_t fBatchSize
Batch size used for training and evaluation.
Definition: Layer.h:155

TMVA::DNN::TSharedLayer::fWeightGradients
Matrix_t fWeightGradients
Gradients w.r.t. the weigths of this layer.
Definition: Layer.h:165

TMVA::DNN::TSharedLayer::GetActivationFunction
EActivationFunction GetActivationFunction() const
Definition: Layer.h:201

TMVA::DNN::TSharedLayer::fActivationGradients
Matrix_t fActivationGradients
Gradients w.r.t. the activations of this layer.
Definition: Layer.h:167

TMVA::DNN::TSharedLayer::GetDropoutProbability
size_t GetDropoutProbability() const
Definition: Layer.h:197

TMVA::DNN::TSharedLayer::GetInputWidth
size_t GetInputWidth() const
Definition: Layer.h:195

TMVA::DNN::TSharedLayer::Print
void Print() const
Definition: Layer.h:377

TMVA::DNN::TSharedLayer::GetBatchSize
size_t GetBatchSize() const
Definition: Layer.h:194

TMVA::DNN::TSharedLayer::Forward
void Forward(Matrix_t &input, bool applyDropout=false)
Compute activation of the layer for the given input.
Definition: Layer.h:342

TMVA::DNN::TSharedLayer::Scalar_t
typename Architecture_t::Scalar_t Scalar_t
Definition: Layer.h:150

TMVA::DNN::TSharedLayer::fF
EActivationFunction fF
Activation function of the layer.
Definition: Layer.h:169

TMVA::DNN::TSharedLayer::fDropoutProbability
Scalar_t fDropoutProbability
Probability that an input is active.
Definition: Layer.h:159

TMVA::DNN::TSharedLayer::GetWeights
Matrix_t & GetWeights() const
Definition: Layer.h:205

TMVA::DNN::TSharedLayer::GetOutput
const Matrix_t & GetOutput() const
Definition: Layer.h:204

TMVA::DNN::TSharedLayer::GetActivationGradients
const Matrix_t & GetActivationGradients() const
Definition: Layer.h:209

TMVA::DNN::TSharedLayer::GetBiasGradients
Matrix_t & GetBiasGradients()
Definition: Layer.h:210

TMVA::DNN::TSharedLayer::SetDropoutProbability
void SetDropoutProbability(Scalar_t p)
Definition: Layer.h:199

TMVA::DNN::TSharedLayer::Backward
void Backward(Matrix_t &gradients_backward, const Matrix_t &activations_backward, ERegularization r, Scalar_t weightDecay)
Compute weight, bias and activation gradients.
Definition: Layer.h:357

ROOT::Math::GSLSimAn::Copy
void Copy(void *source, void *dest)
Definition: GSLSimAnnealing.cxx:149

TMVA::DNN::EInitialization
EInitialization
Definition: Functions.h:70

TMVA::DNN::EInitialization::kZero
@ kZero

TMVA::DNN::weightDecay
double weightDecay(double error, ItWeight itWeight, ItWeight itWeightEnd, double factorWeightDecay, EnumRegularization eRegularization)
compute the weight decay for regularization (L1 or L2)
Definition: NeuralNet.icc:496

TMVA::DNN::ERegularization
ERegularization
Enum representing the regularization type applied for a given layer.
Definition: Functions.h:63

TMVA::DNN::EActivationFunction
EActivationFunction
Enum that represents layer activation functions.
Definition: Functions.h:32

TMVA
Abstract ClassifierFactory template that handles arbitrary types.
Definition: GeneticMinimizer.h:21

m
auto * m
Definition: textangle.C:8

Functions.h