doc/v610/Layer_8h_source.html

 // @(#)root/tmva/tmva/dnn:$Id$
 // Author: Simon Pfreundschuh 20/06/16

 /*************************************************************************
  * Copyright (C) 2016, Simon Pfreundschuh                                *
  * All rights reserved.                                                  *
  *                                                                       *
  * For the licensing terms see $ROOTSYS/LICENSE.                         *
  * For the list of contributors see $ROOTSYS/README/CREDITS.             *
  *************************************************************************/

 //////////////////////////////////////////////////////////////////////
 // Contains Layer and SharedLayer classes, that represent layers in //
 // neural networks.                                                 //
 //////////////////////////////////////////////////////////////////////

 #ifndef TMVA_DNN_LAYER
 #define TMVA_DNN_LAYER

 #include <iostream>

 #include "TMatrix.h"
 #include "Functions.h"

 namespace TMVA
 {
 namespace DNN
 {

 //______________________________________________________________________________
 //
 //  The Layer Class
 //______________________________________________________________________________

 /** \class TLayer

     Generic layer class.

     This generic layer class represents a layer of a neural network with
     a given width n and activation function f. The activation
     function of each layer is given by \f$\mathbf{u} =
     \mathbf{W}\mathbf{x} + \boldsymbol{\theta}\f$.

     In addition to the weight and bias matrices, each layer allocates memory
     for its activations and the corresponding first partial fDerivatives of
     the activation function as well as the gradients of the fWeights and fBiases.

     The layer provides member functions for the forward propagation of
     activations through the given layer.
 */
 template<typename Architecture_t>
    class TLayer
 {

 public:
    using Scalar_t = typename Architecture_t::Scalar_t;
    using Matrix_t = typename Architecture_t::Matrix_t;

 private:

    size_t fBatchSize;  ///< Batch size used for training and evaluation.
    size_t fInputWidth; ///< Number of neurons of the previous layer.
    size_t fWidth;      ///< Number of neurons of this layer.

    Scalar_t fDropoutProbability;  ///< Probability that an input is active.

    Matrix_t fWeights;             ///< The fWeights of this layer.
    Matrix_t fBiases;              ///< The bias values of this layer.
    Matrix_t fOutput;              ///< Activations of this layer.
    Matrix_t fDerivatives;         ///< First fDerivatives of the activations of this layer.
    Matrix_t fWeightGradients;     ///< Gradients w.r.t. the weigths of this layer.
    Matrix_t fBiasGradients;       ///< Gradients w.r.t. the bias values of this layer.
    Matrix_t fActivationGradients; ///< Gradients w.r.t. the activations of this layer.

    EActivationFunction fF; ///< Activation function of the layer.

 public:

    TLayer(size_t             BatchSize,
           size_t             InputWidth,
           size_t             Width,
           EActivationFunction f,
           Scalar_t           dropoutProbability);
    TLayer(const TLayer &);

    /*! Initialize fWeights according to the given initialization
     *  method. */
    void Initialize(EInitialization m);
    /*! Compute activation of the layer for the given input. The input
     * must be in matrix form with the different rows corresponding to
     * different events in the batch. Computes activations as well as
     * the first partial derivative of the activation function at those
     * activations. */
    void inline Forward(Matrix_t & input, bool applyDropout = false);
    /*! Compute weight, bias and activation gradients. Uses the precomputed
     *  first partial derviatives of the activation function computed during
     *  forward propagation and modifies them. Must only be called directly
     *  a the corresponding call to Forward(...). */
    void inline Backward(Matrix_t & gradients_backward,
                         const Matrix_t & activations_backward,
                         ERegularization r,
                         Scalar_t weightDecay);

    void Print() const;

    size_t GetBatchSize()          const {return fBatchSize;}
    size_t GetInputWidth()         const {return fInputWidth;}
    size_t GetWidth()              const {return fWidth;}
    size_t GetDropoutProbability() const {return fDropoutProbability;}

    void SetDropoutProbability(Scalar_t p) {fDropoutProbability = p;}

    EActivationFunction GetActivationFunction() const {return fF;}

    Matrix_t       & GetOutput()        {return fOutput;}
    const Matrix_t & GetOutput() const  {return fOutput;}
    Matrix_t       & GetWeights()       {return fWeights;}
    const Matrix_t & GetWeights() const {return fWeights;}
    Matrix_t       & GetBiases()       {return fBiases;}
    const Matrix_t & GetBiases() const {return fBiases;}
    Matrix_t       & GetActivationGradients()       {return fActivationGradients;}
    const Matrix_t & GetActivationGradients() const {return fActivationGradients;}
    Matrix_t       & GetBiasGradients()       {return fBiasGradients;}
    const Matrix_t & GetBiasGradients() const {return fBiasGradients;}
    Matrix_t       & GetWeightGradients()       {return fWeightGradients;}
    const Matrix_t & GetWeightGradients() const {return fWeightGradients;}

 };

 //______________________________________________________________________________
 //
 //  The Shared Layer Class
 //______________________________________________________________________________

 /** \class TSharedLayer

     Layer class width shared weight and bias layers.

     Like the Layer class only that weight matrices are shared between
     different instances of the net, which can be used to implement
     multithreading 'Hogwild' style.
 */

 template<typename Architecture_t>
 class TSharedLayer
 {

 public:

    using Scalar_t = typename Architecture_t::Scalar_t;
    using Matrix_t = typename Architecture_t::Matrix_t;

 private:

    size_t fBatchSize;  ///< Batch size used for training and evaluation.
    size_t fInputWidth; ///< Number of neurons of the previous layer.
    size_t fWidth;      ///< Number of neurons of this layer.

    Scalar_t fDropoutProbability;  ///< Probability that an input is active.

    Matrix_t & fWeights;           ///< Reference to the weight matrix of this layer.
    Matrix_t & fBiases;            ///< Reference to the bias vectors of this layer.
    Matrix_t fOutput;              ///< Activations of this layer.
    Matrix_t fDerivatives;         ///< First fDerivatives of the activations of this layer.
    Matrix_t fWeightGradients;     ///< Gradients w.r.t. the weigths of this layer.
    Matrix_t fBiasGradients;       ///< Gradients w.r.t. the bias values of this layer.
    Matrix_t fActivationGradients; ///< Gradients w.r.t. the activations of this layer.

    EActivationFunction fF; ///< Activation function of the layer.

 public:

    TSharedLayer(size_t fBatchSize,
                 TLayer<Architecture_t> & layer);
    TSharedLayer(const TSharedLayer & layer);

    /*! Compute activation of the layer for the given input. The input
     * must be in matrix form with the different rows corresponding to
     * different events in the batch. Computes activations as well as
     * the first partial derivative of the activation function at those
     * activations. */
    void inline Forward(Matrix_t & input, bool applyDropout = false);
    /*! Compute weight, bias and activation gradients. Uses the precomputed
     *  first partial derviatives of the activation function computed during
     *  forward propagation and modifies them. Must only be called directly
     *  a the corresponding call to Forward(...). */
    void inline Backward(Matrix_t & gradients_backward,
                         const Matrix_t & activations_backward,
                         ERegularization r,
                         Scalar_t weightDecay);

    void Print() const;

    size_t GetBatchSize()          const {return fBatchSize;}
    size_t GetInputWidth()         const {return fInputWidth;}
    size_t GetWidth()              const {return fWidth;}
    size_t GetDropoutProbability() const {return fDropoutProbability;}

    void SetDropoutProbability(Scalar_t p) {fDropoutProbability = p;}

    EActivationFunction GetActivationFunction() const {return fF;}

    Matrix_t       & GetOutput()        {return fOutput;}
    const Matrix_t & GetOutput() const  {return fOutput;}
    Matrix_t       & GetWeights() const {return fWeights;}
    Matrix_t       & GetBiases()       {return fBiases;}
    const Matrix_t & GetBiases() const {return fBiases;}
    Matrix_t       & GetActivationGradients()       {return fActivationGradients;}
    const Matrix_t & GetActivationGradients() const {return fActivationGradients;}
    Matrix_t       & GetBiasGradients()       {return fBiasGradients;}
    const Matrix_t & GetBiasGradients() const {return fBiasGradients;}
    Matrix_t       & GetWeightGradients()       {return fWeightGradients;}
    const Matrix_t & GetWeightGradients() const {return fWeightGradients;}

 };

 //______________________________________________________________________________
 //
 //  The Layer Class - Implementation
 //______________________________________________________________________________

 template<typename Architecture_t>
    TLayer<Architecture_t>::TLayer(size_t batchSize,
                                   size_t inputWidth,
                                   size_t width,
                                   EActivationFunction f,
                                   Scalar_t dropoutProbability)
    : fBatchSize(batchSize), fInputWidth(inputWidth), fWidth(width),
      fDropoutProbability(dropoutProbability), fWeights(width, fInputWidth),
      fBiases(width, 1), fOutput(fBatchSize, width), fDerivatives(fBatchSize, width),
      fWeightGradients(width, fInputWidth), fBiasGradients(width, 1),
      fActivationGradients(fBatchSize, width), fF(f)
 {
    // Nothing to do here.
 }

 //______________________________________________________________________________
 template<typename Architecture_t>
 TLayer<Architecture_t>::TLayer(const TLayer &layer)
     : fBatchSize(layer.fBatchSize), fInputWidth(layer.fInputWidth),
     fWidth(layer.fWidth), fDropoutProbability(layer.fDropoutProbability),
     fWeights(layer.fWidth, layer.fInputWidth), fBiases(layer.fWidth, 1),
     fOutput(layer.fBatchSize, layer.fWidth),
     fDerivatives(layer.fBatchSize, layer.fWidth),
     fWeightGradients(layer.fWidth, layer.fInputWidth),
     fBiasGradients(layer.fWidth, 1),
     fActivationGradients(layer.fBatchSize, layer.fWidth),
     fF(layer.fF)
 {
    Architecture_t::Copy(fWeights, layer.GetWeights());
    Architecture_t::Copy(fBiases,  layer.GetBiases());
 }

 //______________________________________________________________________________
 template<typename Architecture_t>
 auto TLayer<Architecture_t>::Initialize(EInitialization m)
 -> void
 {
    initialize<Architecture_t>(fWeights, m);
    initialize<Architecture_t>(fBiases,  EInitialization::kZero);
 }

 //______________________________________________________________________________
 template<typename Architecture_t>
 auto inline TLayer<Architecture_t>::Forward(Matrix_t & input,
                                             bool applyDropout)
 -> void
 {
    if (applyDropout && (fDropoutProbability != 1.0)) {
       Architecture_t::Dropout(input, fDropoutProbability);
    }
    Architecture_t::MultiplyTranspose(fOutput, input, fWeights);
    Architecture_t::AddRowWise(fOutput, fBiases);
    evaluateDerivative<Architecture_t>(fDerivatives, fF, fOutput);
    evaluate<Architecture_t>(fOutput, fF);
 }

 //______________________________________________________________________________
 template<typename Architecture_t>
 auto TLayer<Architecture_t>::Backward(Matrix_t & gradients_backward,
                                     const Matrix_t & activations_backward,
                                     ERegularization r,
                                     Scalar_t weightDecay)
 -> void
 {
    Architecture_t::Backward(gradients_backward,
                             fWeightGradients,
                             fBiasGradients,
                             fDerivatives,
                             fActivationGradients,
                             fWeights,
                             activations_backward);
    addRegularizationGradients<Architecture_t>(fWeightGradients,
                                               fWeights,
                                               weightDecay, r);
 }

 //______________________________________________________________________________
 template<typename Architecture_t>
    void TLayer<Architecture_t>::Print() const
 {
    std::cout << "Width = " << fWeights.GetNrows();
    std::cout << ", Activation Function = ";
    std::cout << static_cast<int>(fF) << std::endl;
 }

 //______________________________________________________________________________
 //
 //  The Shared Layer Class - Implementation
 //______________________________________________________________________________

 //______________________________________________________________________________
 template<typename Architecture_t>
 TSharedLayer<Architecture_t>::TSharedLayer(size_t BatchSize,
                                          TLayer<Architecture_t> &layer)
 : fBatchSize(BatchSize),
 fInputWidth(layer.GetInputWidth()), fWidth(layer.GetWidth()),
 fDropoutProbability(layer.GetDropoutProbability()),
 fWeights(layer.GetWeights()), fBiases(layer.GetBiases()),
 fOutput(fBatchSize, fWidth), fDerivatives(fBatchSize, fWidth),
 fWeightGradients(fWidth, fInputWidth), fBiasGradients(fWidth, 1),
 fActivationGradients(fBatchSize, fWidth), fF(layer.GetActivationFunction())
 {
    // Nothing to do here.
 }

 //______________________________________________________________________________
 template<typename Architecture_t>
 TSharedLayer<Architecture_t>::TSharedLayer(const TSharedLayer &layer)
     : fBatchSize(layer.fBatchSize),
     fInputWidth(layer.GetInputWidth()), fWidth(layer.GetWidth()),
     fDropoutProbability(layer.fDropoutProbability), fWeights(layer.fWeights),
     fBiases(layer.fBiases), fOutput(layer.fBatchSize, fWidth),
     fDerivatives(layer.fBatchSize, fWidth), fWeightGradients(fWidth, fInputWidth),
     fBiasGradients(fWidth, 1), fActivationGradients(layer.fBatchSize, fWidth),
     fF(layer.fF)
 {
 }

 //______________________________________________________________________________
 template<typename Architecture_t>
 auto inline TSharedLayer<Architecture_t>::Forward(Matrix_t & input,
                                                   bool applyDropout)
 -> void
 {
    if (applyDropout && (fDropoutProbability != 1.0)) {
       Architecture_t::Dropout(input, fDropoutProbability);
    }
    Architecture_t::MultiplyTranspose(fOutput, input, fWeights);
    Architecture_t::AddRowWise(fOutput, fBiases);
    evaluateDerivative<Architecture_t>(fDerivatives, fF, fOutput);
    evaluate<Architecture_t>(fOutput, fF);
 }

 //______________________________________________________________________________
 template<typename Architecture_t>
 auto inline TSharedLayer<Architecture_t>::Backward(Matrix_t & gradients_backward,
                                                  const Matrix_t & activations_backward,
                                                  ERegularization r,
                                                  Scalar_t weightDecay)
 -> void
 {
    Architecture_t::Backward(gradients_backward,
                             fWeightGradients,
                             fBiasGradients,
                             fDerivatives,
                             fActivationGradients,
                             fWeights,
                             activations_backward);
    addRegularizationGradients<Architecture_t>(fWeightGradients,
                                               fWeights,
                                               weightDecay, r);
 }

 //______________________________________________________________________________
 template<typename Architecture_t>
 void TSharedLayer<Architecture_t>::Print() const
 {
    std::cout << "Width = " << fWeights.GetNrows();
    std::cout << ", Activation Function = ";
    std::cout << static_cast<int>(fF) << std::endl;
 }

 } // namespace DNN
 } // namespace TMVA

 #endif
TMVA::DNN::TLayer::Forward
void Forward(Matrix_t &input, bool applyDropout=false)
Compute activation of the layer for the given input.
Definition: Layer.h:265

TMVA::DNN::TSharedLayer::fF
EActivationFunction fF
Activation function of the layer.
Definition: Layer.h:169

TMVA::DNN::TLayer::fWeightGradients
Matrix_t fWeightGradients
Gradients w.r.t. the weigths of this layer.
Definition: Layer.h:71

TMVA::DNN::TSharedLayer::Print
void Print() const
Definition: Layer.h:377

TMVA::DNN::TSharedLayer::SetDropoutProbability
void SetDropoutProbability(Scalar_t p)
Definition: Layer.h:199

TMVA::DNN::TLayer::GetWeights
Matrix_t & GetWeights()
Definition: Layer.h:117

TMVA::DNN::TSharedLayer::GetOutput
Matrix_t & GetOutput()
Definition: Layer.h:203

TMVA::DNN::TLayer::TLayer
TLayer(size_t BatchSize, size_t InputWidth, size_t Width, EActivationFunction f, Scalar_t dropoutProbability)
Definition: Layer.h:223

TMVA::DNN::TSharedLayer::GetActivationFunction
EActivationFunction GetActivationFunction() const
Definition: Layer.h:201

TMVA::DNN::TLayer::fInputWidth
size_t fInputWidth
Number of neurons of the previous layer.
Definition: Layer.h:62

TMVA::DNN::TLayer::fBatchSize
size_t fBatchSize
Batch size used for training and evaluation.
Definition: Layer.h:61

TMVA::DNN::TLayer::Backward
void Backward(Matrix_t &gradients_backward, const Matrix_t &activations_backward, ERegularization r, Scalar_t weightDecay)
Compute weight, bias and activation gradients.
Definition: Layer.h:280

Functions.h

TMVA::DNN::TSharedLayer::TSharedLayer
TSharedLayer(size_t fBatchSize, TLayer< Architecture_t > &layer)
Definition: Layer.h:314

TMVA::DNN::TLayer::GetDropoutProbability
size_t GetDropoutProbability() const
Definition: Layer.h:109

TMVA::DNN::TSharedLayer::GetWeights
Matrix_t & GetWeights() const
Definition: Layer.h:205

TMVA::DNN::TSharedLayer::GetDropoutProbability
size_t GetDropoutProbability() const
Definition: Layer.h:197

TMVA::DNN::TSharedLayer::fOutput
Matrix_t fOutput
Activations of this layer.
Definition: Layer.h:163

TMVA::DNN::TSharedLayer::GetOutput
const Matrix_t & GetOutput() const
Definition: Layer.h:204

TMVA::DNN::TSharedLayer::GetBiasGradients
const Matrix_t & GetBiasGradients() const
Definition: Layer.h:211

TMVA::DNN::TLayer::GetWeightGradients
Matrix_t & GetWeightGradients()
Definition: Layer.h:125

TMVA::DNN::TLayer::fF
EActivationFunction fF
Activation function of the layer.
Definition: Layer.h:75

TMVA::DNN::TSharedLayer::fDerivatives
Matrix_t fDerivatives
First fDerivatives of the activations of this layer.
Definition: Layer.h:164

TMVA::DNN::TSharedLayer::GetBiases
const Matrix_t & GetBiases() const
Definition: Layer.h:207

TMVA::DNN::TLayer::GetBiases
const Matrix_t & GetBiases() const
Definition: Layer.h:120

TMVA::DNN::EInitialization
EInitialization
Definition: Functions.h:70

TMVA::DNN::TLayer::fBiasGradients
Matrix_t fBiasGradients
Gradients w.r.t. the bias values of this layer.
Definition: Layer.h:72

TMVA::DNN::TSharedLayer::fBiases
Matrix_t & fBiases
Reference to the bias vectors of this layer.
Definition: Layer.h:162

TMVA::DNN::TSharedLayer::fWeightGradients
Matrix_t fWeightGradients
Gradients w.r.t. the weigths of this layer.
Definition: Layer.h:165

TMVA::DNN::TLayer
Generic layer class.
Definition: Layer.h:52

TMVA::DNN::TLayer::fWeights
Matrix_t fWeights
The fWeights of this layer.
Definition: Layer.h:67

TMVA::DNN::weightDecay
double weightDecay(double error, ItWeight itWeight, ItWeight itWeightEnd, double factorWeightDecay, EnumRegularization eRegularization)
compute the weight decay for regularization (L1 or L2)
Definition: NeuralNet.icc:496

TMVA::DNN::TSharedLayer::fInputWidth
size_t fInputWidth
Number of neurons of the previous layer.
Definition: Layer.h:156

TMVA::DNN::TLayer::GetBiasGradients
Matrix_t & GetBiasGradients()
Definition: Layer.h:123

TMVA::DNN::TSharedLayer::GetWeightGradients
Matrix_t & GetWeightGradients()
Definition: Layer.h:212

TMVA::DNN::TLayer::GetActivationGradients
const Matrix_t & GetActivationGradients() const
Definition: Layer.h:122

TMVA::DNN::TSharedLayer::Scalar_t
typename Architecture_t::Scalar_t Scalar_t
Definition: Layer.h:150

TMVA::DNN::TLayer::Scalar_t
typename Architecture_t::Scalar_t Scalar_t
Definition: Layer.h:56

TMVA::DNN::TLayer::fBiases
Matrix_t fBiases
The bias values of this layer.
Definition: Layer.h:68

TMVA::DNN::TLayer::GetWidth
size_t GetWidth() const
Definition: Layer.h:108

TMVA::DNN::TSharedLayer::fBiasGradients
Matrix_t fBiasGradients
Gradients w.r.t. the bias values of this layer.
Definition: Layer.h:166

TMVA::DNN::TLayer::GetInputWidth
size_t GetInputWidth() const
Definition: Layer.h:107

TMVA::DNN::TLayer::GetOutput
Matrix_t & GetOutput()
Definition: Layer.h:115

TMVA::DNN::TSharedLayer::GetActivationGradients
Matrix_t & GetActivationGradients()
Definition: Layer.h:208

TMVA::DNN::TLayer::GetActivationFunction
EActivationFunction GetActivationFunction() const
Definition: Layer.h:113

r
TRandom2 r(17)

TMVA::DNN::TLayer::GetActivationGradients
Matrix_t & GetActivationGradients()
Definition: Layer.h:121

TMVA::DNN::TSharedLayer::Matrix_t
typename Architecture_t::Matrix_t Matrix_t
Definition: Layer.h:151

TMVA::DNN::TSharedLayer::GetInputWidth
size_t GetInputWidth() const
Definition: Layer.h:195

TMVA::DNN::TLayer::GetBatchSize
size_t GetBatchSize() const
Definition: Layer.h:106

m
TMarker * m
Definition: textangle.C:8

TMVA::DNN::TLayer::fOutput
Matrix_t fOutput
Activations of this layer.
Definition: Layer.h:69

TMVA::DNN::TSharedLayer::fDropoutProbability
Scalar_t fDropoutProbability
Probability that an input is active.
Definition: Layer.h:159

TMVA::DNN::TSharedLayer::fWeights
Matrix_t & fWeights
Reference to the weight matrix of this layer.
Definition: Layer.h:161

TMVA::DNN::TSharedLayer::GetBiasGradients
Matrix_t & GetBiasGradients()
Definition: Layer.h:210

TMVA::DNN::TLayer::GetOutput
const Matrix_t & GetOutput() const
Definition: Layer.h:116

TMVA::DNN::TSharedLayer::GetWeightGradients
const Matrix_t & GetWeightGradients() const
Definition: Layer.h:213

TMVA::DNN::TSharedLayer::fBatchSize
size_t fBatchSize
Batch size used for training and evaluation.
Definition: Layer.h:155

TMVA::DNN::TSharedLayer::Forward
void Forward(Matrix_t &input, bool applyDropout=false)
Compute activation of the layer for the given input.
Definition: Layer.h:342

TMVA::DNN::TLayer::Initialize
void Initialize(EInitialization m)
Initialize fWeights according to the given initialization method.
Definition: Layer.h:256

TMVA::DNN::TLayer::SetDropoutProbability
void SetDropoutProbability(Scalar_t p)
Definition: Layer.h:111

ROOT::Math::GSLSimAn::Copy
void Copy(void *source, void *dest)
Definition: GSLSimAnnealing.cxx:149

f
double f(double x)
Definition: testIntegration.cxx:12

TMVA::DNN::TLayer::GetBiases
Matrix_t & GetBiases()
Definition: Layer.h:119

TMVA::DNN::EInitialization::kZero

TMVA::DNN::TSharedLayer
Layer class width shared weight and bias layers.
Definition: Layer.h:145

TMVA::DNN::TLayer::fDerivatives
Matrix_t fDerivatives
First fDerivatives of the activations of this layer.
Definition: Layer.h:70

TMVA::DNN::TSharedLayer::GetActivationGradients
const Matrix_t & GetActivationGradients() const
Definition: Layer.h:209

TMVA::DNN::TLayer::fWidth
size_t fWidth
Number of neurons of this layer.
Definition: Layer.h:63

TMVA::DNN::TSharedLayer::GetBiases
Matrix_t & GetBiases()
Definition: Layer.h:206

TMVA::DNN::TLayer::fActivationGradients
Matrix_t fActivationGradients
Gradients w.r.t. the activations of this layer.
Definition: Layer.h:73

TMVA::DNN::TLayer::fDropoutProbability
Scalar_t fDropoutProbability
Probability that an input is active.
Definition: Layer.h:65

TMVA::DNN::TLayer::Matrix_t
typename Architecture_t::Matrix_t Matrix_t
Definition: Layer.h:57

TMVA
Abstract ClassifierFactory template that handles arbitrary types.
Definition: GeneticMinimizer.h:21

TMVA::DNN::TSharedLayer::fActivationGradients
Matrix_t fActivationGradients
Gradients w.r.t. the activations of this layer.
Definition: Layer.h:167

TMVA::DNN::TSharedLayer::GetBatchSize
size_t GetBatchSize() const
Definition: Layer.h:194

TMVA::DNN::ERegularization
ERegularization
Enum representing the regularization type applied for a given layer.
Definition: Functions.h:62

TMVA::DNN::TLayer::GetWeights
const Matrix_t & GetWeights() const
Definition: Layer.h:118

TMatrix.h

TMVA::DNN::TLayer::GetBiasGradients
const Matrix_t & GetBiasGradients() const
Definition: Layer.h:124

TMVA::DNN::EActivationFunction
EActivationFunction
Enum that represents layer activation functions.
Definition: Functions.h:31

TMVA::DNN::TSharedLayer::Backward
void Backward(Matrix_t &gradients_backward, const Matrix_t &activations_backward, ERegularization r, Scalar_t weightDecay)
Compute weight, bias and activation gradients.
Definition: Layer.h:357

TMVA::DNN::TSharedLayer::fWidth
size_t fWidth
Number of neurons of this layer.
Definition: Layer.h:157

TMVA::DNN::TLayer::GetWeightGradients
const Matrix_t & GetWeightGradients() const
Definition: Layer.h:126

TMVA::DNN::TSharedLayer::GetWidth
size_t GetWidth() const
Definition: Layer.h:196

TMVA::DNN::TLayer::Print
void Print() const
Definition: Layer.h:300