doc/v614/Reference_8h_source.html

 // @(#)root/tmva/tmva/dnn:$Id$
 // Author: Simon Pfreundschuh 20/06/16

 /*************************************************************************
  * Copyright (C) 2016, Simon Pfreundschuh                                *
  * All rights reserved.                                                  *
  *                                                                       *
  * For the licensing terms see $ROOTSYS/LICENSE.                         *
  * For the list of contributors see $ROOTSYS/README/CREDITS.             *
  *************************************************************************/

 ///////////////////////////////////////////////////////////////////////
 // Declaration of the TReference architecture, which provides a      //
 // reference implementation of the low-level interface for the DNN   //
 // implementation based on ROOT's TMatrixT matrix type.              //
 ///////////////////////////////////////////////////////////////////////

 #ifndef TMVA_DNN_ARCHITECTURES_REFERENCE
 #define TMVA_DNN_ARCHITECTURES_REFERENCE

 #include "TMatrix.h"
 #include "TMVA/DNN/Functions.h"
 #include "TMVA/DNN/Architectures/Reference/DataLoader.h"
 #include "TMVA/DNN/Architectures/Reference/TensorDataLoader.h"
 #include <vector>

 class TRandom;

 namespace TMVA
 {
 namespace DNN
 {

 /*! The reference architecture class.
 *
 * Class template that contains the reference implementation of the low-level
 * interface for the DNN implementation. The reference implementation uses the
 * TMatrixT class template to represent matrices.
 *
 * \tparam AReal The floating point type used to represent scalars.
 */
 template<typename AReal>
 class TReference
 {
 private:
    static TRandom * fgRandomGen;
 public:

    using Scalar_t     = AReal;
    using Matrix_t     = TMatrixT<AReal>;

    //____________________________________________________________________________
    //
    // Propagation
    //____________________________________________________________________________

    /** @name Forward Propagation
     * Low-level functions required for the forward propagation of activations
     * through the network.
     */
    ///@{
    /** Matrix-multiply \p input with the transpose of \pweights and
     *  write the results into \p output. */
    static void MultiplyTranspose(TMatrixT<Scalar_t> &output,
                                  const TMatrixT<Scalar_t> &input,
                                  const TMatrixT<Scalar_t> &weights);
    /** Add the vectors biases row-wise to the matrix output */
    static void AddRowWise(TMatrixT<Scalar_t> &output,
                           const TMatrixT<Scalar_t> &biases);
    ///@}

    /** @name Backward Propagation
     * Low-level functions required for the forward propagation of activations
     * through the network.
     */
    ///@{
    /** Perform the complete backward propagation step. If the provided
     *  \p activationGradientsBackward matrix is not empty, compute the
     *  gradients of the objective function with respect to the activations
     *  of the previous layer (backward direction).
     *  Also compute the weight and the bias gradients. Modifies the values
     *  in \p df and thus produces only a valid result, if it is applied the
     *  first time after the corresponding forward propagation has been per-
     *  formed. */
    static void Backward(TMatrixT<Scalar_t> & activationGradientsBackward,
                         TMatrixT<Scalar_t> & weightGradients,
                         TMatrixT<Scalar_t> & biasGradients,
                         TMatrixT<Scalar_t> & df,
                         const TMatrixT<Scalar_t> & activationGradients,
                         const TMatrixT<Scalar_t> & weights,
                         const TMatrixT<Scalar_t> & activationBackward);
    /** Backpropagation step for a Recurrent Neural Network */
    static Matrix_t & RecurrentLayerBackward(TMatrixT<Scalar_t> & state_gradients_backward, // BxH
                                             TMatrixT<Scalar_t> & input_weight_gradients,
                                             TMatrixT<Scalar_t> & state_weight_gradients,
                                             TMatrixT<Scalar_t> & bias_gradients,
                                             TMatrixT<Scalar_t> & df, //DxH
                                             const TMatrixT<Scalar_t> & state, // BxH
                                             const TMatrixT<Scalar_t> & weights_input, // HxD
                                             const TMatrixT<Scalar_t> & weights_state, // HxH
                                             const TMatrixT<Scalar_t> & input,  // BxD
                                             TMatrixT<Scalar_t> & input_gradient);
    /** Adds a the elements in matrix B scaled by c to the elements in
     *  the matrix A. This is required for the weight update in the gradient
     *  descent step.*/
    static void ScaleAdd(TMatrixT<Scalar_t> & A,
                         const TMatrixT<Scalar_t> & B,
                         Scalar_t beta = 1.0);

    static void Copy(TMatrixT<Scalar_t> & A,
                     const TMatrixT<Scalar_t> & B);

    // copy from another type of matrix
    template<typename AMatrix_t>
    static void CopyDiffArch(TMatrixT<Scalar_t> & A, const AMatrix_t & B);


    /** Above functions extended to vectors */
    static void ScaleAdd(std::vector<TMatrixT<Scalar_t>> & A,
                         const std::vector<TMatrixT<Scalar_t>> & B,
                         Scalar_t beta = 1.0);

    static void Copy(std::vector<TMatrixT<Scalar_t>> & A, const std::vector<TMatrixT<Scalar_t>> & B);

    // copy from another architecture
    template<typename AMatrix_t>
    static void CopyDiffArch(std::vector<TMatrixT<Scalar_t> > & A, const std::vector<AMatrix_t> & B);


    ///@}

    //____________________________________________________________________________
    //
    // Activation Functions
    //____________________________________________________________________________

    /** @name Activation Functions
     * For each activation function, the low-level interface contains two routines.
     * One that applies the acitvation function to a matrix and one that evaluate
     * the derivatives of the activation function at the elements of a given matrix
     * and writes the results into the result matrix.
     */
    ///@{
    static void Identity(TMatrixT<AReal> & B);
    static void IdentityDerivative(TMatrixT<AReal> & B,
                                   const TMatrixT<AReal> & A);

    static void Relu(TMatrixT<AReal> & B);
    static void ReluDerivative(TMatrixT<AReal> & B,
                               const TMatrixT<AReal> & A);

    static void Sigmoid(TMatrixT<AReal> & B);
    static void SigmoidDerivative(TMatrixT<AReal> & B,
                                  const TMatrixT<AReal> & A);

    static void Tanh(TMatrixT<AReal> & B);
    static void TanhDerivative(TMatrixT<AReal> & B,
                               const TMatrixT<AReal> & A);

    static void SymmetricRelu(TMatrixT<AReal> & B);
    static void SymmetricReluDerivative(TMatrixT<AReal> & B,
                                        const TMatrixT<AReal> & A);

    static void SoftSign(TMatrixT<AReal> & B);
    static void SoftSignDerivative(TMatrixT<AReal> & B,
                                   const TMatrixT<AReal> & A);

    static void Gauss(TMatrixT<AReal> & B);
    static void GaussDerivative(TMatrixT<AReal> & B,
                                const TMatrixT<AReal> & A);

    ///@}

    //____________________________________________________________________________
    //
    // Loss Functions
    //____________________________________________________________________________

    /** @name Loss Functions
     * Loss functions compute a scalar value given the \p output of the network
     * for a given training input and the expected network prediction \p Y that
     * quantifies the quality of the prediction. For each function also a routing
     * that computes the gradients (suffixed by Gradients) must be provided for
     * the starting of the backpropagation algorithm.
     */
    ///@{

    static AReal MeanSquaredError(const TMatrixT<AReal> &Y, const TMatrixT<AReal> &output,
                                  const TMatrixT<AReal> &weights);
    static void MeanSquaredErrorGradients(TMatrixT<AReal> &dY, const TMatrixT<AReal> &Y, const TMatrixT<AReal> &output,
                                          const TMatrixT<AReal> &weights);

    /** Sigmoid transformation is implicitly applied, thus \p output should
     *  hold the linear activations of the last layer in the net. */
    static AReal CrossEntropy(const TMatrixT<AReal> &Y, const TMatrixT<AReal> &output, const TMatrixT<AReal> &weights);

    static void CrossEntropyGradients(TMatrixT<AReal> &dY, const TMatrixT<AReal> &Y, const TMatrixT<AReal> &output,
                                      const TMatrixT<AReal> &weights);

    /** Softmax transformation is implicitly applied, thus \p output should
     *  hold the linear activations of the last layer in the net. */
    static AReal SoftmaxCrossEntropy(const TMatrixT<AReal> &Y, const TMatrixT<AReal> &output,
                                     const TMatrixT<AReal> &weights);
    static void SoftmaxCrossEntropyGradients(TMatrixT<AReal> &dY, const TMatrixT<AReal> &Y,
                                             const TMatrixT<AReal> &output, const TMatrixT<AReal> &weights);
    ///@}

    //____________________________________________________________________________
    //
    // Output Functions
    //____________________________________________________________________________

    /** @name Output Functions
     * Output functions transform the activations \p output of the
     * output layer in the network to a valid prediction \p YHat for
     * the desired usage of the network, e.g.  the identity function
     * for regression or the sigmoid transformation for two-class
     * classification.
     */
    ///@{
    static void Sigmoid(TMatrixT<AReal> &YHat,
                        const TMatrixT<AReal> & );
    static void Softmax(TMatrixT<AReal> &YHat,
                        const TMatrixT<AReal> & );
    ///@}

    //____________________________________________________________________________
    //
    // Regularization
    //____________________________________________________________________________

    /** @name Regularization
     * For each regularization type two functions are required, one named
     * <tt><Type>Regularization</tt> that evaluates the corresponding
     * regularization functional for a given weight matrix and the
     * <tt>Add<Type>RegularizationGradients</tt>, that adds the regularization
     * component in the gradients to the provided matrix.
     */
    ///@{

    static AReal L1Regularization(const TMatrixT<AReal> & W);
    static void AddL1RegularizationGradients(TMatrixT<AReal> & A,
                                             const TMatrixT<AReal> & W,
                                             AReal weightDecay);

    static AReal L2Regularization(const TMatrixT<AReal> & W);
    static void AddL2RegularizationGradients(TMatrixT<AReal> & A,
                                             const TMatrixT<AReal> & W,
                                             AReal weightDecay);
    ///@}

    //____________________________________________________________________________
    //
    // Initialization
    //____________________________________________________________________________

    /** @name Initialization
     * For each initialization method, one function in the low-level interface
     * is provided. The naming scheme is <p>Initialize<Type></p> for a given
     * initialization method Type.
     */
    ///@{

    static void InitializeGauss(TMatrixT<AReal> & A);

    static void InitializeUniform(TMatrixT<AReal> & A);

    static void InitializeIdentity(TMatrixT<AReal> & A);

    static void InitializeZero(TMatrixT<AReal> & A);

    static void InitializeGlorotUniform(TMatrixT<AReal> & A);

    static void InitializeGlorotNormal(TMatrixT<AReal> & A);

    // return static instance of random generator used for initialization
    // if generator does not exist it is created the first time with a random seed (e.g. seed = 0)
    static TRandom & GetRandomGenerator();
    // set random seed for the static geenrator
    // if the static geneerator does not exists it is created
    static void SetRandomSeed(size_t seed);


    ///@}

    //____________________________________________________________________________
    //
    // Dropout
    //____________________________________________________________________________

    /** @name Dropout
     */
    ///@{

    /** Apply dropout with activation probability \p p to the given
     *  matrix \p A and scale the result by reciprocal of \p p. */
    static void Dropout(TMatrixT<AReal> & A, AReal dropoutProbability);

    ///@}


    //____________________________________________________________________________
    //
    //  Convolutional Layer Propagation
    //____________________________________________________________________________

    /** @name Forward Propagation in Convolutional Layer
     */
    ///@{

    /** Transform the matrix \p B in local view format, suitable for
     *  convolution, and store it in matrix \p A. */
    static void Im2col(TMatrixT<AReal> &A, TMatrixT<AReal> &B, size_t imgHeight, size_t imgWidth, size_t fltHeight,
                       size_t fltWidth, size_t strideRows, size_t strideCols, size_t zeroPaddingHeight,
                       size_t zeroPaddingWidth);
    static void Im2colIndices(std::vector<int> &, const TMatrixT<AReal> &, size_t, size_t, size_t, size_t ,
                       size_t , size_t , size_t , size_t ,size_t ) {
       Fatal("Im2ColIndices","This function is not implemented for ref architectures");
    }
    static void Im2colFast(TMatrixT<AReal> &, const TMatrixT<AReal> &, const std::vector<int> & ) {
        Fatal("Im2ColFast","This function is not implemented for ref architectures");
    }

    /** Rotates the matrix \p B, which is representing a weights,
     *  and stores them in the matrix \p A. */
    static void RotateWeights(TMatrixT<AReal> &A, const TMatrixT<AReal> &B, size_t filterDepth, size_t filterHeight,
                              size_t filterWidth, size_t numFilters);

    /** Add the biases in the Convolutional Layer.  */
    static void AddConvBiases(TMatrixT<AReal> &output, const TMatrixT<AReal> &biases);
    ///@}

       /** Forward propagation in the Convolutional layer */
    // static void ConvLayerForward(std::vector<TMatrixT<AReal>> & output, std::vector<TMatrixT<AReal>> & derivatives,
    //                              const std::vector<TMatrixT<AReal>> &input,
    //                              const TMatrixT<AReal> & weights, const TMatrixT<AReal> & biases,
    //                              EActivationFunction func, const std::vector<int> & vIndices,
    //                              size_t nlocalViews, size_t nlocalViewPixels,
    //                              AReal dropoutProbability, bool applyDropout) {
    static void ConvLayerForward(std::vector<TMatrixT<AReal>> & , std::vector<TMatrixT<AReal>> &,
                                 const std::vector<TMatrixT<AReal>> &,
                                 const TMatrixT<AReal> & , const TMatrixT<AReal> & ,
                                 EActivationFunction , const std::vector<int> &,
                                 size_t , size_t,
                                 AReal , bool ) {
       Fatal("ConvLayerForward","This function is not implemented for ref architectures");
    }


    /** @name Backward Propagation in Convolutional Layer
     */
    ///@{

    /** Perform the complete backward propagation step in a Convolutional Layer.
     *  If the provided \p activationGradientsBackward matrix is not empty, compute the
     *  gradients of the objective function with respect to the activations
     *  of the previous layer (backward direction).
     *  Also compute the weight and the bias gradients. Modifies the values
     *  in \p df and thus produces only a valid result, if it is applied the
     *  first time after the corresponding forward propagation has been per-
     *  formed. */
    // static void ConvLayerBackward(std::vector<TMatrixT<AReal>> &activationGradientsBackward,
    //                               TMatrixT<AReal> &weightGradients, TMatrixT<AReal> &biasGradients,
    //                               std::vector<TMatrixT<AReal>> &df,
    //                               const std::vector<TMatrixT<AReal>> &activationGradients,
    //                               const TMatrixT<AReal> &weights, const std::vector<TMatrixT<AReal>> &activationBackward,
    //                               size_t batchSize, size_t inputHeight, size_t inputWidth, size_t depth, size_t height,
    //                               size_t width, size_t filterDepth, size_t filterHeight, size_t filterWidth,
    //                               size_t nLocalViews) {
    static void ConvLayerBackward(std::vector<TMatrixT<AReal>> &,
                                  TMatrixT<AReal> &, TMatrixT<AReal> &,
                                  std::vector<TMatrixT<AReal>> &,
                                  const std::vector<TMatrixT<AReal>> &,
                                  const TMatrixT<AReal> &, const std::vector<TMatrixT<AReal>> &,
                                  size_t , size_t , size_t , size_t , size_t,
                                  size_t , size_t , size_t , size_t ,
                                  size_t ) {
       Fatal("ConvLayerBackward","This function is not implemented for ref architectures");

    }

 #ifdef HAVE_CNN_REFERENCE
    /** Utility function for calculating the activation gradients of the layer
     *  before the convolutional layer. */
    static void CalculateConvActivationGradients(std::vector<TMatrixT<AReal>> &activationGradientsBackward,
                                                 const std::vector<TMatrixT<AReal>> &df, const TMatrixT<AReal> &weights,
                                                 size_t batchSize, size_t inputHeight, size_t inputWidth, size_t depth,
                                                 size_t height, size_t width, size_t filterDepth, size_t filterHeight,
                                                 size_t filterWidth);

    /** Utility function for calculating the weight gradients of the convolutional
     *  layer. */
    static void CalculateConvWeightGradients(TMatrixT<AReal> &weightGradients, const std::vector<TMatrixT<AReal>> &df,
                                             const std::vector<TMatrixT<AReal>> &activationBackward, size_t batchSize,
                                             size_t inputHeight, size_t inputWidth, size_t depth, size_t height,
                                             size_t width, size_t filterDepth, size_t filterHeight, size_t filterWidth,
                                             size_t nLocalViews);

    /** Utility function for calculating the bias gradients of the convolutional
     *  layer. */
    static void CalculateConvBiasGradients(TMatrixT<AReal> &biasGradients, const std::vector<TMatrixT<AReal>> &df,
                                           size_t batchSize, size_t depth, size_t nLocalViews);
    ///@}

 #endif

    //____________________________________________________________________________
    //
    //  Max Pooling Layer Propagation
    //____________________________________________________________________________
    /** @name Forward Propagation in Max Pooling Layer
     */
    ///@{

   /** Downsample the matrix \p C to the matrix \p A, using max
     *  operation, such that the winning indices are stored in matrix
     *  \p B. */
    static void Downsample(TMatrixT<AReal> &A, TMatrixT<AReal> &B, const TMatrixT<AReal> &C, size_t imgHeight,
                           size_t imgWidth, size_t fltHeight, size_t fltWidth, size_t strideRows, size_t strideCols);

    ///@}

    /** @name Backward Propagation in Max Pooling Layer
     */
    ///@{

    /** Perform the complete backward propagation step in a Max Pooling Layer. Based on the
     *  winning idices stored in the index matrix, it just forwards the actiovation
     *  gradients to the previous layer. */
    static void MaxPoolLayerBackward(std::vector<TMatrixT<AReal>> &activationGradientsBackward,
                                     const std::vector<TMatrixT<AReal>> &activationGradients,
                                     const std::vector<TMatrixT<AReal>> &indexMatrix, size_t batchSize, size_t depth,
                                     size_t nLocalViews);
    ///@}
    //____________________________________________________________________________
    //
    //  Reshape Layer Propagation
    //____________________________________________________________________________
    /** @name Forward and Backward Propagation in Reshape Layer
     */
    ///@{

    /** Transform the matrix \p B to a matrix with different dimensions \p A */
    static void Reshape(TMatrixT<AReal> &A, const TMatrixT<AReal> &B);

    /** Flattens the tensor \p B, such that each matrix, is stretched in one row, resulting with a matrix \p A. */
    static void Flatten(TMatrixT<AReal> &A, const std::vector<TMatrixT<AReal>> &B, size_t size, size_t nRows,
                        size_t nCols);

    /** Transforms each row of \p B to a matrix and stores it in the tensor \p B. */
    static void Deflatten(std::vector<TMatrixT<AReal>> &A, const TMatrixT<Scalar_t> &B, size_t index, size_t nRows,
                          size_t nCols);
    /** Rearrage data accoring to time fill B x T x D out with T x B x D matrix in*/
    static void Rearrange(std::vector<TMatrixT<AReal>> &out, const std::vector<TMatrixT<AReal>> &in);

    ///@}

    //____________________________________________________________________________
    //
    // Additional Arithmetic Functions
    //____________________________________________________________________________

    /** Sum columns of (m x n) matrixx \p A and write the results into the first
     * m elements in \p A.
     */
    static void SumColumns(TMatrixT<AReal> &B, const TMatrixT<AReal> &A);

    //____________________________________________________________________________
    //
    // AutoEncoder Propagation
    //____________________________________________________________________________

    // Add Biases to the output
    static void AddBiases(TMatrixT<AReal> &A,
                          const TMatrixT<AReal> &biases);

    // Updating parameters after every backward pass. Weights and biases are
    // updated.
    static void
    UpdateParams(TMatrixT<AReal> &x, TMatrixT<AReal> &tildeX, TMatrixT<AReal> &y,
                 TMatrixT<AReal> &z, TMatrixT<AReal> &fVBiases,
                 TMatrixT<AReal> &fHBiases, TMatrixT<AReal> &fWeights,
                 TMatrixT<AReal> &VBiasError, TMatrixT<AReal> &HBiasError,
                 AReal learningRate, size_t fBatchSize);

    // Softmax functions redifined
    static void SoftmaxAE(TMatrixT<AReal> & A);


    // Corrupt the input values randomly on corruption Level.
    //Basically inputs are masked currently.
    static void CorruptInput(TMatrixT<AReal> & input,
                             TMatrixT<AReal> & corruptedInput,
                             AReal corruptionLevel);

    //Encodes the input Values in the compressed form.
    static void EncodeInput(TMatrixT<AReal> &input,
                            TMatrixT<AReal> &compressedInput,
                            TMatrixT<AReal> &Weights);

    // reconstructs the input. The reconstructed Input has same dimensions as that
    // of the input.
    static void ReconstructInput(TMatrixT<AReal> & compressedInput,
                                 TMatrixT<AReal> & reconstructedInput,
                                 TMatrixT<AReal> &fWeights);


    static void ForwardLogReg(TMatrixT<AReal> &input,
                              TMatrixT<AReal> &p,
                              TMatrixT<AReal> &fWeights);

    static void UpdateParamsLogReg(TMatrixT<AReal> &input,
                                   TMatrixT<AReal> &output,
                                   TMatrixT<AReal> &difference,
                                   TMatrixT<AReal> &p,
                                   TMatrixT<AReal> &fWeights,
                                   TMatrixT<AReal> &fBiases,
                                   AReal learningRate,
                                   size_t fBatchSize);

 };


 // implement the templated member functions
 template <typename AReal>
 template <typename AMatrix_t>
 void TReference<AReal>::CopyDiffArch(TMatrixT<AReal> &A, const AMatrix_t &B)
 {
    TMatrixT<AReal> tmp = B;
    A = tmp;
 }

 template <typename AReal>
 template <typename AMatrix_t>
 void TReference<AReal>::CopyDiffArch(std::vector<TMatrixT<AReal>> &A, const std::vector<AMatrix_t> &B)
 {
    for (size_t i = 0; i < A.size(); ++i) {
       CopyDiffArch(A[i], B[i]);
    }
 }


 } // namespace DNN
 } // namespace TMVA

 #endif
ROOT::Math::Cephes::B
static double B[]
Definition: SpecFuncCephes.cxx:178

TMVA::DNN::TReference::SetRandomSeed
static void SetRandomSeed(size_t seed)
Definition: Initialization.cxx:29

TMVA::DNN::TReference::MaxPoolLayerBackward
static void MaxPoolLayerBackward(std::vector< TMatrixT< AReal >> &activationGradientsBackward, const std::vector< TMatrixT< AReal >> &activationGradients, const std::vector< TMatrixT< AReal >> &indexMatrix, size_t batchSize, size_t depth, size_t nLocalViews)
Perform the complete backward propagation step in a Max Pooling Layer.
Definition: Propagation.cxx:378

TMVA::DNN::TReference::InitializeGlorotUniform
static void InitializeGlorotUniform(TMatrixT< AReal > &A)
Sample from a uniform distribution in range [ -lim,+lim] where lim = sqrt(6/N_in+N_out).
Definition: Initialization.cxx:110

TMVA::DNN::TReference::TanhDerivative
static void TanhDerivative(TMatrixT< AReal > &B, const TMatrixT< AReal > &A)
Definition: ActivationFunctions.cxx:125

TMVA::DNN::TReference::IdentityDerivative
static void IdentityDerivative(TMatrixT< AReal > &B, const TMatrixT< AReal > &A)
Definition: ActivationFunctions.cxx:27

TMVA::DNN::TReference::AddConvBiases
static void AddConvBiases(TMatrixT< AReal > &output, const TMatrixT< AReal > &biases)
Add the biases in the Convolutional Layer.
Definition: Propagation.cxx:170

TMVA::DNN::TReference::Im2col
static void Im2col(TMatrixT< AReal > &A, TMatrixT< AReal > &B, size_t imgHeight, size_t imgWidth, size_t fltHeight, size_t fltWidth, size_t strideRows, size_t strideCols, size_t zeroPaddingHeight, size_t zeroPaddingWidth)
Transform the matrix B in local view format, suitable for convolution, and store it in matrix A...
Definition: Propagation.cxx:120

TMVA::DNN::TReference::Tanh
static void Tanh(TMatrixT< AReal > &B)
Definition: ActivationFunctions.cxx:109

TMVA::DNN::TReference::ForwardLogReg
static void ForwardLogReg(TMatrixT< AReal > &input, TMatrixT< AReal > &p, TMatrixT< AReal > &fWeights)
Definition: DenoisePropagation.cxx:171

TMVA::DNN::TReference::ConvLayerForward
static void ConvLayerForward(std::vector< TMatrixT< AReal >> &, std::vector< TMatrixT< AReal >> &, const std::vector< TMatrixT< AReal >> &, const TMatrixT< AReal > &, const TMatrixT< AReal > &, EActivationFunction, const std::vector< int > &, size_t, size_t, AReal, bool)
Forward propagation in the Convolutional layer.
Definition: Reference.h:340

Fatal
void Fatal(const char *location, const char *msgfmt,...)

TMVA::DNN::TReference::RecurrentLayerBackward
static Matrix_t & RecurrentLayerBackward(TMatrixT< Scalar_t > &state_gradients_backward, TMatrixT< Scalar_t > &input_weight_gradients, TMatrixT< Scalar_t > &state_weight_gradients, TMatrixT< Scalar_t > &bias_gradients, TMatrixT< Scalar_t > &df, const TMatrixT< Scalar_t > &state, const TMatrixT< Scalar_t > &weights_input, const TMatrixT< Scalar_t > &weights_state, const TMatrixT< Scalar_t > &input, TMatrixT< Scalar_t > &input_gradient)
Backpropagation step for a Recurrent Neural Network.
Definition: RecurrentPropagation.cxx:26

width
image html pict1_TGaxis_012 png width
Define new text attributes for the label number "labNum".
Definition: TGaxis.cxx:2551

TMVA::DNN::TReference::Im2colIndices
static void Im2colIndices(std::vector< int > &, const TMatrixT< AReal > &, size_t, size_t, size_t, size_t, size_t, size_t, size_t, size_t, size_t)
Definition: Reference.h:316

Functions.h

TMVA::DNN::TReference::SoftmaxCrossEntropy
static AReal SoftmaxCrossEntropy(const TMatrixT< AReal > &Y, const TMatrixT< AReal > &output, const TMatrixT< AReal > &weights)
Softmax transformation is implicitly applied, thus output should hold the linear activations of the l...
Definition: LossFunctions.cxx:107

TMVA::DNN::TReference::Sigmoid
static void Sigmoid(TMatrixT< AReal > &B)

TMVA::DNN::TReference::CrossEntropy
static AReal CrossEntropy(const TMatrixT< AReal > &Y, const TMatrixT< AReal > &output, const TMatrixT< AReal > &weights)
Sigmoid transformation is implicitly applied, thus output should hold the linear activations of the l...
Definition: LossFunctions.cxx:64

TMVA::DNN::TReference::SigmoidDerivative
static void SigmoidDerivative(TMatrixT< AReal > &B, const TMatrixT< AReal > &A)
Definition: ActivationFunctions.cxx:92

TMVA::DNN::TReference::SoftSign
static void SoftSign(TMatrixT< AReal > &B)
Definition: ActivationFunctions.cxx:173

TMVA::DNN::TReference::Identity
static void Identity(TMatrixT< AReal > &B)

TMVA::DNN::TReference::SymmetricReluDerivative
static void SymmetricReluDerivative(TMatrixT< AReal > &B, const TMatrixT< AReal > &A)
Definition: ActivationFunctions.cxx:157

ROOT::Math::Cephes::A
static double A[]
Definition: SpecFuncCephes.cxx:170

ROOT::Math::beta
double beta(double x, double y)
Calculates the beta function.
Definition: SpecFuncMathCore.cxx:111

TMatrixT< AReal >

TMVA::DNN::TReference::Im2colFast
static void Im2colFast(TMatrixT< AReal > &, const TMatrixT< AReal > &, const std::vector< int > &)
Definition: Reference.h:320

TMVA::DNN::TReference::AddL2RegularizationGradients
static void AddL2RegularizationGradients(TMatrixT< AReal > &A, const TMatrixT< AReal > &W, AReal weightDecay)
Definition: Regularization.cxx:82

x
Double_t x[n]
Definition: legend1.C:17

TMVA::DNN::weightDecay
double weightDecay(double error, ItWeight itWeight, ItWeight itWeightEnd, double factorWeightDecay, EnumRegularization eRegularization)
compute the weight decay for regularization (L1 or L2)
Definition: NeuralNet.icc:496

TRandom
This is the base class for the ROOT Random number generators.
Definition: TRandom.h:27

TMVA::DNN::TReference::SoftmaxAE
static void SoftmaxAE(TMatrixT< AReal > &A)
Definition: DenoisePropagation.cxx:85

TMVA::DNN::TReference::Flatten
static void Flatten(TMatrixT< AReal > &A, const std::vector< TMatrixT< AReal >> &B, size_t size, size_t nRows, size_t nCols)
Flattens the tensor B, such that each matrix, is stretched in one row, resulting with a matrix A...
Definition: Propagation.cxx:418

TMVA::DNN::TReference::Copy
static void Copy(TMatrixT< Scalar_t > &A, const TMatrixT< Scalar_t > &B)
Definition: Propagation.cxx:86

DataLoader.h

TMVA::DNN::TReference::GetRandomGenerator
static TRandom & GetRandomGenerator()
Definition: Initialization.cxx:35

TMVA::DNN::TReference::SoftmaxCrossEntropyGradients
static void SoftmaxCrossEntropyGradients(TMatrixT< AReal > &dY, const TMatrixT< AReal > &Y, const TMatrixT< AReal > &output, const TMatrixT< AReal > &weights)
Definition: LossFunctions.cxx:131

TMVA::DNN::TReference::ReconstructInput
static void ReconstructInput(TMatrixT< AReal > &compressedInput, TMatrixT< AReal > &reconstructedInput, TMatrixT< AReal > &fWeights)
Definition: DenoisePropagation.cxx:152

TMVA::DNN::TReference::ConvLayerBackward
static void ConvLayerBackward(std::vector< TMatrixT< AReal >> &, TMatrixT< AReal > &, TMatrixT< AReal > &, std::vector< TMatrixT< AReal >> &, const std::vector< TMatrixT< AReal >> &, const TMatrixT< AReal > &, const std::vector< TMatrixT< AReal >> &, size_t, size_t, size_t, size_t, size_t, size_t, size_t, size_t, size_t, size_t)
Perform the complete backward propagation step in a Convolutional Layer.
Definition: Reference.h:370

TMVA::DNN::TReference::Scalar_t
AReal Scalar_t
Definition: Reference.h:49

TMVA::DNN::TReference::Reshape
static void Reshape(TMatrixT< AReal > &A, const TMatrixT< AReal > &B)
Transform the matrix B to a matrix with different dimensions A.
Definition: Propagation.cxx:403

TMVA::DNN::TReference::RotateWeights
static void RotateWeights(TMatrixT< AReal > &A, const TMatrixT< AReal > &B, size_t filterDepth, size_t filterHeight, size_t filterWidth, size_t numFilters)
Rotates the matrix B, which is representing a weights, and stores them in the matrix A...
Definition: Propagation.cxx:155

TMVA::DNN::TReference::L1Regularization
static AReal L1Regularization(const TMatrixT< AReal > &W)
Definition: Regularization.cxx:26

TMVA::DNN::TReference::InitializeUniform
static void InitializeUniform(TMatrixT< AReal > &A)
Definition: Initialization.cxx:62

TMVA::DNN::TReference::AddL1RegularizationGradients
static void AddL1RegularizationGradients(TMatrixT< AReal > &A, const TMatrixT< AReal > &W, AReal weightDecay)
Definition: Regularization.cxx:44

TMVA::DNN::TReference::InitializeGlorotNormal
static void InitializeGlorotNormal(TMatrixT< AReal > &A)
Truncated normal initialization (Glorot, called also Xavier normal) The values are sample with a norm...
Definition: Initialization.cxx:85

TMVA::DNN::TReference::Backward
static void Backward(TMatrixT< Scalar_t > &activationGradientsBackward, TMatrixT< Scalar_t > &weightGradients, TMatrixT< Scalar_t > &biasGradients, TMatrixT< Scalar_t > &df, const TMatrixT< Scalar_t > &activationGradients, const TMatrixT< Scalar_t > &weights, const TMatrixT< Scalar_t > &activationBackward)
Perform the complete backward propagation step.
Definition: Propagation.cxx:40

TMVA::DNN::TReference::Relu
static void Relu(TMatrixT< AReal > &B)
Definition: ActivationFunctions.cxx:43

TensorDataLoader.h

TMVA::DNN::TReference::SymmetricRelu
static void SymmetricRelu(TMatrixT< AReal > &B)
Definition: ActivationFunctions.cxx:142

ROOT::Math::Cephes::C
static double C[]
Definition: SpecFuncCephes.cxx:187

TMVA::DNN::TReference::InitializeZero
static void InitializeZero(TMatrixT< AReal > &A)
Definition: Initialization.cxx:148

ClassificationKeras.output
output
Definition: ClassificationKeras.py:16

TMVA::DNN::TReference::Deflatten
static void Deflatten(std::vector< TMatrixT< AReal >> &A, const TMatrixT< Scalar_t > &B, size_t index, size_t nRows, size_t nCols)
Transforms each row of B to a matrix and stores it in the tensor B.
Definition: Propagation.cxx:432

TMVA::DNN::TReference::CorruptInput
static void CorruptInput(TMatrixT< AReal > &input, TMatrixT< AReal > &corruptedInput, AReal corruptionLevel)
Definition: DenoisePropagation.cxx:108

TMVA::DNN::TReference::L2Regularization
static AReal L2Regularization(const TMatrixT< AReal > &W)
Definition: Regularization.cxx:64

TMVA::DNN::TReference::ReluDerivative
static void ReluDerivative(TMatrixT< AReal > &B, const TMatrixT< AReal > &A)
Definition: ActivationFunctions.cxx:58

TMVA::DNN::TReference::AddBiases
static void AddBiases(TMatrixT< AReal > &A, const TMatrixT< AReal > &biases)
Definition: DenoisePropagation.cxx:30

TMVA::DNN::TReference::SumColumns
static void SumColumns(TMatrixT< AReal > &B, const TMatrixT< AReal > &A)
Sum columns of (m x n) matrixx A and write the results into the first m elements in A...
Definition: Propagation.cxx:108

TMVA::DNN::TReference::CrossEntropyGradients
static void CrossEntropyGradients(TMatrixT< AReal > &dY, const TMatrixT< AReal > &Y, const TMatrixT< AReal > &output, const TMatrixT< AReal > &weights)
Definition: LossFunctions.cxx:85

TMVA::DNN::TReference::UpdateParamsLogReg
static void UpdateParamsLogReg(TMatrixT< AReal > &input, TMatrixT< AReal > &output, TMatrixT< AReal > &difference, TMatrixT< AReal > &p, TMatrixT< AReal > &fWeights, TMatrixT< AReal > &fBiases, AReal learningRate, size_t fBatchSize)
Definition: DenoisePropagation.cxx:191

TMVA::DNN::TReference::GaussDerivative
static void GaussDerivative(TMatrixT< AReal > &B, const TMatrixT< AReal > &A)
Definition: ActivationFunctions.cxx:222

TMVA::DNN::TReference::Softmax
static void Softmax(TMatrixT< AReal > &YHat, const TMatrixT< AReal > &)
Definition: OutputFunctions.cxx:37

TMVA::DNN::TReference::fgRandomGen
static TRandom * fgRandomGen
Definition: Reference.h:46

TMVA::DNN::TReference::Downsample
static void Downsample(TMatrixT< AReal > &A, TMatrixT< AReal > &B, const TMatrixT< AReal > &C, size_t imgHeight, size_t imgWidth, size_t fltHeight, size_t fltWidth, size_t strideRows, size_t strideCols)
Downsample the matrix C to the matrix A, using max operation, such that the winning indices are store...
Definition: Propagation.cxx:345

y
Double_t y[n]
Definition: legend1.C:17

TMVA::DNN::TReference::ScaleAdd
static void ScaleAdd(TMatrixT< Scalar_t > &A, const TMatrixT< Scalar_t > &B, Scalar_t beta=1.0)
Adds a the elements in matrix B scaled by c to the elements in the matrix A.
Definition: Propagation.cxx:76

TMVA::DNN::TReference::EncodeInput
static void EncodeInput(TMatrixT< AReal > &input, TMatrixT< AReal > &compressedInput, TMatrixT< AReal > &Weights)
Definition: DenoisePropagation.cxx:134

TMVA::DNN::TReference::InitializeIdentity
static void InitializeIdentity(TMatrixT< AReal > &A)
Definition: Initialization.cxx:129

z
you should not use this method at all Int_t Int_t z
Definition: TRolke.cxx:630

TMVA::DNN::TReference::SoftSignDerivative
static void SoftSignDerivative(TMatrixT< AReal > &B, const TMatrixT< AReal > &A)
Definition: ActivationFunctions.cxx:189

TMVA
Abstract ClassifierFactory template that handles arbitrary types.
Definition: GeneticMinimizer.h:21

TMVA::DNN::TReference::InitializeGauss
static void InitializeGauss(TMatrixT< AReal > &A)
Definition: Initialization.cxx:43

TMatrix.h

TMVA::DNN::EActivationFunction
EActivationFunction
Enum that represents layer activation functions.
Definition: Functions.h:31

TMVA::DNN::TReference::CopyDiffArch
static void CopyDiffArch(TMatrixT< Scalar_t > &A, const AMatrix_t &B)
Definition: Reference.h:527

TMVA::DNN::TReference::Rearrange
static void Rearrange(std::vector< TMatrixT< AReal >> &out, const std::vector< TMatrixT< AReal >> &in)
Rearrage data accoring to time fill B x T x D out with T x B x D matrix in.
Definition: Propagation.cxx:446

TMVA::DNN::TReference::MultiplyTranspose
static void MultiplyTranspose(TMatrixT< Scalar_t > &output, const TMatrixT< Scalar_t > &input, const TMatrixT< Scalar_t > &weights)
Matrix-multiply input with the transpose of  and write the results into output.
Definition: Propagation.cxx:23

TMVA::DNN::TReference::MeanSquaredErrorGradients
static void MeanSquaredErrorGradients(TMatrixT< AReal > &dY, const TMatrixT< AReal > &Y, const TMatrixT< AReal > &output, const TMatrixT< AReal > &weights)
Definition: LossFunctions.cxx:45

TMVA::DNN::TReference::AddRowWise
static void AddRowWise(TMatrixT< Scalar_t > &output, const TMatrixT< Scalar_t > &biases)
Add the vectors biases row-wise to the matrix output.
Definition: Propagation.cxx:30

TMVA::DNN::TReference::Gauss
static void Gauss(TMatrixT< AReal > &B)
Definition: ActivationFunctions.cxx:206

TMVA::DNN::TReference::MeanSquaredError
static AReal MeanSquaredError(const TMatrixT< AReal > &Y, const TMatrixT< AReal > &output, const TMatrixT< AReal > &weights)
Definition: LossFunctions.cxx:25

TMVA::DNN::TReference::Dropout
static void Dropout(TMatrixT< AReal > &A, AReal dropoutProbability)
Apply dropout with activation probability p to the given matrix A and scale the result by reciprocal ...
Definition: Dropout.cxx:29

TMVA::DNN::TReference::UpdateParams
static void UpdateParams(TMatrixT< AReal > &x, TMatrixT< AReal > &tildeX, TMatrixT< AReal > &y, TMatrixT< AReal > &z, TMatrixT< AReal > &fVBiases, TMatrixT< AReal > &fHBiases, TMatrixT< AReal > &fWeights, TMatrixT< AReal > &VBiasError, TMatrixT< AReal > &HBiasError, AReal learningRate, size_t fBatchSize)
Definition: DenoisePropagation.cxx:48