doc/v616/Cuda_8h_source.html

// @(#)root/tmva/tmva/dnn:$Id$

// Author: Simon Pfreundschuh 05/07/16


/*************************************************************************

 * Copyright (C) 2016, Simon Pfreundschuh                                *

 * All rights reserved.                                                  *

 *                                                                       *

 * For the licensing terms see $ROOTSYS/LICENSE.                         *

 * For the list of contributors see $ROOTSYS/README/CREDITS.             *

 *************************************************************************/


///////////////////////////////////////////////////////////////////

// Definition of the TCuda architecture class, which provides an //

// implementation of the low-level functionality for neural      //

// networks for the CUDA computing architectures.                //

///////////////////////////////////////////////////////////////////


#ifndef TMVA_DNN_ARCHITECTURES_CUDA

#define TMVA_DNN_ARCHITECTURES_CUDA


#include "TMVA/DNN/Functions.h"

#include "TMVA/DNN/CNN/ConvLayer.h"


#include "cuda.h"

#include "Cuda/CudaBuffers.h"

#include "Cuda/CudaMatrix.h"

#include "TMVA/DNN/DataLoader.h"

#include <utility>

#include <vector>


class TRandom;


namespace TMVA

{

namespace DNN

{


/** The TCuda architecture class.

 *

 * Low-level interface class for CUDA computing architectures. Contains as

 * public types the declaration of the scalar, matrix and buffer types

 * for this architecture as well as the remaining functions in the low-level

 * interface in the form of static members.

 */

template<typename AFloat = Real_t>

class TCuda

{

private:

   static TRandom * fgRandomGen;

public:


    using Scalar_t       = AFloat;

    using Matrix_t       = TCudaMatrix<AFloat>;

    using DeviceBuffer_t = TCudaDeviceBuffer<AFloat>;

    using HostBuffer_t   = TCudaHostBuffer<AFloat>;


   //____________________________________________________________________________

   //

   // Propagation

   //____________________________________________________________________________


   /** @name Forward Propagation

    * Low-level functions required for the forward propagation of activations

    * through the network.

    */

   ///@{

   /** Matrix-multiply \p input with the transpose of \pweights and

    *  write the results into \p output. */

   static void MultiplyTranspose(TCudaMatrix<AFloat> &output,

                                 const TCudaMatrix<AFloat> &input,

                                 const TCudaMatrix<AFloat> &weights);

   /** Add the vectors biases row-wise to the matrix output */

   static void AddRowWise(TCudaMatrix<AFloat> &output,

                          const TCudaMatrix<AFloat> &biases);

   ///@}


   /** @name Backward Propagation

    * Low-level functions required for the forward propagation of activations

    * through the network.

    */

   ///@{

   /** Perform the complete backward propagation step. If the provided

    *  \p activationGradientsBackward matrix is not empty, compute the

    *  gradients of the objective function with respect to the activations

    *  of the previous layer (backward direction).

    *  Also compute the weight and the bias gradients. Modifies the values

    *  in \p df and thus produces only a valid result, if it is applied the

    *  first time after the corresponding forward propagation has been per-

    *  formed. */

   static void Backward(TCudaMatrix<AFloat> & activationGradientsBackward,

                        TCudaMatrix<AFloat> & weightGradients,

                        TCudaMatrix<AFloat> & biasGradients,

                        TCudaMatrix<AFloat> & df,

                        const TCudaMatrix<AFloat> & activationGradients,

                        const TCudaMatrix<AFloat> & weights,

                        const TCudaMatrix<AFloat> & activationBackward);

   /** Backward pass for Recurrent Networks */

  static Matrix_t & RecurrentLayerBackward(TCudaMatrix<AFloat> & state_gradients_backward, // BxH

                                           TCudaMatrix<AFloat> & input_weight_gradients,

                                           TCudaMatrix<AFloat> & state_weight_gradients,

                                           TCudaMatrix<AFloat> & bias_gradients,

                                           TCudaMatrix<AFloat> & df, //DxH

                                           const TCudaMatrix<AFloat> & state, // BxH

                                           const TCudaMatrix<AFloat> & weights_input, // HxD

                                           const TCudaMatrix<AFloat> & weights_state, // HxH

                                           const TCudaMatrix<AFloat> & input,  // BxD

                                           TCudaMatrix<AFloat> & input_gradient);

   /** Adds a the elements in matrix B scaled by c to the elements in

    *  the matrix A. This is required for the weight update in the gradient

    *  descent step.*/

   static void ScaleAdd(TCudaMatrix<AFloat> & A,

                        const TCudaMatrix<AFloat> & B,

                        Scalar_t beta = 1.0);

   /** Copy the elements of matrix A into matrix B. */

   static void Copy(TCudaMatrix<AFloat> & B,

                    const TCudaMatrix<AFloat> & A);


   // copy from another type of matrix

   template<typename AMatrix_t>

   static void CopyDiffArch(TCudaMatrix<Scalar_t> & B, const AMatrix_t & A);


   /** Above functions extended to vectors */

   static void ScaleAdd(std::vector<TCudaMatrix<Scalar_t>> & A,

                        const std::vector<TCudaMatrix<Scalar_t>> & B,

                        Scalar_t beta = 1.0);


   static void Copy(std::vector<TCudaMatrix<Scalar_t>> & A,

                    const std::vector<TCudaMatrix<Scalar_t>> & B);


   // copy from another architecture

   template<typename AMatrix_t>

   static void CopyDiffArch(std::vector<TCudaMatrix<Scalar_t>> & A,

                    const std::vector<AMatrix_t> & B);


   ///@}


   //____________________________________________________________________________

   //

   // Activation Functions

   //____________________________________________________________________________


   /** @name Activation Functions

    * For each activation function, the low-level interface contains two routines.

    * One that applies the acitvation function to a matrix and one that evaluate

    * the derivatives of the activation function at the elements of a given matrix

    * and writes the results into the result matrix.

    */

   ///@{

   static void Identity(TCudaMatrix<AFloat> & B);

   static void IdentityDerivative(TCudaMatrix<AFloat> & B,

                                  const TCudaMatrix<AFloat> & A);


   static void Relu(TCudaMatrix<AFloat> & B);

   static void ReluDerivative(TCudaMatrix<AFloat> & B,

                              const TCudaMatrix<AFloat> & A);


   static void Sigmoid(TCudaMatrix<AFloat> & B);

   static void SigmoidDerivative(TCudaMatrix<AFloat> & B,

                                 const TCudaMatrix<AFloat> & A);


   static void Tanh(TCudaMatrix<AFloat> & B);

   static void TanhDerivative(TCudaMatrix<AFloat> & B,

                              const TCudaMatrix<AFloat> & A);


   static void SymmetricRelu(TCudaMatrix<AFloat> & B);

   static void SymmetricReluDerivative(TCudaMatrix<AFloat> & B,

                                       const TCudaMatrix<AFloat> & A);


   static void SoftSign(TCudaMatrix<AFloat> & B);

   static void SoftSignDerivative(TCudaMatrix<AFloat> & B,

                                  const TCudaMatrix<AFloat> & A);


   static void Gauss(TCudaMatrix<AFloat> & B);

   static void GaussDerivative(TCudaMatrix<AFloat> & B,

                               const TCudaMatrix<AFloat> & A);

   ///@}


   //____________________________________________________________________________

   //

   // Loss Functions

   //____________________________________________________________________________


   /** @name Loss Functions

    * Loss functions compute a scalar value given the \p output of the network

    * for a given training input and the expected network prediction \p Y that

    * quantifies the quality of the prediction. For each function also a routing

    * that computes the gradients (suffixed by Gradients) must be provided for

    * the starting of the backpropagation algorithm.

    */

   ///@{


   static AFloat MeanSquaredError(const TCudaMatrix<AFloat> &Y, const TCudaMatrix<AFloat> &output,

                                  const TCudaMatrix<AFloat> &weights);

   static void MeanSquaredErrorGradients(TCudaMatrix<AFloat> &dY, const TCudaMatrix<AFloat> &Y,

                                         const TCudaMatrix<AFloat> &output, const TCudaMatrix<AFloat> &weights);


   /** Sigmoid transformation is implicitly applied, thus \p output should

    *  hold the linear activations of the last layer in the net. */

   static AFloat CrossEntropy(const TCudaMatrix<AFloat> &Y, const TCudaMatrix<AFloat> &output,

                              const TCudaMatrix<AFloat> &weights);


   static void CrossEntropyGradients(TCudaMatrix<AFloat> &dY, const TCudaMatrix<AFloat> &Y,

                                     const TCudaMatrix<AFloat> &output, const TCudaMatrix<AFloat> &weights);


   /** Softmax transformation is implicitly applied, thus \p output should

    *  hold the linear activations of the last layer in the net. */

   static AFloat SoftmaxCrossEntropy(const TCudaMatrix<AFloat> &Y, const TCudaMatrix<AFloat> &output,

                                     const TCudaMatrix<AFloat> &weights);

   static void SoftmaxCrossEntropyGradients(TCudaMatrix<AFloat> &dY, const TCudaMatrix<AFloat> &Y,

                                            const TCudaMatrix<AFloat> &output, const TCudaMatrix<AFloat> &weights);

   ///@}


   //____________________________________________________________________________

   //

   // Output Functions

   //____________________________________________________________________________


   /** @name Output Functions

    * Output functions transform the activations \p output of the

    * output layer in the network to a valid prediction \p YHat for

    * the desired usage of the network, e.g.  the identity function

    * for regression or the sigmoid transformation for two-class

    * classification.

    */

   ///@{

   static void Sigmoid(TCudaMatrix<AFloat> &YHat,

                       const TCudaMatrix<AFloat> & );

   static void Softmax(TCudaMatrix<AFloat> &YHat,

                       const TCudaMatrix<AFloat> & );

   ///@}


   //____________________________________________________________________________

   //

   // Regularization

   //____________________________________________________________________________


   /** @name Regularization

    * For each regularization type two functions are required, one named

    * <tt><Type>Regularization</tt> that evaluates the corresponding

    * regularization functional for a given weight matrix and the

    * <tt>Add<Type>RegularizationGradients</tt>, that adds the regularization

    * component in the gradients to the provided matrix.

    */

   ///@{


   static AFloat L1Regularization(const TCudaMatrix<AFloat> & W);

   static void AddL1RegularizationGradients(TCudaMatrix<AFloat> & A,

                                            const TCudaMatrix<AFloat> & W,

                                            AFloat weightDecay);


   static AFloat L2Regularization(const TCudaMatrix<AFloat> & W);

   static void AddL2RegularizationGradients(TCudaMatrix<AFloat> & A,

                                            const TCudaMatrix<AFloat> & W,

                                            AFloat weightDecay);

   ///@}


   //____________________________________________________________________________

   //

   // Initialization

   //____________________________________________________________________________


   /** @name Initialization

    * For each initialization method, one function in the low-level interface

    * is provided. The naming scheme is <p>Initialize<Type></p> for a given

    * initialization method Type.

    */

   ///@{


   static void InitializeGauss(TCudaMatrix<AFloat> & A);

   static void InitializeUniform(TCudaMatrix<AFloat> & A);

   static void InitializeIdentity(TCudaMatrix<AFloat> & A);

   static void InitializeZero(TCudaMatrix<AFloat> & A);

   static void InitializeGlorotUniform(TCudaMatrix<AFloat> & A);

   static void InitializeGlorotNormal(TCudaMatrix<AFloat> & A);

   // return static instance of random generator used for initialization

   // if generator does not exist it is created the first time with a random seed (e.g. seed = 0)

   static TRandom & GetRandomGenerator();

   // set random seed for the static geenrator

   // if the static geneerator does not exists it is created

   static void SetRandomSeed(size_t seed);


   ///@}


   //____________________________________________________________________________

   //

   // Dropout

   //____________________________________________________________________________


   /** @name Dropout

    */

   ///@{


   /** Apply dropout with activation probability \p p to the given

    *  matrix \p A and scale the result by reciprocal of \p p. */

   static void Dropout(TCudaMatrix<AFloat> & A, AFloat p);


   ///@}


   //____________________________________________________________________________

   //

   //  Convolutional Layer Propagation

   //____________________________________________________________________________


   /** @name Forward Propagation in Convolutional Layer

    */

   ///@{


   /** Attaches a cuda stream to each matrix in order to accomodate parallel kernel launches. */

   static void PrepareInternals(std::vector<TCudaMatrix<AFloat>> & inputPrime);


   /** Calculate how many neurons "fit" in the output layer, given the input as well as the layer's hyperparameters. */

   static size_t calculateDimension(size_t imgDim, size_t fltDim, size_t padding, size_t stride);


   /** Transform the matrix \p B in local view format, suitable for

    *  convolution, and store it in matrix \p A. */

   static void Im2col(TCudaMatrix<AFloat> &A,

                      const TCudaMatrix<AFloat> &B,

                      size_t imgHeight,

                      size_t imgWidth,

                      size_t fltHeight,

                      size_t fltWidth,

                      size_t strideRows,

                      size_t strideCols,

                      size_t zeroPaddingHeight,

                      size_t zeroPaddingWidth);


   static void Im2colIndices(std::vector<int> & /* V */, const TCudaMatrix<AFloat> & /* B */, size_t /* nLocalViews */,

                             size_t /* imgHeight */, size_t /* imgWidth */, size_t /* fltHeight */,

                             size_t /* fltWidth */, size_t /* strideRows */, size_t /* strideCols */,

                             size_t /* zeroPaddingHeight */, size_t /* zeroPaddingWidth */) {}

   static void Im2colFast(TCudaMatrix<AFloat> & /* A */, const TCudaMatrix<AFloat> & /* B */,

                          const std::vector<int> & /* V */) {}


   /** Rotates the matrix \p B, which is representing a weights,

    *  and stores them in the matrix \p A. */

   static void RotateWeights(TCudaMatrix<AFloat> &A, const TCudaMatrix<AFloat> &B, size_t filterDepth,

                             size_t filterHeight, size_t filterWidth, size_t numFilters);


   /** Add the biases in the Convolutional Layer.  */

   static void AddConvBiases(TCudaMatrix<AFloat> &output, const TCudaMatrix<AFloat> &biases);


   ///@}

   /** Forward propagation in the Convolutional layer */

   static void ConvLayerForward(std::vector<TCudaMatrix<AFloat>> & output,

                                std::vector<TCudaMatrix<AFloat>> & derivatives,

                                const std::vector<TCudaMatrix<AFloat>> &input,

                                const TCudaMatrix<AFloat> &weights, const TCudaMatrix<AFloat> & biases,

                                const DNN::CNN::TConvParams & params, EActivationFunction activFunc,

                                std::vector<TCudaMatrix<AFloat>> & inputPrime);


   /** @name Backward Propagation in Convolutional Layer

    */

   ///@{


   /** Perform the complete backward propagation step in a Convolutional Layer.

    *  If the provided \p activationGradientsBackward matrix is not empty, compute the

    *  gradients of the objective function with respect to the activations

    *  of the previous layer (backward direction).

    *  Also compute the weight and the bias gradients. Modifies the values

    *  in \p df and thus produces only a valid result, if it is applied the

    *  first time after the corresponding forward propagation has been per-

    *  formed. */

   static void ConvLayerBackward(std::vector<TCudaMatrix<AFloat>> &activationGradientsBackward,

                                 TCudaMatrix<AFloat> &weightGradients, TCudaMatrix<AFloat> &biasGradients,

                                 std::vector<TCudaMatrix<AFloat>> &df,

                                 const std::vector<TCudaMatrix<AFloat>> &activationGradients,

                                 const TCudaMatrix<AFloat> &weights,

                                 const std::vector<TCudaMatrix<AFloat>> &activationBackward, size_t batchSize,

                                 size_t inputHeight, size_t inputWidth, size_t depth, size_t height, size_t width,

                                 size_t filterDepth, size_t filterHeight, size_t filterWidth, size_t nLocalViews);


   /** Utility function for calculating the activation gradients of the layer

    *  before the convolutional layer. */

   static void CalculateConvActivationGradients(std::vector<TCudaMatrix<AFloat>> &activationGradientsBackward,

                                                std::vector<TCudaMatrix<AFloat>> &df,

                                                const TCudaMatrix<AFloat> &weights, size_t batchSize,

                                                size_t inputHeight, size_t inputWidth, size_t depth, size_t height,

                                                size_t width, size_t filterDepth, size_t filterHeight,

                                                size_t filterWidth);


   /** Utility function for calculating the weight gradients of the convolutional

    * layer. */

   static void CalculateConvWeightGradients(TCudaMatrix<AFloat> &weightGradients, std::vector<TCudaMatrix<AFloat>> &df,

                                            const std::vector<TCudaMatrix<AFloat>> &activations_backward,

                                            size_t batchSize, size_t inputHeight, size_t inputWidth, size_t depth,

                                            size_t height, size_t width, size_t filterDepth, size_t filterHeight,

                                            size_t filterWidth, size_t nLocalViews);


   /** Utility function for calculating the bias gradients of the convolutional

    *  layer */

   static void CalculateConvBiasGradients(TCudaMatrix<AFloat> &biasGradients, std::vector<TCudaMatrix<AFloat>> &df,

                                          size_t batchSize, size_t depth, size_t nLocalViews);


   ///@}


   //____________________________________________________________________________

   //

   //  Max Pooling Layer Propagation

   //____________________________________________________________________________

   /** @name Forward Propagation in Max Pooling Layer

    */

   ///@{


   /** Downsample the matrix \p C to the matrix \p A, using max

    *  operation, such that the winning indices are stored in matrix

    *  \p B. */

   static void Downsample(TCudaMatrix<AFloat> &A, TCudaMatrix<AFloat> &B, const TCudaMatrix<AFloat> &C,

                          size_t imgHeight, size_t imgWidth, size_t fltHeight, size_t fltWidth,

                          size_t strideRows, size_t strideCols);

   ///@}


   /** @name Backward Propagation in Max Pooling Layer

    */

   ///@{


   /** Perform the complete backward propagation step in a Pooling Layer. Based on the

    *  winning idices stored in the index matrix, it just forwards the actiovation

    *  gradients to the previous layer. */

   static void MaxPoolLayerBackward(TCudaMatrix<AFloat> &activationGradientsBackward,

                                    const TCudaMatrix<AFloat> &activationGradients,

                                    const TCudaMatrix<AFloat> &indexMatrix,

                                    size_t imgHeight,

                                    size_t imgWidth,

                                    size_t fltHeight,

                                    size_t fltWidth,

                                    size_t strideRows,

                                    size_t strideCols,

                                    size_t nLocalViews);


   ///@}


   //____________________________________________________________________________

   //

   //  Reshape Layer Propagation

   //____________________________________________________________________________

   /** @name Forward and Backward Propagation in Reshape Layer

    */

   ///@{


   /** Transform the matrix \p B to a matrix with different dimensions \p A */

   static void Reshape(TCudaMatrix<AFloat> &A, const TCudaMatrix<AFloat> &B);


   /** Flattens the tensor \p B, such that each matrix, is stretched in

    *  one row, resulting with a matrix \p A. */

   static void Flatten(TCudaMatrix<AFloat> &A, const std::vector<TCudaMatrix<AFloat>> &B, size_t size, size_t nRows,

                       size_t nCols);


   /** Transforms each row of \p B to a matrix and stores it in the tensor \p B. */

   static void Deflatten(std::vector<TCudaMatrix<AFloat>> &A, const TCudaMatrix<AFloat> &B, size_t index, size_t nRows,

                         size_t nCols);

   /** Rearrage data accoring to time fill B x T x D out with T x B x D matrix in*/

   static void Rearrange(std::vector<TCudaMatrix<AFloat>> &out, const std::vector<TCudaMatrix<AFloat>> &in);


   ///@}


   //____________________________________________________________________________

   //

   // Additional Arithmetic Functions

   //____________________________________________________________________________


   /** @name Additional Arithmetic Functions

    *

    * Additional arithmetic on CUDA matrices  used to implement the low-level

    * interface.

    */

   ///@{


   /** Standard multiplication of two matrices \p A and \p B with the result being

    *  written into C.

    */

   static void Multiply(TCudaMatrix<AFloat> & C,

                        const TCudaMatrix<AFloat> & A,

                        const TCudaMatrix<AFloat> & B);

   /** Matrix multiplication of two matrices \p A and \p B^T (transposed) with the

    *  result being written into C.

    */

   static void TransposeMultiply(TCudaMatrix<AFloat> & output,

                                 const TCudaMatrix<AFloat> & input,

                                 const TCudaMatrix<AFloat> & Weights);

   /** In-place Hadamard (element-wise) product of matrices \p A and \p B

    *  with the result being written into \p A.

    */

   static void Hadamard(TCudaMatrix<AFloat> & A, const TCudaMatrix<AFloat> & B);


   /** Sum columns of (m x n) matrix \p A and write the results into the first

    * m elements in \p B.

    */

   static void SumColumns(TCudaMatrix<AFloat> & B, const TCudaMatrix<AFloat> & A);


   /** Sum rows of (m x n) matrix \p A and write the results into the first

   * m elements in \p B.

   */

   static void SumRows(TCudaMatrix<AFloat> & B, const TCudaMatrix<AFloat> & A);


   /** Compute the sum of all elements in \p A */

   static AFloat Sum(const TCudaMatrix<AFloat> &A);


   /** Check two matrices for equality, taking floating point arithmetic errors into account. */

   static bool AlmostEquals(const TCudaMatrix<AFloat> &A, const TCudaMatrix<AFloat> &B, double epsilon = 0.1);


   /** Add the constant \p beta to all the elements of matrix \p A and write the

    * result into \p A.

    */

   static void ConstAdd(TCudaMatrix<AFloat> &A, AFloat beta);


   /** Multiply the constant \p beta to all the elements of matrix \p A and write the

    * result into \p A.

    */

   static void ConstMult(TCudaMatrix<AFloat> &A, AFloat beta);


   /** Reciprocal each element of the matrix \p A and write the result into

    * \p A

    */

   static void ReciprocalElementWise(TCudaMatrix<AFloat> &A);


   /** Square each element of the matrix \p A and write the result into

    * \p A

    */

   static void SquareElementWise(TCudaMatrix<AFloat> &A);


   /** Square root each element of the matrix \p A and write the result into

    * \p A

    */

   static void SqrtElementWise(TCudaMatrix<AFloat> &A);


  // optimizer functions

   static void AdamUpdate(TCudaMatrix<AFloat> & A, const TCudaMatrix<AFloat> & M, const TCudaMatrix<AFloat> & V, AFloat alpha, AFloat eps);

   static void AdamUpdateFirstMom(TCudaMatrix<AFloat> & A, const TCudaMatrix<AFloat> & B, AFloat beta);

   static void AdamUpdateSecondMom(TCudaMatrix<AFloat> & A, const TCudaMatrix<AFloat> & B, AFloat beta);


};


//____________________________________________________________________________

template <typename AFloat>

template <typename AMatrix_t>

void TCuda<AFloat>::CopyDiffArch(TCudaMatrix<AFloat> &B,

                        const AMatrix_t &A)

{

   // copy from another architecture using the reference one

   // this is not very efficient since creates temporary objects

   TMatrixT<AFloat> tmp = A;

   Copy(B, TCudaMatrix<AFloat>(tmp) );

}


//____________________________________________________________________________

template <typename AFloat>

template <typename AMatrix_t>

void TCuda<AFloat>::CopyDiffArch(std::vector<TCudaMatrix<AFloat>> &B,

                            const std::vector<AMatrix_t> &A)

{

   for (size_t i = 0; i < B.size(); ++i) {

      CopyDiffArch(B[i], A[i]);

   }

}


} // namespace DNN

} // namespace TMVA


#endif

ConvLayer.h

CudaBuffers.h

CudaMatrix.h

DataLoader.h

width
include TDocParser_001 C image html pict1_TDocParser_001 png width
Definition: TDocParser.cxx:121

TMVA::DNN::TCudaDeviceBuffer
TCudaDeviceBuffer.
Definition: CudaBuffers.h:98

TMVA::DNN::TCudaHostBuffer
TCudaHostBuffer.
Definition: CudaBuffers.h:43

TMVA::DNN::TCudaMatrix
TCudaMatrix Class.
Definition: CudaMatrix.h:99

TMVA::DNN::TCuda
The TCuda architecture class.
Definition: Cuda.h:47

TMVA::DNN::TCuda::fgRandomGen
static TRandom * fgRandomGen
Definition: Cuda.h:49

TMVA::DNN::TCuda::RotateWeights
static void RotateWeights(TCudaMatrix< AFloat > &A, const TCudaMatrix< AFloat > &B, size_t filterDepth, size_t filterHeight, size_t filterWidth, size_t numFilters)
Rotates the matrix B, which is representing a weights, and stores them in the matrix A.

TMVA::DNN::TCuda::CalculateConvActivationGradients
static void CalculateConvActivationGradients(std::vector< TCudaMatrix< AFloat > > &activationGradientsBackward, std::vector< TCudaMatrix< AFloat > > &df, const TCudaMatrix< AFloat > &weights, size_t batchSize, size_t inputHeight, size_t inputWidth, size_t depth, size_t height, size_t width, size_t filterDepth, size_t filterHeight, size_t filterWidth)
Utility function for calculating the activation gradients of the layer before the convolutional layer...

TMVA::DNN::TCuda::MultiplyTranspose
static void MultiplyTranspose(TCudaMatrix< AFloat > &output, const TCudaMatrix< AFloat > &input, const TCudaMatrix< AFloat > &weights)
Matrix-multiply input with the transpose of \pweights and write the results into output.

TMVA::DNN::TCuda::Multiply
static void Multiply(TCudaMatrix< AFloat > &C, const TCudaMatrix< AFloat > &A, const TCudaMatrix< AFloat > &B)
Standard multiplication of two matrices A and B with the result being written into C.

TMVA::DNN::TCuda::Softmax
static void Softmax(TCudaMatrix< AFloat > &YHat, const TCudaMatrix< AFloat > &)

TMVA::DNN::TCuda::AddL2RegularizationGradients
static void AddL2RegularizationGradients(TCudaMatrix< AFloat > &A, const TCudaMatrix< AFloat > &W, AFloat weightDecay)

TMVA::DNN::TCuda::Im2col
static void Im2col(TCudaMatrix< AFloat > &A, const TCudaMatrix< AFloat > &B, size_t imgHeight, size_t imgWidth, size_t fltHeight, size_t fltWidth, size_t strideRows, size_t strideCols, size_t zeroPaddingHeight, size_t zeroPaddingWidth)
Transform the matrix B in local view format, suitable for convolution, and store it in matrix A.

TMVA::DNN::TCuda::Copy
static void Copy(TCudaMatrix< AFloat > &B, const TCudaMatrix< AFloat > &A)
Copy the elements of matrix A into matrix B.

TMVA::DNN::TCuda::Rearrange
static void Rearrange(std::vector< TCudaMatrix< AFloat > > &out, const std::vector< TCudaMatrix< AFloat > > &in)
Rearrage data accoring to time fill B x T x D out with T x B x D matrix in.

TMVA::DNN::TCuda::Copy
static void Copy(std::vector< TCudaMatrix< Scalar_t > > &A, const std::vector< TCudaMatrix< Scalar_t > > &B)

TMVA::DNN::TCuda::InitializeGlorotNormal
static void InitializeGlorotNormal(TCudaMatrix< AFloat > &A)

TMVA::DNN::TCuda::InitializeGlorotUniform
static void InitializeGlorotUniform(TCudaMatrix< AFloat > &A)

TMVA::DNN::TCuda::Downsample
static void Downsample(TCudaMatrix< AFloat > &A, TCudaMatrix< AFloat > &B, const TCudaMatrix< AFloat > &C, size_t imgHeight, size_t imgWidth, size_t fltHeight, size_t fltWidth, size_t strideRows, size_t strideCols)
Downsample the matrix C to the matrix A, using max operation, such that the winning indices are store...

TMVA::DNN::TCuda::RecurrentLayerBackward
static Matrix_t & RecurrentLayerBackward(TCudaMatrix< AFloat > &state_gradients_backward, TCudaMatrix< AFloat > &input_weight_gradients, TCudaMatrix< AFloat > &state_weight_gradients, TCudaMatrix< AFloat > &bias_gradients, TCudaMatrix< AFloat > &df, const TCudaMatrix< AFloat > &state, const TCudaMatrix< AFloat > &weights_input, const TCudaMatrix< AFloat > &weights_state, const TCudaMatrix< AFloat > &input, TCudaMatrix< AFloat > &input_gradient)
Backward pass for Recurrent Networks.

TMVA::DNN::TCuda::SoftmaxCrossEntropy
static AFloat SoftmaxCrossEntropy(const TCudaMatrix< AFloat > &Y, const TCudaMatrix< AFloat > &output, const TCudaMatrix< AFloat > &weights)
Softmax transformation is implicitly applied, thus output should hold the linear activations of the l...

TMVA::DNN::TCuda::GaussDerivative
static void GaussDerivative(TCudaMatrix< AFloat > &B, const TCudaMatrix< AFloat > &A)

TMVA::DNN::TCuda::Relu
static void Relu(TCudaMatrix< AFloat > &B)

TMVA::DNN::TCuda::PrepareInternals
static void PrepareInternals(std::vector< TCudaMatrix< AFloat > > &inputPrime)
Attaches a cuda stream to each matrix in order to accomodate parallel kernel launches.

TMVA::DNN::TCuda::ConstAdd
static void ConstAdd(TCudaMatrix< AFloat > &A, AFloat beta)
Add the constant beta to all the elements of matrix A and write the result into A.

TMVA::DNN::TCuda::SumColumns
static void SumColumns(TCudaMatrix< AFloat > &B, const TCudaMatrix< AFloat > &A)
Sum columns of (m x n) matrix A and write the results into the first m elements in B.

TMVA::DNN::TCuda::InitializeZero
static void InitializeZero(TCudaMatrix< AFloat > &A)

TMVA::DNN::TCuda::ScaleAdd
static void ScaleAdd(TCudaMatrix< AFloat > &A, const TCudaMatrix< AFloat > &B, Scalar_t beta=1.0)
Adds a the elements in matrix B scaled by c to the elements in the matrix A.

TMVA::DNN::TCuda::SoftSign
static void SoftSign(TCudaMatrix< AFloat > &B)

TMVA::DNN::TCuda::ConvLayerBackward
static void ConvLayerBackward(std::vector< TCudaMatrix< AFloat > > &activationGradientsBackward, TCudaMatrix< AFloat > &weightGradients, TCudaMatrix< AFloat > &biasGradients, std::vector< TCudaMatrix< AFloat > > &df, const std::vector< TCudaMatrix< AFloat > > &activationGradients, const TCudaMatrix< AFloat > &weights, const std::vector< TCudaMatrix< AFloat > > &activationBackward, size_t batchSize, size_t inputHeight, size_t inputWidth, size_t depth, size_t height, size_t width, size_t filterDepth, size_t filterHeight, size_t filterWidth, size_t nLocalViews)
Perform the complete backward propagation step in a Convolutional Layer.

TMVA::DNN::TCuda::SymmetricReluDerivative
static void SymmetricReluDerivative(TCudaMatrix< AFloat > &B, const TCudaMatrix< AFloat > &A)

TMVA::DNN::TCuda::MaxPoolLayerBackward
static void MaxPoolLayerBackward(TCudaMatrix< AFloat > &activationGradientsBackward, const TCudaMatrix< AFloat > &activationGradients, const TCudaMatrix< AFloat > &indexMatrix, size_t imgHeight, size_t imgWidth, size_t fltHeight, size_t fltWidth, size_t strideRows, size_t strideCols, size_t nLocalViews)
Perform the complete backward propagation step in a Pooling Layer.

TMVA::DNN::TCuda::calculateDimension
static size_t calculateDimension(size_t imgDim, size_t fltDim, size_t padding, size_t stride)
Calculate how many neurons "fit" in the output layer, given the input as well as the layer's hyperpar...

TMVA::DNN::TCuda::Hadamard
static void Hadamard(TCudaMatrix< AFloat > &A, const TCudaMatrix< AFloat > &B)
In-place Hadamard (element-wise) product of matrices A and B with the result being written into A.

TMVA::DNN::TCuda::L2Regularization
static AFloat L2Regularization(const TCudaMatrix< AFloat > &W)

TMVA::DNN::TCuda::Im2colIndices
static void Im2colIndices(std::vector< int > &, const TCudaMatrix< AFloat > &, size_t, size_t, size_t, size_t, size_t, size_t, size_t, size_t, size_t)
Definition: Cuda.h:329

TMVA::DNN::TCuda::MeanSquaredErrorGradients
static void MeanSquaredErrorGradients(TCudaMatrix< AFloat > &dY, const TCudaMatrix< AFloat > &Y, const TCudaMatrix< AFloat > &output, const TCudaMatrix< AFloat > &weights)

TMVA::DNN::TCuda::Flatten
static void Flatten(TCudaMatrix< AFloat > &A, const std::vector< TCudaMatrix< AFloat > > &B, size_t size, size_t nRows, size_t nCols)
Flattens the tensor B, such that each matrix, is stretched in one row, resulting with a matrix A.

TMVA::DNN::TCuda::AdamUpdateFirstMom
static void AdamUpdateFirstMom(TCudaMatrix< AFloat > &A, const TCudaMatrix< AFloat > &B, AFloat beta)

TMVA::DNN::TCuda::CrossEntropy
static AFloat CrossEntropy(const TCudaMatrix< AFloat > &Y, const TCudaMatrix< AFloat > &output, const TCudaMatrix< AFloat > &weights)
Sigmoid transformation is implicitly applied, thus output should hold the linear activations of the l...

TMVA::DNN::TCuda::CalculateConvBiasGradients
static void CalculateConvBiasGradients(TCudaMatrix< AFloat > &biasGradients, std::vector< TCudaMatrix< AFloat > > &df, size_t batchSize, size_t depth, size_t nLocalViews)
Utility function for calculating the bias gradients of the convolutional layer.

TMVA::DNN::TCuda::CopyDiffArch
static void CopyDiffArch(TCudaMatrix< Scalar_t > &B, const AMatrix_t &A)
Definition: Cuda.h:539

TMVA::DNN::TCuda::AlmostEquals
static bool AlmostEquals(const TCudaMatrix< AFloat > &A, const TCudaMatrix< AFloat > &B, double epsilon=0.1)
Check two matrices for equality, taking floating point arithmetic errors into account.

TMVA::DNN::TCuda::Scalar_t
AFloat Scalar_t
Definition: Cuda.h:52

TMVA::DNN::TCuda::SquareElementWise
static void SquareElementWise(TCudaMatrix< AFloat > &A)
Square each element of the matrix A and write the result into A.

TMVA::DNN::TCuda::IdentityDerivative
static void IdentityDerivative(TCudaMatrix< AFloat > &B, const TCudaMatrix< AFloat > &A)

TMVA::DNN::TCuda::MeanSquaredError
static AFloat MeanSquaredError(const TCudaMatrix< AFloat > &Y, const TCudaMatrix< AFloat > &output, const TCudaMatrix< AFloat > &weights)

TMVA::DNN::TCuda::SumRows
static void SumRows(TCudaMatrix< AFloat > &B, const TCudaMatrix< AFloat > &A)
Sum rows of (m x n) matrix A and write the results into the first m elements in B.

TMVA::DNN::TCuda::Tanh
static void Tanh(TCudaMatrix< AFloat > &B)

TMVA::DNN::TCuda::SigmoidDerivative
static void SigmoidDerivative(TCudaMatrix< AFloat > &B, const TCudaMatrix< AFloat > &A)

TMVA::DNN::TCuda::ConvLayerForward
static void ConvLayerForward(std::vector< TCudaMatrix< AFloat > > &output, std::vector< TCudaMatrix< AFloat > > &derivatives, const std::vector< TCudaMatrix< AFloat > > &input, const TCudaMatrix< AFloat > &weights, const TCudaMatrix< AFloat > &biases, const DNN::CNN::TConvParams &params, EActivationFunction activFunc, std::vector< TCudaMatrix< AFloat > > &inputPrime)
Forward propagation in the Convolutional layer.

TMVA::DNN::TCuda::AdamUpdate
static void AdamUpdate(TCudaMatrix< AFloat > &A, const TCudaMatrix< AFloat > &M, const TCudaMatrix< AFloat > &V, AFloat alpha, AFloat eps)

TMVA::DNN::TCuda::ConstMult
static void ConstMult(TCudaMatrix< AFloat > &A, AFloat beta)
Multiply the constant beta to all the elements of matrix A and write the result into A.

TMVA::DNN::TCuda::ReciprocalElementWise
static void ReciprocalElementWise(TCudaMatrix< AFloat > &A)
Reciprocal each element of the matrix A and write the result into A.

TMVA::DNN::TCuda::Identity
static void Identity(TCudaMatrix< AFloat > &B)

TMVA::DNN::TCuda::SoftSignDerivative
static void SoftSignDerivative(TCudaMatrix< AFloat > &B, const TCudaMatrix< AFloat > &A)

TMVA::DNN::TCuda::Sum
static AFloat Sum(const TCudaMatrix< AFloat > &A)
Compute the sum of all elements in A.

TMVA::DNN::TCuda::SqrtElementWise
static void SqrtElementWise(TCudaMatrix< AFloat > &A)
Square root each element of the matrix A and write the result into A.

TMVA::DNN::TCuda::AddL1RegularizationGradients
static void AddL1RegularizationGradients(TCudaMatrix< AFloat > &A, const TCudaMatrix< AFloat > &W, AFloat weightDecay)

TMVA::DNN::TCuda::Reshape
static void Reshape(TCudaMatrix< AFloat > &A, const TCudaMatrix< AFloat > &B)
Transform the matrix B to a matrix with different dimensions A.

TMVA::DNN::TCuda::TanhDerivative
static void TanhDerivative(TCudaMatrix< AFloat > &B, const TCudaMatrix< AFloat > &A)

TMVA::DNN::TCuda::SetRandomSeed
static void SetRandomSeed(size_t seed)

TMVA::DNN::TCuda::AdamUpdateSecondMom
static void AdamUpdateSecondMom(TCudaMatrix< AFloat > &A, const TCudaMatrix< AFloat > &B, AFloat beta)

TMVA::DNN::TCuda::Im2colFast
static void Im2colFast(TCudaMatrix< AFloat > &, const TCudaMatrix< AFloat > &, const std::vector< int > &)
Definition: Cuda.h:333

TMVA::DNN::TCuda::L1Regularization
static AFloat L1Regularization(const TCudaMatrix< AFloat > &W)

TMVA::DNN::TCuda::Dropout
static void Dropout(TCudaMatrix< AFloat > &A, AFloat p)
Apply dropout with activation probability p to the given matrix A and scale the result by reciprocal ...

TMVA::DNN::TCuda::AddRowWise
static void AddRowWise(TCudaMatrix< AFloat > &output, const TCudaMatrix< AFloat > &biases)
Add the vectors biases row-wise to the matrix output.

TMVA::DNN::TCuda::TransposeMultiply
static void TransposeMultiply(TCudaMatrix< AFloat > &output, const TCudaMatrix< AFloat > &input, const TCudaMatrix< AFloat > &Weights)
Matrix multiplication of two matrices A and B^T (transposed) with the result being written into C.

TMVA::DNN::TCuda::InitializeGauss
static void InitializeGauss(TCudaMatrix< AFloat > &A)

TMVA::DNN::TCuda::InitializeIdentity
static void InitializeIdentity(TCudaMatrix< AFloat > &A)

TMVA::DNN::TCuda::GetRandomGenerator
static TRandom & GetRandomGenerator()

TMVA::DNN::TCuda::ScaleAdd
static void ScaleAdd(std::vector< TCudaMatrix< Scalar_t > > &A, const std::vector< TCudaMatrix< Scalar_t > > &B, Scalar_t beta=1.0)
Above functions extended to vectors.

TMVA::DNN::TCuda::Sigmoid
static void Sigmoid(TCudaMatrix< AFloat > &B)

TMVA::DNN::TCuda::Gauss
static void Gauss(TCudaMatrix< AFloat > &B)

TMVA::DNN::TCuda::ReluDerivative
static void ReluDerivative(TCudaMatrix< AFloat > &B, const TCudaMatrix< AFloat > &A)

TMVA::DNN::TCuda::CalculateConvWeightGradients
static void CalculateConvWeightGradients(TCudaMatrix< AFloat > &weightGradients, std::vector< TCudaMatrix< AFloat > > &df, const std::vector< TCudaMatrix< AFloat > > &activations_backward, size_t batchSize, size_t inputHeight, size_t inputWidth, size_t depth, size_t height, size_t width, size_t filterDepth, size_t filterHeight, size_t filterWidth, size_t nLocalViews)
Utility function for calculating the weight gradients of the convolutional layer.

TMVA::DNN::TCuda::InitializeUniform
static void InitializeUniform(TCudaMatrix< AFloat > &A)

TMVA::DNN::TCuda::Deflatten
static void Deflatten(std::vector< TCudaMatrix< AFloat > > &A, const TCudaMatrix< AFloat > &B, size_t index, size_t nRows, size_t nCols)
Transforms each row of B to a matrix and stores it in the tensor B.

TMVA::DNN::TCuda::Backward
static void Backward(TCudaMatrix< AFloat > &activationGradientsBackward, TCudaMatrix< AFloat > &weightGradients, TCudaMatrix< AFloat > &biasGradients, TCudaMatrix< AFloat > &df, const TCudaMatrix< AFloat > &activationGradients, const TCudaMatrix< AFloat > &weights, const TCudaMatrix< AFloat > &activationBackward)
Perform the complete backward propagation step.

TMVA::DNN::TCuda::SymmetricRelu
static void SymmetricRelu(TCudaMatrix< AFloat > &B)

TMVA::DNN::TCuda::SoftmaxCrossEntropyGradients
static void SoftmaxCrossEntropyGradients(TCudaMatrix< AFloat > &dY, const TCudaMatrix< AFloat > &Y, const TCudaMatrix< AFloat > &output, const TCudaMatrix< AFloat > &weights)

TMVA::DNN::TCuda::Sigmoid
static void Sigmoid(TCudaMatrix< AFloat > &YHat, const TCudaMatrix< AFloat > &)

TMVA::DNN::TCuda::AddConvBiases
static void AddConvBiases(TCudaMatrix< AFloat > &output, const TCudaMatrix< AFloat > &biases)
Add the biases in the Convolutional Layer.

TMVA::DNN::TCuda::CrossEntropyGradients
static void CrossEntropyGradients(TCudaMatrix< AFloat > &dY, const TCudaMatrix< AFloat > &Y, const TCudaMatrix< AFloat > &output, const TCudaMatrix< AFloat > &weights)

TMatrixT
TMatrixT.
Definition: TMatrixT.h:39

TRandom
This is the base class for the ROOT Random number generators.
Definition: TRandom.h:27

ROOT::Math::beta
double beta(double x, double y)
Calculates the beta function.
Definition: SpecFuncMathCore.cxx:111

ClassificationKeras.output
output
Definition: ClassificationKeras.py:16

ROOT::Math::Cephes::B
static double B[]
Definition: SpecFuncCephes.cxx:178

ROOT::Math::Cephes::A
static double A[]
Definition: SpecFuncCephes.cxx:170

ROOT::Math::Cephes::C
static double C[]
Definition: SpecFuncCephes.cxx:187

ROOT::Math::GSLSimAn::Copy
void Copy(void *source, void *dest)
Definition: GSLSimAnnealing.cxx:149

TMVA::DNN::weightDecay
double weightDecay(double error, ItWeight itWeight, ItWeight itWeightEnd, double factorWeightDecay, EnumRegularization eRegularization)
compute the weight decay for regularization (L1 or L2)
Definition: NeuralNet.icc:496

TMVA::DNN::EActivationFunction
EActivationFunction
Enum that represents layer activation functions.
Definition: Functions.h:32

TMVA
Abstract ClassifierFactory template that handles arbitrary types.
Definition: GeneticMinimizer.h:21

TMVA::DNN::CNN::TConvParams
Definition: ConvLayer.h:155

Functions.h

epsilon
REAL epsilon
Definition: triangle.c:617