doc/v632/Cpu_8h_source.html

// @(#)root/tmva/tmva/dnn:$Id$

// Author: Simon Pfreundschuh 05/07/16


/*************************************************************************

 * Copyright (C) 2016, Simon Pfreundschuh                                *

 * All rights reserved.                                                  *

 *                                                                       *

 * For the licensing terms see $ROOTSYS/LICENSE.                         *

 * For the list of contributors see $ROOTSYS/README/CREDITS.             *

 *************************************************************************/


 //////////////////////////////////////////////////////////////////

 // Definition of the TCpu architecture, which provides a         //

 // multi-threaded CPU implementation of the low-level interface //

 // networks for Cpus using BLAS and Roots TThreadExecutor            //

 //////////////////////////////////////////////////////////////////


#ifndef TMVA_DNN_ARCHITECTURES_CPU

#define TMVA_DNN_ARCHITECTURES_CPU


#include "TMVA/DNN/Functions.h"

#include "TMVA/DNN/CNN/ContextHandles.h"

//#include "TMVA/DNN/CNN/Descriptors.h"

#include "TMVA/DNN/GeneralLayer.h"

#include "TMVA/DNN/BatchNormLayer.h"

#include "TMVA/DNN/CNN/ConvLayer.h"

#include "TMVA/DNN/CNN/MaxPoolLayer.h"

#include "TMVA/DNN/RNN/RNNLayer.h"


#include "TMVA/DNN/Architectures/Cpu/CpuBuffer.h"

#include "TMVA/DNN/Architectures/Cpu/CpuMatrix.h"

#include "TMVA/DNN/Architectures/Cpu/CpuTensor.h"


#include <vector>

#include <string>


class TRandom;


namespace TMVA

{

namespace DNN

{

   //class EActivationFunction;

 struct DummyDescriptor {};

 struct DummyFilterDescriptor {};

 struct DummyConvolutionDescriptor {};

 struct DummyDropoutDescriptor {};

 struct DummyPoolingDescriptor {};

 struct DummyConvolutionFwdAlgo {};

 struct DummyConvolutionBwdDataAlgo {};

 struct DummyConvolutionBwdFilterAlgo {};

 struct DummyDataType {};


 struct DummyEmptyDescriptor {};


/** The TCpu architecture class.

 *

 * Low-level interface class for multi-threaded CPU architectures. Contains as

 * public types the declaration of the scalar, matrix and data loader types

 * for this architecture as well as the remaining functions in the low-level

 * interface in the form of static members.

 */

template<typename AReal = Float_t>


class TCpu

{

private:

   static TRandom * fgRandomGen;

public:

   using Scalar_t       = AReal;

   using Tensor_t       = TCpuTensor<AReal>;

   using Matrix_t       = TCpuMatrix<AReal>;

   using HostBuffer_t   = TCpuBuffer<AReal>;

   using DeviceBuffer_t = TCpuBuffer<AReal>;


   using ActivationDescriptor_t  = DummyDescriptor;

   using ConvolutionDescriptor_t = DummyDescriptor;

   using FilterDescriptor_t      = DummyDescriptor;

   using DropoutDescriptor_t     = DummyDescriptor;

   using PoolingDescriptor_t     = DummyDescriptor;

   using TensorDescriptor_t      = DummyDescriptor;


   using AlgorithmForward_t      = DummyConvolutionFwdAlgo;

   using AlgorithmBackward_t     = DummyConvolutionBwdDataAlgo;

   using AlgorithmHelper_t       = DummyConvolutionBwdFilterAlgo;

   using AlgorithmDataType_t     = DummyDataType;

   using ReduceTensorDescriptor_t = DummyDataType;

   using RecurrentDescriptor_t    = DummyDataType;


   using EmptyDescriptor_t       = DummyDescriptor; // Used if a descriptor is not needed in a class


   using GenLayer_t              = VGeneralLayer<TCpu<AReal>>;

   using BNormLayer_t            = TBatchNormLayer<TCpu<AReal>>;

   using BNormDescriptors_t      = TDNNGenDescriptors<BNormLayer_t>;


   using ConvLayer_t             = CNN::TConvLayer<TCpu<AReal>>;

   using ConvDescriptors_t       = CNN::TCNNDescriptors<ConvLayer_t>;

   using ConvWorkspace_t         = CNN::TCNNWorkspace<ConvLayer_t>;

   using PoolingLayer_t          = CNN::TMaxPoolLayer<TCpu<AReal>>;

   using PoolingDescriptors_t    = CNN::TCNNDescriptors<PoolingLayer_t>;

   using PoolingWorkspace_t      = CNN::TCNNWorkspace<PoolingLayer_t>;


   using RNNDescriptors_t = RNN::TRNNDescriptors<TCpu<AReal>>;

   using RNNWorkspace_t = RNN::TRNNWorkspace<TCpu<AReal>>;


   static TMVA::Experimental::MemoryLayout GetTensorLayout() { return TMVA::Experimental::MemoryLayout::ColumnMajor; }


   static Tensor_t CreateTensor(size_t n, size_t c, size_t h, size_t w) {

      return Tensor_t( {c,h*w,n}, GetTensorLayout());

   }


   static Tensor_t CreateTensor(DeviceBuffer_t buffer, size_t n, size_t c, size_t h, size_t w) {

      return Tensor_t( buffer, {c,h*w,n}, GetTensorLayout());

   }


   static Tensor_t CreateTensor(size_t b, size_t t, size_t w)

   {

      return Tensor_t({t, w, b}, GetTensorLayout());

   }


   static Tensor_t CreateTensor(DeviceBuffer_t buffer, size_t b, size_t t, size_t w)

   {

      return Tensor_t(buffer, {t, w, b}, GetTensorLayout());

   }


   // create a weight tensor/matrix vector   from another tensor/weight  vector using the given tensor shapes

   // this function is used by the optimizers to store intermediate weights representations


   static void  CreateWeightTensors( std::vector<Matrix_t> & newWeights, const std::vector<Matrix_t> & weights) {

      if (!newWeights.empty()) newWeights.clear();

      size_t n =  weights.size();

      for (size_t i = 0; i < n; ++i)

         newWeights.emplace_back( weights[i].GetNrows(), weights[i].GetNcols());

   }


   static bool IsCudnn() { return false; }

   //____________________________________________________________________________

   //

   // Architecture Initialization

   //____________________________________________________________________________


   /** Initialize CNN data/operator descriptors. Not used at the moment.*/


   static void InitializeBNormDescriptors(TDescriptors * & /*descriptors*/,

                                          BNormLayer_t * /*L = nullptr*/) {}


   static void InitializeConvDescriptors(TDescriptors * & /*descriptors*/,

                                         ConvLayer_t * /*L = nullptr*/) {}


   static void InitializePoolDescriptors(TDescriptors * & /*descriptors*/,

                                         PoolingLayer_t * /*L = nullptr*/) {}


   static void InitializeRNNDescriptors(TDescriptors *& /*descriptors*/, GenLayer_t * /*L*/) {}

   static void InitializeLSTMDescriptors(TDescriptors *& /*descriptors*/, GenLayer_t * /*L*/) {}

   static void InitializeGRUDescriptors(TDescriptors *& /*descriptors*/, GenLayer_t * /*L*/) {}


   static void InitializeActivationDescriptor(ActivationDescriptor_t &/*descriptors*/, EActivationFunction /*activFunc */ , double /*coef*/ = 0.0) {}


   /** Release CNN data/operator descriptors. Not used at the moment.*/

   static void ReleaseConvDescriptors(TDescriptors * & /*descriptors*/) {}

   static void ReleasePoolDescriptors(TDescriptors * & /*descriptors*/) {}

   static void ReleaseBNormDescriptors(TDescriptors * & /*descriptors*/) {}

   static void ReleaseRNNDescriptors(TDescriptors *& /*descriptors*/) {}


   static void InitializeConvWorkspace(TWorkspace * & /*workspace*/,

                                       TDescriptors * & /*descriptors*/,

                                       const DNN::CNN::TConvParams & /*params*/,

                                       ConvLayer_t * /*L = nullptr*/) {}


   static void InitializePoolDropoutWorkspace(TWorkspace * & /*workspace*/,

                                       TDescriptors * & /*descriptors*/,

                                       const DNN::CNN::TConvParams & /*params*/,

                                       PoolingLayer_t * /*L = nullptr*/) {}


   static void InitializeRNNWorkspace(TWorkspace *& /*workspace*/, TDescriptors *& /*descriptors*/, GenLayer_t * /*L*/) {}

   static void InitializeLSTMWorkspace(TWorkspace *& /*workspace*/, TDescriptors *& /*descriptors*/, GenLayer_t * /*L*/){}

   static void InitializeGRUWorkspace(TWorkspace *& /*workspace*/, TDescriptors *& /*descriptors*/, GenLayer_t * /*L*/){}


   static void FreeConvWorkspace(TWorkspace * & /*workspace*/) {}   ///< Only used for certain cudnn on-device memory

   static void FreePoolDropoutWorkspace(TWorkspace * & /*workspace*/) {}

   static void FreeRNNWorkspace(TWorkspace *& /*workspace*/) {}


   static void ReleaseDescriptor(ActivationDescriptor_t &  /* activationDescr */) {}


   static void InitializeRNNTensors(GenLayer_t * /*layer*/)   {}

   static void InitializeLSTMTensors(GenLayer_t * /*layer*/) {}

   static void InitializeGRUTensors(GenLayer_t * /*layer*/) {}


   //____________________________________________________________________________

   //

   // Propagation

   //____________________________________________________________________________


   /** @name Forward Propagation

    * Low-level functions required for the forward propagation of activations

    * through the network.

    */

   ///@{

   /** Matrix-multiply \p input with the transpose of \p weights and

    *  write the results into \p output. */

   static void MultiplyTranspose(Matrix_t &output, const Matrix_t &input, const Matrix_t &weights);


   static void MultiplyTranspose(Tensor_t &output, const Tensor_t &input, const Matrix_t &weights) {

      Matrix_t output_matrix = output.GetMatrix();

      MultiplyTranspose( output_matrix, input.GetMatrix(), weights);

      //ensor_t::MatrixToTensor(output_matrix, output); // this maybe is not needed

   }


   /** Add the vectors biases row-wise to the matrix output */

   static void AddRowWise(Matrix_t &output,const Matrix_t &biases);


   static void AddRowWise(Tensor_t &output, const Matrix_t &biases) {

      Matrix_t output_matrix = output.GetMatrix();

      AddRowWise(output_matrix, biases);

      //Tensor_t::MatrixToTensor(output_matrix, output); // this maybe is not needed

   }


   /** @name Backward Propagation (Dense Layers)

    * Low-level functions required for the forward propagation of activations

    * through the network.

    */

   ///@{

   /** Perform the complete backward propagation step. If the provided

    *  \p activationGradientsBackward matrix is not empty, compute the

    *  gradients of the objective function with respect to the activations

    *  of the previous layer (backward direction).

    *  Also compute the weight and the bias gradients. Modifies the values

    *  in \p df and thus produces only a valid result, if it is applied the

    *  first time after the corresponding forward propagation has been per-

    *  formed. */

   static void Backward(Tensor_t & activationGradientsBackward,

                        Matrix_t & weightGradients,

                        Matrix_t & biasGradients,

                        const Tensor_t & df,

                        const Tensor_t & activationGradients,

                        const Matrix_t & weights,

                        const Tensor_t & activationBackward);


   /** Adds a the elements in matrix B scaled by c to the elements in

    *  the matrix A. This is required for the weight update in the gradient

    *  descent step.*/

   static void ScaleAdd(Matrix_t & A,

                        const Matrix_t & B,

                        Scalar_t beta = 1.0);


   static void Copy(Matrix_t & B,

                    const Matrix_t & A);


   // copy from another type of matrix

   template<typename AMatrix_t>

   static void CopyDiffArch(Matrix_t & B, const AMatrix_t & A);


   /** Above functions extended to vectors */

   static void ScaleAdd(Tensor_t & A,

                        const Tensor_t & B,

                        Scalar_t beta = 1.0);


   static void Copy(Tensor_t & A,

                    const Tensor_t & B);


   // copy from another tensor

   template<typename ATensor_t>

   static void CopyDiffArch(Tensor_t & A,

                     const ATensor_t & B);


   // copy from vector of matrices of different types

   template<typename AMatrix_t>

   static void CopyDiffArch(std::vector<Matrix_t>  & A,

                      const std::vector<AMatrix_t> & B);


   ///@}


   //____________________________________________________________________________

   //

   // Activation Functions

   //____________________________________________________________________________


   /** @name Activation Functions

    * For each activation function, the low-level interface contains two routines.

    * One that applies the activation function to a matrix and one that evaluate

    * the derivatives of the activation function at the elements of a given matrix

    * and writes the results into the result matrix.

    */

   ///@{

   /*  impl using Matrix */

   /*inline void evaluate(Matrix_t &A, EActivationFunction f)

   {

    Tensor_t tA(A);

    evaluate<TCpu<AReal>>(tA,f);

   }*/


   static void ActivationFunctionForward(Tensor_t & X, EActivationFunction activFunct,

                          const ActivationDescriptor_t activationDescr,

                          const double coef = 0.0, const Scalar_t alpha = 1,

                          const Scalar_t beta = 0);


   /** Computes the gradient of the activation function */

   static void ActivationFunctionBackward(Tensor_t & dX, const Tensor_t & Y,

                                          const Tensor_t & dY,  const Tensor_t & X,

                                          EActivationFunction activFunct,

                                          const ActivationDescriptor_t activationDescr,

                                          const Scalar_t alpha = 1,

                                          const Scalar_t beta = 0);


   static void IdentityDerivative(Tensor_t & B,

                                  const Tensor_t &A);


   static void Relu(Tensor_t & B);

   static void ReluDerivative(Tensor_t & B,

                              const Tensor_t & A);


   static void Sigmoid(Tensor_t & B);

   static void SigmoidDerivative(Tensor_t & B,

                                 const Tensor_t & A);


   static void Tanh(Tensor_t & B);

   static void TanhDerivative(Tensor_t & B,

                              const Tensor_t & A);


   // fast tanh (only when VDT is available)

   static void FastTanh(Tensor_t &B);

   static void FastTanhDerivative(Tensor_t &B, const Tensor_t &A);


   static void SymmetricRelu(Tensor_t & B);

   static void SymmetricReluDerivative(Tensor_t & B,

                                       const Tensor_t & A);


   static void SoftSign(Tensor_t & B);

   static void SoftSignDerivative(Tensor_t & B,

                                  const Tensor_t & A);


   static void Gauss(Tensor_t & B);

   static void GaussDerivative(Tensor_t & B,

                               const Tensor_t & A);

   ///@}


   //____________________________________________________________________________

   //

   // Loss Functions

   //____________________________________________________________________________


   /** @name Loss Functions

    * Loss functions compute a scalar value given the \p output of the network

    * for a given training input and the expected network prediction \p Y that

    * quantifies the quality of the prediction. For each function also a routing

    * that computes the gradients (suffixed by Gradients) must be provided for

    * the starting of the backpropagation algorithm.

    */

   ///@{


   static Scalar_t MeanSquaredError(const Matrix_t &Y, const Matrix_t &output,

                                    const Matrix_t &weights);

   static void MeanSquaredErrorGradients(Matrix_t &dY, const Matrix_t &Y,

                                         const Matrix_t &output, const Matrix_t &weights);


   /** Sigmoid transformation is implicitly applied, thus \p output should

    *  hold the linear activations of the last layer in the net. */

   static Scalar_t CrossEntropy(const Matrix_t &Y, const Matrix_t &output,

                                const Matrix_t &weights);


   static void CrossEntropyGradients(Matrix_t &dY, const Matrix_t &Y,

                                     const Matrix_t &output, const Matrix_t &weights);


   /** Softmax transformation is implicitly applied, thus \p output should

    *  hold the linear activations of the last layer in the net. */

   static Scalar_t SoftmaxCrossEntropy(const Matrix_t &Y, const Matrix_t &output,

                                       const Matrix_t &weights);

   static void SoftmaxCrossEntropyGradients(Matrix_t &dY, const Matrix_t &Y,

                                            const Matrix_t &output, const Matrix_t &weights);

   ///@}


   //____________________________________________________________________________

   //

   // Output Functions

   //____________________________________________________________________________


   /** @name Output Functions

    * Output functions transform the activations \p output of the

    * output layer in the network to a valid prediction \p YHat for

    * the desired usage of the network, e.g.  the identity function

    * for regression or the sigmoid transformation for two-class

    * classification.

    */

   ///@{

   static void Sigmoid(Matrix_t &YHat,

                        const Matrix_t & );

   static void Softmax(Matrix_t &YHat,

                       const Matrix_t & );

   ///@}


   //____________________________________________________________________________

   //

   // Regularization

   //____________________________________________________________________________


   /** @name Regularization

    * For each regularization type two functions are required, one named

    * <tt>`<Type>`Regularization</tt> that evaluates the corresponding

    * regularization functional for a given weight matrix and the

    * <tt>Add<Type>RegularizationGradients</tt>, that adds the regularization

    * component in the gradients to the provided matrix.

    */

   ///@{


   static Scalar_t L1Regularization(const Matrix_t & W);

   static void AddL1RegularizationGradients(Matrix_t & A,

                                            const Matrix_t & W,

                                            Scalar_t weightDecay);


   static Scalar_t L2Regularization(const Matrix_t & W);

   static void AddL2RegularizationGradients(Matrix_t & A,

                                            const Matrix_t & W,

                                            Scalar_t weightDecay);

   ///@}


   //____________________________________________________________________________

   //

   // Initialization

   //____________________________________________________________________________


   /** @name Initialization

    * For each initialization method, one function in the low-level interface

    * is provided. The naming scheme is <p>Initialize<Type></p> for a given

    * initialization method Type.

    */

   ///@{


   static void InitializeGauss(Matrix_t & A);

   static void InitializeUniform(Matrix_t & A);

   static void InitializeIdentity(Matrix_t & A);

   static void InitializeZero(Matrix_t & A);

   static void InitializeZero(Tensor_t &A);

   static void InitializeGlorotNormal(Matrix_t & A);

   static void InitializeGlorotUniform(Matrix_t & A);


   // return static instance of random generator used for initialization

   // if generator does not exist it is created the first time with a random seed (e.g. seed = 0)

   static TRandom & GetRandomGenerator();

   // set random seed for the static generator

   // if the static generator does not exists it is created

   static void SetRandomSeed(size_t seed);

   ///@}


   //____________________________________________________________________________

   //

   // Dropout

   //____________________________________________________________________________


   /** @name Dropout

    */

   ///@{


   /** Apply dropout with activation probability \p p to the given

    *  tensor \p A and scale the result by reciprocal of \p p. */

   static void DropoutForward(Tensor_t & A,

                              TDescriptors * descriptors,

                              TWorkspace   * workspace,

                              Scalar_t p);


   static void DropoutForward(Matrix_t & A, Scalar_t p) {

      Tensor_t tA(A);

      DropoutForward( tA, static_cast<TDescriptors *> (nullptr), static_cast<TWorkspace *> (nullptr), p );

   }


   // Only needed for cuDNN


   static void DropoutBackward(Tensor_t & /*A */,

                               TDescriptors * /*descriptors */,

                               TWorkspace   * /*workspace*/) {}


   ///@}


   //____________________________________________________________________________

   //

   // Batch Normalization

   //____________________________________________________________________________


   /** @name Batch Normalization Layer Propagation

    */

   ///@{


   /** The input from each batch are normalized during training to have zero mean and unit variance

     * and they are then scaled by two parameter, different for each input variable:

     *  - a scale factor `\gamma` gamma

     *  - an offset `\beta` beta */

   static void BatchNormLayerForwardTraining(int axis, const Tensor_t &x, Tensor_t &y, Matrix_t &gamma, Matrix_t &beta,

                                             Matrix_t &mean, Matrix_t &, Matrix_t &iVariance, Matrix_t &runningMeans,

                                             Matrix_t &runningVars, Scalar_t nTrainedBatches, Scalar_t momentum,

                                             Scalar_t epsilon, const TensorDescriptor_t &bnParDescriptor);


   /** During inference the inputs are not normalized using the batch mean but the previously computed

     * at  running mean and variance */

   static void BatchNormLayerForwardInference(int axis, const Tensor_t &x, Matrix_t &gamma, Matrix_t &beta,

                                              Tensor_t &y, const Matrix_t &runningMeans,

                                              const Matrix_t &runningVars, Scalar_t epsilon,

                                              const TensorDescriptor_t &);


   /**

    * */

   static void BatchNormLayerBackward(int axis, const Tensor_t &x, const Tensor_t &dy, Tensor_t &dx,

                                      Matrix_t &gamma, //  Matrix_t &beta, (not needed)

                                      Matrix_t &dgamma, Matrix_t &dbeta, const Matrix_t &mean, const Matrix_t &variance,

                                      const Matrix_t &iVariance, Scalar_t epsilon, const TensorDescriptor_t &);


   // helper function for BNorm layer

   static Tensor_t BatchNormLayerReshapeTensor(int axis, const Tensor_t &x);


   ///@}


   //____________________________________________________________________________

   //

   //  Convolutional Layer Propagation

   //____________________________________________________________________________


   /** @name Forward Propagation in Convolutional Layer

    */

   ///@{


   /** Calculate how many neurons "fit" in the output layer, given the input as well as the layer's hyperparameters.

    */

   static size_t calculateDimension(size_t imgDim, size_t fltDim, size_t padding, size_t stride);


   /** Transform the matrix B in local view format, suitable for

    *  convolution, and store it in matrix A */

   static void Im2col(Matrix_t &A, const Matrix_t &B, size_t imgHeight, size_t imgWidth, size_t fltHeight,

                      size_t fltWidth, size_t strideRows, size_t strideCols, size_t zeroPaddingHeight,

                      size_t zeroPaddingWidth);


   static void Im2colIndices(std::vector<int> &V, const Matrix_t &B, size_t nLocalViews, size_t imgHeight,

                             size_t imgWidth, size_t fltHeight, size_t fltWidth, size_t strideRows, size_t strideCols,

                             size_t zeroPaddingHeight, size_t zeroPaddingWidth);

   static void Im2colFast(Matrix_t &A, const Matrix_t &B, const std::vector<int> &V);


   /** Rotates the matrix \p B, which is representing a weights,

    *  and stores them in the matrix \p A. */

   static void RotateWeights(Matrix_t &A, const Matrix_t &B, size_t filterDepth, size_t filterHeight,

                             size_t filterWidth, size_t numFilters);


   /** Add the biases in the Convolutional Layer.  */

   static void AddConvBiases(Matrix_t &output, const Matrix_t &biases);

   ///@}


   /** Dummy placeholder - preparation is currently only required for the CUDA architecture. */

   static void PrepareInternals(Tensor_t &) {}


   /** Forward propagation in the Convolutional layer */

   static void ConvLayerForward(Tensor_t &output, Tensor_t &inputActivationFunc, const Tensor_t &input,

                                const Matrix_t &weights, const Matrix_t &biases, const DNN::CNN::TConvParams &params,

                                EActivationFunction activFunc, Tensor_t & /* inputPrime */,

                                const ConvDescriptors_t & /*descriptors*/, // Empty struct for cuda architecture

                                ConvWorkspace_t & /*workspace*/);          // Empty struct for cuda architecture

   // void * cudnnWorkspace = nullptr);          // Remains nullptr for cuda architecture


   /** @name Backward Propagation in Convolutional Layer

    */

   ///@{


   /** Perform the complete backward propagation step in a Convolutional Layer.

    *  If the provided \p activationGradientsBackward matrix is not empty, compute the

    *  gradients of the objective function with respect to the activations

    *  of the previous layer (backward direction).

    *  Also compute the weight and the bias gradients. Modifies the values

    *  in \p df and thus produces only a valid result, if it is applied the

    *  first time after the corresponding forward propagation has been per-

    *  formed. */

   static void

   ConvLayerBackward(Tensor_t &activationGradientsBackward, Matrix_t &weightGradients, Matrix_t &biasGradients,

                     Tensor_t &df, Tensor_t &activationGradients, const Matrix_t &weights,

                     const Tensor_t &activationBackward, const Tensor_t &outputTensor, EActivationFunction activFunc,

                     const ConvDescriptors_t & /*descriptors*/, ConvWorkspace_t & /*workspace*/, size_t batchSize,

                     size_t inputHeight, size_t inputWidth, size_t depth, size_t height, size_t width,

                     size_t filterDepth, size_t filterHeight, size_t filterWidth, size_t nLocalViews);


   /** Utility function for calculating the activation gradients of the layer

    *  before the convolutional layer. */

   static void CalculateConvActivationGradients(Tensor_t &activationGradientsBackward, const Tensor_t &df,

                                                const Matrix_t &weights, size_t batchSize, size_t inputHeight,

                                                size_t inputWidth, size_t depth, size_t height, size_t width,

                                                size_t filterDepth, size_t filterHeight, size_t filterWidth);


   /** Utility function for calculating the weight gradients of the convolutional

    * layer. */

   static void CalculateConvWeightGradients(Matrix_t &weightGradients, const Tensor_t &df,

                                            const Tensor_t &activations_backward, size_t batchSize, size_t inputHeight,

                                            size_t inputWidth, size_t depth, size_t height, size_t width,

                                            size_t filterDepth, size_t filterHeight, size_t filterWidth,

                                            size_t nLocalViews);


   /** Utility function for calculating the bias gradients of the convolutional

    *  layer */

   static void CalculateConvBiasGradients(Matrix_t &biasGradients, const Tensor_t &df, size_t batchSize, size_t depth,

                                          size_t nLocalViews);

   ///@}


   //____________________________________________________________________________

   //

   //  Max Pooling Layer Propagation

   //____________________________________________________________________________

   /** @name Forward Propagation in Max Pooling Layer

    */

   ///@{


   /** Downsample the matrix \p C to the matrix \p A, using max

    * operation, such that the winning indices are stored in matrix

    * \p B. */

   static void Downsample(Tensor_t &A, Tensor_t &B, const Tensor_t &C, const PoolingDescriptors_t & /*descriptors*/,

                          PoolingWorkspace_t & /*workspace*/, size_t imgHeight, size_t imgWidth, size_t fltHeight,

                          size_t fltWidth, size_t strideRows, size_t strideCols);


   ///@}


   /** @name Backward Propagation in Max Pooling Layer

    */

   ///@{

   /** Perform the complete backward propagation step in a Pooling Layer. Based on the

    *  winning indices stored in the index matrix, it just forwards the activation

    *  gradients to the previous layer. */

   static void MaxPoolLayerBackward(Tensor_t &activationGradientsBackward, const Tensor_t &activationGradients,

                                    const Tensor_t &indexMatrix, const Tensor_t & /*inputActivation*/,

                                    const Tensor_t & /*outputTensor*/, const PoolingDescriptors_t & /*descriptors*/,

                                    PoolingWorkspace_t & /*workspace*/, size_t imgHeight, size_t imgWidth,

                                    size_t fltHeight, size_t fltWidth, size_t strideRows, size_t strideCols,

                                    size_t nLocalViews);


                                     //// Recurrent Network Functions


   /** Backward pass for Recurrent Networks */

   static Matrix_t &RecurrentLayerBackward(Matrix_t &state_gradients_backward, // BxH

                                           Matrix_t &input_weight_gradients, Matrix_t &state_weight_gradients,

                                           Matrix_t &bias_gradients,

                                           Matrix_t &df,                  // DxH

                                           const Matrix_t &state,         // BxH

                                           const Matrix_t &weights_input, // HxD

                                           const Matrix_t &weights_state, // HxH

                                           const Matrix_t &input,         // BxD

                                           Matrix_t &input_gradient);


   // dummy RNN functions


   static void RNNForward(const Tensor_t & /* x */, const Matrix_t & /* hx */, const Matrix_t & /* cx */,

                          const Tensor_t & /* weights */, Tensor_t & /* y */, Matrix_t & /* hy */, Matrix_t & /* cy */,

                          const RNNDescriptors_t & /* descr */, RNNWorkspace_t & /* workspace */, bool /* isTraining */)

   {

   }


   static void RNNBackward(const Tensor_t & /* x */, const Matrix_t & /* hx */, const Matrix_t & /* cx */,

                           const Tensor_t & /* y */, const Tensor_t & /* dy */, const Matrix_t & /* dhy */,

                           const Matrix_t & /* dcy */, const Tensor_t & /* weights */, Tensor_t & /* dx */,

                           Matrix_t & /* dhx */, Matrix_t & /* dcx */, Tensor_t & /* dw */,

                           const RNNDescriptors_t & /* desc */, RNNWorkspace_t & /* workspace */)

   {

   }


   /** Backward pass for LSTM Network */

   static Matrix_t & LSTMLayerBackward(TCpuMatrix<Scalar_t> & state_gradients_backward,

                                          TCpuMatrix<Scalar_t> & cell_gradients_backward,

                                          TCpuMatrix<Scalar_t> & input_weight_gradients,

                                       TCpuMatrix<Scalar_t> & forget_weight_gradients,

                                       TCpuMatrix<Scalar_t> & candidate_weight_gradients,

                                       TCpuMatrix<Scalar_t> & output_weight_gradients,

                                       TCpuMatrix<Scalar_t> & input_state_weight_gradients,

                                       TCpuMatrix<Scalar_t> & forget_state_weight_gradients,

                                       TCpuMatrix<Scalar_t> & candidate_state_weight_gradients,

                                       TCpuMatrix<Scalar_t> & output_state_weight_gradients,

                                       TCpuMatrix<Scalar_t> & input_bias_gradients,

                                       TCpuMatrix<Scalar_t> & forget_bias_gradients,

                                       TCpuMatrix<Scalar_t> & candidate_bias_gradients,

                                       TCpuMatrix<Scalar_t> & output_bias_gradients,

                                       TCpuMatrix<Scalar_t> & di,

                                       TCpuMatrix<Scalar_t> & df,

                                       TCpuMatrix<Scalar_t> & dc,

                                       TCpuMatrix<Scalar_t> & dout,

                                       const TCpuMatrix<Scalar_t> & precStateActivations,

                                       const TCpuMatrix<Scalar_t> & precCellActivations,

                                       const TCpuMatrix<Scalar_t> & fInput,

                                       const TCpuMatrix<Scalar_t> & fForget,

                                       const TCpuMatrix<Scalar_t> & fCandidate,

                                       const TCpuMatrix<Scalar_t> & fOutput,

                                       const TCpuMatrix<Scalar_t> & weights_input,

                                       const TCpuMatrix<Scalar_t> & weights_forget,

                                       const TCpuMatrix<Scalar_t> & weights_candidate,

                                       const TCpuMatrix<Scalar_t> & weights_output,

                                       const TCpuMatrix<Scalar_t> & weights_input_state,

                                       const TCpuMatrix<Scalar_t> & weights_forget_state,

                                       const TCpuMatrix<Scalar_t> & weights_candidate_state,

                                       const TCpuMatrix<Scalar_t> & weights_output_state,

                                       const TCpuMatrix<Scalar_t> & input,

                                       TCpuMatrix<Scalar_t> & input_gradient,

                                       TCpuMatrix<Scalar_t> & cell_gradient,

                                       TCpuMatrix<Scalar_t> & cell_tanh);


   /** Backward pass for GRU Network */

   static Matrix_t & GRULayerBackward(TCpuMatrix<Scalar_t> & state_gradients_backward,

                                      TCpuMatrix<Scalar_t> & reset_weight_gradients,

                                      TCpuMatrix<Scalar_t> & update_weight_gradients,

                                      TCpuMatrix<Scalar_t> & candidate_weight_gradients,

                                      TCpuMatrix<Scalar_t> & reset_state_weight_gradients,

                                      TCpuMatrix<Scalar_t> & update_state_weight_gradients,

                                      TCpuMatrix<Scalar_t> & candidate_state_weight_gradients,

                                      TCpuMatrix<Scalar_t> & reset_bias_gradients,

                                      TCpuMatrix<Scalar_t> & update_bias_gradients,

                                      TCpuMatrix<Scalar_t> & candidate_bias_gradients,

                                      TCpuMatrix<Scalar_t> & dr,

                                      TCpuMatrix<Scalar_t> & du,

                                      TCpuMatrix<Scalar_t> & dc,

                                      const TCpuMatrix<Scalar_t> & precStateActivations,

                                      const TCpuMatrix<Scalar_t> & fReset,

                                      const TCpuMatrix<Scalar_t> & fUpdate,

                                      const TCpuMatrix<Scalar_t> & fCandidate,

                                      const TCpuMatrix<Scalar_t> & weights_reset,

                                      const TCpuMatrix<Scalar_t> & weights_update,

                                      const TCpuMatrix<Scalar_t> & weights_candidate,

                                      const TCpuMatrix<Scalar_t> & weights_reset_state,

                                      const TCpuMatrix<Scalar_t> & weights_update_state,

                                      const TCpuMatrix<Scalar_t> & weights_candidate_state,

                                      const TCpuMatrix<Scalar_t> & input,

                                      TCpuMatrix<Scalar_t> & input_gradient,

                                      bool resetGateAfter);


   ///@}


   //____________________________________________________________________________

   //

   //  Reshape Layer Propagation

   //____________________________________________________________________________

   /** @name Forward and Backward Propagation in Reshape Layer

    */

   ///@{


   /** Transform the matrix \p B to a matrix with different dimensions \p A */

   static void Reshape(Matrix_t &A, const Matrix_t &B);


   /** Flattens the tensor \p B, such that each matrix, is stretched in

    *  one row, resulting with a matrix \p A. */

   static void Flatten(Tensor_t &A, const Tensor_t &B); // size_t size, size_t nRows, size_t nCols);


   /** Transforms each row of \p B to a matrix and stores it in the

    *  tensor \p B. */

   static void Deflatten(Tensor_t &A, const Tensor_t &B); // size_t index, size_t nRows,size_t nCols);


   /** Rearrage data according to time fill B x T x D out with T x B x D matrix in*/

   static void Rearrange(Tensor_t &out, const Tensor_t &in);


   ///@}


   //____________________________________________________________________________

   //

   // Additional Arithmetic Functions

   //____________________________________________________________________________


   /** @name Additional Arithmetic Functions

    *

    * Additional arithmetic on CUDA matrices  used to implement the low-level

    * interface.

    */

   ///@{


   /** Standard multiplication of two matrices \p A and \p B with the result being

    *  written into C.

    */

   static void Multiply(Matrix_t &C, const Matrix_t &A, const Matrix_t &B);

   /** Matrix multiplication of two matrices \p A and \p B^T (transposed) with the

    *  result being written into C.

    */

   static void TransposeMultiply(Matrix_t &output, const Matrix_t &input, const Matrix_t &Weights, Scalar_t alpha = 1.0,

                                 Scalar_t beta = 0.);

   /** In-place Hadamard (element-wise) product of matrices \p A and \p B

    *  with the result being written into \p A.

    */

   static void Hadamard(Tensor_t &A, const Tensor_t &B);

   static void Hadamard(Matrix_t &A, const Matrix_t &B);

   // {

   //    Tensor_t tA(A);

   //    Hadamard( tA, Tensor_t(B));

   // }


   /** Sum columns of (m x n) matrix \p A and write the results into the first

    * m elements in \p A.

    */

   static void SumColumns(Matrix_t &B, const Matrix_t &A, Scalar_t alpha = 1.0, Scalar_t beta = 0.);


   /** Compute the sum of all elements in \p A */

   static Scalar_t Sum(const Matrix_t &A);


   /** Check two matrices for equality, taking floating point arithmetic errors into account. */

   static bool AlmostEquals(const Matrix_t &A, const Matrix_t &B, double epsilon = 0.1);


   /** Add the constant \p beta to all the elements of matrix \p A and write the

    * result into \p A.

    */

   static void ConstAdd(Matrix_t &A, Scalar_t beta);


   /** Multiply the constant \p beta to all the elements of matrix \p A and write the

    * result into \p A.

    */

   static void ConstMult(Matrix_t &A, Scalar_t beta);


   /** Reciprocal each element of the matrix \p A and write the result into

    * \p A

    */

   static void ReciprocalElementWise(Matrix_t &A);


   /** Square each element of the matrix \p A and write the result into

    * \p A

    */

   static void SquareElementWise(Matrix_t &A);


   /** Square root each element of the matrix \p A and write the result into

    * \p A

    */

   static void SqrtElementWise(Matrix_t &A);


   // optimizer functions

   static void AdamUpdate(Matrix_t &A, const Matrix_t &M, const Matrix_t &V, Scalar_t alpha, Scalar_t eps);

   static void AdamUpdateFirstMom(Matrix_t &A, const Matrix_t &B, Scalar_t beta);

   static void AdamUpdateSecondMom(Matrix_t &A, const Matrix_t &B, Scalar_t beta);


   // printing of tensor

   static void PrintTensor(const Tensor_t &A, const std::string name = "Cpu-tensor", bool truncate = false);


};


//____________________________________________________________________________

template <typename AReal>

template <typename AMatrix_t>


void TCpu<AReal>::CopyDiffArch(TCpuMatrix<AReal> &B,

                        const AMatrix_t &A)

{

   // copy from another architecture using the reference one

   // this is not very efficient since creates temporary objects

   TMatrixT<AReal> tmp = A;  // this works also if A is a tensor

   Copy(B, TCpuMatrix<AReal>(tmp) );

}


//____________________________________________________________________________

template <typename AReal>

template <typename ATensor_t>


void TCpu<AReal>::CopyDiffArch(TCpuTensor<AReal> &B,

                            const ATensor_t &A)

{


   R__ASSERT(A.GetSize() == B.GetSize());

   // suppose A is of (B,D,H.W) and we want to convert to B,HW,D  or (D,HW,B) in ColumnMajor format

   for (size_t i = 0; i < A.GetFirstSize(); ++i) {

      TMatrixT<AReal> tmpIn = A.At(i);  // this convert tensor (B,D,H,W) in  (D,H,W)i -> (D,HW)i


      TCpuMatrix<AReal> tmpOut = B.At(i).GetMatrix();    // matrix (D,HW)

      Copy(tmpOut, TCpuMatrix<AReal>(tmpIn));

   }


   // ATensor_t tmpIn = A.Reshape({A.GetNrows(), A.GetNcols()});

   // auto tmpOut = B.Reshape({A.GetNrows(), A.GetNcols()});

   // Matrix_t mOut = tmpOut.GetMatrix();

   // CopyDiffArch(mOut, tmpIn.GetMatrix());

}


// Implementation using vector of matrices for the weights

template <typename AReal>

template <typename AMatrix_t>


void TCpu<AReal>::CopyDiffArch(std::vector<TCpuMatrix<AReal>> &A, const std::vector<AMatrix_t> &B)

{

   for (size_t i = 0; i < A.size(); ++i) {

      CopyDiffArch(A[i], B[i]);

   }

}


template <typename AReal>


void TCpu<AReal>::PrintTensor(const typename TCpu<AReal>::Tensor_t & A, const std::string name, bool truncate )

{

   std::cout << name << " size = " << A.GetSize() << " shape = { ";

   auto shape = A.GetShape();

   for (size_t k = 0; k < shape.size()-1; ++k)

      std::cout << shape[k] << " , ";

   std::cout << shape.back() << " } ";


   // print elements

   // need to find way to nice printing all elements

   std::cout << " tensor count " << A.GetBufferUseCount() << std::endl;

   if (A.GetShape().size() == 2 ) {

      for (size_t i = 0; i < A.GetShape()[0]; ++i) {

         std::cout << "{ ";

         size_t n =  A.GetShape()[1];

         if (truncate) n = std::min(n,size_t(10));

         for (size_t j = 0; j < n; ++j) {

            std::cout << A(i,j) << " ";

         }

          if (truncate && n < A.GetShape()[1]) std::cout << " ...... ";

         std::cout << " } " << std::endl;

      }

   } else if  (A.GetShape().size() == 3 ) {

      for (size_t i = 0; i < A.GetFirstSize(); ++i) {

         std::cout << "{ ";

         for (size_t j = 0; j < A.GetHSize(); ++j) {

            std::cout << "{ ";

            size_t n =  A.GetWSize();

            if (truncate)  n = std::min(n,size_t(10));

            for (size_t k = 0; k < n; ++k) {

               std::cout << A(i,j,k) << " ";

            }

            if (truncate && n < A.GetWSize()) std::cout << " ...... ";

            std::cout << " } " << std::endl;

         }

         std::cout << " } " << std::endl;

      }

   }

   else {

      for (size_t l = 0; l < A.GetSize(); ++l) {

         std::cout << A.GetData()[l] << " ";

      }

      std::cout << "\n";

   }

}


} // namespace DNN

} // namespace TMVA


#endif

BatchNormLayer.h

ContextHandles.h

ConvLayer.h

CpuBuffer.h

CpuMatrix.h

CpuTensor.h

GeneralLayer.h

MaxPoolLayer.h

RNNLayer.h

b
#define b(i)
Definition RSha256.hxx:100

c
#define c(i)
Definition RSha256.hxx:101

h
#define h(i)
Definition RSha256.hxx:106

X
#define X(type, name)

TRangeDynCast
ROOT::Detail::TRangeCast< T, true > TRangeDynCast
TRangeDynCast is an adapter class that allows the typed iteration through a TCollection.
Definition TCollection.h:358

R__ASSERT
#define R__ASSERT(e)
Definition TError.h:118

w
winID w
Definition TGWin32VirtualGLProxy.cxx:39

p
winID h TVirtualViewer3D TVirtualGLPainter p
Definition TGWin32VirtualGLProxy.cxx:51

input
Option_t Option_t TPoint TPoint const char GetTextMagnitude GetFillStyle GetLineColor GetLineWidth GetMarkerStyle GetTextAlign GetTextColor GetTextSize void input
Definition TGWin32VirtualXProxy.cxx:142

width
Option_t Option_t width
Definition TGWin32VirtualXProxy.cxx:56

height
Option_t Option_t TPoint TPoint const char GetTextMagnitude GetFillStyle GetLineColor GetLineWidth GetMarkerStyle GetTextAlign GetTextColor GetTextSize void char Point_t Rectangle_t height
Definition TGWin32VirtualXProxy.cxx:164

name
char name[80]
Definition TGX11.cxx:110

AReal

ROOT::Detail::TRangeCast
Definition TCollection.h:311

TMVA::DNN::CNN::TConvLayer
Definition ConvLayer.h:75

TMVA::DNN::CNN::TMaxPoolLayer
Generic Max Pooling Layer class.
Definition MaxPoolLayer.h:59

TMVA::DNN::TCpuMatrix
The TCpuMatrix class.
Definition CpuMatrix.h:86

TMVA::DNN::TCpuTensor
Definition CpuTensor.h:40

TMVA::DNN::TCpuTensor::GetBufferUseCount
size_t GetBufferUseCount() const
Definition CpuTensor.h:300

TMVA::DNN::TCpuTensor::GetWSize
size_t GetWSize() const
Definition CpuTensor.h:177

TMVA::DNN::TCpuTensor::GetFirstSize
size_t GetFirstSize() const
Definition CpuTensor.h:155

TMVA::DNN::TCpuTensor::GetHSize
size_t GetHSize() const
Definition CpuTensor.h:168

TMVA::DNN::TCpu
The TCpu architecture class.
Definition Cpu.h:65

TMVA::DNN::TCpu::CalculateConvBiasGradients
static void CalculateConvBiasGradients(Matrix_t &biasGradients, const Tensor_t &df, size_t batchSize, size_t depth, size_t nLocalViews)
Utility function for calculating the bias gradients of the convolutional layer.
Definition Propagation.hxx:587

TMVA::DNN::TCpu::Deflatten
static void Deflatten(Tensor_t &A, const Tensor_t &B)
Transforms each row of B to a matrix and stores it in the tensor B.
Definition Propagation.hxx:944

TMVA::DNN::TCpu::FastTanh
static void FastTanh(Tensor_t &B)
Definition ActivationFunctions.hxx:158

TMVA::DNN::TCpu::TransposeMultiply
static void TransposeMultiply(Matrix_t &output, const Matrix_t &input, const Matrix_t &Weights, Scalar_t alpha=1.0, Scalar_t beta=0.)
Matrix multiplication of two matrices A and B^T (transposed) with the result being written into C.
Definition Arithmetic.hxx:77

TMVA::DNN::TCpu::fgRandomGen
static TRandom * fgRandomGen
Definition Cpu.h:67

TMVA::DNN::TCpu::CreateTensor
static Tensor_t CreateTensor(DeviceBuffer_t buffer, size_t n, size_t c, size_t h, size_t w)
Definition Cpu.h:111

TMVA::DNN::TCpu::PoolingWorkspace_t
CNN::TCNNWorkspace< PoolingLayer_t > PoolingWorkspace_t
Definition Cpu.h:100

TMVA::DNN::TCpu::L1Regularization
static Scalar_t L1Regularization(const Matrix_t &W)
Definition Regularization.hxx:27

TMVA::DNN::TCpu::MaxPoolLayerBackward
static void MaxPoolLayerBackward(Tensor_t &activationGradientsBackward, const Tensor_t &activationGradients, const Tensor_t &indexMatrix, const Tensor_t &, const Tensor_t &, const PoolingDescriptors_t &, PoolingWorkspace_t &, size_t imgHeight, size_t imgWidth, size_t fltHeight, size_t fltWidth, size_t strideRows, size_t strideCols, size_t nLocalViews)
Perform the complete backward propagation step in a Pooling Layer.
Definition Propagation.hxx:650

TMVA::DNN::TCpu::ScaleAdd
static void ScaleAdd(Matrix_t &A, const Matrix_t &B, Scalar_t beta=1.0)
Adds a the elements in matrix B scaled by c to the elements in the matrix A.
Definition Arithmetic.hxx:248

TMVA::DNN::TCpu::AddL1RegularizationGradients
static void AddL1RegularizationGradients(Matrix_t &A, const Matrix_t &W, Scalar_t weightDecay)
Definition Regularization.hxx:60

TMVA::DNN::TCpu::InitializeLSTMTensors
static void InitializeLSTMTensors(GenLayer_t *)
Definition Cpu.h:177

TMVA::DNN::TCpu::AddRowWise
static void AddRowWise(Tensor_t &output, const Matrix_t &biases)
Definition Cpu.h:203

TMVA::DNN::TCpu::ConstAdd
static void ConstAdd(Matrix_t &A, Scalar_t beta)
Add the constant beta to all the elements of matrix A and write the result into A.
Definition Arithmetic.hxx:302

TMVA::DNN::TCpu::TensorDescriptor_t
DummyDescriptor TensorDescriptor_t
Definition Cpu.h:80

TMVA::DNN::TCpu::PoolingDescriptors_t
CNN::TCNNDescriptors< PoolingLayer_t > PoolingDescriptors_t
Definition Cpu.h:99

TMVA::DNN::TCpu::SumColumns
static void SumColumns(Matrix_t &B, const Matrix_t &A, Scalar_t alpha=1.0, Scalar_t beta=0.)
Sum columns of (m x n) matrix A and write the results into the first m elements in A.
Definition Arithmetic.hxx:212

TMVA::DNN::TCpu::Sigmoid
static void Sigmoid(Tensor_t &B)

TMVA::DNN::TCpu::ConvLayerForward
static void ConvLayerForward(Tensor_t &output, Tensor_t &inputActivationFunc, const Tensor_t &input, const Matrix_t &weights, const Matrix_t &biases, const DNN::CNN::TConvParams &params, EActivationFunction activFunc, Tensor_t &, const ConvDescriptors_t &, ConvWorkspace_t &)
Forward propagation in the Convolutional layer.
Definition Propagation.hxx:326

TMVA::DNN::TCpu::CreateTensor
static Tensor_t CreateTensor(DeviceBuffer_t buffer, size_t b, size_t t, size_t w)
Definition Cpu.h:118

TMVA::DNN::TCpu::DropoutBackward
static void DropoutBackward(Tensor_t &, TDescriptors *, TWorkspace *)
Definition Cpu.h:459

TMVA::DNN::TCpu::Sum
static Scalar_t Sum(const Matrix_t &A)
Compute the sum of all elements in A.

TMVA::DNN::TCpu::InitializeLSTMWorkspace
static void InitializeLSTMWorkspace(TWorkspace *&, TDescriptors *&, GenLayer_t *)
Definition Cpu.h:167

TMVA::DNN::TCpu::ConvWorkspace_t
CNN::TCNNWorkspace< ConvLayer_t > ConvWorkspace_t
Definition Cpu.h:97

TMVA::DNN::TCpu::Sigmoid
static void Sigmoid(Matrix_t &YHat, const Matrix_t &)

TMVA::DNN::TCpu::ConvDescriptors_t
CNN::TCNNDescriptors< ConvLayer_t > ConvDescriptors_t
Definition Cpu.h:96

TMVA::DNN::TCpu::Tensor_t
TCpuTensor< AReal > Tensor_t
Definition Cpu.h:70

TMVA::DNN::TCpu::SymmetricReluDerivative
static void SymmetricReluDerivative(Tensor_t &B, const Tensor_t &A)
Definition ActivationFunctions.hxx:181

TMVA::DNN::TCpu::InitializeBNormDescriptors
static void InitializeBNormDescriptors(TDescriptors *&, BNormLayer_t *)
Initialize CNN data/operator descriptors.
Definition Cpu.h:139

TMVA::DNN::TCpu::AlmostEquals
static bool AlmostEquals(const Matrix_t &A, const Matrix_t &B, double epsilon=0.1)
Check two matrices for equality, taking floating point arithmetic errors into account.
Definition Arithmetic.hxx:194

TMVA::DNN::TCpu::Hadamard
static void Hadamard(Tensor_t &A, const Tensor_t &B)
In-place Hadamard (element-wise) product of matrices A and B with the result being written into A.
Definition Arithmetic.hxx:152

TMVA::DNN::TCpu::InitializeIdentity
static void InitializeIdentity(Matrix_t &A)
Definition Initialization.hxx:133

TMVA::DNN::TCpu::ReleasePoolDescriptors
static void ReleasePoolDescriptors(TDescriptors *&)
Definition Cpu.h:154

TMVA::DNN::TCpu::InitializePoolDropoutWorkspace
static void InitializePoolDropoutWorkspace(TWorkspace *&, TDescriptors *&, const DNN::CNN::TConvParams &, PoolingLayer_t *)
Definition Cpu.h:162

TMVA::DNN::TCpu::Im2colFast
static void Im2colFast(Matrix_t &A, const Matrix_t &B, const std::vector< int > &V)
Definition Propagation.hxx:235

TMVA::DNN::TCpu::SqrtElementWise
static void SqrtElementWise(Matrix_t &A)
Square root each element of the matrix A and write the result into A.
Definition Arithmetic.hxx:334

TMVA::DNN::TCpu::AddRowWise
static void AddRowWise(Matrix_t &output, const Matrix_t &biases)
Add the vectors biases row-wise to the matrix output.

TMVA::DNN::TCpu::SoftmaxCrossEntropyGradients
static void SoftmaxCrossEntropyGradients(Matrix_t &dY, const Matrix_t &Y, const Matrix_t &output, const Matrix_t &weights)
Definition LossFunctions.hxx:180

TMVA::DNN::TCpu::InitializeGRUDescriptors
static void InitializeGRUDescriptors(TDescriptors *&, GenLayer_t *)
Definition Cpu.h:148

TMVA::DNN::TCpu::SymmetricRelu
static void SymmetricRelu(Tensor_t &B)
Definition ActivationFunctions.hxx:173

TMVA::DNN::TCpu::PrintTensor
static void PrintTensor(const Tensor_t &A, const std::string name="Cpu-tensor", bool truncate=false)
Definition Cpu.h:862

TMVA::DNN::TCpu::GetRandomGenerator
static TRandom & GetRandomGenerator()
Definition Initialization.hxx:35

TMVA::DNN::TCpu::MultiplyTranspose
static void MultiplyTranspose(Tensor_t &output, const Tensor_t &input, const Matrix_t &weights)
Definition Cpu.h:194

TMVA::DNN::TCpu::DropoutForward
static void DropoutForward(Tensor_t &A, TDescriptors *descriptors, TWorkspace *workspace, Scalar_t p)
Apply dropout with activation probability p to the given tensor A and scale the result by reciprocal ...

TMVA::DNN::TCpu::FreePoolDropoutWorkspace
static void FreePoolDropoutWorkspace(TWorkspace *&)
Definition Cpu.h:171

TMVA::DNN::TCpu::CreateTensor
static Tensor_t CreateTensor(size_t b, size_t t, size_t w)
Definition Cpu.h:114

TMVA::DNN::TCpu::Softmax
static void Softmax(Matrix_t &YHat, const Matrix_t &)
Definition OutputFunctions.hxx:33

TMVA::DNN::TCpu::CalculateConvActivationGradients
static void CalculateConvActivationGradients(Tensor_t &activationGradientsBackward, const Tensor_t &df, const Matrix_t &weights, size_t batchSize, size_t inputHeight, size_t inputWidth, size_t depth, size_t height, size_t width, size_t filterDepth, size_t filterHeight, size_t filterWidth)
Utility function for calculating the activation gradients of the layer before the convolutional layer...
Definition Propagation.hxx:425

TMVA::DNN::TCpu::TanhDerivative
static void TanhDerivative(Tensor_t &B, const Tensor_t &A)
Definition ActivationFunctions.hxx:110

TMVA::DNN::TCpu::InitializeGRUWorkspace
static void InitializeGRUWorkspace(TWorkspace *&, TDescriptors *&, GenLayer_t *)
Definition Cpu.h:168

TMVA::DNN::TCpu::BatchNormLayerForwardTraining
static void BatchNormLayerForwardTraining(int axis, const Tensor_t &x, Tensor_t &y, Matrix_t &gamma, Matrix_t &beta, Matrix_t &mean, Matrix_t &, Matrix_t &iVariance, Matrix_t &runningMeans, Matrix_t &runningVars, Scalar_t nTrainedBatches, Scalar_t momentum, Scalar_t epsilon, const TensorDescriptor_t &bnParDescriptor)
The input from each batch are normalized during training to have zero mean and unit variance and they...
Definition Propagation.hxx:709

TMVA::DNN::TCpu::Multiply
static void Multiply(Matrix_t &C, const Matrix_t &A, const Matrix_t &B)
Standard multiplication of two matrices A and B with the result being written into C.
Definition Arithmetic.hxx:42

TMVA::DNN::TCpu::Backward
static void Backward(Tensor_t &activationGradientsBackward, Matrix_t &weightGradients, Matrix_t &biasGradients, const Tensor_t &df, const Tensor_t &activationGradients, const Matrix_t &weights, const Tensor_t &activationBackward)
Perform the complete backward propagation step.
Definition Propagation.hxx:100

TMVA::DNN::TCpu::InitializeUniform
static void InitializeUniform(Matrix_t &A)
Definition Initialization.hxx:61

TMVA::DNN::TCpu::ActivationFunctionForward
static void ActivationFunctionForward(Tensor_t &X, EActivationFunction activFunct, const ActivationDescriptor_t activationDescr, const double coef=0.0, const Scalar_t alpha=1, const Scalar_t beta=0)
Definition ActivationFunctions.hxx:32

TMVA::DNN::TCpu::SoftSignDerivative
static void SoftSignDerivative(Tensor_t &B, const Tensor_t &A)
Definition ActivationFunctions.hxx:200

TMVA::DNN::TCpu::AdamUpdateSecondMom
static void AdamUpdateSecondMom(Matrix_t &A, const Matrix_t &B, Scalar_t beta)
Definition Arithmetic.hxx:369

TMVA::DNN::TCpu::Copy
static void Copy(Matrix_t &B, const Matrix_t &A)
Definition Arithmetic.hxx:269

TMVA::DNN::TCpu::ReleaseBNormDescriptors
static void ReleaseBNormDescriptors(TDescriptors *&)
Definition Cpu.h:155

TMVA::DNN::TCpu::SetRandomSeed
static void SetRandomSeed(size_t seed)
Definition Initialization.hxx:29

TMVA::DNN::TCpu::FreeConvWorkspace
static void FreeConvWorkspace(TWorkspace *&)
Only used for certain cudnn on-device memory.
Definition Cpu.h:170

TMVA::DNN::TCpu::LSTMLayerBackward
static Matrix_t & LSTMLayerBackward(TCpuMatrix< Scalar_t > &state_gradients_backward, TCpuMatrix< Scalar_t > &cell_gradients_backward, TCpuMatrix< Scalar_t > &input_weight_gradients, TCpuMatrix< Scalar_t > &forget_weight_gradients, TCpuMatrix< Scalar_t > &candidate_weight_gradients, TCpuMatrix< Scalar_t > &output_weight_gradients, TCpuMatrix< Scalar_t > &input_state_weight_gradients, TCpuMatrix< Scalar_t > &forget_state_weight_gradients, TCpuMatrix< Scalar_t > &candidate_state_weight_gradients, TCpuMatrix< Scalar_t > &output_state_weight_gradients, TCpuMatrix< Scalar_t > &input_bias_gradients, TCpuMatrix< Scalar_t > &forget_bias_gradients, TCpuMatrix< Scalar_t > &candidate_bias_gradients, TCpuMatrix< Scalar_t > &output_bias_gradients, TCpuMatrix< Scalar_t > &di, TCpuMatrix< Scalar_t > &df, TCpuMatrix< Scalar_t > &dc, TCpuMatrix< Scalar_t > &dout, const TCpuMatrix< Scalar_t > &precStateActivations, const TCpuMatrix< Scalar_t > &precCellActivations, const TCpuMatrix< Scalar_t > &fInput, const TCpuMatrix< Scalar_t > &fForget, const TCpuMatrix< Scalar_t > &fCandidate, const TCpuMatrix< Scalar_t > &fOutput, const TCpuMatrix< Scalar_t > &weights_input, const TCpuMatrix< Scalar_t > &weights_forget, const TCpuMatrix< Scalar_t > &weights_candidate, const TCpuMatrix< Scalar_t > &weights_output, const TCpuMatrix< Scalar_t > &weights_input_state, const TCpuMatrix< Scalar_t > &weights_forget_state, const TCpuMatrix< Scalar_t > &weights_candidate_state, const TCpuMatrix< Scalar_t > &weights_output_state, const TCpuMatrix< Scalar_t > &input, TCpuMatrix< Scalar_t > &input_gradient, TCpuMatrix< Scalar_t > &cell_gradient, TCpuMatrix< Scalar_t > &cell_tanh)
Backward pass for LSTM Network.
Definition RecurrentPropagation.hxx:75

TMVA::DNN::TCpu::L2Regularization
static Scalar_t L2Regularization(const Matrix_t &W)
Definition Regularization.hxx:98

TMVA::DNN::TCpu::CreateWeightTensors
static void CreateWeightTensors(std::vector< Matrix_t > &newWeights, const std::vector< Matrix_t > &weights)
Definition Cpu.h:124

TMVA::DNN::TCpu::AddL2RegularizationGradients
static void AddL2RegularizationGradients(Matrix_t &A, const Matrix_t &W, Scalar_t weightDecay)
Definition Regularization.hxx:132

TMVA::DNN::TCpu::InitializeGauss
static void InitializeGauss(Matrix_t &A)
Definition Initialization.hxx:43

TMVA::DNN::TCpu::Reshape
static void Reshape(Matrix_t &A, const Matrix_t &B)
Transform the matrix B to a matrix with different dimensions A.
Definition Propagation.hxx:893

TMVA::DNN::TCpu::IdentityDerivative
static void IdentityDerivative(Tensor_t &B, const Tensor_t &A)
Definition ActivationFunctions.hxx:56

TMVA::DNN::TCpu::RecurrentLayerBackward
static Matrix_t & RecurrentLayerBackward(Matrix_t &state_gradients_backward, Matrix_t &input_weight_gradients, Matrix_t &state_weight_gradients, Matrix_t &bias_gradients, Matrix_t &df, const Matrix_t &state, const Matrix_t &weights_input, const Matrix_t &weights_state, const Matrix_t &input, Matrix_t &input_gradient)
Backward pass for Recurrent Networks.
Definition RecurrentPropagation.hxx:26

TMVA::DNN::TCpu::Rearrange
static void Rearrange(Tensor_t &out, const Tensor_t &in)
Rearrage data according to time fill B x T x D out with T x B x D matrix in.
Definition Propagation.hxx:968

TMVA::DNN::TCpu::MultiplyTranspose
static void MultiplyTranspose(Matrix_t &output, const Matrix_t &input, const Matrix_t &weights)
Matrix-multiply input with the transpose of weights and write the results into output.

TMVA::DNN::TCpu::CrossEntropyGradients
static void CrossEntropyGradients(Matrix_t &dY, const Matrix_t &Y, const Matrix_t &output, const Matrix_t &weights)
Definition LossFunctions.hxx:120

TMVA::DNN::TCpu::InitializeGRUTensors
static void InitializeGRUTensors(GenLayer_t *)
Definition Cpu.h:178

TMVA::DNN::TCpu::InitializeRNNDescriptors
static void InitializeRNNDescriptors(TDescriptors *&, GenLayer_t *)
Definition Cpu.h:146

TMVA::DNN::TCpu::GRULayerBackward
static Matrix_t & GRULayerBackward(TCpuMatrix< Scalar_t > &state_gradients_backward, TCpuMatrix< Scalar_t > &reset_weight_gradients, TCpuMatrix< Scalar_t > &update_weight_gradients, TCpuMatrix< Scalar_t > &candidate_weight_gradients, TCpuMatrix< Scalar_t > &reset_state_weight_gradients, TCpuMatrix< Scalar_t > &update_state_weight_gradients, TCpuMatrix< Scalar_t > &candidate_state_weight_gradients, TCpuMatrix< Scalar_t > &reset_bias_gradients, TCpuMatrix< Scalar_t > &update_bias_gradients, TCpuMatrix< Scalar_t > &candidate_bias_gradients, TCpuMatrix< Scalar_t > &dr, TCpuMatrix< Scalar_t > &du, TCpuMatrix< Scalar_t > &dc, const TCpuMatrix< Scalar_t > &precStateActivations, const TCpuMatrix< Scalar_t > &fReset, const TCpuMatrix< Scalar_t > &fUpdate, const TCpuMatrix< Scalar_t > &fCandidate, const TCpuMatrix< Scalar_t > &weights_reset, const TCpuMatrix< Scalar_t > &weights_update, const TCpuMatrix< Scalar_t > &weights_candidate, const TCpuMatrix< Scalar_t > &weights_reset_state, const TCpuMatrix< Scalar_t > &weights_update_state, const TCpuMatrix< Scalar_t > &weights_candidate_state, const TCpuMatrix< Scalar_t > &input, TCpuMatrix< Scalar_t > &input_gradient, bool resetGateAfter)
Backward pass for GRU Network.
Definition RecurrentPropagation.hxx:193

TMVA::DNN::TCpu::RNNBackward
static void RNNBackward(const Tensor_t &, const Matrix_t &, const Matrix_t &, const Tensor_t &, const Tensor_t &, const Matrix_t &, const Matrix_t &, const Tensor_t &, Tensor_t &, Matrix_t &, Matrix_t &, Tensor_t &, const RNNDescriptors_t &, RNNWorkspace_t &)
Definition Cpu.h:637

TMVA::DNN::TCpu::CalculateConvWeightGradients
static void CalculateConvWeightGradients(Matrix_t &weightGradients, const Tensor_t &df, const Tensor_t &activations_backward, size_t batchSize, size_t inputHeight, size_t inputWidth, size_t depth, size_t height, size_t width, size_t filterDepth, size_t filterHeight, size_t filterWidth, size_t nLocalViews)
Utility function for calculating the weight gradients of the convolutional layer.
Definition Propagation.hxx:494

TMVA::DNN::TCpu::calculateDimension
static size_t calculateDimension(size_t imgDim, size_t fltDim, size_t padding, size_t stride)
Calculate how many neurons "fit" in the output layer, given the input as well as the layer's hyperpar...
Definition Propagation.hxx:314

TMVA::DNN::TCpu::BatchNormLayerBackward
static void BatchNormLayerBackward(int axis, const Tensor_t &x, const Tensor_t &dy, Tensor_t &dx, Matrix_t &gamma, Matrix_t &dgamma, Matrix_t &dbeta, const Matrix_t &mean, const Matrix_t &variance, const Matrix_t &iVariance, Scalar_t epsilon, const TensorDescriptor_t &)
Definition Propagation.hxx:835

TMVA::DNN::TCpu::InitializeConvWorkspace
static void InitializeConvWorkspace(TWorkspace *&, TDescriptors *&, const DNN::CNN::TConvParams &, ConvLayer_t *)
Definition Cpu.h:158

TMVA::DNN::TCpu::ConvLayerBackward
static void ConvLayerBackward(Tensor_t &activationGradientsBackward, Matrix_t &weightGradients, Matrix_t &biasGradients, Tensor_t &df, Tensor_t &activationGradients, const Matrix_t &weights, const Tensor_t &activationBackward, const Tensor_t &outputTensor, EActivationFunction activFunc, const ConvDescriptors_t &, ConvWorkspace_t &, size_t batchSize, size_t inputHeight, size_t inputWidth, size_t depth, size_t height, size_t width, size_t filterDepth, size_t filterHeight, size_t filterWidth, size_t nLocalViews)
Perform the complete backward propagation step in a Convolutional Layer.
Definition Propagation.hxx:380

TMVA::DNN::TCpu::InitializePoolDescriptors
static void InitializePoolDescriptors(TDescriptors *&, PoolingLayer_t *)
Definition Cpu.h:144

TMVA::DNN::TCpu::InitializeZero
static void InitializeZero(Matrix_t &A)

TMVA::DNN::TCpu::BatchNormLayerReshapeTensor
static Tensor_t BatchNormLayerReshapeTensor(int axis, const Tensor_t &x)
Definition Propagation.hxx:693

TMVA::DNN::TCpu::PrepareInternals
static void PrepareInternals(Tensor_t &)
Dummy placeholder - preparation is currently only required for the CUDA architecture.
Definition Cpu.h:536

TMVA::DNN::TCpu::MeanSquaredErrorGradients
static void MeanSquaredErrorGradients(Matrix_t &dY, const Matrix_t &Y, const Matrix_t &output, const Matrix_t &weights)
Definition LossFunctions.hxx:54

TMVA::DNN::TCpu::MeanSquaredError
static Scalar_t MeanSquaredError(const Matrix_t &Y, const Matrix_t &output, const Matrix_t &weights)
Definition LossFunctions.hxx:27

TMVA::DNN::TCpu::InitializeGlorotUniform
static void InitializeGlorotUniform(Matrix_t &A)
Sample from a uniform distribution in range [ -lim,+lim] where lim = sqrt(6/N_in+N_out).
Definition Initialization.hxx:114

TMVA::DNN::TCpu::Relu
static void Relu(Tensor_t &B)
Definition ActivationFunctions.hxx:65

TMVA::DNN::TCpu::ActivationFunctionBackward
static void ActivationFunctionBackward(Tensor_t &dX, const Tensor_t &Y, const Tensor_t &dY, const Tensor_t &X, EActivationFunction activFunct, const ActivationDescriptor_t activationDescr, const Scalar_t alpha=1, const Scalar_t beta=0)
Computes the gradient of the activation function.
Definition ActivationFunctions.hxx:41

TMVA::DNN::TCpu::SquareElementWise
static void SquareElementWise(Matrix_t &A)
Square each element of the matrix A and write the result into A.
Definition Arithmetic.hxx:326

TMVA::DNN::TCpu::Im2colIndices
static void Im2colIndices(std::vector< int > &V, const Matrix_t &B, size_t nLocalViews, size_t imgHeight, size_t imgWidth, size_t fltHeight, size_t fltWidth, size_t strideRows, size_t strideCols, size_t zeroPaddingHeight, size_t zeroPaddingWidth)
Definition Propagation.hxx:183

TMVA::DNN::TCpu::Flatten
static void Flatten(Tensor_t &A, const Tensor_t &B)
Flattens the tensor B, such that each matrix, is stretched in one row, resulting with a matrix A.
Definition Propagation.hxx:908

TMVA::DNN::TCpu::AddConvBiases
static void AddConvBiases(Matrix_t &output, const Matrix_t &biases)
Add the biases in the Convolutional Layer.
Definition Propagation.hxx:289

TMVA::DNN::TCpu::CrossEntropy
static Scalar_t CrossEntropy(const Matrix_t &Y, const Matrix_t &output, const Matrix_t &weights)
Sigmoid transformation is implicitly applied, thus output should hold the linear activations of the l...
Definition LossFunctions.hxx:77

TMVA::DNN::TCpu::InitializeRNNTensors
static void InitializeRNNTensors(GenLayer_t *)
Definition Cpu.h:176

TMVA::DNN::TCpu::Im2col
static void Im2col(Matrix_t &A, const Matrix_t &B, size_t imgHeight, size_t imgWidth, size_t fltHeight, size_t fltWidth, size_t strideRows, size_t strideCols, size_t zeroPaddingHeight, size_t zeroPaddingWidth)
Transform the matrix B in local view format, suitable for convolution, and store it in matrix A.
Definition Propagation.hxx:132

TMVA::DNN::TCpu::ReleaseConvDescriptors
static void ReleaseConvDescriptors(TDescriptors *&)
Release CNN data/operator descriptors.
Definition Cpu.h:153

TMVA::DNN::TCpu::InitializeRNNWorkspace
static void InitializeRNNWorkspace(TWorkspace *&, TDescriptors *&, GenLayer_t *)
Definition Cpu.h:166

TMVA::DNN::TCpu::CreateTensor
static Tensor_t CreateTensor(size_t n, size_t c, size_t h, size_t w)
Definition Cpu.h:108

TMVA::DNN::TCpu::InitializeGlorotNormal
static void InitializeGlorotNormal(Matrix_t &A)
Truncated normal initialization (Glorot, called also Xavier normal) The values are sample with a norm...
Definition Initialization.hxx:85

TMVA::DNN::TCpu::InitializeLSTMDescriptors
static void InitializeLSTMDescriptors(TDescriptors *&, GenLayer_t *)
Definition Cpu.h:147

TMVA::DNN::TCpu::FreeRNNWorkspace
static void FreeRNNWorkspace(TWorkspace *&)
Definition Cpu.h:172

TMVA::DNN::TCpu::GaussDerivative
static void GaussDerivative(Tensor_t &B, const Tensor_t &A)
Definition ActivationFunctions.hxx:221

TMVA::DNN::TCpu::BatchNormLayerForwardInference
static void BatchNormLayerForwardInference(int axis, const Tensor_t &x, Matrix_t &gamma, Matrix_t &beta, Tensor_t &y, const Matrix_t &runningMeans, const Matrix_t &runningVars, Scalar_t epsilon, const TensorDescriptor_t &)
During inference the inputs are not normalized using the batch mean but the previously computed at ru...
Definition Propagation.hxx:794

TMVA::DNN::TCpu::AdamUpdateFirstMom
static void AdamUpdateFirstMom(Matrix_t &A, const Matrix_t &B, Scalar_t beta)
Definition Arithmetic.hxx:357

TMVA::DNN::TCpu::DropoutForward
static void DropoutForward(Matrix_t &A, Scalar_t p)
Definition Cpu.h:453

TMVA::DNN::TCpu::Downsample
static void Downsample(Tensor_t &A, Tensor_t &B, const Tensor_t &C, const PoolingDescriptors_t &, PoolingWorkspace_t &, size_t imgHeight, size_t imgWidth, size_t fltHeight, size_t fltWidth, size_t strideRows, size_t strideCols)
Downsample the matrix C to the matrix A, using max operation, such that the winning indices are store...
Definition Propagation.hxx:605

TMVA::DNN::TCpu::InitializeConvDescriptors
static void InitializeConvDescriptors(TDescriptors *&, ConvLayer_t *)
Definition Cpu.h:142

TMVA::DNN::TCpu::IsCudnn
static bool IsCudnn()
Definition Cpu.h:131

TMVA::DNN::TCpu::ConstMult
static void ConstMult(Matrix_t &A, Scalar_t beta)
Multiply the constant beta to all the elements of matrix A and write the result into A.
Definition Arithmetic.hxx:310

TMVA::DNN::TCpu::SigmoidDerivative
static void SigmoidDerivative(Tensor_t &B, const Tensor_t &A)
Definition ActivationFunctions.hxx:90

TMVA::DNN::TCpu::RNNForward
static void RNNForward(const Tensor_t &, const Matrix_t &, const Matrix_t &, const Tensor_t &, Tensor_t &, Matrix_t &, Matrix_t &, const RNNDescriptors_t &, RNNWorkspace_t &, bool)
Definition Cpu.h:631

TMVA::DNN::TCpu::CopyDiffArch
static void CopyDiffArch(Matrix_t &B, const AMatrix_t &A)
Definition Cpu.h:820

TMVA::DNN::TCpu::SoftmaxCrossEntropy
static Scalar_t SoftmaxCrossEntropy(const Matrix_t &Y, const Matrix_t &output, const Matrix_t &weights)
Softmax transformation is implicitly applied, thus output should hold the linear activations of the l...
Definition LossFunctions.hxx:144

TMVA::DNN::TCpu::InitializeZero
static void InitializeZero(Tensor_t &A)

TMVA::DNN::TCpu::FastTanhDerivative
static void FastTanhDerivative(Tensor_t &B, const Tensor_t &A)
Definition ActivationFunctions.hxx:165

TMVA::DNN::TCpu::InitializeActivationDescriptor
static void InitializeActivationDescriptor(ActivationDescriptor_t &, EActivationFunction, double=0.0)
Definition Cpu.h:150

TMVA::DNN::TCpu::ReleaseDescriptor
static void ReleaseDescriptor(ActivationDescriptor_t &)
Definition Cpu.h:174

TMVA::DNN::TCpu::ReleaseRNNDescriptors
static void ReleaseRNNDescriptors(TDescriptors *&)
Definition Cpu.h:156

TMVA::DNN::TCpu::GetTensorLayout
static TMVA::Experimental::MemoryLayout GetTensorLayout()
Definition Cpu.h:106

TMVA::DNN::TCpu::RotateWeights
static void RotateWeights(Matrix_t &A, const Matrix_t &B, size_t filterDepth, size_t filterHeight, size_t filterWidth, size_t numFilters)
Rotates the matrix B, which is representing a weights, and stores them in the matrix A.
Definition Propagation.hxx:273

TMVA::DNN::TCpu::ReluDerivative
static void ReluDerivative(Tensor_t &B, const Tensor_t &A)
Definition ActivationFunctions.hxx:73

TMVA::DNN::TCpu::ReciprocalElementWise
static void ReciprocalElementWise(Matrix_t &A)
Reciprocal each element of the matrix A and write the result into A.
Definition Arithmetic.hxx:318

TMVA::DNN::TCpu::AdamUpdate
static void AdamUpdate(Matrix_t &A, const Matrix_t &M, const Matrix_t &V, Scalar_t alpha, Scalar_t eps)
Adam updates.
Definition Arithmetic.hxx:343

TMVA::Experimental::RTensor::GetSize
std::size_t GetSize() const
Definition RTensor.hxx:242

TMVA::Experimental::RTensor::GetData
Value_t * GetData()
Definition RTensor.hxx:245

TMVA::Experimental::RTensor::GetShape
const Shape_t & GetShape() const
Definition RTensor.hxx:243

TRandom
This is the base class for the ROOT Random number generators.
Definition TRandom.h:27

y
Double_t y[n]
Definition legend1.C:17

x
Double_t x[n]
Definition legend1.C:17

n
const Int_t n
Definition legend1.C:16

TMVA::DNN::Tanh
std::shared_ptr< std::function< double(double)> > Tanh
Definition NeuralNet.cxx:29

TMVA::DNN::weightDecay
double weightDecay(double error, ItWeight itWeight, ItWeight itWeightEnd, double factorWeightDecay, EnumRegularization eRegularization)
compute the weight decay for regularization (L1 or L2)
Definition NeuralNet.icc:498

TMVA::DNN::EActivationFunction
EActivationFunction
Enum that represents layer activation functions.
Definition Functions.h:32

TMVA::DNN::Gauss
std::shared_ptr< std::function< double(double)> > Gauss
Definition NeuralNet.cxx:12

TMVA::DNN::SoftSign
std::shared_ptr< std::function< double(double)> > SoftSign
Definition NeuralNet.cxx:32

TMVA::Experimental::MemoryLayout
MemoryLayout
Memory layout type (copy from RTensor.hxx)
Definition CudaTensor.h:47

TMVA
create variable transformations
Definition GeneticMinimizer.h:22

TMVA::DNN::CNN::TCNNDescriptors
Definition ContextHandles.h:51

TMVA::DNN::CNN::TCNNWorkspace
Definition ContextHandles.h:62

TMVA::DNN::CNN::TConvParams
Definition ConvLayer.h:44

TMVA::DNN::DummyConvolutionBwdDataAlgo
Definition Cpu.h:50

TMVA::DNN::DummyConvolutionBwdFilterAlgo
Definition Cpu.h:51

TMVA::DNN::DummyConvolutionDescriptor
Definition Cpu.h:46

TMVA::DNN::DummyConvolutionFwdAlgo
Definition Cpu.h:49

TMVA::DNN::DummyDataType
Definition Cpu.h:52

TMVA::DNN::DummyDescriptor
Definition Cpu.h:44

TMVA::DNN::DummyDropoutDescriptor
Definition Cpu.h:47

TMVA::DNN::DummyEmptyDescriptor
Definition Cpu.h:54

TMVA::DNN::DummyFilterDescriptor
Definition Cpu.h:45

TMVA::DNN::DummyPoolingDescriptor
Definition Cpu.h:48

TMVA::DNN::RNN::TRNNDescriptors
Definition ContextHandles.h:95

TMVA::DNN::RNN::TRNNWorkspace
Definition ContextHandles.h:132

TMVA::DNN::TDescriptors
Definition ContextHandles.h:29

TMVA::DNN::TWorkspace
Definition ContextHandles.h:32

l
TLine l
Definition textangle.C:4

Functions.h

output
static void output()