17 #ifndef TMVA_DNN_ARCHITECTURES_CUDA_DEVICE 18 #define TMVA_DNN_ARCHITECTURES_CUDA_DEVICE 21 #include "vector_types.h" 50 return dim3(1, BlockSize);
57 return dim3(BlockDimX, BlockDimY);
62 template<
typename AFloat>
69 return dim3(1, gridDim);
74 template<
typename AFloat>
83 return dim3(gridDimX, gridDimY);
87 template<
typename AFloat>
static constexpr int BlockSize
static dim3 GridDims1D(const TCudaMatrix< AFloat > &A)
static int NThreads(const TCudaMatrix< AFloat > &A)
static constexpr int BlockDimY
static dim3 BlockDims2D()
static dim3 GridDims2D(const TCudaMatrix< AFloat > &A)
Abstract ClassifierFactory template that handles arbitrary types.
static dim3 BlockDims1D()
static constexpr int BlockDimX