19#define ERRCHECK(err) __checkCudaErrors((err), __func__, __FILE__, __LINE__)
25 throw std::runtime_error(
errMsg.str());
30namespace CudaInterface {
32DeviceMemory::DeviceMemory(std::size_t
n, std::size_t
typeSize) : _size{
n}
38PinnedHostMemory::PinnedHostMemory(std::size_t
n, std::size_t
typeSize) : _size{
n}
84 auto stream =
reinterpret_cast<cudaStream_t *
>(ptr);
98 ERRCHECK(::cudaEventRecord(event, stream));
106CudaStream::CudaStream()
108 auto stream =
new cudaStream_t;
118bool CudaStream::isActive()
149 ERRCHECK(::cudaEventElapsedTime(&
ret, begin, end));
static void __checkCudaErrors(cudaError_t error, std::string func, std::string file, int line)
RooAbsData * _data
Pointer to original input dataset.
ROOT::Detail::TRangeCast< T, true > TRangeDynCast
TRangeDynCast is an adapter class that allows the typed iteration through a TCollection.
Option_t Option_t TPoint TPoint const char GetTextMagnitude GetFillStyle GetLineColor GetLineWidth GetMarkerStyle GetTextAlign GetTextColor GetTextSize void char Point_t Rectangle_t dest
Option_t Option_t TPoint TPoint const char GetTextMagnitude GetFillStyle GetLineColor GetLineWidth GetMarkerStyle GetTextAlign GetTextColor GetTextSize void char Point_t Rectangle_t src
void cudaEventRecord(CudaEvent &event, CudaStream &stream)
Records a CUDA event.
float cudaEventElapsedTime(CudaEvent &begin, CudaEvent &end)
Calculates the elapsed time between two CUDA events.
Namespace for dispatching RooFit computations to various backends.