The interface which should be implemented to provide optimised computation functions for implementations of RooAbsReal::doEval().
The class RooBatchComputeInterface provides the mechanism for external modules (like RooFit) to call functions from the library. The power lies in the virtual functions that can resolve to different implementations for the functionality; for example, calling a function through dispatchCuda will resolve to efficient CUDA implementations.
This interface contains the signatures of the compute functions of every PDF that has an optimised implementation available. These are the functions that perform the actual computations in batches.
Several implementations of this interface may be provided, e.g. SSE, AVX, AVX2 etc. At run time, the fastest implementation of this interface is selected, and using a virtual call, the computation is dispatched to the best backend.
- See also
- RooBatchCompute::dispatch, RooBatchComputeClass, RF_ARCH
Definition at line 162 of file RooBatchCompute.h.
|
virtual | ~RooBatchComputeInterface ()=default |
|
virtual Architecture | architecture () const =0 |
|
virtual std::string | architectureName () const =0 |
|
virtual void | compute (Config const &cfg, Computer, std::span< double > output, VarSpan, ArgSpan)=0 |
|
virtual std::unique_ptr< AbsBufferManager > | createBufferManager () const =0 |
|
virtual void | cudaEventRecord (CudaInterface::CudaEvent *, CudaInterface::CudaStream *) const =0 |
|
virtual bool | cudaStreamIsActive (CudaInterface::CudaStream *) const =0 |
|
virtual void | cudaStreamWaitForEvent (CudaInterface::CudaStream *, CudaInterface::CudaEvent *) const =0 |
|
virtual void | deleteCudaEvent (CudaInterface::CudaEvent *) const =0 |
|
virtual void | deleteCudaStream (CudaInterface::CudaStream *) const =0 |
|
virtual CudaInterface::CudaEvent * | newCudaEvent (bool forTiming) const =0 |
|
virtual CudaInterface::CudaStream * | newCudaStream () const =0 |
|
virtual ReduceNLLOutput | reduceNLL (Config const &cfg, std::span< const double > probas, std::span< const double > weights, std::span< const double > offsetProbas)=0 |
|
virtual double | reduceSum (Config const &cfg, InputArr input, size_t n)=0 |
|