#include <cstddef>
#include <memory>
|
| template<class T > |
| void | RooBatchCompute::CudaInterface::copyDeviceToDevice (const T *src, T *dest, std::size_t n, CudaStream *=nullptr) |
| | Copies data from the CUDA device to the CUDA device.
|
| |
| template<class T > |
| void | RooBatchCompute::CudaInterface::copyDeviceToHost (const T *src, T *dest, std::size_t n, CudaStream *=nullptr) |
| | Copies data from the CUDA device to the host.
|
| |
| template<class T > |
| void | RooBatchCompute::CudaInterface::copyHostToDevice (const T *src, T *dest, std::size_t n, CudaStream *=nullptr) |
| | Copies data from the host to the CUDA device.
|
| |
| float | RooBatchCompute::CudaInterface::cudaEventElapsedTime (CudaEvent &begin, CudaEvent &end) |
| | Calculates the elapsed time between two CUDA events.
|
| |
| void | RooBatchCompute::CudaInterface::cudaEventRecord (CudaEvent &event, CudaStream &stream) |
| | Records a CUDA event.
|
| |