15#ifndef GPURECONSTRUCTIONCUDA_H
16#define GPURECONSTRUCTIONCUDA_H
36struct GPUReconstructionCUDAInternals;
47 template <
class T, int32_t I = 0,
typename... Args>
49 template <
class T, int32_t I = 0,
typename... Args>
51 template <
class T,
int32_t I>
54 template <
class T,
class S>
79 void GetITSTraits(
std::unique_ptr<
o2::its::TrackerTraits>* trackerTraits,
std::unique_ptr<
o2::its::VertexerTraits>* vertexerTraits,
std::unique_ptr<
o2::its::
TimeFrame>* timeFrame) override;
90 int32_t genRTC(std::string&
filename, uint32_t& nCompile);
91 void getRTCKernelCalls(std::vector<std::string>& kernels);
93 void loadKernelModules(
bool perKernel);
94 const char *mRtcSrcExtension =
".src", *mRtcBinExtension =
".o";
o2::gpu::GPUReconstruction * GPUReconstruction_Create_CUDA(const o2::gpu::GPUSettingsDeviceBackend &cfg)
int32_t ExitDevice_Runtime() override
GPUReconstructionCUDAInternals * mInternals
int32_t unregisterMemoryForGPU_internal(const void *ptr) override
bool IsEventDone(deviceEvent *evList, int32_t nEvents=1) override
GPUReconstructionCUDA(const GPUSettingsDeviceBackend &cfg)
size_t WriteToConstantMemory(size_t offset, const void *src, size_t size, int32_t stream=-1, deviceEvent *ev=nullptr) override
void startGPUProfiling() override
int32_t InitDevice_Runtime() override
void StreamWaitForEvents(int32_t stream, deviceEvent *evList, int32_t nEvents=1) override
void runKernelBackend(const krnlSetupTime &_xyz, const Args &... args)
void SetONNXGPUStream(Ort::SessionOptions &session_options, int32_t stream, int32_t *deviceId) override
void RecordMarker(deviceEvent *ev, int32_t stream) override
bool CanQueryMaxMemory() override
void SynchronizeEvents(deviceEvent *evList, int32_t nEvents=1) override
size_t GPUMemCpy(void *dst, const void *src, size_t size, int32_t stream, int32_t toGPU, deviceEvent *ev=nullptr, deviceEvent *evList=nullptr, int32_t nEvents=1) override
void endGPUProfiling() override
int32_t registerMemoryForGPU_internal(const void *ptr, size_t size) override
int32_t GPUDebug(const char *state="UNKNOWN", int32_t stream=-1, bool force=false) override
void SynchronizeStream(int32_t stream) override
void GetITSTraits(std::unique_ptr< o2::its::TrackerTraits > *trackerTraits, std::unique_ptr< o2::its::VertexerTraits > *vertexerTraits, std::unique_ptr< o2::its::TimeFrame > *timeFrame) override
void PrintKernelOccupancies() override
void runKernelBackendTimed(const krnlSetupTime &_xyz, const Args &... args)
void SynchronizeGPU() override
~GPUReconstructionCUDA() override
virtual int32_t GPUChkErrInternal(const int64_t error, const char *file, int32_t line) const override
std::unique_ptr< threadContext > GetThreadContext() override
void ReleaseEvent(deviceEvent ev) override
virtual void * getGPUPointer(void *ptr)
typedef void(APIENTRYP PFNGLCULLFACEPROC)(GLenum mode)
a couple of static helper functions to create timestamp values for CCDB queries or override obsolete ...
Defining DataPointCompositeObject explicitly as copiable.