|
| | GPUChainITS (GPUReconstruction *rec) |
| |
| | GPUChain (GPUReconstruction *rec) |
| |
| int32_t | GetThread () |
| |
| GPUConstantMem * | processors () |
| |
| GPUConstantMem * | processorsShadow () |
| |
| GPUConstantMem * | processorsDevice () |
| |
| GPUParam & | param () |
| |
| const GPUConstantMem * | processors () const |
| |
| void | SynchronizeStream (int32_t stream) |
| |
| void | SetONNXGPUStream (Ort::SessionOptions &opt, int32_t stream, int32_t *deviceId) |
| |
| void | SynchronizeEvents (deviceEvent *evList, int32_t nEvents=1) |
| |
| void | SynchronizeEventAndRelease (deviceEvent &ev, bool doGPU=true) |
| |
| template<class T > |
| void | CondWaitEvent (T &cond, deviceEvent *ev) |
| |
| bool | IsEventDone (deviceEvent *evList, int32_t nEvents=1) |
| |
| void | RecordMarker (deviceEvent *ev, int32_t stream) |
| |
| virtual std::unique_ptr< GPUReconstructionProcessing::threadContext > | GetThreadContext () |
| |
| void | SynchronizeGPU () |
| |
| void | ReleaseEvent (deviceEvent ev, bool doGPU=true) |
| |
| void | StreamWaitForEvents (int32_t stream, deviceEvent *evList, int32_t nEvents=1) |
| |
| int32_t | GPUDebug (const char *state="UNKNOWN", int32_t stream=-1) |
| |
| void | TransferMemoryResourceToGPU (RecoStep step, GPUMemoryResource *res, int32_t stream=-1, deviceEvent *ev=nullptr, deviceEvent *evList=nullptr, int32_t nEvents=1) |
| |
| void | TransferMemoryResourceToHost (RecoStep step, GPUMemoryResource *res, int32_t stream=-1, deviceEvent *ev=nullptr, deviceEvent *evList=nullptr, int32_t nEvents=1) |
| |
| void | TransferMemoryResourcesToGPU (RecoStep step, GPUProcessor *proc, int32_t stream=-1, bool all=false) |
| |
| void | TransferMemoryResourcesToHost (RecoStep step, GPUProcessor *proc, int32_t stream=-1, bool all=false) |
| |
| void | TransferMemoryResourceLinkToGPU (RecoStep step, int16_t res, int32_t stream=-1, deviceEvent *ev=nullptr, deviceEvent *evList=nullptr, int32_t nEvents=1) |
| |
| void | TransferMemoryResourceLinkToHost (RecoStep step, int16_t res, int32_t stream=-1, deviceEvent *ev=nullptr, deviceEvent *evList=nullptr, int32_t nEvents=1) |
| |
| void | WriteToConstantMemory (RecoStep step, size_t offset, const void *src, size_t size, int32_t stream=-1, deviceEvent *ev=nullptr) |
| |
| void | GPUMemCpy (RecoStep step, void *dst, const void *src, size_t size, int32_t stream, int32_t toGPU, deviceEvent *ev=nullptr, deviceEvent *evList=nullptr, int32_t nEvents=1) |
| |
| void | GPUMemCpyAlways (RecoStep step, void *dst, const void *src, size_t size, int32_t stream, int32_t toGPU, deviceEvent *ev=nullptr, deviceEvent *evList=nullptr, int32_t nEvents=1) |
| |
| template<class T > |
| void | AllocateIOMemoryHelper (uint32_t n, const T *&ptr, std::unique_ptr< T[]> &u) |
| |
| template<class T , class S > |
| uint32_t | DumpData (FILE *fp, const T *const *entries, const S *num, InOutPointerType type) |
| |
| template<class T , class S > |
| size_t | ReadData (FILE *fp, const T **entries, S *num, std::unique_ptr< T[]> *mem, InOutPointerType type, T **nonConstPtrs=nullptr) |
| |
| template<class T > |
| void | DumpFlatObjectToFile (const T *obj, const char *file) |
| |
| template<class T > |
| std::unique_ptr< T > | ReadFlatObjectFromFile (const char *file) |
| |
| template<class T > |
| void | DumpStructToFile (const T *obj, const char *file) |
| |
| template<class T > |
| std::unique_ptr< T > | ReadStructFromFile (const char *file) |
| |
| template<class T > |
| void | ReadStructFromFile (const char *file, T *obj) |
| |
template<class S , int32_t I = 0, typename... Args>
requires (sizeof(S) >= 0) |
| void | runKernel (GPUReconstructionProcessing::krnlSetup &&setup, Args const &... args) |
| |
| template<class S , int32_t I = 0> |
| GPUReconstructionProcessing::krnlProperties | getKernelProperties () |
| |
| template<class T , int32_t I = 0> |
| HighResTimer & | getKernelTimer (RecoStep step, int32_t num=0, size_t addMemorySize=0, bool increment=true) |
| |
| template<class T , int32_t J = -1> |
| HighResTimer & | getTimer (const char *name, int32_t num=-1) |
| |
| krnlExec | GetGrid (uint32_t totalItems, uint32_t nThreads, int32_t stream, GPUReconstruction::krnlDeviceType d=GPUReconstruction::krnlDeviceType::Auto, GPUDataTypes::RecoStep st=GPUDataTypes::RecoStep::NoRecoStep) |
| |
| krnlExec | GetGrid (uint32_t totalItems, int32_t stream, GPUReconstruction::krnlDeviceType d=GPUReconstruction::krnlDeviceType::Auto, GPUDataTypes::RecoStep st=GPUDataTypes::RecoStep::NoRecoStep) |
| |
| krnlExec | GetGridBlk (uint32_t nBlocks, int32_t stream, GPUReconstruction::krnlDeviceType d=GPUReconstruction::krnlDeviceType::Auto, GPUDataTypes::RecoStep st=GPUDataTypes::RecoStep::NoRecoStep) |
| |
| krnlExec | GetGridBlkStep (uint32_t nBlocks, int32_t stream, GPUDataTypes::RecoStep st=GPUDataTypes::RecoStep::NoRecoStep) |
| |
| krnlExec | GetGridAuto (int32_t stream, GPUReconstruction::krnlDeviceType d=GPUReconstruction::krnlDeviceType::Auto, GPUDataTypes::RecoStep st=GPUDataTypes::RecoStep::NoRecoStep) |
| |
| krnlExec | GetGridAutoStep (int32_t stream, GPUDataTypes::RecoStep st=GPUDataTypes::RecoStep::NoRecoStep) |
| |
| uint32_t | BlockCount () const |
| |
| uint32_t | WarpSize () const |
| |
| uint32_t | ThreadCount () const |
| |
| size_t | AllocateRegisteredMemory (GPUProcessor *proc) |
| |
| size_t | AllocateRegisteredMemory (int16_t res, GPUOutputControl *control=nullptr) |
| |
| template<class T > |
| void | SetupGPUProcessor (T *proc, bool allocate) |
| |
| GPUChain * | GetNextChainInQueue () |
| |
| virtual int32_t | DoStuckProtection (int32_t stream, deviceEvent event) |
| |
| template<class T , class S , typename... Args> |
| bool | DoDebugAndDump (RecoStep step, uint32_t mask, T &processor, S T::*func, Args &&... args) |
| |
| template<class T , class S , typename... Args> |
| bool | DoDebugAndDump (RecoStep step, uint32_t mask, bool transfer, T &processor, S T::*func, Args &&... args) |
| |
| template<typename... Args> |
| bool | DoDebugDump (uint32_t mask, std::function< void(Args &...)> func, Args &... args) |
| |
| template<class S , typename... Args> |
| bool | DoDebugDump (uint32_t mask, S *func, Args &&... args) |
| |
| template<class T , class S , typename... Args> |
| int32_t | runRecoStep (RecoStep step, S T::*func, Args... args) |
| |
Definition at line 32 of file GPUChainITS.h.