15#if !defined(GPURECONSTRUCTIONPROCESSING_H)
16#define GPURECONSTRUCTIONPROCESSING_H
19#include "GPUReconstructionKernelIncludes.h"
28struct GPUDefParameters;
30namespace gpu_reconstruction_kernels
38 v =
reinterpret_cast<void*&
>(
val);
43 return reinterpret_cast<T&
>(
v);
48 return reinterpret_cast<T*
>(
this);
79 template <
class T,
int32_t I>
82 template <
class T,
int32_t I = 0>
92 virtual std::unique_ptr<gpu_reconstruction_kernels::threadContext>
GetThreadContext()
override;
114 std::vector<std::vector<deviceEvent>>
mEvents;
118 std::unique_ptr<HighResTimer[]>
timer;
129 std::vector<std::unique_ptr<timerMeta>>
mTimers;
132 template <
class T,
int32_t I = 0>
134 template <
class T, int32_t J = -1>
141 uint32_t getNextTimerId();
142 timerMeta* getTimerById(uint32_t
id,
bool increment =
true);
145 static std::atomic_flag mTimerFlag;
152 events = (T*)
mEvents.back().data();
155template <
class T,
int32_t I>
158 static int32_t
id = getNextTimerId();
159 timerMeta* timer = getTimerById(
id, increment);
160 if (timer ==
nullptr) {
161 timer = insertTimer(
id, GetKernelName<T, I>(), -1,
NSECTORS, 0, step);
164 timer->
memSize += addMemorySize;
166 if (num < 0 || num >= timer->
num) {
167 throw std::runtime_error(
"Invalid timer requested");
172template <
class T,
int32_t J>
175 static int32_t
id = getNextTimerId();
177 if (timer ==
nullptr) {
179 timer = insertTimer(
id,
name, J,
max, 1, RecoStep::NoRecoStep);
184 if (num < 0 || num >= timer->
num) {
185 throw std::runtime_error(
"Invalid timer requested");
static constexpr int32_t N_RECO_STEPS
static constexpr int32_t N_GENERAL_STEPS
virtual std::unique_ptr< gpu_reconstruction_kernels::threadContext > GetThreadContext() override
auto & getRecoStepTimer(RecoStep step)
HighResTimer & getGeneralStepTimer(GeneralStep step)
RecoStepTimerMeta mTimersRecoSteps[GPUDataTypes::N_RECO_STEPS]
static const char * GetKernelName()
void runParallelOuterLoop(bool doGPU, uint32_t nThreads, std::function< void(uint32_t)> lambda)
std::vector< std::vector< deviceEvent > > mEvents
static uint32_t GetKernelNum()
int32_t mActiveHostKernelThreads
std::vector< std::unique_ptr< timerMeta > > mTimers
void SetNActiveThreads(int32_t n)
GPUDefParameters * mParCPU
HighResTimer mTimersGeneralSteps[GPUDataTypes::N_GENERAL_STEPS]
uint32_t getNActiveThreadsOuterLoop() const
HighResTimer & getKernelTimer(RecoStep step, int32_t num=0, size_t addMemorySize=0, bool increment=true)
int32_t getNKernelHostThreads(bool splitCores)
const std::string & GetKernelName(int32_t i) const
static const std::vector< std::string > mKernelNames
uint32_t mNActiveThreadsOuterLoop
GPUDefParameters * mParDevice
uint32_t SetAndGetNActiveThreadsOuterLoop(bool condition, uint32_t max)
HighResTimer & getTimer(const char *name, int32_t num=-1)
~GPUReconstructionProcessing() override
void SetNActiveThreadsOuterLoop(uint32_t f)
void AddGPUEvents(T *&events)
int32_t getGeneralStepNum(GeneralStep step, bool validCheck=true)
static constexpr uint32_t NSECTORS
GPUSettingsProcessing mProcessingSettings
int32_t getRecoStepNum(RecoStep step, bool validCheck=true)
static int32_t getHostThreadIndex()
GLuint const GLchar * name
GLint GLint GLsizei GLint GLenum GLenum type
constexpr deviceEvent()=default
constexpr deviceEvent(std::nullptr_t p)