Project
Loading...
Searching...
No Matches
GPUReconstructionOCLKernels.cxx
Go to the documentation of this file.
1// Copyright 2019-2020 CERN and copyright holders of ALICE O2.
2// See https://alice-o2.web.cern.ch/copyright for details of the copyright holders.
3// All rights not expressly granted are reserved.
4//
5// This software is distributed under the terms of the GNU General Public
6// License v3 (GPL Version 3), copied verbatim in the file "COPYING".
7//
8// In applying this license CERN does not waive the privileges and immunities
9// granted to it by virtue of its status as an Intergovernmental Organization
10// or submit itself to any jurisdiction.
11
14
16
17template <>
18inline void GPUReconstructionOCLBackend::runKernelBackendInternal<GPUMemClean16, 0>(const krnlSetupTime& _xyz, void* const& ptr, uint64_t const& size)
19{
20 cl_int4 val0 = {0, 0, 0, 0};
21 GPUChkErr(clEnqueueFillBuffer(mInternals->command_queue[_xyz.x.stream], mInternals->mem_gpu, &val0, sizeof(val0), (char*)ptr - (char*)mDeviceMemoryBase, (size + sizeof(val0) - 1) & ~(sizeof(val0) - 1), _xyz.z.evList == nullptr ? 0 : _xyz.z.nEvents, _xyz.z.evList->getEventList<cl_event>(), _xyz.z.ev->getEventList<cl_event>()));
22}
23
24template <class T, int32_t I, typename... Args>
25inline void GPUReconstructionOCLBackend::runKernelBackendInternal(const krnlSetupTime& _xyz, const Args&... args)
26{
27 cl_kernel k = getKernelObject<cl_kernel, T, I>();
28 auto& x = _xyz.x;
29 auto& y = _xyz.y;
30 auto& z = _xyz.z;
31 GPUChkErr(OCLsetKernelParameters(k, mInternals->mem_gpu, mInternals->mem_constant, y.index, args...));
32
33 cl_event ev;
34 cl_event* evr;
35 bool tmpEvent = false;
36 if (z.ev == nullptr && mProcessingSettings.deviceTimers && mProcessingSettings.debugLevel > 0) {
37 evr = &ev;
38 tmpEvent = true;
39 } else {
40 evr = (cl_event*)z.ev;
41 }
42 GPUChkErr(clExecuteKernelA(mInternals->command_queue[x.stream], k, x.nThreads, x.nThreads * x.nBlocks, evr, (cl_event*)z.evList, z.nEvents));
43 if (mProcessingSettings.deviceTimers && mProcessingSettings.debugLevel > 0) {
44 cl_ulong time_start, time_end;
45 GPUChkErr(clWaitForEvents(1, evr));
46 GPUChkErr(clGetEventProfilingInfo(*evr, CL_PROFILING_COMMAND_START, sizeof(time_start), &time_start, nullptr));
47 GPUChkErr(clGetEventProfilingInfo(*evr, CL_PROFILING_COMMAND_END, sizeof(time_end), &time_end, nullptr));
48 _xyz.t = (time_end - time_start) * 1.e-9f;
49 if (tmpEvent) {
50 GPUChkErr(clReleaseEvent(ev));
51 }
52 }
53}
54
55template <class T, int32_t I, typename... Args>
57{
58 std::apply([this, &args](auto&... vals) { runKernelBackendInternal<T, I, Args...>(args.s, vals...); }, args.v);
59}
60
61template <class T, int32_t I>
63{
64 std::string name(GetKernelName<T, I>());
65 std::string kname("krnl_" + name);
66
67 cl_int ocl_error;
68 cl_kernel krnl = clCreateKernel(mInternals->program, kname.c_str(), &ocl_error);
69 if (GPUChkErrI(ocl_error)) {
70 GPUError("Error creating OPENCL Kernel: %s", name.c_str());
71 return 1;
72 }
73 mInternals->kernels.emplace_back(krnl);
74 return 0;
75}
76
77template <class S, class T, int32_t I>
79{
80 return mInternals->kernels[GetKernelNum<T, I>()];
81}
82
83int32_t GPUReconstructionOCLBackend::AddKernels()
84{
85#define GPUCA_KRNL(x_class, ...) \
86 if (AddKernel<GPUCA_M_KRNL_TEMPLATE(x_class)>()) { \
87 return 1; \
88 }
89#include "GPUReconstructionKernelList.h"
90#undef GPUCA_KRNL
91 return 0;
92}
93
94#define GPUCA_KRNL(x_class, x_attributes, x_arguments, x_forward, x_types, ...) template void GPUReconstructionOCLBackend::runKernelBackend<GPUCA_M_KRNL_TEMPLATE(x_class)>(const krnlSetupArgs<GPUCA_M_KRNL_TEMPLATE(x_class) GPUCA_M_STRIP(x_types)>& args);
95#include "GPUReconstructionKernelList.h"
96#undef GPUCA_KRNL
#define GPUChkErrI(x)
#define GPUChkErr(x)
TBranch * ptr
void runKernelBackend(const krnlSetupArgs< T, I, Args... > &args)
void runKernelBackendInternal(const krnlSetupTime &_xyz, const Args &... args)
GPUReconstructionOCLInternals * mInternals
GPUSettingsProcessing mProcessingSettings
GLint GLenum GLint x
Definition glcorearb.h:403
GLsizeiptr size
Definition glcorearb.h:659
GLuint const GLchar * name
Definition glcorearb.h:781
GLdouble GLdouble GLdouble z
Definition glcorearb.h:843
cl_command_queue command_queue[GPUCA_MAX_STREAMS]
std::tuple< typename std::conditional<(sizeof(Args) > sizeof(void *)), const Args &, const Args >::type... > v