Project
Loading...
Searching...
No Matches
GPUReconstructionKernels.h
Go to the documentation of this file.
1// Copyright 2019-2020 CERN and copyright holders of ALICE O2.
2// See https://alice-o2.web.cern.ch/copyright for details of the copyright holders.
3// All rights not expressly granted are reserved.
4//
5// This software is distributed under the terms of the GNU General Public
6// License v3 (GPL Version 3), copied verbatim in the file "COPYING".
7//
8// In applying this license CERN does not waive the privileges and immunities
9// granted to it by virtue of its status as an Intergovernmental Organization
10// or submit itself to any jurisdiction.
11
14
15#ifndef GPURECONSTRUCTIONKERNELS_H
16#define GPURECONSTRUCTIONKERNELS_H
17
18#include "GPUReconstruction.h"
19
20namespace o2::gpu
21{
22
23namespace gpu_reconstruction_kernels
24{
25
26template <class T, int32_t I = 0>
28 using t = T;
29 static constexpr int32_t i = I;
30};
31
32struct krnlExec {
33 constexpr krnlExec(uint32_t b, uint32_t t, int32_t s, GPUReconstruction::krnlDeviceType d = GPUReconstruction::krnlDeviceType::Auto) : nBlocks(b), nThreads(t), stream(s), device(d), step(GPUDataTypes::RecoStep::NoRecoStep) {}
34 constexpr krnlExec(uint32_t b, uint32_t t, int32_t s, GPUDataTypes::RecoStep st) : nBlocks(b), nThreads(t), stream(s), device(GPUReconstruction::krnlDeviceType::Auto), step(st) {}
35 constexpr krnlExec(uint32_t b, uint32_t t, int32_t s, GPUReconstruction::krnlDeviceType d, GPUDataTypes::RecoStep st) : nBlocks(b), nThreads(t), stream(s), device(d), step(st) {}
36 uint32_t nBlocks;
37 uint32_t nThreads;
38 int32_t stream;
41};
43 constexpr krnlRunRange() = default;
44 constexpr krnlRunRange(uint32_t v) : index(v) {}
45 uint32_t index = 0;
46};
47struct krnlEvent {
48 constexpr krnlEvent(deviceEvent* e = nullptr, deviceEvent* el = nullptr, int32_t n = 1) : ev(e), evList(el), nEvents(n) {}
51 int32_t nEvents;
52};
53
55 krnlProperties(int32_t t = 0, int32_t b = 1, int32_t b2 = 0) : nThreads(t), minBlocks(b), forceBlocks(b2) {}
56 uint32_t nThreads;
57 uint32_t minBlocks;
58 uint32_t forceBlocks;
59 uint32_t total() { return forceBlocks ? forceBlocks : (nThreads * minBlocks); }
60};
61
62struct krnlSetup {
63 krnlSetup(const krnlExec& xx, const krnlRunRange& yy = {0}, const krnlEvent& zz = {nullptr, nullptr, 0}) : x(xx), y(yy), z(zz) {}
67};
68
69struct krnlSetupTime : public krnlSetup {
70 double& t;
71};
72
73template <class T, int32_t I = 0, typename... Args>
75 krnlSetupArgs(const krnlExec& xx, const krnlRunRange& yy, const krnlEvent& zz, double& tt, const Args&... args) : s{{xx, yy, zz}, tt}, v(args...) {}
77 std::tuple<typename std::conditional<(sizeof(Args) > sizeof(void*)), const Args&, const Args>::type...> v;
78};
79
80} // namespace gpu_reconstruction_kernels
81
82template <class T>
84{
85 public:
87
88 protected:
95 template <class S, int32_t I = 0, typename... Args>
97
98 virtual void runKernelImpl(const int num, const void* args)
99 {
100 switch (num) { // clang-format off
101#define GPUCA_KRNL(x_class, x_attributes, x_arguments, x_forward, x_types, x_num) \
102 case x_num: { \
103 const auto& args2 = *(const krnlSetupArgs<GPUCA_M_KRNL_TEMPLATE(x_class) GPUCA_M_STRIP(x_types)>*)args; \
104 T::template runKernelBackend<GPUCA_M_KRNL_TEMPLATE(x_class)>(args2); \
105 break; \
106 }
107#include "GPUReconstructionKernelList.h"
108#undef GPUCA_KRNL
109 } // clang-format on
110 }
111};
112
113} // namespace o2::gpu
114
115#endif
double num
benchmark::State & st
GPUReconstructionKernels(const GPUSettingsDeviceBackend &cfg)
virtual void runKernelImpl(const int num, const void *args)
GLdouble n
Definition glcorearb.h:1982
GLint GLenum GLint x
Definition glcorearb.h:403
const GLdouble * v
Definition glcorearb.h:832
GLuint index
Definition glcorearb.h:781
GLboolean GLboolean GLboolean b
Definition glcorearb.h:1233
GLint GLint GLsizei GLint GLenum GLenum type
Definition glcorearb.h:275
GLuint GLuint stream
Definition glcorearb.h:1806
GLdouble GLdouble GLdouble z
Definition glcorearb.h:843
constexpr krnlEvent(deviceEvent *e=nullptr, deviceEvent *el=nullptr, int32_t n=1)
constexpr krnlExec(uint32_t b, uint32_t t, int32_t s, GPUReconstruction::krnlDeviceType d, GPUDataTypes::RecoStep st)
constexpr krnlExec(uint32_t b, uint32_t t, int32_t s, GPUDataTypes::RecoStep st)
constexpr krnlExec(uint32_t b, uint32_t t, int32_t s, GPUReconstruction::krnlDeviceType d=GPUReconstruction::krnlDeviceType::Auto)
krnlProperties(int32_t t=0, int32_t b=1, int32_t b2=0)
krnlSetupArgs(const krnlExec &xx, const krnlRunRange &yy, const krnlEvent &zz, double &tt, const Args &... args)
krnlSetup(const krnlExec &xx, const krnlRunRange &yy={0}, const krnlEvent &zz={nullptr, nullptr, 0})