Project
Loading...
Searching...
No Matches
GPUReconstructionCUDAInternals.h
Go to the documentation of this file.
1
// Copyright 2019-2020 CERN and copyright holders of ALICE O2.
2
// See https://alice-o2.web.cern.ch/copyright for details of the copyright holders.
3
// All rights not expressly granted are reserved.
4
//
5
// This software is distributed under the terms of the GNU General Public
6
// License v3 (GPL Version 3), copied verbatim in the file "COPYING".
7
//
8
// In applying this license CERN does not waive the privileges and immunities
9
// granted to it by virtue of its status as an Intergovernmental Organization
10
// or submit itself to any jurisdiction.
11
14
15
// All CUDA-header related stuff goes here, so we can run CING over GPUReconstructionCUDA
16
17
#ifndef GPURECONSTRUCTIONCUDAINTERNALS_H
18
#define GPURECONSTRUCTIONCUDAINTERNALS_H
19
20
#include <cuda.h>
21
#include "
GPULogging.h
"
22
#include <vector>
23
#include <memory>
24
#include <string>
25
#include "
GPUCommonHelpers.h
"
26
27
namespace
o2::gpu
28
{
29
30
struct
GPUReconstructionCUDAInternals
{
31
std::vector<std::unique_ptr<CUmodule>>
kernelModules
;
// module for RTC compilation
32
std::vector<std::unique_ptr<CUfunction>>
kernelFunctions
;
// vector of ptrs to RTC kernels
33
cudaStream_t
Streams
[
GPUCA_MAX_STREAMS
];
// Pointer to array of CUDA Streams
34
35
static
void
getArgPtrs
(
const
void
** pArgs) {}
36
template
<
typename
T,
typename
... Args>
37
static
void
getArgPtrs
(
const
void
** pArgs,
const
T& arg,
const
Args&... args)
38
{
39
*pArgs = &arg;
40
getArgPtrs
(pArgs + 1, args...);
41
}
42
};
43
44
class
GPUDebugTiming
45
{
46
public
:
47
GPUDebugTiming
(
bool
d,
gpu_reconstruction_kernels::deviceEvent
* t, cudaStream_t* s,
const
gpu_reconstruction_kernels::krnlSetupTime
&
x
,
GPUReconstructionCUDABackend
*
r
) : mDeviceTimers(t), mStreams(s), mXYZ(
x
), mRec(
r
), mDo(d)
48
{
49
if
(mDo) {
50
if
(mDeviceTimers) {
51
mRec->GPUChkErr(cudaEventRecord(mDeviceTimers[0].get<cudaEvent_t>(), mStreams[mXYZ.
x
.
stream
]));
52
}
else
{
53
mTimer.
ResetStart
();
54
}
55
}
56
}
57
~GPUDebugTiming
()
58
{
59
if
(mDo && mXYZ.
t
== 0.) {
60
if
(mDeviceTimers) {
61
mRec->GPUChkErr(cudaEventRecord(mDeviceTimers[1].get<cudaEvent_t>(), mStreams[mXYZ.
x
.
stream
]));
62
mRec->GPUChkErr(cudaEventSynchronize(mDeviceTimers[1].get<cudaEvent_t>()));
63
float
v
;
64
mRec->GPUChkErr(cudaEventElapsedTime(&
v
, mDeviceTimers[0].get<cudaEvent_t>(), mDeviceTimers[1].get<cudaEvent_t>()));
65
mXYZ.
t
=
v
* 1.e-3f;
66
}
else
{
67
mRec->GPUChkErr(cudaStreamSynchronize(mStreams[mXYZ.
x
.
stream
]));
68
mXYZ.
t
= mTimer.
GetCurrentElapsedTime
();
69
}
70
}
71
}
72
73
private
:
74
gpu_reconstruction_kernels::deviceEvent
* mDeviceTimers;
75
cudaStream_t* mStreams;
76
const
gpu_reconstruction_kernels::krnlSetupTime
& mXYZ;
77
GPUReconstructionCUDABackend
* mRec;
78
HighResTimer
mTimer;
79
bool
mDo;
80
};
81
82
static_assert
(std::is_convertible<cudaEvent_t, void*>::value,
"CUDA event type incompatible to deviceEvent"
);
83
84
}
// namespace o2::gpu
85
86
#endif
GPUCommonHelpers.h
GPUCA_MAX_STREAMS
#define GPUCA_MAX_STREAMS
Definition
GPUDefParametersDefault.h:584
GPULogging.h
HighResTimer
Definition
timer.h:21
HighResTimer::GetCurrentElapsedTime
double GetCurrentElapsedTime(bool reset=false)
Definition
timer.cxx:110
HighResTimer::ResetStart
void ResetStart()
Definition
timer.cxx:63
o2::gpu::GPUDebugTiming
Definition
GPUReconstructionCUDAInternals.h:45
o2::gpu::GPUDebugTiming::~GPUDebugTiming
~GPUDebugTiming()
Definition
GPUReconstructionCUDAInternals.h:57
o2::gpu::GPUDebugTiming::GPUDebugTiming
GPUDebugTiming(bool d, gpu_reconstruction_kernels::deviceEvent *t, cudaStream_t *s, const gpu_reconstruction_kernels::krnlSetupTime &x, GPUReconstructionCUDABackend *r)
Definition
GPUReconstructionCUDAInternals.h:47
o2::gpu::GPUReconstructionCUDABackend
Definition
GPUReconstructionCUDA.h:33
x
GLint GLenum GLint x
Definition
glcorearb.h:403
v
const GLdouble * v
Definition
glcorearb.h:832
r
GLboolean r
Definition
glcorearb.h:1233
o2::gpu
Definition
TrackTRD.h:35
o2::gpu::GPUReconstructionCUDAInternals
Definition
GPUReconstructionCUDAInternals.h:30
o2::gpu::GPUReconstructionCUDAInternals::getArgPtrs
static void getArgPtrs(const void **pArgs)
Definition
GPUReconstructionCUDAInternals.h:35
o2::gpu::GPUReconstructionCUDAInternals::Streams
cudaStream_t Streams[GPUCA_MAX_STREAMS]
Definition
GPUReconstructionCUDAInternals.h:33
o2::gpu::GPUReconstructionCUDAInternals::getArgPtrs
static void getArgPtrs(const void **pArgs, const T &arg, const Args &... args)
Definition
GPUReconstructionCUDAInternals.h:37
o2::gpu::GPUReconstructionCUDAInternals::kernelModules
std::vector< std::unique_ptr< CUmodule > > kernelModules
Definition
GPUReconstructionCUDAInternals.h:31
o2::gpu::GPUReconstructionCUDAInternals::kernelFunctions
std::vector< std::unique_ptr< CUfunction > > kernelFunctions
Definition
GPUReconstructionCUDAInternals.h:32
o2::gpu::gpu_reconstruction_kernels::deviceEvent
Definition
GPUReconstructionProcessing.h:32
o2::gpu::gpu_reconstruction_kernels::krnlExec::stream
int32_t stream
Definition
GPUReconstructionKernels.h:38
o2::gpu::gpu_reconstruction_kernels::krnlSetupTime
Definition
GPUReconstructionKernels.h:69
o2::gpu::gpu_reconstruction_kernels::krnlSetupTime::t
double & t
Definition
GPUReconstructionKernels.h:70
o2::gpu::gpu_reconstruction_kernels::krnlSetup::x
krnlExec x
Definition
GPUReconstructionKernels.h:64
GPU
GPUTracking
Base
cuda
GPUReconstructionCUDAInternals.h
Generated on Thu Apr 3 2025 21:05:45 for Project by
1.9.8