Project
Loading...
Searching...
No Matches
GPUReconstructionDeviceBase.cxx
Go to the documentation of this file.
1// Copyright 2019-2020 CERN and copyright holders of ALICE O2.
2// See https://alice-o2.web.cern.ch/copyright for details of the copyright holders.
3// All rights not expressly granted are reserved.
4//
5// This software is distributed under the terms of the GNU General Public
6// License v3 (GPL Version 3), copied verbatim in the file "COPYING".
7//
8// In applying this license CERN does not waive the privileges and immunities
9// granted to it by virtue of its status as an Intergovernmental Organization
10// or submit itself to any jurisdiction.
11
14
17
18#include "GPUTPCTracker.h"
19
20using namespace o2::gpu;
21
22#if defined(_WIN32)
23#include "../utils/pthread_mutex_win32_wrapper.h"
24#else
25#include <cerrno>
26#include <unistd.h>
27#endif
28#include <cstring>
29
30class GPUTPCRow;
31
32#define SemLockName "AliceHLTTPCGPUTrackerInitLockSem"
33
35{
36 if (sizeCheck != sizeof(GPUReconstructionDeviceBase)) {
37 GPUFatal("Mismatch of C++ object size between GPU compilers!");
38 }
39}
40
42
44{
45#ifdef _WIN32
46 HANDLE* semLock = new HANDLE;
47 *semLock = CreateSemaphore(nullptr, 1, 1, SemLockName);
48 if (*semLock == nullptr) {
49 GPUError("Error creating GPUInit Semaphore");
50 return (1);
51 }
52 WaitForSingleObject(*semLock, INFINITE);
53#elif !defined(__APPLE__) // GPU not supported on MacOS anyway
54 sem_t* semLock = sem_open(SemLockName, O_CREAT, 0x01B6, 1);
55 if (semLock == SEM_FAILED) {
56 GPUError("Error creating GPUInit Semaphore");
57 return (1);
58 }
59 timespec semtime;
60 clock_gettime(CLOCK_REALTIME, &semtime);
61 semtime.tv_sec += 10;
62 while (sem_timedwait(semLock, &semtime) != 0) {
63 GPUError("Global Lock for GPU initialisation was not released for 10 seconds, assuming another thread died");
64 GPUWarning("Resetting the global lock");
65 sem_post(semLock);
66 }
67#else
68 void* semLock = nullptr;
69#endif
70 pLock = semLock;
71 return 0;
72}
73
75{
76// Release the global named semaphore that locks GPU Initialization
77#ifdef _WIN32
78 HANDLE* h = (HANDLE*)sem;
79 ReleaseSemaphore(*h, 1, nullptr);
80 CloseHandle(*h);
81 delete h;
82#elif !defined(__APPLE__) // GPU not supported on MacOS anyway
83 sem_t* pSem = (sem_t*)sem;
84 sem_post(pSem);
85 sem_unlink(SemLockName);
86#endif
87}
88
90{
91 // cpu_set_t mask;
92 // CPU_ZERO(&mask);
93 // CPU_SET(0, &mask);
94 // sched_setaffinity(0, sizeof(mask), &mask);
95
96 if (mProcessingSettings.memoryAllocationStrategy == GPUMemoryResource::ALLOCATION_INDIVIDUAL) {
97 GPUError("Individual memory allocation strategy unsupported for device\n");
98 return (1);
99 }
100 if (mProcessingSettings.nStreams > GPUCA_MAX_STREAMS) {
101 GPUError("Too many straems requested %d > %d\n", mProcessingSettings.nStreams, GPUCA_MAX_STREAMS);
102 return (1);
103 }
104
105 void* semLock = nullptr;
106 if (mProcessingSettings.globalInitMutex && GetGlobalLock(semLock)) {
107 return (1);
108 }
109
110 if (mProcessingSettings.deviceTimers) {
112 }
113
114 int32_t retVal = InitDevice_Runtime();
115 if (retVal) {
116 GPUImportant("GPU Tracker initialization failed");
117 return (1);
118 }
119
120 if (mProcessingSettings.globalInitMutex) {
121 ReleaseGlobalLock(semLock);
122 }
123
127
131
132 if (mMaster == nullptr || mProcessingSettings.debugLevel >= 2) {
133 GPUInfo("GPU Tracker initialization successfull"); // Verbosity reduced because GPU backend will print GPUImportant message!
134 }
135
136 return (retVal);
137}
138
139void* GPUReconstructionDeviceBase::GPUProcessorProcessors::SetPointersDeviceProcessor(void* mem)
140{
141 // Don't run constructor / destructor here, this will be just local memcopy of Processors in GPU Memory
143 return mem;
144}
145
155
157{
158 return IsGPU();
159}
160
162{
163 return IsGPU();
164}
165
173
175{
176 auto& list = getDeviceConstantMemRegistratorsVector();
177 for (uint32_t i = 0; i < list.size(); i++) {
178 auto* ptr = list[i]();
179 if (ptr == nullptr) {
180 GPUFatal("Error registering constant memory");
181 }
182 mDeviceConstantMemList.emplace_back(ptr);
183 }
184}
185
186size_t GPUReconstructionDeviceBase::TransferMemoryInternal(GPUMemoryResource* res, int32_t stream, deviceEvent* ev, deviceEvent* evList, int32_t nEvents, bool toGPU, const void* src, void* dst)
187{
188 if (!(res->Type() & GPUMemoryResource::MEMORY_GPU)) {
189 if (mProcessingSettings.debugLevel >= 4) {
190 GPUInfo("Skipped transfer of non-GPU memory resource: %s", res->Name());
191 }
192 return 0;
193 }
194 if (mProcessingSettings.debugLevel >= 3 && (strcmp(res->Name(), "ErrorCodes") || mProcessingSettings.debugLevel >= 4)) {
195 GPUInfo("Copying to %s: %s - %ld bytes", toGPU ? "GPU" : "Host", res->Name(), (int64_t)res->Size());
196 }
197 return GPUMemCpy(dst, src, res->Size(), stream, toGPU, ev, evList, nEvents);
198}
int32_t i
#define GPUCA_MAX_STREAMS
#define SemLockName
int32_t retVal
uint32_t res
Definition RawData.h:0
TBranch * ptr
Class for time synchronization of RawReader instances.
static void computePointerWithAlignment(T *&basePtr, S *&objPtr, size_t nEntries=1)
void InitGPUProcessor(GPUReconstruction *rec, ProcessorType type=PROCESSOR_TYPE_CPU, GPUProcessor *slaveProcessor=nullptr)
virtual size_t GPUMemCpy(void *dst, const void *src, size_t size, int32_t stream, int32_t toGPU, deviceEvent *ev=nullptr, deviceEvent *evList=nullptr, int32_t nEvents=1)
int32_t unregisterMemoryForGPU_internal(const void *ptr) override
virtual int32_t InitDevice_Runtime()=0
size_t TransferMemoryInternal(GPUMemoryResource *res, int32_t stream, deviceEvent *ev, deviceEvent *evList, int32_t nEvents, bool toGPU, const void *src, void *dst) override
GPUReconstructionDeviceBase(const GPUSettingsDeviceBackend &cfg, size_t sizeCheck)
int32_t registerMemoryForGPU_internal(const void *ptr, size_t size) override
int32_t unregisterMemoryForGPU_internal(const void *ptr) override
std::unordered_set< const void * > mRegisteredMemoryPtrs
GPUSettingsProcessing mProcessingSettings
int16_t RegisterMemoryAllocation(T *proc, void *(T::*setPtr)(void *), int32_t type, const char *name="", const GPUMemoryReuse &re=GPUMemoryReuse())
void ClearAllocatedMemory(bool clearOutputs=true)
size_t AllocateRegisteredMemory(GPUProcessor *proc, bool resetCustom=false)
GLenum src
Definition glcorearb.h:1767
GLsizeiptr size
Definition glcorearb.h:659
GLenum GLenum dst
Definition glcorearb.h:1767
GLuint GLuint stream
Definition glcorearb.h:1806
Definition list.h:40
const int nEvents
Definition test_Fifo.cxx:27