Project
Loading...
Searching...
No Matches
GPUChainTracking.cxx
Go to the documentation of this file.
1// Copyright 2019-2020 CERN and copyright holders of ALICE O2.
2// See https://alice-o2.web.cern.ch/copyright for details of the copyright holders.
3// All rights not expressly granted are reserved.
4//
5// This software is distributed under the terms of the GNU General Public
6// License v3 (GPL Version 3), copied verbatim in the file "COPYING".
7//
8// In applying this license CERN does not waive the privileges and immunities
9// granted to it by virtue of its status as an Intergovernmental Organization
10// or submit itself to any jurisdiction.
11
14
17#include <fstream>
18#include <chrono>
19
20#include "GPUChainTracking.h"
21#include "GPUChainTrackingGetters.inc"
22#include "GPUReconstructionIO.h"
24#include "GPUTPCGMMergedTrack.h"
26#include "GPUTPCTrack.h"
27#include "GPUTPCHitId.h"
28#include "GPUTPCClusterData.h"
29#include "TPCZSLinkMapping.h"
30#include "GPUTRDTrackletWord.h"
32#include "GPUTPCMCInfo.h"
33#include "GPUTRDTrack.h"
34#include "GPUTRDTracker.h"
35#include "AliHLTTPCRawCluster.h"
38#include "GPUQA.h"
39#include "GPULogging.h"
42#include "GPUNewCalibValues.h"
43#include "GPUTriggerOutputs.h"
44#include "GPUDefParametersRuntime.h"
45
47#include "GPUHostDataTypes.h"
49#include "GPUTrackingRefit.h"
50#include "CalibdEdxContainer.h"
51
52#include "TPCFastTransform.h"
54
55#include "utils/linux_helpers.h"
56#include "utils/strtag.h"
57using namespace o2::gpu;
58
59#include "GPUO2DataTypes.h"
60
61using namespace o2::tpc;
62using namespace o2::trd;
63
64GPUChainTracking::GPUChainTracking(GPUReconstruction* rec, uint32_t maxTPCHits, uint32_t maxTRDTracklets) : GPUChain(rec), mIOPtrs(processors()->ioPtrs), mInputsHost(new GPUTrackingInputProvider), mInputsShadow(new GPUTrackingInputProvider), mClusterNativeAccess(new ClusterNativeAccess), mTriggerBuffer(new GPUTriggerOutputs), mMaxTPCHits(maxTPCHits), mMaxTRDTracklets(maxTRDTracklets), mDebugFile(new std::ofstream)
65{
69}
70
72
74{
75 if (mRec->IsGPU()) {
79 }
80
82 if (GetRecoSteps() & RecoStep::TPCSectorTracking) {
83 for (uint32_t i = 0; i < NSECTORS; i++) {
84 mRec->RegisterGPUProcessor(&processors()->tpcTrackers[i], GetRecoStepsGPU() & RecoStep::TPCSectorTracking);
85 }
86 }
87 if (GetRecoSteps() & RecoStep::TPCMerging) {
88 mRec->RegisterGPUProcessor(&processors()->tpcMerger, GetRecoStepsGPU() & RecoStep::TPCMerging);
89 }
90 if (GetRecoSteps() & RecoStep::TRDTracking) {
91 mRec->RegisterGPUProcessor(&processors()->trdTrackerGPU, GetRecoStepsGPU() & RecoStep::TRDTracking);
92 }
93 if (GetRecoSteps() & RecoStep::TRDTracking) {
94 mRec->RegisterGPUProcessor(&processors()->trdTrackerO2, GetRecoStepsGPU() & RecoStep::TRDTracking);
95 }
96 if (GetRecoSteps() & RecoStep::TPCCompression) {
97 mRec->RegisterGPUProcessor(&processors()->tpcCompressor, GetRecoStepsGPU() & RecoStep::TPCCompression);
98 }
99 if (GetRecoSteps() & RecoStep::TPCDecompression) {
100 mRec->RegisterGPUProcessor(&processors()->tpcDecompressor, GetRecoStepsGPU() & RecoStep::TPCDecompression);
101 }
102 if (GetRecoSteps() & RecoStep::TPCClusterFinding) {
103 for (uint32_t i = 0; i < NSECTORS; i++) {
104 mRec->RegisterGPUProcessor(&processors()->tpcClusterer[i], GetRecoStepsGPU() & RecoStep::TPCClusterFinding);
105#ifdef GPUCA_HAS_ONNX
106 mRec->RegisterGPUProcessor(&processors()->tpcNNClusterer[i], GetRecoStepsGPU() & RecoStep::TPCClusterFinding);
107#endif
108 }
109 }
110 if (GetRecoSteps() & RecoStep::Refit) {
111 mRec->RegisterGPUProcessor(&processors()->trackingRefit, GetRecoStepsGPU() & RecoStep::Refit);
112 }
113#ifdef GPUCA_KERNEL_DEBUGGER_OUTPUT
114 mRec->RegisterGPUProcessor(&processors()->debugOutput, true);
115#endif
117}
118
120{
121 if (mRec->IsGPU()) {
123 }
124 memcpy((void*)&processorsShadow()->trdTrackerGPU, (const void*)&processors()->trdTrackerGPU, sizeof(processors()->trdTrackerGPU));
125 if (GetRecoStepsGPU() & RecoStep::TPCSectorTracking) {
126 for (uint32_t i = 0; i < NSECTORS; i++) {
127 mRec->RegisterGPUDeviceProcessor(&processorsShadow()->tpcTrackers[i], &processors()->tpcTrackers[i]);
128 }
129 }
130 if (GetRecoStepsGPU() & RecoStep::TPCMerging) {
131 mRec->RegisterGPUDeviceProcessor(&processorsShadow()->tpcMerger, &processors()->tpcMerger);
132 }
133 if (GetRecoStepsGPU() & RecoStep::TRDTracking) {
134 mRec->RegisterGPUDeviceProcessor(&processorsShadow()->trdTrackerGPU, &processors()->trdTrackerGPU);
135 }
136
137 memcpy((void*)&processorsShadow()->trdTrackerO2, (const void*)&processors()->trdTrackerO2, sizeof(processors()->trdTrackerO2));
138 if (GetRecoStepsGPU() & RecoStep::TRDTracking) {
139 mRec->RegisterGPUDeviceProcessor(&processorsShadow()->trdTrackerO2, &processors()->trdTrackerO2);
140 }
141 if (GetRecoStepsGPU() & RecoStep::TPCCompression) {
142 mRec->RegisterGPUDeviceProcessor(&processorsShadow()->tpcCompressor, &processors()->tpcCompressor);
143 }
144 if (GetRecoStepsGPU() & RecoStep::TPCDecompression) {
145 mRec->RegisterGPUDeviceProcessor(&processorsShadow()->tpcDecompressor, &processors()->tpcDecompressor);
146 }
147 if (GetRecoStepsGPU() & RecoStep::TPCClusterFinding) {
148 for (uint32_t i = 0; i < NSECTORS; i++) {
149 mRec->RegisterGPUDeviceProcessor(&processorsShadow()->tpcClusterer[i], &processors()->tpcClusterer[i]);
150#ifdef GPUCA_HAS_ONNX
151 mRec->RegisterGPUDeviceProcessor(&processorsShadow()->tpcNNClusterer[i], &processors()->tpcNNClusterer[i]);
152#endif
153 }
154 }
155 if (GetRecoStepsGPU() & RecoStep::Refit) {
156 mRec->RegisterGPUDeviceProcessor(&processorsShadow()->trackingRefit, &processors()->trackingRefit);
157 }
158#ifdef GPUCA_KERNEL_DEBUGGER_OUTPUT
159 mRec->RegisterGPUDeviceProcessor(&processorsShadow()->debugOutput, &processors()->debugOutput);
160#endif
161}
162
163void GPUChainTracking::MemorySize(size_t& gpuMem, size_t& pageLockedHostMem)
164{
165 gpuMem = GPUCA_MEMORY_SIZE;
166 pageLockedHostMem = GPUCA_HOST_MEMORY_SIZE;
167}
168
170{
172 GPUError("Invalid Reconstruction Step Setting: dEdx requires TPC Merger to be active");
173 return false;
174 }
176 GPUError("Invalid GPU Reconstruction Step Setting: dEdx requires TPC Merger to be active");
177 return false;
178 }
180 GPUError("Invalid Reconstruction Step Setting: Tracking requires TPC Conversion to be active");
181 return false;
182 }
184 GPUError("Invalid input, TPC Clusterizer needs TPC raw input");
185 return false;
186 }
188 GPUError("Invalid input / output / step, merger cannot read/store sectors tracks and needs TPC conversion");
189 return false;
190 }
192 if ((GetRecoSteps() & GPUDataTypes::RecoStep::TPCMerging) && !tpcClustersAvail) {
193 GPUError("Invalid Inputs for track merging, TPC Clusters required");
194 return false;
195 }
196#ifndef GPUCA_TPC_GEOMETRY_O2
198 GPUError("Can not run TPC GPU Cluster Finding with Run 2 Data");
199 return false;
200 }
201#endif
203 GPUError("Missing input for TPC Cluster conversion / sector tracking / compression / dEdx: TPC Clusters required");
204 return false;
205 }
207 GPUError("Input for TPC merger missing");
208 return false;
209 }
211 GPUError("Input for TPC compressor missing");
212 return false;
213 }
215 GPUError("Input for TRD Tracker missing");
216 return false;
217 }
219 GPUError("TPC Raw / TPC Clusters / TRD Tracklets cannot be output");
220 return false;
221 }
223 GPUError("No TPC Merged Track Output available");
224 return false;
225 }
227 GPUError("No TPC Compression Output available");
228 return false;
229 }
231 GPUError("No TRD Tracker Output available");
232 return false;
233 }
234 if ((GetRecoSteps() & GPUDataTypes::RecoStep::TPCdEdx) && (processors()->calibObjects.dEdxCalibContainer == nullptr)) {
235 GPUError("Cannot run dE/dx without dE/dx calibration container object");
236 return false;
237 }
238 if ((GetRecoSteps() & GPUDataTypes::RecoStep::TPCClusterFinding) && processors()->calibObjects.tpcPadGain == nullptr) {
239 GPUError("Cannot run gain calibration without calibration object");
240 return false;
241 }
242 if ((GetRecoSteps() & GPUDataTypes::RecoStep::TPCClusterFinding) && processors()->calibObjects.tpcZSLinkMapping == nullptr && mIOPtrs.tpcZS != nullptr) {
243 GPUError("Cannot run TPC ZS Decoder without mapping object. (tpczslinkmapping.dump missing?)");
244 return false;
245 }
246 return true;
247}
248
250{
251 int32_t gatherMode = mRec->GetProcessingSettings().tpcCompressionGatherMode == -1 ? mRec->getGPUParameters(mRec->GetRecoStepsGPU() & GPUDataTypes::RecoStep::TPCCompression).par_COMP_GATHER_MODE : mRec->GetProcessingSettings().tpcCompressionGatherMode;
252 if ((param().rec.tpc.nWays & 1) == 0) {
253 GPUError("nWay setting musst be odd number!");
254 return false;
255 }
256 if (param().rec.tpc.mergerInterpolateErrors && param().rec.tpc.nWays < 3) {
257 GPUError("Cannot do error interpolation with NWays < 3!");
258 return false;
259 }
260 if (param().continuousMaxTimeBin > (int32_t)GPUSettings::TPC_MAX_TF_TIME_BIN) {
261 GPUError("configured max time bin exceeds 256 orbits");
262 return false;
263 }
264 if ((GetRecoStepsGPU() & RecoStep::TPCClusterFinding) && std::max(GetProcessingSettings().nTPCClustererLanes + 1, GetProcessingSettings().nTPCClustererLanes * 2) + (GetProcessingSettings().doublePipeline ? 1 : 0) > (int32_t)mRec->NStreams()) {
265 GPUError("NStreams of %d insufficient for %d nTPCClustererLanes", mRec->NStreams(), (int32_t)GetProcessingSettings().nTPCClustererLanes);
266 return false;
267 }
268 if ((mRec->GetRecoStepsGPU() & GPUDataTypes::RecoStep::TPCCompression) && GetProcessingSettings().noGPUMemoryRegistration && gatherMode != 3) {
269 GPUError("noGPUMemoryRegistration only possible with gather mode 3 (set to %d / %d)", mRec->GetProcessingSettings().tpcCompressionGatherMode, gatherMode);
270 return false;
271 }
272 if (mRec->IsGPU() && (GetProcessingSettings().clusterizerZSSanityCheck || GetProcessingSettings().mergerSanityCheck)) {
273 GPUError("Clusterizer and merger Sanity checks only supported when not running on GPU");
274 return false;
275 }
276 if (GetProcessingSettings().tpcWriteClustersAfterRejection && (mRec->IsGPU() || param().rec.tpc.compressionTypeMask || !(GetRecoSteps() & GPUDataTypes::RecoStep::TPCCompression))) {
277 GPUError("tpcWriteClustersAfterRejection requires compressionTypeMask = 0, no GPU usage, and compression enabled");
278 return false;
279 }
280 if (GetProcessingSettings().doublePipeline) {
282 GPUError("Invalid outputs for double pipeline mode 0x%x", (uint32_t)GetRecoStepsOutputs());
283 return false;
284 }
289 GPUError("Must use external output for double pipeline mode");
290 return false;
291 }
292 if (gatherMode == 1) {
293 GPUError("Double pipeline incompatible to compression mode 1");
294 return false;
295 }
297 GPUError("Invalid reconstruction settings for double pipeline: Needs compression and cluster finding");
298 return false;
299 }
300 }
301 if ((GetRecoStepsGPU() & GPUDataTypes::RecoStep::TPCCompression) && !(GetRecoStepsGPU() & GPUDataTypes::RecoStep::TPCCompression) && (gatherMode == 1 || gatherMode == 3)) {
302 GPUError("Invalid tpcCompressionGatherMode for compression on CPU");
303 return false;
304 }
305 if (GetProcessingSettings().tpcApplyClusterFilterOnCPU > 0 && (GetRecoStepsGPU() & GPUDataTypes::RecoStep::TPCClusterFinding || GetProcessingSettings().runMC)) {
306 GPUError("tpcApplyClusterFilterOnCPU cannot be used with GPU clusterization or with MC labels");
307 return false;
308 }
309 if (GetRecoSteps() & RecoStep::TRDTracking) {
310 if (GetProcessingSettings().trdTrackModelO2 && (GetProcessingSettings().createO2Output == 0 || (GetMatLUT() == nullptr && !GetProcessingSettings().willProvideO2PropagatorLate))) {
311 GPUError("TRD tracking can only run on O2 TPC tracks if createO2Output is enabled (%d), and matBudLUT is available (0x%p)", (int32_t)GetProcessingSettings().createO2Output, (void*)GetMatLUT());
312 return false;
313 }
314 if ((GetRecoStepsGPU() & RecoStep::TRDTracking) && !GetProcessingSettings().trdTrackModelO2 && GetProcessingSettings().createO2Output > 1) {
315 GPUError("TRD tracking can only run on GPU TPC tracks if the createO2Output setting does not suppress them");
316 return false;
317 }
318 if ((((GetRecoStepsGPU() & RecoStep::TRDTracking) && GetProcessingSettings().trdTrackModelO2) || ((GetRecoStepsGPU() & RecoStep::Refit) && !param().rec.trackingRefitGPUModel)) && (!GetProcessingSettings().o2PropagatorUseGPUField || (GetMatLUT() == nullptr && !GetProcessingSettings().willProvideO2PropagatorLate))) {
319 GPUError("Cannot use TRD tracking or Refit on GPU without GPU polynomial field map (%d) or matlut table (%p)", (int32_t)GetProcessingSettings().o2PropagatorUseGPUField, (void*)GetMatLUT());
320 return false;
321 }
322 }
323 return true;
324}
325
327{
328 const auto& threadContext = GetThreadContext();
329 if (GetProcessingSettings().debugLevel >= 1) {
330 printf("Enabled Reconstruction Steps: 0x%x (on GPU: 0x%x)", (int32_t)GetRecoSteps().get(), (int32_t)GetRecoStepsGPU().get());
331 for (uint32_t i = 0; i < sizeof(GPUDataTypes::RECO_STEP_NAMES) / sizeof(GPUDataTypes::RECO_STEP_NAMES[0]); i++) {
332 if (GetRecoSteps().isSet(1u << i)) {
333 printf(" - %s", GPUDataTypes::RECO_STEP_NAMES[i]);
334 if (GetRecoStepsGPU().isSet(1u << i)) {
335 printf(" (G)");
336 }
337 }
338 }
339 printf("\n");
340 }
341 if (!ValidateSteps()) {
342 return 1;
343 }
344
345 for (uint32_t i = 0; i < mSubOutputControls.size(); i++) {
346 if (mSubOutputControls[i] == nullptr) {
348 }
349 }
350
351 if (!ValidateSettings()) {
352 return 1;
353 }
354
357 if (!qa) {
358 qa.reset(new GPUQA(this));
359 }
360 }
363 if (mEventDisplay == nullptr) {
364 throw std::runtime_error("Error loading event display");
365 }
366 }
367
370
371 if (mRec->IsGPU()) {
373 UpdateGPUCalibObjectsPtrs(-1); // First initialization, for users not using RunChain
375 WriteToConstantMemory(RecoStep::NoRecoStep, (char*)&processors()->errorCodes - (char*)processors(), &processorsShadow()->errorCodes, sizeof(processorsShadow()->errorCodes), -1);
376 TransferMemoryResourceLinkToGPU(RecoStep::NoRecoStep, mInputsHost->mResourceErrorCodes);
377 }
378
379 if (GetProcessingSettings().debugLevel >= 6) {
380 std::string filename = std::string(mRec->IsGPU() ? "GPU" : "CPU") + (mRec->slaveId() != -1 ? (std::string("_slave") + std::to_string(mRec->slaveId())) : std::string(mRec->slavesExist() ? "_master" : "")) + GetProcessingSettings().debugLogSuffix + ".out";
381 mDebugFile->open(filename.c_str());
382 }
383
384 return 0;
385}
386
388{
389 if (processors()->calibObjects.fastTransform && (ptrMask == nullptr || ptrMask->fastTransform)) {
390 memcpy((void*)mFlatObjectsShadow.mCalibObjects.fastTransform, (const void*)processors()->calibObjects.fastTransform, sizeof(*processors()->calibObjects.fastTransform));
391 memcpy((void*)mFlatObjectsShadow.mTpcTransformBuffer, (const void*)processors()->calibObjects.fastTransform->getFlatBufferPtr(), processors()->calibObjects.fastTransform->getFlatBufferSize());
392 mFlatObjectsShadow.mCalibObjects.fastTransform->clearInternalBufferPtr();
395 }
396 if (processors()->calibObjects.fastTransformMShape && (ptrMask == nullptr || ptrMask->fastTransformMShape)) {
397 memcpy((void*)mFlatObjectsShadow.mCalibObjects.fastTransformMShape, (const void*)processors()->calibObjects.fastTransformMShape, sizeof(*processors()->calibObjects.fastTransformMShape));
398 memcpy((void*)mFlatObjectsShadow.mTpcTransformMShapeBuffer, (const void*)processors()->calibObjects.fastTransformMShape->getFlatBufferPtr(), processors()->calibObjects.fastTransformMShape->getFlatBufferSize());
399 mFlatObjectsShadow.mCalibObjects.fastTransformMShape->clearInternalBufferPtr();
402 }
403 if (processors()->calibObjects.fastTransformRef && (ptrMask == nullptr || ptrMask->fastTransformRef)) {
404 memcpy((void*)mFlatObjectsShadow.mCalibObjects.fastTransformRef, (const void*)processors()->calibObjects.fastTransformRef, sizeof(*processors()->calibObjects.fastTransformRef));
405 memcpy((void*)mFlatObjectsShadow.mTpcTransformRefBuffer, (const void*)processors()->calibObjects.fastTransformRef->getFlatBufferPtr(), processors()->calibObjects.fastTransformRef->getFlatBufferSize());
406 mFlatObjectsShadow.mCalibObjects.fastTransformRef->clearInternalBufferPtr();
409 }
410 if (processors()->calibObjects.fastTransformHelper && (ptrMask == nullptr || ptrMask->fastTransformHelper)) {
411 memcpy((void*)mFlatObjectsShadow.mCalibObjects.fastTransformHelper, (const void*)processors()->calibObjects.fastTransformHelper, sizeof(*processors()->calibObjects.fastTransformHelper));
415 }
416 if (processors()->calibObjects.dEdxCalibContainer && (ptrMask == nullptr || ptrMask->dEdxCalibContainer)) {
417 memcpy((void*)mFlatObjectsShadow.mCalibObjects.dEdxCalibContainer, (const void*)processors()->calibObjects.dEdxCalibContainer, sizeof(*processors()->calibObjects.dEdxCalibContainer));
418 memcpy((void*)mFlatObjectsShadow.mdEdxSplinesBuffer, (const void*)processors()->calibObjects.dEdxCalibContainer->getFlatBufferPtr(), processors()->calibObjects.dEdxCalibContainer->getFlatBufferSize());
419 mFlatObjectsShadow.mCalibObjects.dEdxCalibContainer->clearInternalBufferPtr();
422 }
423 if (processors()->calibObjects.matLUT && (ptrMask == nullptr || ptrMask->matLUT)) {
424 memcpy((void*)mFlatObjectsShadow.mCalibObjects.matLUT, (const void*)processors()->calibObjects.matLUT, sizeof(*processors()->calibObjects.matLUT));
425 memcpy((void*)mFlatObjectsShadow.mMatLUTBuffer, (const void*)processors()->calibObjects.matLUT->getFlatBufferPtr(), processors()->calibObjects.matLUT->getFlatBufferSize());
426 mFlatObjectsShadow.mCalibObjects.matLUT->clearInternalBufferPtr();
429 }
430 if (processors()->calibObjects.trdGeometry && (ptrMask == nullptr || ptrMask->trdGeometry)) {
431 memcpy((void*)mFlatObjectsShadow.mCalibObjects.trdGeometry, (const void*)processors()->calibObjects.trdGeometry, sizeof(*processors()->calibObjects.trdGeometry));
432 mFlatObjectsShadow.mCalibObjects.trdGeometry->clearInternalBufferPtr();
433 }
434 if (processors()->calibObjects.tpcPadGain && (ptrMask == nullptr || ptrMask->tpcPadGain)) {
435 memcpy((void*)mFlatObjectsShadow.mCalibObjects.tpcPadGain, (const void*)processors()->calibObjects.tpcPadGain, sizeof(*processors()->calibObjects.tpcPadGain));
436 }
437 if (processors()->calibObjects.tpcZSLinkMapping && (ptrMask == nullptr || ptrMask->tpcZSLinkMapping)) {
438 memcpy((void*)mFlatObjectsShadow.mCalibObjects.tpcZSLinkMapping, (const void*)processors()->calibObjects.tpcZSLinkMapping, sizeof(*processors()->calibObjects.tpcZSLinkMapping));
439 }
440 if (processors()->calibObjects.o2Propagator && (ptrMask == nullptr || ptrMask->o2Propagator)) {
441 memcpy((void*)mFlatObjectsShadow.mCalibObjects.o2Propagator, (const void*)processors()->calibObjects.o2Propagator, sizeof(*processors()->calibObjects.o2Propagator));
442 mFlatObjectsShadow.mCalibObjects.o2Propagator->setGPUField(&processorsDevice()->param.polynomialField);
444 }
446 memcpy((void*)&processorsShadow()->calibObjects, (void*)&mFlatObjectsDevice.mCalibObjects, sizeof(mFlatObjectsDevice.mCalibObjects));
447}
448
450{
451 WriteToConstantMemory(RecoStep::NoRecoStep, (char*)&processors()->calibObjects - (char*)processors(), &mFlatObjectsDevice.mCalibObjects, sizeof(mFlatObjectsDevice.mCalibObjects), stream);
452}
453
455{
459 }
460 if (mIOPtrs.tpcZS && param().rec.fwdTPCDigitsAsClusters) {
461 throw std::runtime_error("Forwading zero-suppressed hits not supported");
462 }
464 return 0;
465}
466
468{
470 if (!qa) {
471 qa.reset(new GPUQA(this));
472 }
473 if (!GetQA()->IsInitialized()) {
474 return GetQA()->InitQA();
475 }
476 return 0;
477}
478
480{
481 if (GetProcessingSettings().runQA && GetQA()->IsInitialized() && !(mConfigQA && mConfigQA->shipToQC) && !mQAFromForeignChain) {
482 GetQA()->UpdateChain(this);
484 }
485 if (GetProcessingSettings().debugLevel >= 6) {
486 mDebugFile->close();
487 }
489 mCompressionStatistics->Finish();
490 }
491 return 0;
492}
493
495{
496 char* fastTransformBase = (char*)mem;
500 }
504 }
508 }
511 }
512 if ((char*)mem - fastTransformBase < mChainTracking->GetProcessingSettings().fastTransformObjectsMinMemorySize) {
513 mem = fastTransformBase + mChainTracking->GetProcessingSettings().fastTransformObjectsMinMemorySize; // TODO: Fixme and do proper dynamic allocation
514 }
517 }
520 }
521 char* dummyPtr;
525 } else if (mChainTracking->GetProcessingSettings().lateO2MatLutProvisioningSize) {
526 computePointerWithAlignment(mem, dummyPtr, mChainTracking->GetProcessingSettings().lateO2MatLutProvisioningSize);
527 }
531 }
534 }
537 mCalibObjects.o2Propagator = nullptr; // Always reserve memory for o2::Propagator, since it may be propagatred only during run() not during init().
538 }
540 mem = (char*)mem + mChainTracking->GetProcessingSettings().calibObjectsExtraMemorySize; // TODO: Fixme and do proper dynamic allocation
541 }
542 return mem;
543}
544
546{
547 std::memset((void*)&mIOPtrs, 0, sizeof(mIOPtrs));
549 new (&mIOMem) InOutMemory;
550 mClusterNativeAccessReduced.reset(nullptr);
551 if (mClusterNativeAccess.get()) {
552 memset((void*)mClusterNativeAccess.get(), 0, sizeof(*mClusterNativeAccess));
553 }
554}
555
557{
558 for (uint32_t i = 0; i < NSECTORS; i++) {
563 }
565 std::memset(mIOMem.clusterNativeAccess.get(), 0, sizeof(ClusterNativeAccess)); // ClusterNativeAccess has no its own constructor
579}
580
581void GPUChainTracking::SetTPCFastTransform(std::unique_ptr<TPCFastTransform>&& tpcFastTransform, std::unique_ptr<CorrectionMapsHelper>&& tpcTransformHelper)
582{
583 mTPCFastTransformU = std::move(tpcFastTransform);
584 mTPCFastTransformHelperU = std::move(tpcTransformHelper);
587}
588
589void GPUChainTracking::SetMatLUT(std::unique_ptr<o2::base::MatLayerCylSet>&& lut)
590{
591 mMatLUTU = std::move(lut);
593}
594
595void GPUChainTracking::SetTRDGeometry(std::unique_ptr<o2::trd::GeometryFlat>&& geo)
596{
597 mTRDGeometryU = std::move(geo);
599}
600
601int32_t GPUChainTracking::DoQueuedUpdates(int32_t stream, bool updateSlave)
602{
603 int32_t retVal = 0;
604 std::unique_ptr<GPUSettingsGRP> grp;
605 const GPUSettingsProcessing* p = nullptr;
606 std::lock_guard lk(mMutexUpdateCalib);
608 if (mNewCalibValues->newSolenoidField || mNewCalibValues->newContinuousMaxTimeBin || mNewCalibValues->newTPCTimeBinCut) {
609 grp = std::make_unique<GPUSettingsGRP>(mRec->GetGRPSettings());
610 if (mNewCalibValues->newSolenoidField) {
611 grp->solenoidBzNominalGPU = mNewCalibValues->solenoidField;
612 }
613 if (mNewCalibValues->newContinuousMaxTimeBin) {
614 grp->grpContinuousMaxTimeBin = mNewCalibValues->continuousMaxTimeBin;
615 }
616 if (mNewCalibValues->newTPCTimeBinCut) {
617 grp->tpcCutTimeBin = mNewCalibValues->tpcTimeBinCut;
618 }
619 }
620 }
621 if (GetProcessingSettings().tpcDownscaledEdx != 0) {
623 }
624 if (grp || p) {
625 mRec->UpdateSettings(grp.get(), p);
626 retVal = 1;
627 }
629 if (mNewCalibObjects->o2Propagator && ((mNewCalibObjects->o2Propagator->getGPUField() != nullptr) ^ GetProcessingSettings().o2PropagatorUseGPUField)) {
630 GPUFatal("GPU magnetic field for propagator requested, but received an O2 propagator without GPU field");
631 }
632 void* const* pSrc = (void* const*)mNewCalibObjects.get();
633 void** pDst = (void**)&processors()->calibObjects;
634 for (uint32_t i = 0; i < sizeof(processors()->calibObjects) / sizeof(void*); i++) {
635 if (pSrc[i]) {
636 pDst[i] = pSrc[i];
637 }
638 }
640 if (GetProcessingSettings().trdTrackModelO2) {
642 if (mRec->IsGPU()) {
643 TransferMemoryResourceLinkToGPU(RecoStep::NoRecoStep, processors()->trdTrackerO2.MemoryPermanent(), stream);
644 }
645 } else {
647 if (mRec->IsGPU()) {
648 TransferMemoryResourceLinkToGPU(RecoStep::NoRecoStep, processors()->trdTrackerGPU.MemoryPermanent(), stream);
649 }
650 }
651 }
652 if (mRec->IsGPU()) {
653 std::array<uint8_t, sizeof(GPUTrackingFlatObjects)> oldFlatPtrs, oldFlatPtrsDevice;
654 memcpy(oldFlatPtrs.data(), (void*)&mFlatObjectsShadow, oldFlatPtrs.size());
655 memcpy(oldFlatPtrsDevice.data(), (void*)&mFlatObjectsDevice, oldFlatPtrsDevice.size());
657 bool ptrsChanged = memcmp(oldFlatPtrs.data(), (void*)&mFlatObjectsShadow, oldFlatPtrs.size()) || memcmp(oldFlatPtrsDevice.data(), (void*)&mFlatObjectsDevice, oldFlatPtrsDevice.size());
658 if (ptrsChanged) {
659 GPUInfo("Updating all calib objects since pointers changed");
660 }
661 UpdateGPUCalibObjects(stream, ptrsChanged ? nullptr : mNewCalibObjects.get());
662 }
663 }
664
665 if ((mUpdateNewCalibObjects || (mRec->slavesExist() && updateSlave)) && mRec->IsGPU()) {
666 UpdateGPUCalibObjectsPtrs(stream); // Reinitialize
667 retVal = 1;
668 }
669 mNewCalibObjects.reset(nullptr);
670 mNewCalibValues.reset(nullptr);
672 return retVal;
673}
674
676{
677 if ((((GetRecoSteps() & RecoStep::TRDTracking) && !GetProcessingSettings().trdTrackModelO2 && !GetProcessingSettings().willProvideO2PropagatorLate) || ((GetRecoSteps() & RecoStep::Refit) && !param().rec.trackingRefitGPUModel)) && processors()->calibObjects.o2Propagator == nullptr) {
678 GPUFatal("Cannot run TRD tracking or refit with o2 track model without o2 propagator"); // This check must happen during run, since o2::Propagator cannot be available during init
679 }
680 if (GetProcessingSettings().autoAdjustHostThreads && !mRec->IsGPU()) {
682 }
683 const auto threadContext = GetThreadContext();
684 if (GetProcessingSettings().runCompressionStatistics && mCompressionStatistics == nullptr) {
686 }
687 const bool needQA = GPUQA::QAAvailable() && (GetProcessingSettings().runQA || (GetProcessingSettings().eventDisplay && (mIOPtrs.nMCInfosTPC || GetProcessingSettings().runMC)));
688 if (needQA && GetQA()->IsInitialized() == false) {
689 if (GetQA()->InitQA(GetProcessingSettings().runQA ? -GetProcessingSettings().runQA : -1)) {
690 return 1;
691 }
692 }
693 if (needQA) {
694 mFractionalQAEnabled = GetProcessingSettings().qcRunFraction == 100.f || (uint32_t)(rand() % 10000) < (uint32_t)(GetProcessingSettings().qcRunFraction * 100);
695 }
696 if (GetProcessingSettings().debugLevel >= 6) {
697 *mDebugFile << "\n\nProcessing event " << mRec->getNEventsProcessed() << std::endl;
698 }
700
701 mRec->getGeneralStepTimer(GeneralStep::Prepare).Start();
702 try {
704 } catch (const std::bad_alloc& e) {
705 GPUError("Memory Allocation Error");
706 return (1);
707 }
708 mRec->getGeneralStepTimer(GeneralStep::Prepare).Stop();
709
711
712 SynchronizeStream(0); // Synchronize all init copies that might be ongoing
713
714 if (GetProcessingSettings().debugOnFailure) {
715 mRec->setDebugDumpCallback([this]() { DoDebugRawDump(); });
716 }
717
719 if (runRecoStep(RecoStep::TPCDecompression, &GPUChainTracking::RunTPCDecompression)) {
720 return 1;
721 }
722 } else if (mIOPtrs.tpcPackedDigits || mIOPtrs.tpcZS) {
723 if (runRecoStep(RecoStep::TPCClusterFinding, &GPUChainTracking::RunTPCClusterizer, false)) {
724 return 1;
725 }
726 }
727
728 if (GetProcessingSettings().autoAdjustHostThreads && !mRec->IsGPU() && mIOPtrs.clustersNative) {
730 }
731
733 return 1;
734 }
735
736 mRec->PushNonPersistentMemory(qStr2Tag("TPCSLCD1")); // 1st stack level for TPC tracking sector data
738 if (runRecoStep(RecoStep::TPCSectorTracking, &GPUChainTracking::RunTPCTrackingSectors)) {
739 return 1;
740 }
741
742 if (runRecoStep(RecoStep::TPCMerging, &GPUChainTracking::RunTPCTrackingMerger, false)) {
743 return 1;
744 }
746 mRec->PopNonPersistentMemory(RecoStep::TPCSectorTracking, qStr2Tag("TPCSLCD1")); // Release 1st stack level, TPC sector data not needed after merger
748 }
749
751 if (GetProcessingSettings().doublePipeline) {
753 if (foreignChain && foreignChain->mIOPtrs.tpcZS) {
754 if (GetProcessingSettings().debugLevel >= 3) {
755 GPUInfo("Preempting tpcZS input of foreign chain");
756 }
757 mPipelineFinalizationCtx.reset(new GPUChainTrackingFinalContext);
758 mPipelineFinalizationCtx->rec = this->mRec;
759 foreignChain->mPipelineNotifyCtx = mPipelineFinalizationCtx.get();
760 }
761 }
762 if (runRecoStep(RecoStep::TPCCompression, &GPUChainTracking::RunTPCCompression)) {
763 return 1;
764 }
765 }
766
767 if (runRecoStep(RecoStep::TRDTracking, &GPUChainTracking::RunTRDTracking)) {
768 return 1;
769 }
770
771 if (runRecoStep(RecoStep::Refit, &GPUChainTracking::RunRefit)) {
772 return 1;
773 }
774
775 if (!GetProcessingSettings().doublePipeline) { // Synchronize with output copies running asynchronously
776 SynchronizeStream(OutputStream());
777 }
778
779 if (GetProcessingSettings().autoAdjustHostThreads && !mRec->IsGPU()) {
781 }
782
783 int32_t retVal = 0;
784 if (CheckErrorCodes(false, false, mRec->getErrorCodeOutput())) { // TODO: Eventually, we should use GPUReconstruction::CheckErrorCodes
785 retVal = 3;
786 if (!GetProcessingSettings().ignoreNonFatalGPUErrors) {
787 return retVal;
788 }
789 }
790
791 if (GetProcessingSettings().doublePipeline) {
792 return retVal;
793 }
794 int32_t retVal2 = RunChainFinalize();
795 return retVal2 ? retVal2 : retVal;
796}
797
798int32_t GPUChainTracking::RunChainFinalize()
799{
800 if (mIOPtrs.clustersNative && (GetRecoSteps() & RecoStep::TPCCompression) && GetProcessingSettings().runCompressionStatistics) {
803 }
804
805 if (GetProcessingSettings().outputSanityCheck) {
806 OutputSanityCheck();
807 }
808
809 const bool needQA = GPUQA::QAAvailable() && (GetProcessingSettings().runQA || (GetProcessingSettings().eventDisplay && mIOPtrs.nMCInfosTPC));
810 if (needQA && mFractionalQAEnabled) {
811 mRec->getGeneralStepTimer(GeneralStep::QA).Start();
812 GetQA()->UpdateChain(this);
813 GetQA()->RunQA(!GetProcessingSettings().runQA);
814 mRec->getGeneralStepTimer(GeneralStep::QA).Stop();
815 if (GetProcessingSettings().debugLevel == 0) {
816 GPUInfo("Total QA runtime: %d us", (int32_t)(mRec->getGeneralStepTimer(GeneralStep::QA).GetElapsedTime() * 1000000));
817 }
818 }
819
820 if (GetProcessingSettings().showOutputStat) {
822 }
823
825
826 // PrintMemoryRelations();
827
829 if (!mDisplayRunning) {
830 GPUInfo("Starting Event Display...");
831 if (mEventDisplay->StartDisplay()) {
832 GPUError("Error starting Event Display");
833 return (1);
834 }
835 mDisplayRunning = true;
836 } else {
837 mEventDisplay->ShowNextEvent();
838 }
839
840 mEventDisplay->WaitTillEventShown();
841
842 if (GetProcessingSettings().eventDisplay->EnableSendKey()) {
843 while (kbhit()) {
844 getch();
845 }
846 GPUInfo("Press key for next event!");
847 }
848
849 int32_t iKey;
850 do {
851 usleep(10000);
852 if (GetProcessingSettings().eventDisplay->EnableSendKey()) {
853 iKey = kbhit() ? getch() : 0;
854 if (iKey == 27) {
855 GetProcessingSettings().eventDisplay->setDisplayControl(2);
856 } else if (iKey == 'n') {
857 break;
858 } else if (iKey) {
859 while (GetProcessingSettings().eventDisplay->getSendKey() != 0) {
860 usleep(1000);
861 }
862 GetProcessingSettings().eventDisplay->setSendKey(iKey);
863 }
864 }
865 } while (GetProcessingSettings().eventDisplay->getDisplayControl() == 0);
866 if (GetProcessingSettings().eventDisplay->getDisplayControl() == 2) {
867 mDisplayRunning = false;
868 GetProcessingSettings().eventDisplay->DisplayExit();
869 const_cast<GPUSettingsProcessing&>(GetProcessingSettings()).eventDisplay = nullptr; // TODO: fixme - eventDisplay should probably not be put into ProcessingSettings in the first place
870 return (2);
871 }
872 GetProcessingSettings().eventDisplay->setDisplayControl(0);
873 GPUInfo("Loading next event...");
874
875 mEventDisplay->BlockTillNextEvent();
876 }
877
878 return 0;
879}
880
882{
883 if (mPipelineFinalizationCtx) {
884 {
885 std::unique_lock<std::mutex> lock(mPipelineFinalizationCtx->mutex);
886 auto* ctx = mPipelineFinalizationCtx.get();
887 mPipelineFinalizationCtx->cond.wait(lock, [ctx]() { return ctx->ready; });
888 }
889 mPipelineFinalizationCtx.reset();
890 }
891 return RunChainFinalize();
892}
893
894int32_t GPUChainTracking::CheckErrorCodes(bool cpuOnly, bool forceShowErrors, std::vector<std::array<uint32_t, 4>>* fillErrors)
895{
896 int32_t retVal = 0;
897 bool hasDebugError = false;
898 for (int32_t i = 0; i < 1 + (!cpuOnly && mRec->IsGPU()); i++) {
899 if (i) {
900 const auto& threadContext = GetThreadContext();
901 if (GetProcessingSettings().doublePipeline) {
902 TransferMemoryResourceLinkToHost(RecoStep::NoRecoStep, mInputsHost->mResourceErrorCodes, 0);
904 } else {
905 TransferMemoryResourceLinkToHost(RecoStep::NoRecoStep, mInputsHost->mResourceErrorCodes);
906 }
907 }
908 if (processors()->errorCodes.hasError()) {
909 static int32_t errorsShown = 0;
910 static bool quiet = false;
911 static std::chrono::time_point<std::chrono::steady_clock> silenceFrom;
912 if (!quiet && errorsShown++ >= 10 && GetProcessingSettings().throttleAlarms && !forceShowErrors) {
913 silenceFrom = std::chrono::steady_clock::now();
914 quiet = true;
915 } else if (quiet) {
916 auto currentTime = std::chrono::steady_clock::now();
917 std::chrono::duration<double> elapsed_seconds = currentTime - silenceFrom;
918 if (elapsed_seconds.count() > 60 * 10) {
919 quiet = false;
920 errorsShown = 1;
921 }
922 }
923 retVal = 1;
924 if (GetProcessingSettings().throttleAlarms && !forceShowErrors) {
925 GPUWarning("GPUReconstruction suffered from an error in the %s part", i ? "GPU" : "CPU");
926 } else {
927 GPUError("GPUReconstruction suffered from an error in the %s part", i ? "GPU" : "CPU");
928 }
929 if (!quiet) {
930 processors()->errorCodes.printErrors(GetProcessingSettings().throttleAlarms && !forceShowErrors);
931 }
932 if (fillErrors) {
933 uint32_t nErrors = processors()->errorCodes.getNErrors();
934 const uint32_t* pErrors = processors()->errorCodes.getErrorPtr();
935 for (uint32_t j = 0; j < nErrors; j++) {
936 fillErrors->emplace_back(std::array<uint32_t, 4>{pErrors[4 * j], pErrors[4 * j + 1], pErrors[4 * j + 2], pErrors[4 * j + 3]});
937 }
938 }
939 if ((GetProcessingSettings().debugOnFailure & 1) || (GetProcessingSettings().debugOnFailure & 4)) {
940 if (GetProcessingSettings().debugOnFailureErrorMask == (uint64_t)-1) {
941 hasDebugError = true;
942 } else {
943 uint32_t nErrors = processors()->errorCodes.getNErrors();
944 const uint32_t* pErrors = processors()->errorCodes.getErrorPtr();
945 for (uint32_t j = 0; j < nErrors; j++) {
946 if (GetProcessingSettings().debugOnFailureErrorMask & (1 << pErrors[4 * j])) {
947 hasDebugError = true;
948 break;
949 }
950 }
951 }
952 }
953 }
954 }
955 ClearErrorCodes(cpuOnly);
956 if (hasDebugError) {
958 }
959 return retVal;
960}
961
963{
965 if (mRec->IsGPU() && !cpuOnly) {
966 const auto& threadContext = GetThreadContext();
967 WriteToConstantMemory(RecoStep::NoRecoStep, (char*)&processors()->errorCodes - (char*)processors(), &processorsShadow()->errorCodes, sizeof(processorsShadow()->errorCodes), 0);
968 TransferMemoryResourceLinkToGPU(RecoStep::NoRecoStep, mInputsHost->mResourceErrorCodes, 0);
969 }
970}
971
973{
974 std::lock_guard lk(mMutexUpdateCalib);
975 if (mNewCalibObjects) {
976 void* const* pSrc = (void* const*)&obj;
977 void** pDst = (void**)mNewCalibObjects.get();
978 for (uint32_t i = 0; i < sizeof(*mNewCalibObjects) / sizeof(void*); i++) {
979 if (pSrc[i]) {
980 pDst[i] = pSrc[i];
981 }
982 }
983 } else {
985 }
986 if (mNewCalibValues) {
987 mNewCalibValues->updateFrom(&vals);
988 } else {
989 mNewCalibValues.reset(new GPUNewCalibValues(vals));
990 }
992}
993
995{
996 return (mRec->IsGPU() ? processorsShadow() : processors())->calibObjects.o2Propagator;
997}
998
1000{
1002 if ((prop->getGPUField() != nullptr) ^ GetProcessingSettings().o2PropagatorUseGPUField) {
1003 GPUFatal("GPU magnetic field for propagator requested, but received an O2 propagator without GPU field");
1004 }
1005}
Definition of container class for dE/dx corrections.
Helper class to access correction maps.
int32_t i
#define GPUCA_MEMORY_SIZE
#define GPUCA_HOST_MEMORY_SIZE
int32_t retVal
Online TRD tracker based on extrapolated TPC tracks.
Used for storing the MC labels for the TRD tracklets.
TRD Tracklet word for GPU tracker - 32bit tracklet info + half chamber ID + index.
Definition of a container to keep Monte Carlo truth external to simulation objects.
uint32_t j
Definition RawData.h:0
uint32_t c
Definition RawData.h:2
Definition of TPCFastTransform class.
void Start()
Definition timer.cxx:64
double GetElapsedTime()
Definition timer.cxx:115
void Stop()
Definition timer.cxx:76
bool isSet(const bitfield &v) const
Definition bitfield.h:66
size_t getFlatBufferSize() const
Gives size of the flat buffer.
Definition FlatObject.h:256
void SetMatLUT(std::unique_ptr< o2::base::MatLayerCylSet > &&lut)
std::unique_ptr< o2::base::MatLayerCylSet > mMatLUTU
const o2::base::Propagator * GetDeviceO2Propagator()
std::unique_ptr< o2::tpc::ClusterNativeAccess > mClusterNativeAccess
void SetTRDGeometry(std::unique_ptr< o2::trd::GeometryFlat > &&geo)
GPUChainTracking * mQAFromForeignChain
void SetO2Propagator(const o2::base::Propagator *prop)
std::unique_ptr< GPUQA > mQA
std::unique_ptr< CorrectionMapsHelper > mTPCFastTransformHelperU
GPUTrackingFlatObjects mFlatObjectsDevice
int32_t RunTPCClusterizer(bool synchronizeOutput=true)
void UpdateGPUCalibObjectsPtrs(int32_t stream)
int32_t RunTPCTrackingMerger(bool synchronizeOutput=true)
std::unique_ptr< GPUTrackingInputProvider > mInputsHost
std::unique_ptr< GPUTPCClusterStatistics > mCompressionStatistics
const o2::base::MatLayerCylSet * GetMatLUT() const
std::array< GPUOutputControl *, GPUTrackingOutputs::count()> mSubOutputControls
std::unique_ptr< std::ofstream > mDebugFile
void SetUpdateCalibObjects(const GPUCalibObjectsConst &obj, const GPUNewCalibValues &vals)
std::unique_ptr< GPUCalibObjectsConst > mNewCalibObjects
std::unique_ptr< o2::trd::GeometryFlat > mTRDGeometryU
GPUTrackingFlatObjects mFlatObjectsShadow
void RegisterPermanentMemoryAndProcessors() override
void RegisterGPUProcessors() override
void ClearErrorCodes(bool cpuOnly=false)
const GPUQA * GetQA() const
void MemorySize(size_t &gpuMem, size_t &pageLockedHostMem) override
void SetTPCFastTransform(std::unique_ptr< TPCFastTransform > &&tpcFastTransform, std::unique_ptr< CorrectionMapsHelper > &&tpcTransformHelper)
int32_t DoQueuedUpdates(int32_t stream, bool updateSlave=true)
std::unique_ptr< GPUNewCalibValues > mNewCalibValues
int32_t CheckErrorCodes(bool cpuOnly=false, bool forceShowErrors=false, std::vector< std::array< uint32_t, 4 > > *fillErrors=nullptr) override
std::unique_ptr< TPCFastTransform > mTPCFastTransformU
int32_t PrepareEvent() override
GPUChainTracking(GPUReconstruction *rec, uint32_t maxTPCHits=GPUCA_MAX_CLUSTERS, uint32_t maxTRDTracklets=GPUCA_MAX_TRD_TRACKLETS)
void UpdateGPUCalibObjects(int32_t stream, const GPUCalibObjectsConst *ptrMask=nullptr)
GPUTrackingInOutPointers & mIOPtrs
struct o2::gpu::GPUChainTracking::InOutMemory mIOMem
const o2::tpc::CalibdEdxContainer * GetdEdxCalibContainer() const
std::unique_ptr< GPUTrackingInputProvider > mInputsShadow
const GPUSettingsQA * mConfigQA
int32_t FinalizePipelinedProcessing() override
std::unique_ptr< GPUDisplayInterface > mEventDisplay
std::unique_ptr< o2::tpc::ClusterNativeAccess > mClusterNativeAccessReduced
void TransferMemoryResourceLinkToGPU(RecoStep step, int16_t res, int32_t stream=-1, deviceEvent *ev=nullptr, deviceEvent *evList=nullptr, int32_t nEvents=1)
Definition GPUChain.h:124
GPUConstantMem * processorsDevice()
Definition GPUChain.h:86
GPUReconstruction::RecoStepField GetRecoStepsGPU() const
Definition GPUChain.h:72
GPUReconstruction::RecoStepField GetRecoSteps() const
Definition GPUChain.h:71
void WriteToConstantMemory(RecoStep step, size_t offset, const void *src, size_t size, int32_t stream=-1, deviceEvent *ev=nullptr)
Definition GPUChain.h:127
GPUChain * GetNextChainInQueue()
Definition GPUChain.h:225
GPUReconstruction::InOutTypeField GetRecoStepsOutputs() const
Definition GPUChain.h:74
virtual std::unique_ptr< GPUReconstructionProcessing::threadContext > GetThreadContext()
Definition GPUChain.h:109
GPUConstantMem * processors()
Definition GPUChain.h:84
GPUParam & param()
Definition GPUChain.h:87
const GPUSettingsProcessing & GetProcessingSettings() const
Definition GPUChain.h:76
void SynchronizeStream(int32_t stream)
Definition GPUChain.h:89
GPUReconstructionCPU * mRec
Definition GPUChain.h:79
GPUConstantMem * processorsShadow()
Definition GPUChain.h:85
GPUReconstruction::InOutTypeField GetRecoStepsInputs() const
Definition GPUChain.h:73
static constexpr int32_t NSECTORS
Definition GPUChain.h:58
void TransferMemoryResourceLinkToHost(RecoStep step, int16_t res, int32_t stream=-1, deviceEvent *ev=nullptr, deviceEvent *evList=nullptr, int32_t nEvents=1)
Definition GPUChain.h:125
void AllocateIOMemoryHelper(uint32_t n, const T *&ptr, std::unique_ptr< T[]> &u)
Definition GPUChain.h:139
int32_t runRecoStep(RecoStep step, S T::*func, Args... args)
Definition GPUChain.h:289
GPUReconstruction * rec()
Definition GPUChain.h:66
static constexpr const char *const RECO_STEP_NAMES[]
static GPUDisplayInterface * getDisplay(GPUDisplayFrontendInterface *frontend, GPUChainTracking *chain, GPUQA *qa, const GPUParam *param=nullptr, const GPUCalibObjectsConst *calib=nullptr, const GPUSettingsDisplay *config=nullptr, const GPUSettingsProcessing *proc=nullptr)
const uint32_t * getErrorPtr() const
Definition GPUErrors.cxx:96
void setMemory(GPUglobalref() uint32_t *m)
Definition GPUErrors.h:37
bool printErrors(bool silent=false, uint64_t mask=0)
Definition GPUErrors.cxx:61
uint32_t getNErrors() const
Definition GPUErrors.cxx:91
static void computePointerWithAlignment(T *&basePtr, S *&objPtr, size_t nEntries=1)
void InitGPUProcessor(GPUReconstruction *rec, ProcessorType type=PROCESSOR_TYPE_CPU, GPUProcessor *slaveProcessor=nullptr)
static bool QAAvailable()
Definition GPUQA.h:56
int32_t DrawQAHistograms()
Definition GPUQA.h:46
void UpdateChain(GPUChainTracking *chain)
Definition GPUQA.h:58
static bool IsInitialized()
Definition GPUQA.h:57
int32_t InitQA(int32_t tasks=0)
Definition GPUQA.h:44
void RunQA(bool matchOnly=false)
Definition GPUQA.h:45
HighResTimer & getGeneralStepTimer(GeneralStep step)
const GPUDefParameters & getGPUParameters(bool doGPU) const override
std::vector< std::array< uint32_t, 4 > > * getErrorCodeOutput()
void PopNonPersistentMemory(RecoStep step, uint64_t tag)
RecoStepField GetRecoStepsGPU() const
void RegisterGPUDeviceProcessor(GPUProcessor *proc, GPUProcessor *slaveProcessor)
void RegisterGPUProcessor(T *proc, bool deviceSlave)
void setDebugDumpCallback(std::function< void()> &&callback=std::function< void()>(nullptr))
void ResetRegisteredMemoryPointers(GPUProcessor *proc)
int16_t RegisterMemoryAllocation(T *proc, void *(T::*setPtr)(void *), int32_t type, const char *name="", const GPUMemoryReuse &re=GPUMemoryReuse())
void UpdateSettings(const GPUSettingsGRP *g, const GPUSettingsProcessing *p=nullptr, const GPUSettingsRecDynamic *d=nullptr)
void PushNonPersistentMemory(uint64_t tag)
GPUMemorySizeScalers * MemoryScalers()
const GPUSettingsProcessing & GetProcessingSettings() const
const GPUSettingsGRP & GetGRPSettings() const
GPUOutputControl & OutputControl()
static constexpr const uint32_t TPC_MAX_TF_TIME_BIN
Definition GPUSettings.h:47
GLenum GLfloat param
Definition glcorearb.h:271
GLuint GLuint stream
Definition glcorearb.h:1806
GPUCalibObjectsTemplate< ConstPtr > GPUCalibObjectsConst
Global TPC definitions and constants.
Definition SimTraits.h:167
Defining DataPointCompositeObject explicitly as copiable.
std::string to_string(gsl::span< T, Size > span)
Definition common.h:52
std::string filename()
std::unique_ptr< GPUDisplayFrontendInterface > eventDisplay
GPUReconstruction * rec
constexpr T qStr2Tag(const char *str)
Definition strtag.h:22
S< o2::trd::GeometryFlat >::type * trdGeometry
S< o2::tpc::CalibdEdxContainer >::type * dEdxCalibContainer
S< TPCZSLinkMapping >::type * tpcZSLinkMapping
S< TPCFastTransform >::type * fastTransform
S< TPCPadGainCalib >::type * tpcPadGain
S< o2::base::PropagatorImpl< float > >::type * o2Propagator
S< o2::base::MatLayerCylSet >::type * matLUT
S< CorrectionMapsHelper >::type * fastTransformHelper
S< TPCFastTransform >::type * fastTransformRef
S< TPCFastTransform >::type * fastTransformMShape
std::unique_ptr< GPUTPCMCInfo[]> mcInfosTPC
std::unique_ptr< GPUTRDTrackletWord[]> trdTracklets
std::unique_ptr< GPUTPCMCInfoCol[]> mcInfosTPCCol
std::unique_ptr< GPUTPCGMMergedTrackHit[]> mergedTrackHits
std::unique_ptr< int32_t[]> trdTrackletIdxFirst
std::unique_ptr< GPUTPCGMMergedTrack[]> mergedTracks
std::unique_ptr< AliHLTTPCClusterMCLabel[]> mcLabelsTPC
std::unique_ptr< GPUTPCClusterData[]> clusterData[NSECTORS]
std::unique_ptr< o2::tpc::ClusterNative[]> clustersNative
std::unique_ptr< float[]> trdTriggerTimes
std::unique_ptr< GPUTPCTrack[]> sectorTracks[NSECTORS]
std::unique_ptr< GPUTRDSpacePoint[]> trdSpacePoints
std::unique_ptr< uint8_t[]> trdTrigRecMask
std::unique_ptr< o2::tpc::ClusterNativeAccess > clusterNativeAccess
std::unique_ptr< AliHLTTPCRawCluster[]> rawClusters[NSECTORS]
std::unique_ptr< GPUTPCHitId[]> sectorClusters[NSECTORS]
std::unique_ptr< GPUTRDTrackGPU[]> trdTracks
GPUTRDTrackerGPU trdTrackerGPU
GPUCalibObjectsConst calibObjects
const GPUTPCHitId * sectorClusters[NSECTORS]
const o2::tpc::ClusterNativeAccess * clustersNative
const GPUTPCMCInfo * mcInfosTPC
const o2::tpc::CompressedClustersFlat * tpcCompressedClusters
const AliHLTTPCClusterMCLabel * mcLabelsTPC
const GPUTRDSpacePoint * trdSpacePoints
const GPUTPCTrack * sectorTracks[NSECTORS]
const GPUTRDTrackGPU * trdTracks
const GPUTRDTrackletWord * trdTracklets
const GPUTrackingInOutZS * tpcZS
const AliHLTTPCRawCluster * rawClusters[NSECTORS]
const GPUTPCClusterData * clusterData[NSECTORS]
const GPUTPCGMMergedTrackHit * mergedTrackHits
const GPUTrackingInOutDigits * tpcPackedDigits
const GPUTPCMCInfoCol * mcInfosTPCCol
const GPUTPCGMMergedTrack * mergedTracks
size_t getIndex(const GPUOutputControl &v)
GPUOutputControl sharedClusterMap
GPUOutputControl compressedClusters