Project
Loading...
Searching...
No Matches
GPUChainTracking.cxx
Go to the documentation of this file.
1// Copyright 2019-2020 CERN and copyright holders of ALICE O2.
2// See https://alice-o2.web.cern.ch/copyright for details of the copyright holders.
3// All rights not expressly granted are reserved.
4//
5// This software is distributed under the terms of the GNU General Public
6// License v3 (GPL Version 3), copied verbatim in the file "COPYING".
7//
8// In applying this license CERN does not waive the privileges and immunities
9// granted to it by virtue of its status as an Intergovernmental Organization
10// or submit itself to any jurisdiction.
11
14
17#include <fstream>
18#include <chrono>
19
20#include "GPUChainTracking.h"
21#include "GPUChainTrackingGetters.inc"
22#include "GPUReconstructionIO.h"
24#include "GPUTPCGMMergedTrack.h"
26#include "GPUTPCTrack.h"
27#include "GPUTPCHitId.h"
28#include "GPUTPCClusterData.h"
29#include "TPCZSLinkMapping.h"
30#include "GPUTRDTrackletWord.h"
32#include "GPUTPCMCInfo.h"
33#include "GPUTRDTrack.h"
34#include "GPUTRDTracker.h"
35#include "AliHLTTPCRawCluster.h"
37#include "GPUTRDRecoParam.h"
39#include "GPUQA.h"
40#include "GPULogging.h"
43#include "GPUNewCalibValues.h"
44#include "GPUTriggerOutputs.h"
45#include "GPUDefParametersRuntime.h"
46
48#include "GPUHostDataTypes.h"
50#include "GPUTrackingRefit.h"
51#include "CalibdEdxContainer.h"
52
53#include "TPCFastTransform.h"
55
56#include "utils/linux_helpers.h"
57#include "utils/strtag.h"
58using namespace o2::gpu;
59
60#include "GPUO2DataTypes.h"
61
62using namespace o2::tpc;
63using namespace o2::trd;
64
65GPUChainTracking::GPUChainTracking(GPUReconstruction* rec, uint32_t maxTPCHits, uint32_t maxTRDTracklets) : GPUChain(rec), mIOPtrs(processors()->ioPtrs), mInputsHost(new GPUTrackingInputProvider), mInputsShadow(new GPUTrackingInputProvider), mClusterNativeAccess(new ClusterNativeAccess), mTriggerBuffer(new GPUTriggerOutputs), mMaxTPCHits(maxTPCHits), mMaxTRDTracklets(maxTRDTracklets), mDebugFile(new std::ofstream)
66{
70}
71
73
75{
76 if (mRec->IsGPU()) {
80 }
81
83 if (GetRecoSteps() & RecoStep::TPCSectorTracking) {
84 for (uint32_t i = 0; i < NSECTORS; i++) {
85 mRec->RegisterGPUProcessor(&processors()->tpcTrackers[i], GetRecoStepsGPU() & RecoStep::TPCSectorTracking);
86 }
87 }
88 if (GetRecoSteps() & RecoStep::TPCMerging) {
89 mRec->RegisterGPUProcessor(&processors()->tpcMerger, GetRecoStepsGPU() & RecoStep::TPCMerging);
90 }
91 if (GetRecoSteps() & RecoStep::TRDTracking) {
92 mRec->RegisterGPUProcessor(&processors()->trdTrackerGPU, GetRecoStepsGPU() & RecoStep::TRDTracking);
93 }
94 if (GetRecoSteps() & RecoStep::TRDTracking) {
95 mRec->RegisterGPUProcessor(&processors()->trdTrackerO2, GetRecoStepsGPU() & RecoStep::TRDTracking);
96 }
97 if (GetRecoSteps() & RecoStep::TPCCompression) {
98 mRec->RegisterGPUProcessor(&processors()->tpcCompressor, GetRecoStepsGPU() & RecoStep::TPCCompression);
99 }
100 if (GetRecoSteps() & RecoStep::TPCDecompression) {
101 mRec->RegisterGPUProcessor(&processors()->tpcDecompressor, GetRecoStepsGPU() & RecoStep::TPCDecompression);
102 }
103 if (GetRecoSteps() & RecoStep::TPCClusterFinding) {
104 for (uint32_t i = 0; i < NSECTORS; i++) {
105 mRec->RegisterGPUProcessor(&processors()->tpcClusterer[i], GetRecoStepsGPU() & RecoStep::TPCClusterFinding);
106#ifdef GPUCA_HAS_ONNX
107 mRec->RegisterGPUProcessor(&processors()->tpcNNClusterer[i], GetRecoStepsGPU() & RecoStep::TPCClusterFinding);
108#endif
109 }
110 }
111 if (GetRecoSteps() & RecoStep::Refit) {
112 mRec->RegisterGPUProcessor(&processors()->trackingRefit, GetRecoStepsGPU() & RecoStep::Refit);
113 }
114#ifdef GPUCA_KERNEL_DEBUGGER_OUTPUT
115 mRec->RegisterGPUProcessor(&processors()->debugOutput, true);
116#endif
118}
119
121{
122 if (mRec->IsGPU()) {
124 }
125 memcpy((void*)&processorsShadow()->trdTrackerGPU, (const void*)&processors()->trdTrackerGPU, sizeof(processors()->trdTrackerGPU));
126 if (GetRecoStepsGPU() & RecoStep::TPCSectorTracking) {
127 for (uint32_t i = 0; i < NSECTORS; i++) {
128 mRec->RegisterGPUDeviceProcessor(&processorsShadow()->tpcTrackers[i], &processors()->tpcTrackers[i]);
129 }
130 }
131 if (GetRecoStepsGPU() & RecoStep::TPCMerging) {
132 mRec->RegisterGPUDeviceProcessor(&processorsShadow()->tpcMerger, &processors()->tpcMerger);
133 }
134 if (GetRecoStepsGPU() & RecoStep::TRDTracking) {
135 mRec->RegisterGPUDeviceProcessor(&processorsShadow()->trdTrackerGPU, &processors()->trdTrackerGPU);
136 }
137
138 memcpy((void*)&processorsShadow()->trdTrackerO2, (const void*)&processors()->trdTrackerO2, sizeof(processors()->trdTrackerO2));
139 if (GetRecoStepsGPU() & RecoStep::TRDTracking) {
140 mRec->RegisterGPUDeviceProcessor(&processorsShadow()->trdTrackerO2, &processors()->trdTrackerO2);
141 }
142 if (GetRecoStepsGPU() & RecoStep::TPCCompression) {
143 mRec->RegisterGPUDeviceProcessor(&processorsShadow()->tpcCompressor, &processors()->tpcCompressor);
144 }
145 if (GetRecoStepsGPU() & RecoStep::TPCDecompression) {
146 mRec->RegisterGPUDeviceProcessor(&processorsShadow()->tpcDecompressor, &processors()->tpcDecompressor);
147 }
148 if (GetRecoStepsGPU() & RecoStep::TPCClusterFinding) {
149 for (uint32_t i = 0; i < NSECTORS; i++) {
150 mRec->RegisterGPUDeviceProcessor(&processorsShadow()->tpcClusterer[i], &processors()->tpcClusterer[i]);
151#ifdef GPUCA_HAS_ONNX
152 mRec->RegisterGPUDeviceProcessor(&processorsShadow()->tpcNNClusterer[i], &processors()->tpcNNClusterer[i]);
153#endif
154 }
155 }
156 if (GetRecoStepsGPU() & RecoStep::Refit) {
157 mRec->RegisterGPUDeviceProcessor(&processorsShadow()->trackingRefit, &processors()->trackingRefit);
158 }
159#ifdef GPUCA_KERNEL_DEBUGGER_OUTPUT
160 mRec->RegisterGPUDeviceProcessor(&processorsShadow()->debugOutput, &processors()->debugOutput);
161#endif
162}
163
164void GPUChainTracking::MemorySize(size_t& gpuMem, size_t& pageLockedHostMem)
165{
166 gpuMem = GPUCA_MEMORY_SIZE;
167 pageLockedHostMem = GPUCA_HOST_MEMORY_SIZE;
168}
169
171{
173 GPUError("Invalid Reconstruction Step Setting: dEdx requires TPC Merger to be active");
174 return false;
175 }
177 GPUError("Invalid GPU Reconstruction Step Setting: dEdx requires TPC Merger to be active");
178 return false;
179 }
181 GPUError("Invalid Reconstruction Step Setting: Tracking requires TPC Conversion to be active");
182 return false;
183 }
185 GPUError("Invalid input, TPC Clusterizer needs TPC raw input");
186 return false;
187 }
189 GPUError("Invalid input / output / step, merger cannot read/store sectors tracks and needs TPC conversion");
190 return false;
191 }
193 if ((GetRecoSteps() & gpudatatypes::RecoStep::TPCMerging) && !tpcClustersAvail) {
194 GPUError("Invalid Inputs for track merging, TPC Clusters required");
195 return false;
196 }
197#ifndef GPUCA_TPC_GEOMETRY_O2
199 GPUError("Can not run TPC GPU Cluster Finding with Run 2 Data");
200 return false;
201 }
202#endif
204 GPUError("Missing input for TPC Cluster conversion / sector tracking / compression / dEdx: TPC Clusters required");
205 return false;
206 }
208 GPUError("Input for TPC merger missing");
209 return false;
210 }
212 GPUError("Input for TPC compressor missing");
213 return false;
214 }
216 GPUError("Input for TRD Tracker missing");
217 return false;
218 }
220 GPUError("TPC Raw / TPC Clusters / TRD Tracklets cannot be output");
221 return false;
222 }
224 GPUError("No TPC Merged Track Output available");
225 return false;
226 }
228 GPUError("No TPC Compression Output available");
229 return false;
230 }
232 GPUError("No TRD Tracker Output available");
233 return false;
234 }
235 if ((GetRecoSteps() & gpudatatypes::RecoStep::TPCdEdx) && (processors()->calibObjects.dEdxCalibContainer == nullptr)) {
236 GPUError("Cannot run dE/dx without dE/dx calibration container object");
237 return false;
238 }
239 if ((GetRecoSteps() & gpudatatypes::RecoStep::TPCClusterFinding) && processors()->calibObjects.tpcPadGain == nullptr) {
240 GPUError("Cannot run gain calibration without calibration object");
241 return false;
242 }
243 if ((GetRecoSteps() & gpudatatypes::RecoStep::TPCClusterFinding) && processors()->calibObjects.tpcZSLinkMapping == nullptr && mIOPtrs.tpcZS != nullptr) {
244 GPUError("Cannot run TPC ZS Decoder without mapping object. (tpczslinkmapping.dump missing?)");
245 return false;
246 }
247 return true;
248}
249
251{
252 int32_t gatherMode = mRec->GetProcessingSettings().tpcCompressionGatherMode == -1 ? mRec->getGPUParameters(mRec->GetRecoStepsGPU() & gpudatatypes::RecoStep::TPCCompression).par_COMP_GATHER_MODE : mRec->GetProcessingSettings().tpcCompressionGatherMode;
253 if ((param().rec.tpc.nWays & 1) == 0) {
254 GPUError("nWay setting musst be odd number!");
255 return false;
256 }
257 if (param().rec.tpc.mergerInterpolateErrors && param().rec.tpc.nWays < 3) {
258 GPUError("Cannot do error interpolation with NWays < 3!");
259 return false;
260 }
261 if (param().continuousMaxTimeBin > (int32_t)GPUSettings::TPC_MAX_TF_TIME_BIN) {
262 GPUError("configured max time bin exceeds 256 orbits");
263 return false;
264 }
265 if ((GetRecoStepsGPU() & RecoStep::TPCClusterFinding) && std::max(GetProcessingSettings().nTPCClustererLanes + 1, GetProcessingSettings().nTPCClustererLanes * 2) + (GetProcessingSettings().doublePipeline ? 1 : 0) > (int32_t)mRec->NStreams()) {
266 GPUError("NStreams of %d insufficient for %d nTPCClustererLanes", mRec->NStreams(), (int32_t)GetProcessingSettings().nTPCClustererLanes);
267 return false;
268 }
269 if ((mRec->GetRecoStepsGPU() & gpudatatypes::RecoStep::TPCCompression) && GetProcessingSettings().noGPUMemoryRegistration && gatherMode != 3) {
270 GPUError("noGPUMemoryRegistration only possible with gather mode 3 (set to %d / %d)", mRec->GetProcessingSettings().tpcCompressionGatherMode, gatherMode);
271 return false;
272 }
273 if (mRec->IsGPU() && (GetProcessingSettings().clusterizerZSSanityCheck || GetProcessingSettings().mergerSanityCheck)) {
274 GPUError("Clusterizer and merger Sanity checks only supported when not running on GPU");
275 return false;
276 }
277 if (GetProcessingSettings().tpcWriteClustersAfterRejection && (mRec->IsGPU() || param().rec.tpc.compressionTypeMask || !(GetRecoSteps() & gpudatatypes::RecoStep::TPCCompression))) {
278 GPUError("tpcWriteClustersAfterRejection requires compressionTypeMask = 0, no GPU usage, and compression enabled");
279 return false;
280 }
281 if (GetProcessingSettings().doublePipeline) {
282 if (GetProcessingSettings().tpcFreeAllocatedMemoryAfterProcessing) {
283 GPUError("Cannot use double pipeline with tpcFreeAllocatedMemoryAfterProcessing");
284 return false;
285 }
287 GPUError("Invalid outputs for double pipeline mode 0x%x", (uint32_t)GetRecoStepsOutputs());
288 return false;
289 }
294 GPUError("Must use external output for double pipeline mode");
295 return false;
296 }
297 if (gatherMode == 1) {
298 GPUError("Double pipeline incompatible to compression mode 1");
299 return false;
300 }
302 GPUError("Invalid reconstruction settings for double pipeline: Needs compression and cluster finding");
303 return false;
304 }
305 }
306 if ((GetRecoStepsGPU() & gpudatatypes::RecoStep::TPCCompression) && !(GetRecoStepsGPU() & gpudatatypes::RecoStep::TPCCompression) && (gatherMode == 1 || gatherMode == 3)) {
307 GPUError("Invalid tpcCompressionGatherMode for compression on CPU");
308 return false;
309 }
310 if (GetProcessingSettings().tpcApplyClusterFilterOnCPU > 0 && (GetRecoStepsGPU() & gpudatatypes::RecoStep::TPCClusterFinding || GetProcessingSettings().runMC)) {
311 GPUError("tpcApplyClusterFilterOnCPU cannot be used with GPU clusterization or with MC labels");
312 return false;
313 }
314 if (GetRecoSteps() & RecoStep::TRDTracking) {
315 if (GetProcessingSettings().trdTrackModelO2 && (GetProcessingSettings().createO2Output == 0 || (GetMatLUT() == nullptr && !GetProcessingSettings().willProvideO2PropagatorLate))) {
316 GPUError("TRD tracking can only run on O2 TPC tracks if createO2Output is enabled (%d), and matBudLUT is available (0x%p)", (int32_t)GetProcessingSettings().createO2Output, (void*)GetMatLUT());
317 return false;
318 }
319 if ((GetRecoStepsGPU() & RecoStep::TRDTracking) && !GetProcessingSettings().trdTrackModelO2 && GetProcessingSettings().createO2Output > 1) {
320 GPUError("TRD tracking can only run on GPU TPC tracks if the createO2Output setting does not suppress them");
321 return false;
322 }
323 if ((((GetRecoStepsGPU() & RecoStep::TRDTracking) && GetProcessingSettings().trdTrackModelO2) || ((GetRecoStepsGPU() & RecoStep::Refit) && !param().rec.trackingRefitGPUModel)) && (!GetProcessingSettings().o2PropagatorUseGPUField || (GetMatLUT() == nullptr && !GetProcessingSettings().willProvideO2PropagatorLate))) {
324 GPUError("Cannot use TRD tracking or Refit on GPU without GPU polynomial field map (%d) or matlut table (%p)", (int32_t)GetProcessingSettings().o2PropagatorUseGPUField, (void*)GetMatLUT());
325 return false;
326 }
327 }
328 return true;
329}
330
332{
333 const auto& threadContext = GetThreadContext();
334 if (GetProcessingSettings().debugLevel >= 1) {
335 printf("Enabled Reconstruction Steps: 0x%x (on GPU: 0x%x)", (int32_t)GetRecoSteps().get(), (int32_t)GetRecoStepsGPU().get());
336 for (uint32_t i = 0; i < sizeof(gpudatatypes::RECO_STEP_NAMES) / sizeof(gpudatatypes::RECO_STEP_NAMES[0]); i++) {
337 if (GetRecoSteps().isSet(1u << i)) {
338 printf(" - %s", gpudatatypes::RECO_STEP_NAMES[i]);
339 if (GetRecoStepsGPU().isSet(1u << i)) {
340 printf(" (G)");
341 }
342 }
343 }
344 printf("\n");
345 }
346 if (!ValidateSteps()) {
347 return 1;
348 }
349
350 for (uint32_t i = 0; i < mSubOutputControls.size(); i++) {
351 if (mSubOutputControls[i] == nullptr) {
353 }
354 }
355
356 if (!ValidateSettings()) {
357 return 1;
358 }
359
362 if (!qa) {
363 qa.reset(new GPUQA(this));
364 }
365 }
368 if (mEventDisplay == nullptr) {
369 throw std::runtime_error("Error loading event display");
370 }
371 }
372
375
376 if (mRec->IsGPU()) {
378 UpdateGPUCalibObjectsPtrs(-1); // First initialization, for users not using RunChain
380 WriteToConstantMemory(RecoStep::NoRecoStep, (char*)&processors()->errorCodes - (char*)processors(), &processorsShadow()->errorCodes, sizeof(processorsShadow()->errorCodes), -1);
381 TransferMemoryResourceLinkToGPU(RecoStep::NoRecoStep, mInputsHost->mResourceErrorCodes);
382 }
383
384 if (GetProcessingSettings().debugLevel >= 6) {
385 std::string filename = std::string(mRec->IsGPU() ? "GPU" : "CPU") + (mRec->slaveId() != -1 ? (std::string("_slave") + std::to_string(mRec->slaveId())) : std::string(mRec->slavesExist() ? "_master" : "")) + GetProcessingSettings().debugLogSuffix + ".out";
386 mDebugFile->open(filename.c_str());
387 }
388
389 return 0;
390}
391
393{
394 if (processors()->calibObjects.fastTransform && (ptrMask == nullptr || ptrMask->fastTransform)) {
395 memcpy((void*)mFlatObjectsShadow.mCalibObjects.fastTransform, (const void*)processors()->calibObjects.fastTransform, sizeof(*processors()->calibObjects.fastTransform));
396 memcpy((void*)mFlatObjectsShadow.mTpcTransformBuffer, (const void*)processors()->calibObjects.fastTransform->getFlatBufferPtr(), processors()->calibObjects.fastTransform->getFlatBufferSize());
397 mFlatObjectsShadow.mCalibObjects.fastTransform->clearInternalBufferPtr();
400 }
401 if (processors()->calibObjects.fastTransformMShape && (ptrMask == nullptr || ptrMask->fastTransformMShape)) {
402 memcpy((void*)mFlatObjectsShadow.mCalibObjects.fastTransformMShape, (const void*)processors()->calibObjects.fastTransformMShape, sizeof(*processors()->calibObjects.fastTransformMShape));
403 memcpy((void*)mFlatObjectsShadow.mTpcTransformMShapeBuffer, (const void*)processors()->calibObjects.fastTransformMShape->getFlatBufferPtr(), processors()->calibObjects.fastTransformMShape->getFlatBufferSize());
404 mFlatObjectsShadow.mCalibObjects.fastTransformMShape->clearInternalBufferPtr();
407 }
408 if (processors()->calibObjects.fastTransformRef && (ptrMask == nullptr || ptrMask->fastTransformRef)) {
409 memcpy((void*)mFlatObjectsShadow.mCalibObjects.fastTransformRef, (const void*)processors()->calibObjects.fastTransformRef, sizeof(*processors()->calibObjects.fastTransformRef));
410 memcpy((void*)mFlatObjectsShadow.mTpcTransformRefBuffer, (const void*)processors()->calibObjects.fastTransformRef->getFlatBufferPtr(), processors()->calibObjects.fastTransformRef->getFlatBufferSize());
411 mFlatObjectsShadow.mCalibObjects.fastTransformRef->clearInternalBufferPtr();
414 }
415 if (processors()->calibObjects.fastTransformHelper && (ptrMask == nullptr || ptrMask->fastTransformHelper)) {
416 memcpy((void*)mFlatObjectsShadow.mCalibObjects.fastTransformHelper, (const void*)processors()->calibObjects.fastTransformHelper, sizeof(*processors()->calibObjects.fastTransformHelper));
420 }
421 if (processors()->calibObjects.dEdxCalibContainer && (ptrMask == nullptr || ptrMask->dEdxCalibContainer)) {
422 memcpy((void*)mFlatObjectsShadow.mCalibObjects.dEdxCalibContainer, (const void*)processors()->calibObjects.dEdxCalibContainer, sizeof(*processors()->calibObjects.dEdxCalibContainer));
423 memcpy((void*)mFlatObjectsShadow.mdEdxSplinesBuffer, (const void*)processors()->calibObjects.dEdxCalibContainer->getFlatBufferPtr(), processors()->calibObjects.dEdxCalibContainer->getFlatBufferSize());
424 mFlatObjectsShadow.mCalibObjects.dEdxCalibContainer->clearInternalBufferPtr();
427 }
428 if (processors()->calibObjects.matLUT && (ptrMask == nullptr || ptrMask->matLUT)) {
429 memcpy((void*)mFlatObjectsShadow.mCalibObjects.matLUT, (const void*)processors()->calibObjects.matLUT, sizeof(*processors()->calibObjects.matLUT));
430 memcpy((void*)mFlatObjectsShadow.mMatLUTBuffer, (const void*)processors()->calibObjects.matLUT->getFlatBufferPtr(), processors()->calibObjects.matLUT->getFlatBufferSize());
431 mFlatObjectsShadow.mCalibObjects.matLUT->clearInternalBufferPtr();
434 }
435 if (processors()->calibObjects.trdGeometry && (ptrMask == nullptr || ptrMask->trdGeometry)) {
436 memcpy((void*)mFlatObjectsShadow.mCalibObjects.trdGeometry, (const void*)processors()->calibObjects.trdGeometry, sizeof(*processors()->calibObjects.trdGeometry));
437 mFlatObjectsShadow.mCalibObjects.trdGeometry->clearInternalBufferPtr();
438 }
439 if (processors()->calibObjects.trdRecoParam && (ptrMask == nullptr || ptrMask->trdRecoParam)) {
440 memcpy((void*)mFlatObjectsShadow.mCalibObjects.trdRecoParam, (const void*)processors()->calibObjects.trdRecoParam, sizeof(*processors()->calibObjects.trdRecoParam));
441 }
442 if (processors()->calibObjects.tpcPadGain && (ptrMask == nullptr || ptrMask->tpcPadGain)) {
443 memcpy((void*)mFlatObjectsShadow.mCalibObjects.tpcPadGain, (const void*)processors()->calibObjects.tpcPadGain, sizeof(*processors()->calibObjects.tpcPadGain));
444 }
445 if (processors()->calibObjects.tpcZSLinkMapping && (ptrMask == nullptr || ptrMask->tpcZSLinkMapping)) {
446 memcpy((void*)mFlatObjectsShadow.mCalibObjects.tpcZSLinkMapping, (const void*)processors()->calibObjects.tpcZSLinkMapping, sizeof(*processors()->calibObjects.tpcZSLinkMapping));
447 }
448 if (processors()->calibObjects.o2Propagator && (ptrMask == nullptr || ptrMask->o2Propagator)) {
449 memcpy((void*)mFlatObjectsShadow.mCalibObjects.o2Propagator, (const void*)processors()->calibObjects.o2Propagator, sizeof(*processors()->calibObjects.o2Propagator));
450 mFlatObjectsShadow.mCalibObjects.o2Propagator->setGPUField(&processorsDevice()->param.polynomialField);
452 }
454 memcpy((void*)&processorsShadow()->calibObjects, (void*)&mFlatObjectsDevice.mCalibObjects, sizeof(mFlatObjectsDevice.mCalibObjects));
455}
456
458{
459 WriteToConstantMemory(RecoStep::NoRecoStep, (char*)&processors()->calibObjects - (char*)processors(), &mFlatObjectsDevice.mCalibObjects, sizeof(mFlatObjectsDevice.mCalibObjects), stream);
460}
461
463{
467 }
468 if (mIOPtrs.tpcZS && param().rec.fwdTPCDigitsAsClusters) {
469 throw std::runtime_error("Forwading zero-suppressed hits not supported");
470 }
472 return 0;
473}
474
476{
478 if (!qa) {
479 qa.reset(new GPUQA(this));
480 }
481 if (!GetQA()->IsInitialized()) {
483 }
484 return 0;
485}
486
488{
489 if (GetProcessingSettings().runQA && GetQA()->IsInitialized() && !(mConfigQA && mConfigQA->shipToQC) && !mQAFromForeignChain) {
490 GetQA()->UpdateChain(this);
492 }
493 if (GetProcessingSettings().debugLevel >= 6) {
494 mDebugFile->close();
495 }
497 mCompressionStatistics->Finish();
498 }
499 return 0;
500}
501
503{
504 char* fastTransformBase = (char*)mem;
508 }
512 }
516 }
519 }
520 if ((char*)mem - fastTransformBase < mChainTracking->GetProcessingSettings().fastTransformObjectsMinMemorySize) {
521 mem = fastTransformBase + mChainTracking->GetProcessingSettings().fastTransformObjectsMinMemorySize; // TODO: Fixme and do proper dynamic allocation
522 }
525 }
528 }
529 char* dummyPtr;
533 } else if (mChainTracking->GetProcessingSettings().lateO2MatLutProvisioningSize) {
534 computePointerWithAlignment(mem, dummyPtr, mChainTracking->GetProcessingSettings().lateO2MatLutProvisioningSize);
535 }
539 }
542 }
545 }
548 mCalibObjects.o2Propagator = nullptr; // Always reserve memory for o2::Propagator, since it may be propagatred only during run() not during init().
549 }
551 mem = (char*)mem + mChainTracking->GetProcessingSettings().calibObjectsExtraMemorySize; // TODO: Fixme and do proper dynamic allocation
552 }
553 return mem;
554}
555
557{
558 std::memset((void*)&mIOPtrs, 0, sizeof(mIOPtrs));
560 new (&mIOMem) InOutMemory;
561 mClusterNativeAccessReduced.reset(nullptr);
562 if (mClusterNativeAccess.get()) {
563 memset((void*)mClusterNativeAccess.get(), 0, sizeof(*mClusterNativeAccess));
564 }
565}
566
568{
569 for (uint32_t i = 0; i < NSECTORS; i++) {
574 }
576 std::memset(mIOMem.clusterNativeAccess.get(), 0, sizeof(ClusterNativeAccess)); // ClusterNativeAccess has no its own constructor
590}
591
592void GPUChainTracking::SetTPCFastTransform(std::unique_ptr<TPCFastTransform>&& tpcFastTransform, std::unique_ptr<CorrectionMapsHelper>&& tpcTransformHelper)
593{
594 mTPCFastTransformU = std::move(tpcFastTransform);
595 mTPCFastTransformHelperU = std::move(tpcTransformHelper);
598}
599
600void GPUChainTracking::SetMatLUT(std::unique_ptr<o2::base::MatLayerCylSet>&& lut)
601{
602 mMatLUTU = std::move(lut);
604}
605
606void GPUChainTracking::SetTRDGeometry(std::unique_ptr<o2::trd::GeometryFlat>&& geo)
607{
608 mTRDGeometryU = std::move(geo);
610}
611
612void GPUChainTracking::SetTRDRecoParam(std::unique_ptr<GPUTRDRecoParam>&& par)
613{
614 mTRDRecoParamU = std::move(par);
616}
617
618int32_t GPUChainTracking::DoQueuedUpdates(int32_t stream, bool updateSlave)
619{
620 int32_t retVal = 0;
621 std::unique_ptr<GPUSettingsGRP> grp;
622 const GPUSettingsProcessing* p = nullptr;
623 std::lock_guard lk(mMutexUpdateCalib);
625 if (mNewCalibValues->newSolenoidField || mNewCalibValues->newContinuousMaxTimeBin || mNewCalibValues->newTPCTimeBinCut) {
626 grp = std::make_unique<GPUSettingsGRP>(mRec->GetGRPSettings());
627 if (mNewCalibValues->newSolenoidField) {
628 grp->solenoidBzNominalGPU = mNewCalibValues->solenoidField;
629 }
630 if (mNewCalibValues->newContinuousMaxTimeBin) {
631 grp->grpContinuousMaxTimeBin = mNewCalibValues->continuousMaxTimeBin;
632 }
633 if (mNewCalibValues->newTPCTimeBinCut) {
634 grp->tpcCutTimeBin = mNewCalibValues->tpcTimeBinCut;
635 }
636 }
637 }
638 if (GetProcessingSettings().tpcDownscaledEdx != 0) {
640 }
641 if (grp || p) {
642 mRec->UpdateSettings(grp.get(), p);
643 retVal = 1;
644 }
646 if (mNewCalibObjects->o2Propagator && ((mNewCalibObjects->o2Propagator->getGPUField() != nullptr) ^ GetProcessingSettings().o2PropagatorUseGPUField)) {
647 GPUFatal("GPU magnetic field for propagator requested, but received an O2 propagator without GPU field");
648 }
649 void* const* pSrc = (void* const*)mNewCalibObjects.get();
650 void** pDst = (void**)&processors()->calibObjects;
651 for (uint32_t i = 0; i < sizeof(processors()->calibObjects) / sizeof(void*); i++) {
652 if (pSrc[i]) {
653 pDst[i] = pSrc[i];
654 }
655 }
657 if (GetProcessingSettings().trdTrackModelO2) {
659 if (mRec->IsGPU()) {
660 TransferMemoryResourceLinkToGPU(RecoStep::NoRecoStep, processors()->trdTrackerO2.MemoryPermanent(), stream);
661 }
662 } else {
664 if (mRec->IsGPU()) {
665 TransferMemoryResourceLinkToGPU(RecoStep::NoRecoStep, processors()->trdTrackerGPU.MemoryPermanent(), stream);
666 }
667 }
668 }
669 if (mRec->IsGPU()) {
670 std::array<uint8_t, sizeof(GPUTrackingFlatObjects)> oldFlatPtrs, oldFlatPtrsDevice;
671 memcpy(oldFlatPtrs.data(), (void*)&mFlatObjectsShadow, oldFlatPtrs.size());
672 memcpy(oldFlatPtrsDevice.data(), (void*)&mFlatObjectsDevice, oldFlatPtrsDevice.size());
674 bool ptrsChanged = memcmp(oldFlatPtrs.data(), (void*)&mFlatObjectsShadow, oldFlatPtrs.size()) || memcmp(oldFlatPtrsDevice.data(), (void*)&mFlatObjectsDevice, oldFlatPtrsDevice.size());
675 if (ptrsChanged) {
676 GPUInfo("Updating all calib objects since pointers changed");
677 }
678 UpdateGPUCalibObjects(stream, ptrsChanged ? nullptr : mNewCalibObjects.get());
679 }
680 }
681
682 if ((mUpdateNewCalibObjects || (mRec->slavesExist() && updateSlave)) && mRec->IsGPU()) {
683 UpdateGPUCalibObjectsPtrs(stream); // Reinitialize
684 retVal = 1;
685 }
686 mNewCalibObjects.reset(nullptr);
687 mNewCalibValues.reset(nullptr);
689 return retVal;
690}
691
693{
694 if ((((GetRecoSteps() & RecoStep::TRDTracking) && !GetProcessingSettings().trdTrackModelO2 && !GetProcessingSettings().willProvideO2PropagatorLate) || ((GetRecoSteps() & RecoStep::Refit) && !param().rec.trackingRefitGPUModel)) && processors()->calibObjects.o2Propagator == nullptr) {
695 GPUFatal("Cannot run TRD tracking or refit with o2 track model without o2 propagator"); // This check must happen during run, since o2::Propagator cannot be available during init
696 }
697 if (GetProcessingSettings().autoAdjustHostThreads && !mRec->IsGPU()) {
699 }
700 const auto threadContext = GetThreadContext();
701 if (GetProcessingSettings().runCompressionStatistics && mCompressionStatistics == nullptr) {
703 }
704 const bool needQA = GPUQA::QAAvailable() && (GetProcessingSettings().runQA || (GetProcessingSettings().eventDisplay && (mIOPtrs.nMCInfosTPC || GetProcessingSettings().runMC)));
705 if (needQA && GetQA()->IsInitialized() == false) {
707 return 1;
708 }
709 }
710 if (needQA) {
711 mFractionalQAEnabled = GetProcessingSettings().qcRunFraction == 100.f || (uint32_t)(rand() % 10000) < (uint32_t)(GetProcessingSettings().qcRunFraction * 100);
712 }
713 if (GetProcessingSettings().debugLevel >= 6) {
714 *mDebugFile << "\n\nProcessing event " << mRec->getNEventsProcessed() << std::endl;
715 }
717
718 mRec->getGeneralStepTimer(GeneralStep::Prepare).Start();
719 try {
721 } catch (const std::bad_alloc& e) {
722 GPUError("Memory Allocation Error");
723 return (1);
724 }
725 mRec->getGeneralStepTimer(GeneralStep::Prepare).Stop();
726
728
729 SynchronizeStream(0); // Synchronize all init copies that might be ongoing
730
731 if (GetProcessingSettings().debugOnFailure) {
732 mRec->setDebugDumpCallback([this]() { DoDebugRawDump(); });
733 }
734
736 if (runRecoStep(RecoStep::TPCDecompression, &GPUChainTracking::RunTPCDecompression)) {
737 return 1;
738 }
739 } else if (mIOPtrs.tpcPackedDigits || mIOPtrs.tpcZS) {
740 if (runRecoStep(RecoStep::TPCClusterFinding, &GPUChainTracking::RunTPCClusterizer, false)) {
741 return 1;
742 }
743 }
744
745 if (GetProcessingSettings().autoAdjustHostThreads && !mRec->IsGPU() && mIOPtrs.clustersNative) {
747 }
748
750 return 1;
751 }
752
753 mRec->PushNonPersistentMemory(qStr2Tag("TPCSLCD1")); // 1st stack level for TPC tracking sector data
755 if (runRecoStep(RecoStep::TPCSectorTracking, &GPUChainTracking::RunTPCTrackingSectors)) {
756 return 1;
757 }
758
759 if (runRecoStep(RecoStep::TPCMerging, &GPUChainTracking::RunTPCTrackingMerger, false)) {
760 return 1;
761 }
763 mRec->PopNonPersistentMemory(RecoStep::TPCSectorTracking, qStr2Tag("TPCSLCD1")); // Release 1st stack level, TPC sector data not needed after merger
765 }
766
768 if (GetProcessingSettings().doublePipeline) {
770 if (foreignChain && foreignChain->mIOPtrs.tpcZS) {
771 if (GetProcessingSettings().debugLevel >= 3) {
772 GPUInfo("Preempting tpcZS input of foreign chain");
773 }
774 mPipelineFinalizationCtx.reset(new GPUChainTrackingFinalContext);
775 mPipelineFinalizationCtx->rec = this->mRec;
776 foreignChain->mPipelineNotifyCtx = mPipelineFinalizationCtx.get();
777 }
778 }
779 if (runRecoStep(RecoStep::TPCCompression, &GPUChainTracking::RunTPCCompression)) {
780 return 1;
781 }
782 }
783
784 if (runRecoStep(RecoStep::TRDTracking, &GPUChainTracking::RunTRDTracking)) {
785 return 1;
786 }
787
788 if (runRecoStep(RecoStep::Refit, &GPUChainTracking::RunRefit)) {
789 return 1;
790 }
791
792 if (!GetProcessingSettings().doublePipeline) { // Synchronize with output copies running asynchronously
793 SynchronizeStream(OutputStream());
794 }
795
796 if (GetProcessingSettings().autoAdjustHostThreads && !mRec->IsGPU()) {
798 }
799
800 int32_t retVal = 0;
801 if (CheckErrorCodes(false, false, mRec->getErrorCodeOutput())) { // TODO: Eventually, we should use GPUReconstruction::CheckErrorCodes
802 retVal = 3;
803 if (!GetProcessingSettings().ignoreNonFatalGPUErrors) {
804 return retVal;
805 }
806 }
807
808 if (GetProcessingSettings().doublePipeline) {
809 return retVal;
810 }
811 int32_t retVal2 = RunChainFinalize();
812 return retVal2 ? retVal2 : retVal;
813}
814
815int32_t GPUChainTracking::RunChainFinalize()
816{
817 if (mIOPtrs.clustersNative && (GetRecoSteps() & RecoStep::TPCCompression) && GetProcessingSettings().runCompressionStatistics) {
820 }
821
822 if (GetProcessingSettings().outputSanityCheck) {
823 OutputSanityCheck();
824 }
825
826 const bool needQA = GPUQA::QAAvailable() && (GetProcessingSettings().runQA || (GetProcessingSettings().eventDisplay && mIOPtrs.nMCInfosTPC));
827 if (needQA && mFractionalQAEnabled) {
828 mRec->getGeneralStepTimer(GeneralStep::QA).Start();
829 GetQA()->UpdateChain(this);
830 GetQA()->RunQA(!GetProcessingSettings().runQA);
831 mRec->getGeneralStepTimer(GeneralStep::QA).Stop();
832 if (GetProcessingSettings().debugLevel == 0) {
833 GPUInfo("Total QA runtime: %d us", (int32_t)(mRec->getGeneralStepTimer(GeneralStep::QA).GetElapsedTime() * 1000000));
834 }
835 }
836
837 if (GetProcessingSettings().showOutputStat) {
839 }
840
842
843 // PrintMemoryRelations();
844
846 if (!mDisplayRunning) {
847 GPUInfo("Starting Event Display...");
848 if (mEventDisplay->StartDisplay()) {
849 GPUError("Error starting Event Display");
850 return (1);
851 }
852 mDisplayRunning = true;
853 } else {
854 mEventDisplay->ShowNextEvent();
855 }
856
857 mEventDisplay->WaitTillEventShown();
858
859 if (GetProcessingSettings().eventDisplay->EnableSendKey()) {
860 while (kbhit()) {
861 getch();
862 }
863 GPUInfo("Press key for next event!");
864 }
865
866 int32_t iKey;
867 do {
868 usleep(10000);
869 if (GetProcessingSettings().eventDisplay->EnableSendKey()) {
870 iKey = kbhit() ? getch() : 0;
871 if (iKey == 27) {
872 GetProcessingSettings().eventDisplay->setDisplayControl(2);
873 } else if (iKey == 'n') {
874 break;
875 } else if (iKey) {
876 while (GetProcessingSettings().eventDisplay->getSendKey() != 0) {
877 usleep(1000);
878 }
879 GetProcessingSettings().eventDisplay->setSendKey(iKey);
880 }
881 }
882 } while (GetProcessingSettings().eventDisplay->getDisplayControl() == 0);
883 if (GetProcessingSettings().eventDisplay->getDisplayControl() == 2) {
884 mDisplayRunning = false;
885 GetProcessingSettings().eventDisplay->DisplayExit();
886 const_cast<GPUSettingsProcessing&>(GetProcessingSettings()).eventDisplay = nullptr; // TODO: fixme - eventDisplay should probably not be put into ProcessingSettings in the first place
887 return (2);
888 }
889 GetProcessingSettings().eventDisplay->setDisplayControl(0);
890 GPUInfo("Loading next event...");
891
892 mEventDisplay->BlockTillNextEvent();
893 }
894
895 return 0;
896}
897
899{
900 if (mPipelineFinalizationCtx) {
901 {
902 std::unique_lock<std::mutex> lock(mPipelineFinalizationCtx->mutex);
903 auto* ctx = mPipelineFinalizationCtx.get();
904 mPipelineFinalizationCtx->cond.wait(lock, [ctx]() { return ctx->ready; });
905 }
906 mPipelineFinalizationCtx.reset();
907 }
908 return RunChainFinalize();
909}
910
911int32_t GPUChainTracking::CheckErrorCodes(bool cpuOnly, bool forceShowErrors, std::vector<std::array<uint32_t, 4>>* fillErrors)
912{
913 int32_t retVal = 0;
914 bool hasDebugError = false;
915 for (int32_t i = 0; i < 1 + (!cpuOnly && mRec->IsGPU()); i++) {
916 if (i) {
917 const auto& threadContext = GetThreadContext();
918 if (GetProcessingSettings().doublePipeline) {
919 TransferMemoryResourceLinkToHost(RecoStep::NoRecoStep, mInputsHost->mResourceErrorCodes, 0);
921 } else {
922 TransferMemoryResourceLinkToHost(RecoStep::NoRecoStep, mInputsHost->mResourceErrorCodes);
923 }
924 }
925 if (processors()->errorCodes.hasError()) {
926 static int32_t errorsShown = 0;
927 static bool quiet = false;
928 static std::chrono::time_point<std::chrono::steady_clock> silenceFrom;
929 if (!quiet && errorsShown++ >= 10 && GetProcessingSettings().throttleAlarms && !forceShowErrors) {
930 silenceFrom = std::chrono::steady_clock::now();
931 quiet = true;
932 } else if (quiet) {
933 auto currentTime = std::chrono::steady_clock::now();
934 std::chrono::duration<double> elapsed_seconds = currentTime - silenceFrom;
935 if (elapsed_seconds.count() > 60 * 10) {
936 quiet = false;
937 errorsShown = 1;
938 }
939 }
940 retVal = 1;
941 if (GetProcessingSettings().throttleAlarms && !forceShowErrors) {
942 GPUWarning("GPUReconstruction suffered from an error in the %s part", i ? "GPU" : "CPU");
943 } else {
944 GPUError("GPUReconstruction suffered from an error in the %s part", i ? "GPU" : "CPU");
945 }
946 if (!quiet) {
947 processors()->errorCodes.printErrors(GetProcessingSettings().throttleAlarms && !forceShowErrors);
948 }
949 if (fillErrors) {
950 uint32_t nErrors = processors()->errorCodes.getNErrors();
951 const uint32_t* pErrors = processors()->errorCodes.getErrorPtr();
952 for (uint32_t j = 0; j < nErrors; j++) {
953 fillErrors->emplace_back(std::array<uint32_t, 4>{pErrors[4 * j], pErrors[4 * j + 1], pErrors[4 * j + 2], pErrors[4 * j + 3]});
954 }
955 }
956 if ((GetProcessingSettings().debugOnFailure & 1) || (GetProcessingSettings().debugOnFailure & 4)) {
957 if (GetProcessingSettings().debugOnFailureErrorMask == (uint64_t)-1) {
958 hasDebugError = true;
959 } else {
960 uint32_t nErrors = processors()->errorCodes.getNErrors();
961 const uint32_t* pErrors = processors()->errorCodes.getErrorPtr();
962 for (uint32_t j = 0; j < nErrors; j++) {
963 if (GetProcessingSettings().debugOnFailureErrorMask & (1 << pErrors[4 * j])) {
964 hasDebugError = true;
965 break;
966 }
967 }
968 }
969 }
970 }
971 }
972 ClearErrorCodes(cpuOnly);
973 if (hasDebugError) {
975 }
976 return retVal;
977}
978
980{
982 if (mRec->IsGPU() && !cpuOnly) {
983 const auto& threadContext = GetThreadContext();
984 WriteToConstantMemory(RecoStep::NoRecoStep, (char*)&processors()->errorCodes - (char*)processors(), &processorsShadow()->errorCodes, sizeof(processorsShadow()->errorCodes), 0);
985 TransferMemoryResourceLinkToGPU(RecoStep::NoRecoStep, mInputsHost->mResourceErrorCodes, 0);
986 }
987}
988
990{
991 std::lock_guard lk(mMutexUpdateCalib);
992 if (mNewCalibObjects) {
993 void* const* pSrc = (void* const*)&obj;
994 void** pDst = (void**)mNewCalibObjects.get();
995 for (uint32_t i = 0; i < sizeof(*mNewCalibObjects) / sizeof(void*); i++) {
996 if (pSrc[i]) {
997 pDst[i] = pSrc[i];
998 }
999 }
1000 } else {
1001 mNewCalibObjects.reset(new GPUCalibObjectsConst(obj));
1002 }
1003 if (mNewCalibValues) {
1004 mNewCalibValues->updateFrom(&vals);
1005 } else {
1006 mNewCalibValues.reset(new GPUNewCalibValues(vals));
1007 }
1009}
1010
1012{
1013 return (mRec->IsGPU() ? processorsShadow() : processors())->calibObjects.o2Propagator;
1014}
1015
1017{
1019 if ((prop->getGPUField() != nullptr) ^ GetProcessingSettings().o2PropagatorUseGPUField) {
1020 GPUFatal("GPU magnetic field for propagator requested, but received an O2 propagator without GPU field");
1021 }
1022}
1023
1024void GPUChainTracking::ApplySyncSettings(GPUSettingsProcessing& proc, GPUSettingsRec& rec, gpudatatypes::RecoStepField& steps, bool syncMode, int32_t dEdxMode)
1025{
1026 if (syncMode) {
1027 rec.useMatLUT = false;
1028 }
1029 if (proc.rtc.optSpecialCode == -1) {
1030 proc.rtc.optSpecialCode = syncMode;
1031 }
1032 if (dEdxMode != -2) {
1033 steps.setBits(gpudatatypes::RecoStep::TPCdEdx, dEdxMode == -1 ? !syncMode : (dEdxMode > 0));
1034 }
1035}
Definition of container class for dE/dx corrections.
Helper class to access correction maps.
int32_t i
#define GPUCA_MEMORY_SIZE
#define GPUCA_HOST_MEMORY_SIZE
int32_t retVal
Online TRD tracker based on extrapolated TPC tracks.
Used for storing the MC labels for the TRD tracklets.
TRD Tracklet word for GPU tracker - 32bit tracklet info + half chamber ID + index.
Definition of a container to keep Monte Carlo truth external to simulation objects.
uint32_t j
Definition RawData.h:0
uint32_t c
Definition RawData.h:2
Definition of TPCFastTransform class.
void Start()
Definition timer.cxx:64
double GetElapsedTime()
Definition timer.cxx:115
void Stop()
Definition timer.cxx:76
bitfield & setBits(const bitfield v, bool w)
Definition bitfield.h:45
bool isSet(const bitfield &v) const
Definition bitfield.h:66
size_t getFlatBufferSize() const
Gives size of the flat buffer.
Definition FlatObject.h:256
void SetMatLUT(std::unique_ptr< o2::base::MatLayerCylSet > &&lut)
static void ApplySyncSettings(GPUSettingsProcessing &proc, GPUSettingsRec &rec, gpudatatypes::RecoStepField &steps, bool syncMode, int32_t dEdxMode=-2)
std::unique_ptr< o2::base::MatLayerCylSet > mMatLUTU
const o2::base::Propagator * GetDeviceO2Propagator()
std::unique_ptr< o2::tpc::ClusterNativeAccess > mClusterNativeAccess
std::unique_ptr< GPUTRDRecoParam > mTRDRecoParamU
void SetTRDGeometry(std::unique_ptr< o2::trd::GeometryFlat > &&geo)
GPUChainTracking * mQAFromForeignChain
void SetO2Propagator(const o2::base::Propagator *prop)
std::unique_ptr< GPUQA > mQA
std::unique_ptr< CorrectionMapsHelper > mTPCFastTransformHelperU
GPUTrackingFlatObjects mFlatObjectsDevice
int32_t RunTPCClusterizer(bool synchronizeOutput=true)
void UpdateGPUCalibObjectsPtrs(int32_t stream)
int32_t RunTPCTrackingMerger(bool synchronizeOutput=true)
std::unique_ptr< GPUTrackingInputProvider > mInputsHost
std::unique_ptr< GPUTPCClusterStatistics > mCompressionStatistics
const o2::base::MatLayerCylSet * GetMatLUT() const
void SetTRDRecoParam(std::unique_ptr< GPUTRDRecoParam > &&par)
std::array< GPUOutputControl *, GPUTrackingOutputs::count()> mSubOutputControls
std::unique_ptr< std::ofstream > mDebugFile
void SetUpdateCalibObjects(const GPUCalibObjectsConst &obj, const GPUNewCalibValues &vals)
std::unique_ptr< GPUCalibObjectsConst > mNewCalibObjects
std::unique_ptr< o2::trd::GeometryFlat > mTRDGeometryU
GPUTrackingFlatObjects mFlatObjectsShadow
void RegisterPermanentMemoryAndProcessors() override
void RegisterGPUProcessors() override
void ClearErrorCodes(bool cpuOnly=false)
const GPUQA * GetQA() const
void MemorySize(size_t &gpuMem, size_t &pageLockedHostMem) override
void SetTPCFastTransform(std::unique_ptr< TPCFastTransform > &&tpcFastTransform, std::unique_ptr< CorrectionMapsHelper > &&tpcTransformHelper)
int32_t DoQueuedUpdates(int32_t stream, bool updateSlave=true)
std::unique_ptr< GPUNewCalibValues > mNewCalibValues
int32_t CheckErrorCodes(bool cpuOnly=false, bool forceShowErrors=false, std::vector< std::array< uint32_t, 4 > > *fillErrors=nullptr) override
std::unique_ptr< TPCFastTransform > mTPCFastTransformU
int32_t PrepareEvent() override
GPUChainTracking(GPUReconstruction *rec, uint32_t maxTPCHits=GPUCA_MAX_CLUSTERS, uint32_t maxTRDTracklets=GPUCA_MAX_TRD_TRACKLETS)
void UpdateGPUCalibObjects(int32_t stream, const GPUCalibObjectsConst *ptrMask=nullptr)
GPUTrackingInOutPointers & mIOPtrs
struct o2::gpu::GPUChainTracking::InOutMemory mIOMem
const o2::tpc::CalibdEdxContainer * GetdEdxCalibContainer() const
std::unique_ptr< GPUTrackingInputProvider > mInputsShadow
const GPUSettingsQA * mConfigQA
int32_t FinalizePipelinedProcessing() override
std::unique_ptr< GPUDisplayInterface > mEventDisplay
std::unique_ptr< o2::tpc::ClusterNativeAccess > mClusterNativeAccessReduced
void TransferMemoryResourceLinkToGPU(RecoStep step, int16_t res, int32_t stream=-1, deviceEvent *ev=nullptr, deviceEvent *evList=nullptr, int32_t nEvents=1)
Definition GPUChain.h:124
GPUConstantMem * processorsDevice()
Definition GPUChain.h:86
GPUReconstruction::RecoStepField GetRecoStepsGPU() const
Definition GPUChain.h:72
GPUReconstruction::RecoStepField GetRecoSteps() const
Definition GPUChain.h:71
void WriteToConstantMemory(RecoStep step, size_t offset, const void *src, size_t size, int32_t stream=-1, deviceEvent *ev=nullptr)
Definition GPUChain.h:127
GPUChain * GetNextChainInQueue()
Definition GPUChain.h:225
GPUReconstruction::InOutTypeField GetRecoStepsOutputs() const
Definition GPUChain.h:74
virtual std::unique_ptr< GPUReconstructionProcessing::threadContext > GetThreadContext()
Definition GPUChain.h:109
GPUConstantMem * processors()
Definition GPUChain.h:84
GPUParam & param()
Definition GPUChain.h:87
const GPUSettingsProcessing & GetProcessingSettings() const
Definition GPUChain.h:76
void SynchronizeStream(int32_t stream)
Definition GPUChain.h:89
GPUReconstructionCPU * mRec
Definition GPUChain.h:79
GPUConstantMem * processorsShadow()
Definition GPUChain.h:85
GPUReconstruction::InOutTypeField GetRecoStepsInputs() const
Definition GPUChain.h:73
static constexpr int32_t NSECTORS
Definition GPUChain.h:58
void TransferMemoryResourceLinkToHost(RecoStep step, int16_t res, int32_t stream=-1, deviceEvent *ev=nullptr, deviceEvent *evList=nullptr, int32_t nEvents=1)
Definition GPUChain.h:125
void AllocateIOMemoryHelper(uint32_t n, const T *&ptr, std::unique_ptr< T[]> &u)
Definition GPUChain.h:139
int32_t runRecoStep(RecoStep step, S T::*func, Args... args)
Definition GPUChain.h:287
GPUReconstruction * rec()
Definition GPUChain.h:66
static GPUDisplayInterface * getDisplay(GPUDisplayFrontendInterface *frontend, GPUChainTracking *chain, GPUQA *qa, const GPUParam *param=nullptr, const GPUCalibObjectsConst *calib=nullptr, const GPUSettingsDisplay *config=nullptr, const GPUSettingsProcessing *proc=nullptr)
const uint32_t * getErrorPtr() const
Definition GPUErrors.cxx:96
void setMemory(GPUglobalref() uint32_t *m)
Definition GPUErrors.h:37
bool printErrors(bool silent=false, uint64_t mask=0)
Definition GPUErrors.cxx:61
uint32_t getNErrors() const
Definition GPUErrors.cxx:91
static void computePointerWithAlignment(T *&basePtr, S *&objPtr, size_t nEntries=1)
void InitGPUProcessor(GPUReconstruction *rec, ProcessorType type=PROCESSOR_TYPE_CPU, GPUProcessor *slaveProcessor=nullptr)
static bool QAAvailable()
Definition GPUQA.h:57
int32_t DrawQAHistograms()
Definition GPUQA.h:47
void UpdateChain(GPUChainTracking *chain)
Definition GPUQA.h:59
static bool IsInitialized()
Definition GPUQA.h:58
int32_t InitQA(int32_t tasks=0)
Definition GPUQA.h:45
void RunQA(bool matchOnly=false)
Definition GPUQA.h:46
HighResTimer & getGeneralStepTimer(GeneralStep step)
const GPUDefParameters & getGPUParameters(bool doGPU) const override
std::vector< std::array< uint32_t, 4 > > * getErrorCodeOutput()
RecoStepField GetRecoStepsGPU() const
void RegisterGPUDeviceProcessor(GPUProcessor *proc, GPUProcessor *slaveProcessor)
void RegisterGPUProcessor(T *proc, bool deviceSlave)
void setDebugDumpCallback(std::function< void()> &&callback=std::function< void()>(nullptr))
void ResetRegisteredMemoryPointers(GPUProcessor *proc)
int16_t RegisterMemoryAllocation(T *proc, void *(T::*setPtr)(void *), int32_t type, const char *name="", const GPUMemoryReuse &re=GPUMemoryReuse())
void PopNonPersistentMemory(RecoStep step, uint64_t tag, const GPUProcessor *proc=nullptr)
void UpdateSettings(const GPUSettingsGRP *g, const GPUSettingsProcessing *p=nullptr, const GPUSettingsRecDynamic *d=nullptr)
void PushNonPersistentMemory(uint64_t tag)
GPUMemorySizeScalers * MemoryScalers()
const GPUSettingsProcessing & GetProcessingSettings() const
const GPUSettingsGRP & GetGRPSettings() const
GPUOutputControl & OutputControl()
static constexpr const uint32_t TPC_MAX_TF_TIME_BIN
Definition GPUSettings.h:47
GLenum GLfloat param
Definition glcorearb.h:271
GLuint GLuint stream
Definition glcorearb.h:1806
GPUCalibObjectsTemplate< ConstPtr > GPUCalibObjectsConst
Global TPC definitions and constants.
Definition SimTraits.h:168
Defining DataPointCompositeObject explicitly as copiable.
std::string to_string(gsl::span< T, Size > span)
Definition common.h:52
std::string filename()
std::unique_ptr< GPUDisplayFrontendInterface > eventDisplay
GPUReconstruction * rec
constexpr T qStr2Tag(const char(&str)[N])
Definition strtag.h:24
S< o2::trd::GeometryFlat >::type * trdGeometry
S< o2::tpc::CalibdEdxContainer >::type * dEdxCalibContainer
S< TPCZSLinkMapping >::type * tpcZSLinkMapping
S< TPCFastTransform >::type * fastTransform
S< GPUTRDRecoParam >::type * trdRecoParam
S< TPCPadGainCalib >::type * tpcPadGain
S< o2::base::PropagatorImpl< float > >::type * o2Propagator
S< o2::base::MatLayerCylSet >::type * matLUT
S< CorrectionMapsHelper >::type * fastTransformHelper
S< TPCFastTransform >::type * fastTransformRef
S< TPCFastTransform >::type * fastTransformMShape
std::unique_ptr< GPUTPCMCInfo[]> mcInfosTPC
std::unique_ptr< GPUTRDTrackletWord[]> trdTracklets
std::unique_ptr< GPUTPCMCInfoCol[]> mcInfosTPCCol
std::unique_ptr< GPUTPCGMMergedTrackHit[]> mergedTrackHits
std::unique_ptr< int32_t[]> trdTrackletIdxFirst
std::unique_ptr< GPUTPCGMMergedTrack[]> mergedTracks
std::unique_ptr< AliHLTTPCClusterMCLabel[]> mcLabelsTPC
std::unique_ptr< GPUTPCClusterData[]> clusterData[NSECTORS]
std::unique_ptr< o2::tpc::ClusterNative[]> clustersNative
std::unique_ptr< float[]> trdTriggerTimes
std::unique_ptr< GPUTPCTrack[]> sectorTracks[NSECTORS]
std::unique_ptr< GPUTRDSpacePoint[]> trdSpacePoints
std::unique_ptr< uint8_t[]> trdTrigRecMask
std::unique_ptr< o2::tpc::ClusterNativeAccess > clusterNativeAccess
std::unique_ptr< AliHLTTPCRawCluster[]> rawClusters[NSECTORS]
std::unique_ptr< GPUTPCHitId[]> sectorClusters[NSECTORS]
std::unique_ptr< GPUTRDTrackGPU[]> trdTracks
GPUTRDTrackerGPU trdTrackerGPU
GPUCalibObjectsConst calibObjects
const GPUTPCHitId * sectorClusters[NSECTORS]
const o2::tpc::ClusterNativeAccess * clustersNative
const o2::tpc::CompressedClustersFlat * tpcCompressedClusters
const AliHLTTPCClusterMCLabel * mcLabelsTPC
const GPUTRDSpacePoint * trdSpacePoints
const GPUTPCTrack * sectorTracks[NSECTORS]
const GPUTRDTrackGPU * trdTracks
const GPUTRDTrackletWord * trdTracklets
const GPUTrackingInOutZS * tpcZS
const AliHLTTPCRawCluster * rawClusters[NSECTORS]
const GPUTPCClusterData * clusterData[NSECTORS]
const GPUTPCGMMergedTrackHit * mergedTrackHits
const GPUTrackingInOutDigits * tpcPackedDigits
const GPUTPCMCInfoCol * mcInfosTPCCol
const GPUTPCGMMergedTrack * mergedTracks
size_t getIndex(const GPUOutputControl &v)
GPUOutputControl sharedClusterMap
GPUOutputControl compressedClusters