db/d5b/GPUReconstruction_8cxx_source.html

// Copyright 2019-2020 CERN and copyright holders of ALICE O2.

// See https://alice-o2.web.cern.ch/copyright for details of the copyright holders.

// All rights not expressly granted are reserved.

//

// This software is distributed under the terms of the GNU General Public

// License v3 (GPL Version 3), copied verbatim in the file "COPYING".

//

// In applying this license CERN does not waive the privileges and immunities

// granted to it by virtue of its status as an Intergovernmental Organization

// or submit itself to any jurisdiction.


#include <cstring>

#include <cstdio>

#include <iostream>

#include <mutex>

#include <string>

#include <map>

#include <queue>

#include <mutex>

#include <condition_variable>

#include <array>


#include "GPUReconstruction.h"

#include "GPUReconstructionIncludes.h"

#include "GPUReconstructionThreading.h"

#include "GPUReconstructionIO.h"

#include "GPUROOTDumpCore.h"

#include "GPUConfigDump.h"

#include "GPUChainTracking.h"

#include "GPUConstantMem.h"

#include "GPUCommonHelpers.h"

#include "GPUSettings.h"


#include "GPUMemoryResource.h"

#include "GPUChain.h"

#include "GPUMemorySizeScalers.h"


#include "GPULogging.h"

#include "utils/strtag.h"


#ifdef GPUCA_O2_LIB

#include "GPUO2InterfaceConfiguration.h"

#endif


#include "GPUReconstructionIncludesITS.h"


namespace o2::gpu

{

namespace // anonymous

{

struct GPUReconstructionPipelineQueue {

  uint32_t op = 0; // For now, 0 = process, 1 = terminate

  GPUChain* chain = nullptr;

  std::mutex m;

  std::condition_variable c;

  bool done = false;

  int32_t retVal = 0;

};

} // namespace


struct GPUReconstructionPipelineContext {

  std::queue<GPUReconstructionPipelineQueue*> queue;

  std::mutex mutex;

  std::condition_variable cond;

  bool terminate = false;

};


} // namespace o2::gpu


using namespace o2::gpu;


constexpr const char* const GPUReconstruction::GEOMETRY_TYPE_NAMES[];

constexpr const char* const GPUReconstruction::IOTYPENAMES[];

constexpr GPUReconstruction::GeometryType GPUReconstruction::geometryType;


static ptrdiff_t ptrDiff(void* a, void* b) { return (char*)a - (char*)b; }


GPUReconstruction::GPUReconstruction(const GPUSettingsDeviceBackend& cfg) : mHostConstantMem(new GPUConstantMem), mGRPSettings(new GPUSettingsGRP), mDeviceBackendSettings(new GPUSettingsDeviceBackend(cfg)), mProcessingSettings(new GPUSettingsProcessing)

{

  if (cfg.master) {

    if (cfg.master->GetDeviceBackendSettings().deviceType != cfg.deviceType) {

      throw std::invalid_argument("device type of master and slave GPUReconstruction does not match");

    }

    if (cfg.master->mMaster) {

      throw std::invalid_argument("Cannot be slave to a slave");

    }

    mMaster = cfg.master;

    mSlaveId = cfg.master->mSlaves.size();

    cfg.master->mSlaves.emplace_back(this);

  }

  param().SetDefaults(mGRPSettings.get());

  mMemoryScalers.reset(new GPUMemorySizeScalers);

  for (uint32_t i = 0; i < NSECTORS; i++) {

    processors()->tpcTrackers[i].SetSector(i); // TODO: Move to a better place

    processors()->tpcClusterer[i].mISector = i;

#ifdef GPUCA_HAS_ONNX

    processors()->tpcNNClusterer[i].mISector = i;

#endif

  }

#ifndef GPUCA_NO_ROOT

  mROOTDump = GPUROOTDumpCore::getAndCreate();

#endif

}


GPUReconstruction::~GPUReconstruction()

{

  if (mInitialized) {

    GPUError("GPU Reconstruction not properly deinitialized!");

  }

}


void GPUReconstruction::GetITSTraits(std::unique_ptr<o2::its::TrackerTraits<7>>* trackerTraits, std::unique_ptr<o2::its::VertexerTraits>* vertexerTraits, std::unique_ptr<o2::its::TimeFrame<7>>* timeFrame)

{

  if (trackerTraits) {

    trackerTraits->reset(new o2::its::TrackerTraits<7>);

  }

  if (vertexerTraits) {

    vertexerTraits->reset(new o2::its::VertexerTraits);

  }

  if (timeFrame) {

    timeFrame->reset(new o2::its::TimeFrame<7>);

  }

}


int32_t GPUReconstruction::getHostThreadIndex()

{

  return std::max<int32_t>(0, tbb::this_task_arena::current_thread_index());

}


int32_t GPUReconstruction::Init()

{

  if (mMaster) {

    throw std::runtime_error("Must not call init on slave!");

  }

  int32_t retVal = InitPhaseBeforeDevice();

  if (retVal) {

    return retVal;

  }

  for (uint32_t i = 0; i < mSlaves.size(); i++) {

    retVal = mSlaves[i]->InitPhaseBeforeDevice();

    if (retVal) {

      GPUError("Error initialization slave (before deviceinit)");

      return retVal;

    }

    mNStreams = std::max(mNStreams, mSlaves[i]->mNStreams);

    mHostMemorySize = std::max(mHostMemorySize, mSlaves[i]->mHostMemorySize);

    mDeviceMemorySize = std::max(mDeviceMemorySize, mSlaves[i]->mDeviceMemorySize);

  }

  if (InitDevice()) {

    return 1;

  }

  if (GetProcessingSettings().memoryAllocationStrategy == GPUMemoryResource::ALLOCATION_GLOBAL) {

    mHostMemoryPoolEnd = (char*)mHostMemoryBase + mHostMemorySize;

    mDeviceMemoryPoolEnd = (char*)mDeviceMemoryBase + mDeviceMemorySize;

  } else {

    mHostMemoryPoolEnd = mDeviceMemoryPoolEnd = nullptr;

  }

  if (InitPhasePermanentMemory()) {

    return 1;

  }

  for (uint32_t i = 0; i < mSlaves.size(); i++) {

    mSlaves[i]->mDeviceMemoryBase = mDeviceMemoryPermanent;

    mSlaves[i]->mHostMemoryBase = mHostMemoryPermanent;

    mSlaves[i]->mDeviceMemorySize = mDeviceMemorySize - ptrDiff(mSlaves[i]->mDeviceMemoryBase, mDeviceMemoryBase);

    mSlaves[i]->mHostMemorySize = mHostMemorySize - ptrDiff(mSlaves[i]->mHostMemoryBase, mHostMemoryBase);

    mSlaves[i]->mHostMemoryPoolEnd = mHostMemoryPoolEnd;

    mSlaves[i]->mDeviceMemoryPoolEnd = mDeviceMemoryPoolEnd;

    if (mSlaves[i]->InitDevice()) {

      GPUError("Error initialization slave (deviceinit)");

      return 1;

    }

    if (mSlaves[i]->InitPhasePermanentMemory()) {

      GPUError("Error initialization slave (permanent memory)");

      return 1;

    }

    mDeviceMemoryPermanent = mSlaves[i]->mDeviceMemoryPermanent;

    mHostMemoryPermanent = mSlaves[i]->mHostMemoryPermanent;

  }

  retVal = InitPhaseAfterDevice();

  if (retVal) {

    return retVal;

  }

  ClearAllocatedMemory();

  for (uint32_t i = 0; i < mSlaves.size(); i++) {

    mSlaves[i]->mDeviceMemoryPermanent = mDeviceMemoryPermanent;

    mSlaves[i]->mHostMemoryPermanent = mHostMemoryPermanent;

    retVal = mSlaves[i]->InitPhaseAfterDevice();

    if (retVal) {

      GPUError("Error initialization slave (after device init)");

      return retVal;

    }

    mSlaves[i]->ClearAllocatedMemory();

  }

  debugInit();

  return 0;

}


namespace o2::gpu::internal

{

static uint32_t getDefaultNThreads()

{

  const char* tbbEnv = getenv("TBB_NUM_THREADS");

  uint32_t tbbNum = tbbEnv ? atoi(tbbEnv) : 0;

  if (tbbNum) {

    return tbbNum;

  }

  const char* ompEnv = getenv("OMP_NUM_THREADS");

  uint32_t ompNum = ompEnv ? atoi(ompEnv) : 0;

  if (ompNum) {

    return ompNum;

  }

  return tbb::info::default_concurrency();

}

} // namespace o2::gpu::internal


int32_t GPUReconstruction::InitPhaseBeforeDevice()

{

  if (GetProcessingSettings().printSettings) {

    if (mSlaves.size() || mMaster) {

      printf("\nConfig Dump %s\n", mMaster ? "Slave" : "Master");

    }

    const GPUChainTracking* chTrk;

    for (uint32_t i = 0; i < mChains.size(); i++) {

      if ((chTrk = dynamic_cast<GPUChainTracking*>(mChains[i].get()))) {

        break;

      }

    }

    GPUConfigDump::dumpConfig(&param().rec, mProcessingSettings.get(), chTrk ? chTrk->GetQAConfig() : nullptr, chTrk ? chTrk->GetEventDisplayConfig() : nullptr, mDeviceBackendSettings.get(), &mRecoSteps);

  }

  mRecoSteps.stepsGPUMask &= mRecoSteps.steps;

  mRecoSteps.stepsGPUMask &= AvailableGPURecoSteps();

  if (!IsGPU()) {

    mRecoSteps.stepsGPUMask.set((uint8_t)0);

  }


  if (GetProcessingSettings().forceMemoryPoolSize >= 1024 || GetProcessingSettings().forceHostMemoryPoolSize >= 1024) {

    mProcessingSettings->memoryAllocationStrategy = GPUMemoryResource::ALLOCATION_GLOBAL;

  }

  if (GetProcessingSettings().memoryAllocationStrategy == GPUMemoryResource::ALLOCATION_AUTO) {

    mProcessingSettings->memoryAllocationStrategy = IsGPU() ? GPUMemoryResource::ALLOCATION_GLOBAL : GPUMemoryResource::ALLOCATION_INDIVIDUAL;

  }

  if (GetProcessingSettings().memoryAllocationStrategy == GPUMemoryResource::ALLOCATION_INDIVIDUAL) {

    mProcessingSettings->forceMemoryPoolSize = mProcessingSettings->forceHostMemoryPoolSize = 0;

  }

  if (GetProcessingSettings().debugLevel >= 4) {

    mProcessingSettings->keepAllMemory = true;

  }

  if (GetProcessingSettings().debugLevel >= 5 && GetProcessingSettings().allocDebugLevel < 2) {

    mProcessingSettings->allocDebugLevel = 2;

  }

  if (GetProcessingSettings().eventDisplay || GetProcessingSettings().keepAllMemory) {

    mProcessingSettings->keepDisplayMemory = true;

  }

  if (GetProcessingSettings().debugLevel < 6) {

    mProcessingSettings->debugMask = 0;

  }

  if (GetProcessingSettings().debugLevel < 1) {

    mProcessingSettings->deviceTimers = false;

  }

  if (GetProcessingSettings().debugLevel > 0) {

    mProcessingSettings->recoTaskTiming = true;

  }

  if (GetProcessingSettings().deterministicGPUReconstruction == -1) {

    mProcessingSettings->deterministicGPUReconstruction = GetProcessingSettings().debugLevel >= 6;

  }

  if (GetProcessingSettings().deterministicGPUReconstruction) {

#ifndef GPUCA_DETERMINISTIC_MODE

    GPUError("WARNING, deterministicGPUReconstruction needs GPUCA_DETERMINISTIC_MODE for being fully deterministic, without only most indeterminism by concurrency is removed, but floating point effects remain!");

#endif

    mProcessingSettings->overrideClusterizerFragmentLen = TPC_MAX_FRAGMENT_LEN_GPU;

    param().rec.tpc.nWaysOuter = true;

    if (param().rec.tpc.looperInterpolationInExtraPass == -1) {

      param().rec.tpc.looperInterpolationInExtraPass = 0;

    }

    if (GetProcessingSettings().createO2Output > 1) {

      mProcessingSettings->createO2Output = 1;

    }

    mProcessingSettings->rtc.deterministic = 1;

  } else {

#ifdef GPUCA_DETERMINISTIC_MODE

    GPUError("WARNING, compiled with GPUCA_DETERMINISTIC_MODE but deterministicGPUReconstruction not set, only compile-time determinism and deterministic math enforced, not fully deterministic!");

#endif

  }

  if (GetProcessingSettings().deterministicGPUReconstruction && GetProcessingSettings().debugLevel >= 6) {

    mProcessingSettings->nTPCClustererLanes = 1;

  }

  if (GetProcessingSettings().createO2Output > 1 && GetProcessingSettings().runQA && GetProcessingSettings().qcRunFraction == 100.f) {

    mProcessingSettings->createO2Output = 1;

  }

  if (!GetProcessingSettings().createO2Output || !IsGPU()) {

    mProcessingSettings->clearO2OutputFromGPU = false;

  }

  if (!(mRecoSteps.stepsGPUMask & GPUDataTypes::RecoStep::TPCMerging)) {

    mProcessingSettings->mergerSortTracks = false;

  }


  if (GetProcessingSettings().debugLevel > 3 || !IsGPU() || GetProcessingSettings().deterministicGPUReconstruction) {

    mProcessingSettings->delayedOutput = false;

  }


  if (!GetProcessingSettings().rtc.enable) {

    mProcessingSettings->rtc.optConstexpr = false;

  }


  mMemoryScalers->scalingFactor = GetProcessingSettings().memoryScalingFactor;

  mMemoryScalers->conservative = GetProcessingSettings().conservativeMemoryEstimate;

  mMemoryScalers->returnMaxVal = GetProcessingSettings().forceMaxMemScalers != 0;

  if (GetProcessingSettings().forceMaxMemScalers > 1) {

    mMemoryScalers->rescaleMaxMem(GetProcessingSettings().forceMaxMemScalers);

  }


  if (GetProcessingSettings().nHostThreads != -1 && GetProcessingSettings().ompThreads != -1) {

    GPUFatal("Must not use both nHostThreads and ompThreads at the same time!");

  } else if (GetProcessingSettings().ompThreads != -1) {

    mProcessingSettings->nHostThreads = GetProcessingSettings().ompThreads;

    GPUWarning("You are using the deprecated ompThreads option, please switch to nHostThreads!");

  }


  if (GetProcessingSettings().nHostThreads <= 0) {

    mProcessingSettings->nHostThreads = internal::getDefaultNThreads();

  } else {

    mProcessingSettings->autoAdjustHostThreads = false;

  }

  mMaxHostThreads = GetProcessingSettings().nHostThreads;

  if (mMaster == nullptr) {

    mThreading = std::make_shared<GPUReconstructionThreading>();

    mThreading->control = std::make_unique<tbb::global_control>(tbb::global_control::max_allowed_parallelism, mMaxHostThreads);

    mThreading->allThreads = std::make_unique<tbb::task_arena>(mMaxHostThreads);

    mThreading->activeThreads = std::make_unique<tbb::task_arena>(mMaxHostThreads);

  } else {

    mThreading = mMaster->mThreading;

  }

  mMaxBackendThreads = std::max(mMaxBackendThreads, mMaxHostThreads);

  if (IsGPU()) {

    mNStreams = std::max<int32_t>(GetProcessingSettings().nStreams, 3);

  }


  if (GetProcessingSettings().nTPCClustererLanes == -1) {

    mProcessingSettings->nTPCClustererLanes = (GetRecoStepsGPU() & RecoStep::TPCClusterFinding) ? 3 : std::max<int32_t>(1, std::min<int32_t>(GPUCA_NSECTORS, GetProcessingSettings().inKernelParallel ? (mMaxHostThreads >= 4 ? std::min<int32_t>(mMaxHostThreads / 2, mMaxHostThreads >= 32 ? GPUCA_NSECTORS : 4) : 1) : mMaxHostThreads));

  }

  if (GetProcessingSettings().overrideClusterizerFragmentLen == -1) {

    mProcessingSettings->overrideClusterizerFragmentLen = ((GetRecoStepsGPU() & RecoStep::TPCClusterFinding) || (mMaxHostThreads / GetProcessingSettings().nTPCClustererLanes >= 3)) ? TPC_MAX_FRAGMENT_LEN_GPU : TPC_MAX_FRAGMENT_LEN_HOST;

  }

  if (GetProcessingSettings().nTPCClustererLanes > GPUCA_NSECTORS) {

    GPUError("Invalid value for nTPCClustererLanes: %d", GetProcessingSettings().nTPCClustererLanes);

    mProcessingSettings->nTPCClustererLanes = GPUCA_NSECTORS;

  }


  if (GetProcessingSettings().doublePipeline) {

    mProcessingSettings->rtctech.allowOptimizedSlaveReconstruction = true;

  }

  if (GetProcessingSettings().doublePipeline && (mChains.size() != 1 || mChains[0]->SupportsDoublePipeline() == false || !IsGPU() || GetProcessingSettings().memoryAllocationStrategy != GPUMemoryResource::ALLOCATION_GLOBAL)) {

    GPUError("Must use double pipeline mode only with exactly one chain that must support it");

    return 1;

  }

  if (mMaster == nullptr && GetProcessingSettings().doublePipeline) {

    mPipelineContext.reset(new GPUReconstructionPipelineContext);

  }


  if (mMaster && GetProcessingSettings().rtc.enable && (GetProcessingSettings().rtc.optConstexpr || GetProcessingSettings().rtc.optSpecialCode) && !GetProcessingSettings().rtctech.allowOptimizedSlaveReconstruction) {

    GPUError("Not allowed to create optimized RTC code with more than one GPUReconstruction instances");

    return 1;

  }


  mDeviceMemorySize = mHostMemorySize = 0;

  for (uint32_t i = 0; i < mChains.size(); i++) {

    if (mChains[i]->EarlyConfigure()) {

      return 1;

    }

    mChains[i]->RegisterPermanentMemoryAndProcessors();

    size_t memPrimary, memPageLocked;

    mChains[i]->MemorySize(memPrimary, memPageLocked);

    if (!IsGPU() || mOutputControl.useInternal()) {

      memPageLocked = memPrimary;

    }

    mDeviceMemorySize += memPrimary;

    mHostMemorySize += memPageLocked;

  }

  if (GetProcessingSettings().forceMemoryPoolSize && GetProcessingSettings().forceMemoryPoolSize <= 2 && CanQueryMaxMemory()) {

    mDeviceMemorySize = GetProcessingSettings().forceMemoryPoolSize;

  } else if (GetProcessingSettings().forceMemoryPoolSize > 2) {

    mDeviceMemorySize = GetProcessingSettings().forceMemoryPoolSize;

    if (!IsGPU() || mOutputControl.useInternal()) {

      mHostMemorySize = mDeviceMemorySize;

    }

  }

  if (GetProcessingSettings().forceHostMemoryPoolSize) {

    mHostMemorySize = GetProcessingSettings().forceHostMemoryPoolSize;

  }


  for (uint32_t i = 0; i < mProcessors.size(); i++) {

    (mProcessors[i].proc->*(mProcessors[i].RegisterMemoryAllocation))();

  }


  return 0;

}


int32_t GPUReconstruction::InitPhasePermanentMemory()

{

  if (IsGPU()) {

    for (uint32_t i = 0; i < mChains.size(); i++) {

      mChains[i]->RegisterGPUProcessors();

    }

  }

  AllocateRegisteredPermanentMemory();

  return 0;

}


int32_t GPUReconstruction::InitPhaseAfterDevice()

{

  if (GetProcessingSettings().forceMaxMemScalers <= 1 && GetProcessingSettings().memoryAllocationStrategy == GPUMemoryResource::ALLOCATION_GLOBAL) {

    mMemoryScalers->rescaleMaxMem(IsGPU() ? mDeviceMemorySize : mHostMemorySize);

  }

  for (uint32_t i = 0; i < mChains.size(); i++) {

    if (mChains[i]->Init()) {

      return 1;

    }

  }

  for (uint32_t i = 0; i < mProcessors.size(); i++) {

    (mProcessors[i].proc->*(mProcessors[i].InitializeProcessor))();

  }


  WriteConstantParams(); // Initialize with initial values, can optionally be updated later


  mInitialized = true;

  return 0;

}


void GPUReconstruction::WriteConstantParams()

{

  if (IsGPU()) {

    const auto threadContext = GetThreadContext();

    WriteToConstantMemory(ptrDiff(&processors()->param, processors()), &param(), sizeof(param()), -1);

  }

}


int32_t GPUReconstruction::Finalize()

{

  for (uint32_t i = 0; i < mChains.size(); i++) {

    mChains[i]->Finalize();

  }

  return 0;

}


int32_t GPUReconstruction::Exit()

{

  if (!mInitialized) {

    return 1;

  }

  for (uint32_t i = 0; i < mSlaves.size(); i++) {

    if (mSlaves[i]->Exit()) {

      GPUError("Error exiting slave");

    }

  }


  mChains.clear();          // Make sure we destroy a possible ITS GPU tracker before we call the destructors

  mHostConstantMem.reset(); // Reset these explicitly before the destruction of other members unloads the library

  if (GetProcessingSettings().memoryAllocationStrategy == GPUMemoryResource::ALLOCATION_INDIVIDUAL) {

    for (uint32_t i = 0; i < mMemoryResources.size(); i++) {

      if (mMemoryResources[i].mReuse >= 0) {

        continue;

      }

      operator delete(mMemoryResources[i].mPtrDevice, std::align_val_t(GPUCA_BUFFER_ALIGNMENT));

      mMemoryResources[i].mPtr = mMemoryResources[i].mPtrDevice = nullptr;

    }

  }

  mMemoryResources.clear();

  if (mInitialized) {

    ExitDevice();

  }

  debugExit();

  mInitialized = false;

  return 0;

}


void GPUReconstruction::RegisterGPUDeviceProcessor(GPUProcessor* proc, GPUProcessor* slaveProcessor) { proc->InitGPUProcessor(this, GPUProcessor::PROCESSOR_TYPE_DEVICE, slaveProcessor); }

void GPUReconstruction::ConstructGPUProcessor(GPUProcessor* proc) { proc->mConstantMem = proc->mGPUProcessorType == GPUProcessor::PROCESSOR_TYPE_DEVICE ? mDeviceConstantMem : mHostConstantMem.get(); }


void GPUReconstruction::ComputeReuseMax(GPUProcessor* proc)

{

  for (auto it = mMemoryReuse1to1.begin(); it != mMemoryReuse1to1.end(); it++) {

    auto& re = it->second;

    if (proc == nullptr || re.proc == proc) {

      GPUMemoryResource& resMain = mMemoryResources[re.res[0]];

      resMain.mOverrideSize = 0;

      for (uint32_t i = 0; i < re.res.size(); i++) {

        GPUMemoryResource& res = mMemoryResources[re.res[i]];

        resMain.mOverrideSize = std::max<size_t>(resMain.mOverrideSize, ptrDiff(res.SetPointers((void*)1), (char*)1));

      }

    }

  }

}


int16_t GPUReconstruction::RegisterMemoryAllocationHelper(GPUProcessor* proc, void* (GPUProcessor::*setPtr)(void*), int32_t type, const char* name, const GPUMemoryReuse& re)

{

  if (!(type & (GPUMemoryResource::MEMORY_HOST | GPUMemoryResource::MEMORY_GPU))) {

    if ((type & GPUMemoryResource::MEMORY_SCRATCH) && !GetProcessingSettings().keepDisplayMemory) { // keepAllMemory --> keepDisplayMemory

      type |= (proc->mGPUProcessorType == GPUProcessor::PROCESSOR_TYPE_CPU ? GPUMemoryResource::MEMORY_HOST : GPUMemoryResource::MEMORY_GPU);

    } else {

      type |= GPUMemoryResource::MEMORY_HOST | GPUMemoryResource::MEMORY_GPU;

    }

  }

  if (proc->mGPUProcessorType == GPUProcessor::PROCESSOR_TYPE_CPU) {

    type &= ~GPUMemoryResource::MEMORY_GPU;

  }

  mMemoryResources.emplace_back(proc, setPtr, (GPUMemoryResource::MemoryType)type, name);

  if (mMemoryResources.size() >= 32768) {

    throw std::bad_alloc();

  }

  uint16_t retVal = mMemoryResources.size() - 1;

  if (re.type != GPUMemoryReuse::NONE && !GetProcessingSettings().disableMemoryReuse) {

    const auto& it = mMemoryReuse1to1.find(re.id);

    if (it == mMemoryReuse1to1.end()) {

      mMemoryReuse1to1[re.id] = {proc, retVal};

    } else {

      mMemoryResources[retVal].mReuse = it->second.res[0];

      it->second.res.emplace_back(retVal);

    }

  }

  return retVal;

}


size_t GPUReconstruction::AllocateRegisteredMemory(GPUProcessor* proc, bool resetCustom)

{

  if (GetProcessingSettings().debugLevel >= 5) {

    GPUInfo("Allocating memory %p", (void*)proc);

  }

  size_t total = 0;

  for (uint32_t i = 0; i < mMemoryResources.size(); i++) {

    if (proc == nullptr ? !mMemoryResources[i].mProcessor->mAllocateAndInitializeLate : mMemoryResources[i].mProcessor == proc) {

      if (!(mMemoryResources[i].mType & GPUMemoryResource::MEMORY_CUSTOM)) {

        total += AllocateRegisteredMemory(i);

      } else if (resetCustom && (mMemoryResources[i].mPtr || mMemoryResources[i].mPtrDevice)) {

        ResetRegisteredMemoryPointers(i);

      }

    }

  }

  if (GetProcessingSettings().debugLevel >= 5) {

    GPUInfo("Allocating memory done");

  }

  return total;

}


size_t GPUReconstruction::AllocateRegisteredPermanentMemory()

{

  if (GetProcessingSettings().debugLevel >= 5) {

    GPUInfo("Allocating Permanent Memory");

  }

  if (mVolatileMemoryStart) {

    GPUError("Must not allocate permanent memory while volatile chunks are allocated");

    throw std::bad_alloc();

  }

  int32_t total = 0;

  for (uint32_t i = 0; i < mMemoryResources.size(); i++) {

    if ((mMemoryResources[i].mType & GPUMemoryResource::MEMORY_PERMANENT) && mMemoryResources[i].mPtr == nullptr) {

      total += AllocateRegisteredMemory(i);

    }

  }

  mHostMemoryPermanent = mHostMemoryPool;

  mDeviceMemoryPermanent = mDeviceMemoryPool;

  if (GetProcessingSettings().debugLevel >= 5) {

    GPUInfo("Permanent Memory Done");

  }

  return total;

}


size_t GPUReconstruction::AllocateRegisteredMemoryHelper(GPUMemoryResource* res, void*& ptr, void*& memorypool, void* memorybase, size_t memorysize, void* (GPUMemoryResource::*setPtr)(void*), void*& memorypoolend, const char* device)

{

  if (res->mReuse >= 0) {

    ptr = (&ptr == &res->mPtrDevice) ? mMemoryResources[res->mReuse].mPtrDevice : mMemoryResources[res->mReuse].mPtr;

    if (ptr == nullptr) {

      GPUError("Invalid reuse ptr (%s)", res->mName);

      throw std::bad_alloc();

    }

    size_t retVal = ptrDiff((res->*setPtr)(ptr), ptr);

    if (retVal > mMemoryResources[res->mReuse].mSize) {

      GPUError("Insufficient reuse memory %lu < %lu (%s) (%s)", mMemoryResources[res->mReuse].mSize, retVal, res->mName, device);

      throw std::bad_alloc();

    }

    if (GetProcessingSettings().allocDebugLevel >= 2) {

      std::cout << "Reused (" << device << ") " << res->mName << ": " << retVal << "\n";

    }

    return retVal;

  }

  if (memorypool == nullptr) {

    GPUError("Cannot allocate memory from uninitialized pool");

    throw std::bad_alloc();

  }

  size_t retVal;

  if ((res->mType & GPUMemoryResource::MEMORY_STACK) && memorypoolend) {

    retVal = ptrDiff((res->*setPtr)((char*)1), (char*)(1));

    memorypoolend = (void*)((char*)memorypoolend - GPUProcessor::getAlignmentMod<GPUCA_MEMALIGN>(memorypoolend));

    if (retVal < res->mOverrideSize) {

      retVal = res->mOverrideSize;

    }

    retVal += GPUProcessor::getAlignment<GPUCA_MEMALIGN>(retVal);

    memorypoolend = (char*)memorypoolend - retVal;

    ptr = memorypoolend;

    retVal = std::max<size_t>(ptrDiff((res->*setPtr)(ptr), ptr), res->mOverrideSize);

  } else {

    ptr = memorypool;

    memorypool = (char*)((res->*setPtr)(ptr));

    retVal = ptrDiff(memorypool, ptr);

    if (retVal < res->mOverrideSize) {

      retVal = res->mOverrideSize;

      memorypool = (char*)ptr + res->mOverrideSize;

    }

    memorypool = (void*)((char*)memorypool + GPUProcessor::getAlignment<GPUCA_MEMALIGN>(memorypool));

  }

  if (memorypoolend ? (memorypool > memorypoolend) : ((size_t)ptrDiff(memorypool, memorybase) > memorysize)) {

    std::cerr << "Memory pool size exceeded (" << device << ") (" << res->mName << ": " << (memorypoolend ? (memorysize + ptrDiff(memorypool, memorypoolend)) : ptrDiff(memorypool, memorybase)) << " > " << memorysize << "\n";

    throw std::bad_alloc();

  }

  if (GetProcessingSettings().allocDebugLevel >= 2) {

    std::cout << "Allocated (" << device << ") " << res->mName << ": " << retVal << " - available: " << (memorypoolend ? ptrDiff(memorypoolend, memorypool) : (memorysize - ptrDiff(memorypool, memorybase))) << "\n";

  }

  return retVal;

}


void GPUReconstruction::AllocateRegisteredMemoryInternal(GPUMemoryResource* res, GPUOutputControl* control, GPUReconstruction* recPool)

{

  if (GetProcessingSettings().memoryAllocationStrategy == GPUMemoryResource::ALLOCATION_INDIVIDUAL && (control == nullptr || control->useInternal())) {

    if (!(res->mType & GPUMemoryResource::MEMORY_EXTERNAL)) {

      if (res->mPtrDevice && res->mReuse < 0) {

        operator delete(res->mPtrDevice, std::align_val_t(GPUCA_BUFFER_ALIGNMENT));

      }

      res->mSize = std::max((size_t)res->SetPointers((void*)1) - 1, res->mOverrideSize);

      if (res->mReuse >= 0) {

        if (res->mSize > mMemoryResources[res->mReuse].mSize) {

          GPUError("Invalid reuse, insufficient size: %ld < %ld", (int64_t)mMemoryResources[res->mReuse].mSize, (int64_t)res->mSize);

          throw std::bad_alloc();

        }

        res->mPtrDevice = mMemoryResources[res->mReuse].mPtrDevice;

      } else {

        res->mPtrDevice = operator new(res->mSize + GPUCA_BUFFER_ALIGNMENT, std::align_val_t(GPUCA_BUFFER_ALIGNMENT));

      }

      res->mPtr = GPUProcessor::alignPointer<GPUCA_BUFFER_ALIGNMENT>(res->mPtrDevice);

      res->SetPointers(res->mPtr);

      if (GetProcessingSettings().allocDebugLevel >= 2) {

        std::cout << (res->mReuse >= 0 ? "Reused " : "Allocated ") << res->mName << ": " << res->mSize << "\n";

      }

      if (res->mType & GPUMemoryResource::MEMORY_STACK) {

        mNonPersistentIndividualAllocations.emplace_back(res);

      }

      if ((size_t)res->mPtr % GPUCA_BUFFER_ALIGNMENT) {

        GPUError("Got buffer with insufficient alignment");

        throw std::bad_alloc();

      }

    }

  } else {

    if (res->mPtr != nullptr) {

      GPUError("Double allocation! (%s)", res->mName);

      throw std::bad_alloc();

    }

    if (IsGPU() && res->mOverrideSize < GPUCA_BUFFER_ALIGNMENT) {

      res->mOverrideSize = GPUCA_BUFFER_ALIGNMENT;

    }

    if ((!IsGPU() || (res->mType & GPUMemoryResource::MEMORY_HOST) || GetProcessingSettings().keepDisplayMemory) && !(res->mType & GPUMemoryResource::MEMORY_EXTERNAL)) { // keepAllMemory --> keepDisplayMemory

      if (control && control->useExternal()) {

        if (control->allocator) {

          res->mSize = std::max((size_t)res->SetPointers((void*)1) - 1, res->mOverrideSize);

          res->mPtr = control->allocator(CAMath::nextMultipleOf<GPUCA_BUFFER_ALIGNMENT>(res->mSize));

          res->mSize = std::max<size_t>(ptrDiff(res->SetPointers(res->mPtr), res->mPtr), res->mOverrideSize);

          if (GetProcessingSettings().allocDebugLevel >= 2) {

            std::cout << "Allocated (from callback) " << res->mName << ": " << res->mSize << "\n";

          }

        } else {

          void* dummy = nullptr;

          res->mSize = AllocateRegisteredMemoryHelper(res, res->mPtr, control->ptrCurrent, control->ptrBase, control->size, &GPUMemoryResource::SetPointers, dummy, "host");

        }

      } else {

        res->mSize = AllocateRegisteredMemoryHelper(res, res->mPtr, recPool->mHostMemoryPool, recPool->mHostMemoryBase, recPool->mHostMemorySize, &GPUMemoryResource::SetPointers, recPool->mHostMemoryPoolEnd, "host");

      }

      if ((size_t)res->mPtr % GPUCA_BUFFER_ALIGNMENT) {

        GPUError("Got buffer with insufficient alignment");

        throw std::bad_alloc();

      }

    }

    if (IsGPU() && (res->mType & GPUMemoryResource::MEMORY_GPU)) {

      if (res->mProcessor->mLinkedProcessor == nullptr) {

        GPUError("Device Processor not set (%s)", res->mName);

        throw std::bad_alloc();

      }

      if (mVolatileMemoryStart && !mDeviceMemoryAsVolatile && !(res->mType & GPUMemoryResource::MEMORY_STACK)) {

        GPUError("Must not allocate non-stacked device memory while volatile chunks are allocated");

        throw std::bad_alloc();

      }

      size_t size = AllocateRegisteredMemoryHelper(res, res->mPtrDevice, recPool->mDeviceMemoryPool, recPool->mDeviceMemoryBase, recPool->mDeviceMemorySize, &GPUMemoryResource::SetDevicePointers, recPool->mDeviceMemoryPoolEnd, " gpu");


      if (!(res->mType & GPUMemoryResource::MEMORY_HOST) || (res->mType & GPUMemoryResource::MEMORY_EXTERNAL)) {

        res->mSize = size;

      } else if (size != res->mSize) {

        GPUError("Inconsistent device memory allocation (%s: device %lu vs %lu)", res->mName, size, res->mSize);

        throw std::bad_alloc();

      }

      if ((size_t)res->mPtrDevice % GPUCA_BUFFER_ALIGNMENT) {

        GPUError("Got buffer with insufficient alignment");

        throw std::bad_alloc();

      }

    }

    UpdateMaxMemoryUsed();

  }

}


void GPUReconstruction::AllocateRegisteredForeignMemory(int16_t ires, GPUReconstruction* rec, GPUOutputControl* control)

{

  rec->AllocateRegisteredMemoryInternal(&rec->mMemoryResources[ires], control, this);

}


size_t GPUReconstruction::AllocateRegisteredMemory(int16_t ires, GPUOutputControl* control)

{

  GPUMemoryResource* res = &mMemoryResources[ires];

  if ((res->mType & GPUMemoryResource::MEMORY_PERMANENT) && res->mPtr != nullptr) {

    ResetRegisteredMemoryPointers(ires);

  } else {

    AllocateRegisteredMemoryInternal(res, control, this);

  }

  return res->mReuse >= 0 ? 0 : res->mSize;

}


void* GPUReconstruction::AllocateDirectMemory(size_t size, int32_t type)

{

  if (GetProcessingSettings().memoryAllocationStrategy == GPUMemoryResource::ALLOCATION_INDIVIDUAL) {

    char* retVal = new (std::align_val_t(GPUCA_BUFFER_ALIGNMENT)) char[size];

    if ((type & GPUMemoryResource::MEMORY_STACK)) {

      mNonPersistentIndividualDirectAllocations.emplace_back(retVal, alignedDeleter());

    } else {

      mDirectMemoryChunks.emplace_back(retVal, alignedDeleter());

    }

    return retVal;

  }


  if ((type & ~(GPUMemoryResource::MEMORY_HOST | GPUMemoryResource::MEMORY_GPU | GPUMemoryResource::MEMORY_STACK)) || ((type & GPUMemoryResource::MEMORY_HOST) && (type & GPUMemoryResource::MEMORY_GPU))) {

    throw std::runtime_error("Requested invalid memory typo for direct allocation");

  }

  if (mVolatileMemoryStart && !mDeviceMemoryAsVolatile && (type & GPUMemoryResource::MEMORY_GPU) && !(type & GPUMemoryResource::MEMORY_STACK)) {

    GPUError("Must not allocate direct memory while volatile chunks are allocated");

    throw std::bad_alloc();

  }


  void*& pool = (type & GPUMemoryResource::MEMORY_GPU) ? mDeviceMemoryPool : mHostMemoryPool;

  void*& poolend = (type & GPUMemoryResource::MEMORY_GPU) ? mDeviceMemoryPoolEnd : mHostMemoryPoolEnd;

  char* retVal;

  if ((type & GPUMemoryResource::MEMORY_STACK)) {

    poolend = (char*)poolend - size;

    poolend = (char*)poolend - GPUProcessor::getAlignmentMod<GPUCA_MEMALIGN>(poolend);

    retVal = (char*)poolend;

  } else {

    GPUProcessor::computePointerWithAlignment(pool, retVal, size);

  }

  if (pool > poolend) {

    GPUError("Insufficient unmanaged memory: missing %ld bytes", ptrDiff(pool, poolend));

    throw std::bad_alloc();

  }

  UpdateMaxMemoryUsed();

  if (GetProcessingSettings().allocDebugLevel >= 2) {

    std::cout << "Allocated (unmanaged " << (type == GPUMemoryResource::MEMORY_GPU ? "gpu" : "host") << "): " << size << " - available: " << ptrDiff(poolend, pool) << "\n";

  }

  return retVal;

}


void* GPUReconstruction::AllocateVolatileDeviceMemory(size_t size)

{

  if (mVolatileMemoryStart == nullptr) {

    mVolatileMemoryStart = mDeviceMemoryPool;

  }

  if (size == 0) {

    return nullptr; // Future GPU memory allocation is volatile

  }

  char* retVal;

  GPUProcessor::computePointerWithAlignment(mDeviceMemoryPool, retVal, size);

  if (mDeviceMemoryPool > mDeviceMemoryPoolEnd) {

    GPUError("Insufficient volatile device memory: missing %ld", ptrDiff(mDeviceMemoryPool, mDeviceMemoryPoolEnd));

    throw std::bad_alloc();

  }

  UpdateMaxMemoryUsed();

  if (GetProcessingSettings().allocDebugLevel >= 2) {

    std::cout << "Allocated (volatile GPU): " << size << " - available: " << ptrDiff(mDeviceMemoryPoolEnd, mDeviceMemoryPool) << "\n";

  }

  return retVal;

}


void* GPUReconstruction::AllocateVolatileMemory(size_t size, bool device)

{

  if (device) {

    return AllocateVolatileDeviceMemory(size);

  }

  char* retVal = new (std::align_val_t(GPUCA_BUFFER_ALIGNMENT)) char[size];

  mVolatileChunks.emplace_back(retVal, alignedDeleter());

  return retVal;

}


void GPUReconstruction::MakeFutureDeviceMemoryAllocationsVolatile()

{

  mDeviceMemoryAsVolatile = true;

  AllocateVolatileDeviceMemory(0);

}


void GPUReconstruction::ReturnVolatileDeviceMemory()

{

  mDeviceMemoryAsVolatile = false;

  if (mVolatileMemoryStart) {

    mDeviceMemoryPool = mVolatileMemoryStart;

    mVolatileMemoryStart = nullptr;

  }

  if (GetProcessingSettings().allocDebugLevel >= 2) {

    std::cout << "Freed (volatile GPU) - available: " << ptrDiff(mDeviceMemoryPoolEnd, mDeviceMemoryPool) << "\n";

  }

}


void GPUReconstruction::ReturnVolatileMemory()

{

  ReturnVolatileDeviceMemory();

  mVolatileChunks.clear();

}


void GPUReconstruction::ResetRegisteredMemoryPointers(GPUProcessor* proc)

{

  for (uint32_t i = 0; i < mMemoryResources.size(); i++) {

    if (proc == nullptr || mMemoryResources[i].mProcessor == proc) {

      ResetRegisteredMemoryPointers(i);

    }

  }

}


void GPUReconstruction::ResetRegisteredMemoryPointers(int16_t ires)

{

  GPUMemoryResource* res = &mMemoryResources[ires];

  if (!(res->mType & GPUMemoryResource::MEMORY_EXTERNAL) && (res->mType & GPUMemoryResource::MEMORY_HOST)) {

    void* basePtr = res->mReuse >= 0 ? mMemoryResources[res->mReuse].mPtr : res->mPtr;

    size_t size = ptrDiff(res->SetPointers(basePtr), basePtr);

    if (basePtr && size > std::max(res->mSize, res->mOverrideSize)) {

      std::cerr << "Updated pointers exceed available memory size: " << size << " > " << std::max(res->mSize, res->mOverrideSize) << " - host - " << res->mName << "\n";

      throw std::bad_alloc();

    }

  }

  if (IsGPU() && (res->mType & GPUMemoryResource::MEMORY_GPU)) {

    void* basePtr = res->mReuse >= 0 ? mMemoryResources[res->mReuse].mPtrDevice : res->mPtrDevice;

    size_t size = ptrDiff(res->SetDevicePointers(basePtr), basePtr);

    if (basePtr && size > std::max(res->mSize, res->mOverrideSize)) {

      std::cerr << "Updated pointers exceed available memory size: " << size << " > " << std::max(res->mSize, res->mOverrideSize) << " - GPU - " << res->mName << "\n";

      throw std::bad_alloc();

    }

  }

}


void GPUReconstruction::FreeRegisteredMemory(GPUProcessor* proc, bool freeCustom, bool freePermanent)

{

  for (uint32_t i = 0; i < mMemoryResources.size(); i++) {

    if ((proc == nullptr || mMemoryResources[i].mProcessor == proc) && (freeCustom || !(mMemoryResources[i].mType & GPUMemoryResource::MEMORY_CUSTOM)) && (freePermanent || !(mMemoryResources[i].mType & GPUMemoryResource::MEMORY_PERMANENT))) {

      FreeRegisteredMemory(i);

    }

  }

}


void GPUReconstruction::FreeRegisteredMemory(int16_t ires)

{

  FreeRegisteredMemory(&mMemoryResources[ires]);

}


void GPUReconstruction::FreeRegisteredMemory(GPUMemoryResource* res)

{

  if (GetProcessingSettings().allocDebugLevel >= 2 && (res->mPtr || res->mPtrDevice)) {

    std::cout << "Freeing " << res->mName << ": size " << res->mSize << " (reused " << res->mReuse << ")\n";

  }

  if (GetProcessingSettings().memoryAllocationStrategy == GPUMemoryResource::ALLOCATION_INDIVIDUAL && res->mReuse < 0) {

    operator delete(res->mPtrDevice, std::align_val_t(GPUCA_BUFFER_ALIGNMENT));

  }

  res->mPtr = nullptr;

  res->mPtrDevice = nullptr;

}


void GPUReconstruction::PushNonPersistentMemory(uint64_t tag)

{

  mNonPersistentMemoryStack.emplace_back(mHostMemoryPoolEnd, mDeviceMemoryPoolEnd, mNonPersistentIndividualAllocations.size(), mNonPersistentIndividualDirectAllocations.size(), tag);

}


void GPUReconstruction::PopNonPersistentMemory(RecoStep step, uint64_t tag)

{

  if (GetProcessingSettings().keepDisplayMemory || GetProcessingSettings().disableMemoryReuse) {

    return;

  }

  if (mNonPersistentMemoryStack.size() == 0) {

    GPUFatal("Trying to pop memory state from empty stack");

  }

  if (tag != 0 && std::get<4>(mNonPersistentMemoryStack.back()) != tag) {

    GPUFatal("Tag mismatch when popping non persistent memory from stack : pop %s vs on stack %s", qTag2Str(tag).c_str(), qTag2Str(std::get<4>(mNonPersistentMemoryStack.back())).c_str());

  }

  if ((GetProcessingSettings().debugLevel >= 3 || GetProcessingSettings().allocDebugLevel) && (IsGPU() || GetProcessingSettings().forceHostMemoryPoolSize)) {

    printf("Allocated memory after %30s (%8s) (Stack %zu): ", GPUDataTypes::RECO_STEP_NAMES[getRecoStepNum(step, true)], qTag2Str(std::get<4>(mNonPersistentMemoryStack.back())).c_str(), mNonPersistentMemoryStack.size());

    PrintMemoryOverview();

    printf("%76s", "");

    PrintMemoryMax();

  }

  mHostMemoryPoolEnd = std::get<0>(mNonPersistentMemoryStack.back());

  mDeviceMemoryPoolEnd = std::get<1>(mNonPersistentMemoryStack.back());

  for (uint32_t i = std::get<2>(mNonPersistentMemoryStack.back()); i < mNonPersistentIndividualAllocations.size(); i++) {

    GPUMemoryResource* res = mNonPersistentIndividualAllocations[i];

    if (res->mReuse < 0) {

      operator delete(res->mPtrDevice, std::align_val_t(GPUCA_BUFFER_ALIGNMENT));

    }

    res->mPtr = nullptr;

    res->mPtrDevice = nullptr;

  }

  mNonPersistentIndividualAllocations.resize(std::get<2>(mNonPersistentMemoryStack.back()));

  mNonPersistentIndividualDirectAllocations.resize(std::get<3>(mNonPersistentMemoryStack.back()));

  mNonPersistentMemoryStack.pop_back();

}


void GPUReconstruction::BlockStackedMemory(GPUReconstruction* rec)

{

  if (mHostMemoryPoolBlocked || mDeviceMemoryPoolBlocked) {

    throw std::runtime_error("temporary memory stack already blocked");

  }

  mHostMemoryPoolBlocked = rec->mHostMemoryPoolEnd;

  mDeviceMemoryPoolBlocked = rec->mDeviceMemoryPoolEnd;

}


void GPUReconstruction::UnblockStackedMemory()

{

  if (mNonPersistentMemoryStack.size()) {

    throw std::runtime_error("cannot unblock while there is stacked memory");

  }

  mHostMemoryPoolEnd = (char*)mHostMemoryBase + mHostMemorySize;

  mDeviceMemoryPoolEnd = (char*)mDeviceMemoryBase + mDeviceMemorySize;

  mHostMemoryPoolBlocked = nullptr;

  mDeviceMemoryPoolBlocked = nullptr;

}


void GPUReconstruction::SetMemoryExternalInput(int16_t res, void* ptr)

{

  mMemoryResources[res].mPtr = ptr;

}


void GPUReconstruction::ClearAllocatedMemory(bool clearOutputs)

{

  for (uint32_t i = 0; i < mMemoryResources.size(); i++) {

    if (!(mMemoryResources[i].mType & GPUMemoryResource::MEMORY_PERMANENT) && (clearOutputs || !(mMemoryResources[i].mType & GPUMemoryResource::MEMORY_OUTPUT))) {

      FreeRegisteredMemory(i);

    }

  }

  mNonPersistentMemoryStack.clear();

  mNonPersistentIndividualAllocations.clear();

  mDirectMemoryChunks.clear();

  mNonPersistentIndividualDirectAllocations.clear();

  mVolatileChunks.clear();

  mVolatileMemoryStart = nullptr;

  if (GetProcessingSettings().memoryAllocationStrategy == GPUMemoryResource::ALLOCATION_GLOBAL) {

    mHostMemoryPool = GPUProcessor::alignPointer<GPUCA_MEMALIGN>(mHostMemoryPermanent);

    mDeviceMemoryPool = GPUProcessor::alignPointer<GPUCA_MEMALIGN>(mDeviceMemoryPermanent);

    mHostMemoryPoolEnd = mHostMemoryPoolBlocked ? mHostMemoryPoolBlocked : ((char*)mHostMemoryBase + mHostMemorySize);

    mDeviceMemoryPoolEnd = mDeviceMemoryPoolBlocked ? mDeviceMemoryPoolBlocked : ((char*)mDeviceMemoryBase + mDeviceMemorySize);

  } else {

    mHostMemoryPool = mDeviceMemoryPool = mHostMemoryPoolEnd = mDeviceMemoryPoolEnd = nullptr;

  }

}


void GPUReconstruction::UpdateMaxMemoryUsed()

{

  mHostMemoryUsedMax = std::max<size_t>(mHostMemoryUsedMax, ptrDiff(mHostMemoryPool, mHostMemoryBase) + ptrDiff((char*)mHostMemoryBase + mHostMemorySize, mHostMemoryPoolEnd));

  mDeviceMemoryUsedMax = std::max<size_t>(mDeviceMemoryUsedMax, ptrDiff(mDeviceMemoryPool, mDeviceMemoryBase) + ptrDiff((char*)mDeviceMemoryBase + mDeviceMemorySize, mDeviceMemoryPoolEnd));

}


void GPUReconstruction::PrintMemoryMax()

{

  printf("Maximum Memory Allocation: Host %'zu / Device %'zu\n", mHostMemoryUsedMax, mDeviceMemoryUsedMax);

}


void GPUReconstruction::PrintMemoryOverview()

{

  if (GetProcessingSettings().memoryAllocationStrategy == GPUMemoryResource::ALLOCATION_GLOBAL) {

    printf("Memory Allocation: Host %'13zd / %'13zu (Permanent %'13zd, Data %'13zd, Scratch %'13zd), Device %'13zd / %'13zu, (Permanent %'13zd, Data %'13zd, Scratch %'13zd) %zu chunks\n",

           ptrDiff(mHostMemoryPool, mHostMemoryBase) + ptrDiff((char*)mHostMemoryBase + mHostMemorySize, mHostMemoryPoolEnd), mHostMemorySize, ptrDiff(mHostMemoryPermanent, mHostMemoryBase), ptrDiff(mHostMemoryPool, mHostMemoryPermanent), ptrDiff((char*)mHostMemoryBase + mHostMemorySize, mHostMemoryPoolEnd),

           ptrDiff(mDeviceMemoryPool, mDeviceMemoryBase) + ptrDiff((char*)mDeviceMemoryBase + mDeviceMemorySize, mDeviceMemoryPoolEnd), mDeviceMemorySize, ptrDiff(mDeviceMemoryPermanent, mDeviceMemoryBase), ptrDiff(mDeviceMemoryPool, mDeviceMemoryPermanent), ptrDiff((char*)mDeviceMemoryBase + mDeviceMemorySize, mDeviceMemoryPoolEnd),

           mMemoryResources.size());

  }

}


void GPUReconstruction::PrintMemoryStatistics()

{

  std::map<std::string, std::array<size_t, 3>> sizes;

  for (uint32_t i = 0; i < mMemoryResources.size(); i++) {

    auto& res = mMemoryResources[i];

    if (res.mReuse >= 0) {

      continue;

    }

    auto& x = sizes[res.mName];

    if (res.mPtr) {

      x[0] += res.mSize;

    }

    if (res.mPtrDevice) {

      x[1] += res.mSize;

    }

    if (res.mType & GPUMemoryResource::MemoryType::MEMORY_PERMANENT) {

      x[2] = 1;

    }

  }

  printf("%59s CPU / %9s GPU\n", "", "");

  for (auto it = sizes.begin(); it != sizes.end(); it++) {

    printf("Allocation %30s %s: Size %'14zu / %'14zu\n", it->first.c_str(), it->second[2] ? "P" : " ", it->second[0], it->second[1]);

  }

  PrintMemoryOverview();

  for (uint32_t i = 0; i < mChains.size(); i++) {

    mChains[i]->PrintMemoryStatistics();

  }

}


int32_t GPUReconstruction::registerMemoryForGPU(const void* ptr, size_t size)

{

  if (GetProcessingSettings().noGPUMemoryRegistration) {

    return 0;

  }

  int32_t retVal = registerMemoryForGPU_internal(ptr, size);

  if (retVal == 0) {

    mRegisteredMemoryPtrs.emplace(ptr);

  }

  return retVal;

}


int32_t GPUReconstruction::unregisterMemoryForGPU(const void* ptr)

{

  if (GetProcessingSettings().noGPUMemoryRegistration) {

    return 0;

  }

  const auto& pos = mRegisteredMemoryPtrs.find(ptr);

  if (pos != mRegisteredMemoryPtrs.end()) {

    mRegisteredMemoryPtrs.erase(pos);

    return unregisterMemoryForGPU_internal(ptr);

  }

  return 1;

}


namespace o2::gpu::internal

{

namespace // anonymous

{

template <class T>

constexpr static inline int32_t getStepNum(T step, bool validCheck, int32_t N, const char* err = "Invalid step num")

{

  static_assert(sizeof(step) == sizeof(uint32_t), "Invalid step enum size");

  int32_t retVal = 8 * sizeof(uint32_t) - 1 - CAMath::Clz((uint32_t)step);

  if ((uint32_t)step == 0 || retVal >= N) {

    if (!validCheck) {

      return -1;

    }

    throw std::runtime_error("Invalid General Step");

  }

  return retVal;

}

} // anonymous namespace

} // namespace o2::gpu::internal


int32_t GPUReconstruction::getRecoStepNum(RecoStep step, bool validCheck) { return internal::getStepNum(step, validCheck, GPUDataTypes::N_RECO_STEPS, "Invalid Reco Step"); }

int32_t GPUReconstruction::getGeneralStepNum(GeneralStep step, bool validCheck) { return internal::getStepNum(step, validCheck, GPUDataTypes::N_GENERAL_STEPS, "Invalid General Step"); }


void GPUReconstruction::RunPipelineWorker()

{

  if (!mInitialized || !GetProcessingSettings().doublePipeline || mMaster != nullptr || !mSlaves.size()) {

    throw std::invalid_argument("Cannot start double pipeline mode");

  }

  if (GetProcessingSettings().debugLevel >= 3) {

    GPUInfo("Pipeline worker started");

  }

  bool terminate = false;

  while (!terminate) {

    {

      std::unique_lock<std::mutex> lk(mPipelineContext->mutex);

      mPipelineContext->cond.wait(lk, [this] { return this->mPipelineContext->queue.size() > 0; });

    }

    GPUReconstructionPipelineQueue* q;

    {

      std::lock_guard<std::mutex> lk(mPipelineContext->mutex);

      q = mPipelineContext->queue.front();

      mPipelineContext->queue.pop();

    }

    if (q->op == 1) {

      terminate = 1;

    } else {

      q->retVal = q->chain->RunChain();

    }

    {

      std::lock_guard<std::mutex> lk(q->m);

      q->done = true;

    }

    q->c.notify_one();

  }

  if (GetProcessingSettings().debugLevel >= 3) {

    GPUInfo("Pipeline worker ended");

  }

}


void GPUReconstruction::TerminatePipelineWorker()

{

  EnqueuePipeline(true);

}


int32_t GPUReconstruction::EnqueuePipeline(bool terminate)

{

  ClearAllocatedMemory(true);

  GPUReconstruction* rec = mMaster ? mMaster : this;

  std::unique_ptr<GPUReconstructionPipelineQueue> qu(new GPUReconstructionPipelineQueue);

  GPUReconstructionPipelineQueue* q = qu.get();

  q->chain = terminate ? nullptr : mChains[0].get();

  q->op = terminate ? 1 : 0;

  std::unique_lock<std::mutex> lkdone(q->m);

  {

    std::lock_guard<std::mutex> lkpipe(rec->mPipelineContext->mutex);

    if (rec->mPipelineContext->terminate) {

      throw std::runtime_error("Must not enqueue work after termination request");

    }

    rec->mPipelineContext->queue.push(q);

    rec->mPipelineContext->terminate = terminate;

    rec->mPipelineContext->cond.notify_one();

  }

  q->c.wait(lkdone, [&q]() { return q->done; });

  if (q->retVal) {

    return q->retVal;

  }

  if (terminate) {

    return 0;

  } else {

    return mChains[0]->FinalizePipelinedProcessing();

  }

}


GPUChain* GPUReconstruction::GetNextChainInQueue()

{

  GPUReconstruction* rec = mMaster ? mMaster : this;

  std::lock_guard<std::mutex> lk(rec->mPipelineContext->mutex);

  return rec->mPipelineContext->queue.size() && rec->mPipelineContext->queue.front()->op == 0 ? rec->mPipelineContext->queue.front()->chain : nullptr;

}


void GPUReconstruction::PrepareEvent() // TODO: Clean this up, this should not be called from chainTracking but before

{

  ClearAllocatedMemory(true);

  for (uint32_t i = 0; i < mChains.size(); i++) {

    mChains[i]->PrepareEvent();

  }

  for (uint32_t i = 0; i < mProcessors.size(); i++) {

    if (mProcessors[i].proc->mAllocateAndInitializeLate) {

      continue;

    }

    (mProcessors[i].proc->*(mProcessors[i].SetMaxData))(mHostConstantMem->ioPtrs);

    if (mProcessors[i].proc->mGPUProcessorType != GPUProcessor::PROCESSOR_TYPE_DEVICE && mProcessors[i].proc->mLinkedProcessor) {

      (mProcessors[i].proc->mLinkedProcessor->*(mProcessors[i].SetMaxData))(mHostConstantMem->ioPtrs);

    }

  }

  ComputeReuseMax(nullptr);

  AllocateRegisteredMemory(nullptr);

}


int32_t GPUReconstruction::CheckErrorCodes(bool cpuOnly, bool forceShowErrors, std::vector<std::array<uint32_t, 4>>* fillErrors)

{

  int32_t retVal = 0;

  for (uint32_t i = 0; i < mChains.size(); i++) {

    if (mChains[i]->CheckErrorCodes(cpuOnly, forceShowErrors, fillErrors)) {

      retVal++;

    }

  }

  return retVal;

}


int32_t GPUReconstruction::GPUChkErrA(const int64_t error, const char* file, int32_t line, bool failOnError)

{

  if (error == 0 || !GPUChkErrInternal(error, file, line)) {

    return 0;

  }

  if (failOnError) {

    if (mInitialized && mInErrorHandling == false) {

      mInErrorHandling = true;

      CheckErrorCodes(false, true);

    }

    throw std::runtime_error("GPU Backend Failure");

  }

  return 1;

}


void GPUReconstruction::DumpSettings(const char* dir)

{

  std::string f;

  f = dir;

  f += "settings.dump";

  DumpStructToFile(mGRPSettings.get(), f.c_str());

  for (uint32_t i = 0; i < mChains.size(); i++) {

    mChains[i]->DumpSettings(dir);

  }

}


void GPUReconstruction::UpdateDynamicSettings(const GPUSettingsRecDynamic* d)

{

  UpdateSettings(nullptr, nullptr, d);

}


void GPUReconstruction::UpdateSettings(const GPUSettingsGRP* g, const GPUSettingsProcessing* p, const GPUSettingsRecDynamic* d)

{

  if (g) {

    *mGRPSettings = *g;

  }

  if (p) {

    mProcessingSettings->debugLevel = p->debugLevel;

    mProcessingSettings->resetTimers = p->resetTimers;

  }

  GPURecoStepConfiguration* w = nullptr;

  if (mRecoSteps.steps.isSet(GPUDataTypes::RecoStep::TPCdEdx)) {

    w = &mRecoSteps;

  }

  param().UpdateSettings(g, p, w, d);

  if (mInitialized) {

    WriteConstantParams();

  }

}


int32_t GPUReconstruction::ReadSettings(const char* dir)

{

  std::string f;

  f = dir;

  f += "settings.dump";

  new (mGRPSettings.get()) GPUSettingsGRP;

  if (ReadStructFromFile(f.c_str(), mGRPSettings.get())) {

    return 1;

  }

  param().UpdateSettings(mGRPSettings.get());

  for (uint32_t i = 0; i < mChains.size(); i++) {

    mChains[i]->ReadSettings(dir);

  }

  return 0;

}


void GPUReconstruction::SetSettings(float solenoidBzNominalGPU, const GPURecoStepConfiguration* workflow)

{

#ifdef GPUCA_O2_LIB

  GPUO2InterfaceConfiguration config;

  config.ReadConfigurableParam(config);

  config.configGRP.solenoidBzNominalGPU = solenoidBzNominalGPU;

  SetSettings(&config.configGRP, &config.configReconstruction, &config.configProcessing, workflow);

#else

  GPUSettingsGRP grp;

  grp.solenoidBzNominalGPU = solenoidBzNominalGPU;

  SetSettings(&grp, nullptr, nullptr, workflow);

#endif

}


void GPUReconstruction::SetSettings(const GPUSettingsGRP* grp, const GPUSettingsRec* rec, const GPUSettingsProcessing* proc, const GPURecoStepConfiguration* workflow)

{

  if (mInitialized) {

    GPUError("Cannot update settings while initialized");

    throw std::runtime_error("Settings updated while initialized");

  }

  *mGRPSettings = *grp;

  if (proc) {

    *mProcessingSettings = *proc;

  }

  if (workflow) {

    mRecoSteps.steps = workflow->steps;

    mRecoSteps.stepsGPUMask &= workflow->stepsGPUMask;

    mRecoSteps.inputs = workflow->inputs;

    mRecoSteps.outputs = workflow->outputs;

  }

  param().SetDefaults(mGRPSettings.get(), rec, proc, workflow);

}


void GPUReconstruction::SetOutputControl(void* ptr, size_t size)

{

  GPUOutputControl outputControl;

  outputControl.set(ptr, size);

  SetOutputControl(outputControl);

}


void GPUReconstruction::SetInputControl(void* ptr, size_t size) { mInputControl.set(ptr, size); }

GPUReconstruction::DeviceType GPUReconstruction::GetDeviceType() const { return (DeviceType)GetDeviceBackendSettings().deviceType; }

const GPUParam& GPUReconstruction::GetParam() const { return mHostConstantMem->param; }

void GPUReconstruction::SetResetTimers(bool reset) { mProcessingSettings->resetTimers = reset; }

void GPUReconstruction::SetDebugLevelTmp(int32_t level) { mProcessingSettings->debugLevel = level; }

GPUParam& GPUReconstruction::param() { return mHostConstantMem->param; }

const GPUTrackingInOutPointers GPUReconstruction::GetIOPtrs() const { return mHostConstantMem->ioPtrs; }

const GPUCalibObjectsConst& GPUReconstruction::GetCalib() const { return processors()->calibObjects; }


ThrustVolatileAllocator::ThrustVolatileAllocator(GPUReconstruction* r)

{

  mAlloc = [&r](size_t n) { return (char*)r->AllocateVolatileDeviceMemory(n); };

}


ThrustVolatileAllocator GPUReconstruction::getThrustVolatileDeviceAllocator()

{

  return ThrustVolatileAllocator(this);

}


GPUChainTracking.h

GPUChain.h

i
int32_t i
Definition GPUCommonAlgorithm.h:436

GPUCommonHelpers.h

GPUConfigDump.h

GPUConstantMem.h

GPUCA_BUFFER_ALIGNMENT
#define GPUCA_BUFFER_ALIGNMENT
Definition GPUDefParametersConstants.h:29

GPULogging.h

GPUMemoryResource.h

GPUMemorySizeScalers.h

GPUO2InterfaceConfiguration.h

GPUROOTDumpCore.h

GPUReconstructionIO.h

GPUReconstructionIncludesITS.h

GPUReconstructionIncludes.h

GPUReconstructionThreading.h

op
uint32_t op
Definition GPUReconstruction.cxx:55

done
bool done
Definition GPUReconstruction.cxx:59

retVal
int32_t retVal
Definition GPUReconstruction.cxx:60

chain
GPUChain * chain
Definition GPUReconstruction.cxx:56

GPUReconstruction.h

GPUSettings.h

GPUCA_NSECTORS
#define GPUCA_NSECTORS
Definition GPUTPCGeometry.h:22

pos
uint16_t pos
Definition RawData.h:3

res
uint32_t res
Definition RawData.h:0

ptr
TBranch * ptr
Definition TTreePlugin.cxx:841

bitfield::set
void set(S v)
Definition bitfield.h:55

bitfield::isSet
bool isSet(const bitfield &v) const
Definition bitfield.h:66

char

GPUSettingsRec

int

o2::gpu::GPUChainTracking
Definition GPUChainTracking.h:71

o2::gpu::GPUChainTracking::GetEventDisplayConfig
const GPUSettingsDisplay * GetEventDisplayConfig() const
Definition GPUChainTracking.h:156

o2::gpu::GPUChainTracking::GetQAConfig
const GPUSettingsQA * GetQAConfig() const
Definition GPUChainTracking.h:157

o2::gpu::GPUChain
Definition GPUChain.h:29

o2::gpu::GPUConfigDump::dumpConfig
static void dumpConfig(const GPUSettingsRec *rec, const GPUSettingsProcessing *proc, const GPUSettingsQA *qa, const GPUSettingsDisplay *display, const GPUSettingsDeviceBackend *device, const GPURecoStepConfiguration *workflow)
Definition GPUConfigDump.cxx:36

o2::gpu::GPUDataTypes::RecoStep
RecoStep
Definition GPUDataTypes.h:123

o2::gpu::GPUDataTypes::RecoStep::TPCdEdx
@ TPCdEdx

o2::gpu::GPUDataTypes::RecoStep::TPCMerging
@ TPCMerging

o2::gpu::GPUDataTypes::RECO_STEP_NAMES
static constexpr const char *const RECO_STEP_NAMES[]
Definition GPUDataTypes.h:146

o2::gpu::GPUDataTypes::GeometryType
GeometryType
Definition GPUDataTypes.h:118

o2::gpu::GPUDataTypes::N_RECO_STEPS
static constexpr int32_t N_RECO_STEPS
Definition GPUDataTypes.h:148

o2::gpu::GPUDataTypes::N_GENERAL_STEPS
static constexpr int32_t N_GENERAL_STEPS
Definition GPUDataTypes.h:149

o2::gpu::GPUDataTypes::GeneralStep
GeneralStep
Definition GPUDataTypes.h:120

o2::gpu::GPUDataTypes::DeviceType
DeviceType
Definition GPUDataTypes.h:119

o2::gpu::GPUMemoryResource
Definition GPUMemoryResource.h:53

o2::gpu::GPUMemoryResource::MemoryType
MemoryType
Definition GPUMemoryResource.h:58

o2::gpu::GPUMemoryResource::MEMORY_OUTPUT
@ MEMORY_OUTPUT
Definition GPUMemoryResource.h:64

o2::gpu::GPUMemoryResource::MEMORY_STACK
@ MEMORY_STACK
Definition GPUMemoryResource.h:72

o2::gpu::GPUMemoryResource::MEMORY_GPU
@ MEMORY_GPU
Definition GPUMemoryResource.h:60

o2::gpu::GPUMemoryResource::MEMORY_PERMANENT
@ MEMORY_PERMANENT
Definition GPUMemoryResource.h:69

o2::gpu::GPUMemoryResource::MEMORY_HOST
@ MEMORY_HOST
Definition GPUMemoryResource.h:59

o2::gpu::GPUMemoryResource::MEMORY_CUSTOM
@ MEMORY_CUSTOM
Definition GPUMemoryResource.h:70

o2::gpu::GPUMemoryResource::MEMORY_EXTERNAL
@ MEMORY_EXTERNAL
Definition GPUMemoryResource.h:68

o2::gpu::GPUMemoryResource::MEMORY_SCRATCH
@ MEMORY_SCRATCH
Definition GPUMemoryResource.h:66

o2::gpu::GPUMemoryResource::SetDevicePointers
void * SetDevicePointers(void *ptr)
Definition GPUMemoryResource.h:87

o2::gpu::GPUMemoryResource::ALLOCATION_INDIVIDUAL
@ ALLOCATION_INDIVIDUAL
Definition GPUMemoryResource.h:75

o2::gpu::GPUMemoryResource::ALLOCATION_GLOBAL
@ ALLOCATION_GLOBAL
Definition GPUMemoryResource.h:76

o2::gpu::GPUMemoryResource::ALLOCATION_AUTO
@ ALLOCATION_AUTO
Definition GPUMemoryResource.h:74

o2::gpu::GPUMemoryResource::SetPointers
void * SetPointers(void *ptr)
Definition GPUMemoryResource.h:83

o2::gpu::GPUProcessor
Definition GPUProcessor.h:34

o2::gpu::GPUProcessor::computePointerWithAlignment
static void computePointerWithAlignment(T *&basePtr, S *&objPtr, size_t nEntries=1)
Definition GPUProcessor.h:138

o2::gpu::GPUProcessor::InitGPUProcessor
void InitGPUProcessor(GPUReconstruction *rec, ProcessorType type=PROCESSOR_TYPE_CPU, GPUProcessor *slaveProcessor=nullptr)
Definition GPUProcessor.cxx:30

o2::gpu::GPUProcessor::mGPUProcessorType
ProcessorType mGPUProcessorType
Definition GPUProcessor.h:161

o2::gpu::GPUProcessor::PROCESSOR_TYPE_CPU
@ PROCESSOR_TYPE_CPU
Definition GPUProcessor.h:40

o2::gpu::GPUProcessor::PROCESSOR_TYPE_DEVICE
@ PROCESSOR_TYPE_DEVICE
Definition GPUProcessor.h:41

o2::gpu::GPUReconstruction
Definition GPUReconstruction.h:70

o2::gpu::GPUReconstruction::mRecoSteps
GPURecoStepConfiguration mRecoSteps
Definition GPUReconstruction.h:324

o2::gpu::GPUReconstruction::InitPhaseBeforeDevice
int32_t InitPhaseBeforeDevice()
Definition GPUReconstruction.cxx:218

o2::gpu::GPUReconstruction::GetITSTraits
virtual void GetITSTraits(std::unique_ptr< o2::its::TrackerTraits< 7 > > *trackerTraits, std::unique_ptr< o2::its::VertexerTraits > *vertexerTraits, std::unique_ptr< o2::its::TimeFrame< 7 > > *timeFrame)
Definition GPUReconstruction.cxx:114

o2::gpu::GPUReconstruction::mRegisteredMemoryPtrs
std::unordered_set< const void * > mRegisteredMemoryPtrs
Definition GPUReconstruction.h:346

o2::gpu::GPUReconstruction::InitPhasePermanentMemory
int32_t InitPhasePermanentMemory()
Definition GPUReconstruction.cxx:400

o2::gpu::GPUReconstruction::RegisterMemoryAllocationHelper
int16_t RegisterMemoryAllocationHelper(GPUProcessor *proc, void *(GPUProcessor::*setPtr)(void *), int32_t type, const char *name, const GPUMemoryReuse &re)
Definition GPUReconstruction.cxx:496

o2::gpu::GPUReconstruction::mChains
std::vector< std::unique_ptr< GPUChain > > mChains
Definition GPUReconstruction.h:75

o2::gpu::GPUReconstruction::mHostMemoryPool
void * mHostMemoryPool
Definition GPUReconstruction.h:331

o2::gpu::GPUReconstruction::mMaster
GPUReconstruction * mMaster
Definition GPUReconstruction.h:348

o2::gpu::GPUReconstruction::mMaxHostThreads
int32_t mMaxHostThreads
Definition GPUReconstruction.h:366

o2::gpu::GPUReconstruction::AllocateVolatileMemory
void * AllocateVolatileMemory(size_t size, bool device)
Definition GPUReconstruction.cxx:785

o2::gpu::GPUReconstruction::getThrustVolatileDeviceAllocator
ThrustVolatileAllocator getThrustVolatileDeviceAllocator()
Definition GPUReconstruction.cxx:1284

o2::gpu::GPUReconstruction::mMemoryScalers
std::unique_ptr< GPUMemorySizeScalers > mMemoryScalers
Definition GPUReconstruction.h:322

o2::gpu::GPUReconstruction::mDeviceMemorySize
size_t mDeviceMemorySize
Definition GPUReconstruction.h:341

o2::gpu::GPUReconstruction::AllocateRegisteredForeignMemory
void AllocateRegisteredForeignMemory(int16_t res, GPUReconstruction *rec, GPUOutputControl *control=nullptr)
Definition GPUReconstruction.cxx:707

o2::gpu::GPUReconstruction::SetInputControl
void SetInputControl(void *ptr, size_t size)
Definition GPUReconstruction.cxx:1271

o2::gpu::GPUReconstruction::mDeviceConstantMem
GPUConstantMem * mDeviceConstantMem
Definition GPUReconstruction.h:314

o2::gpu::GPUReconstruction::ConstructGPUProcessor
void ConstructGPUProcessor(GPUProcessor *proc)
Definition GPUReconstruction.cxx:479

o2::gpu::GPUReconstruction::TerminatePipelineWorker
void TerminatePipelineWorker()
Definition GPUReconstruction.cxx:1094

o2::gpu::GPUReconstruction::mROOTDump
std::shared_ptr< GPUROOTDumpCore > mROOTDump
Definition GPUReconstruction.h:360

o2::gpu::GPUReconstruction::PopNonPersistentMemory
void PopNonPersistentMemory(RecoStep step, uint64_t tag)
Definition GPUReconstruction.cxx:880

o2::gpu::GPUReconstruction::AllocateRegisteredMemoryHelper
size_t AllocateRegisteredMemoryHelper(GPUMemoryResource *res, void *&ptr, void *&memorypool, void *memorybase, size_t memorysize, void *(GPUMemoryResource::*SetPointers)(void *), void *&memorypoolend, const char *device)
Definition GPUReconstruction.cxx:569

o2::gpu::GPUReconstruction::processors
GPUConstantMem * processors()
Definition GPUReconstruction.h:310

o2::gpu::GPUReconstruction::PrepareEvent
void PrepareEvent()
Definition GPUReconstruction.cxx:1135

o2::gpu::GPUReconstruction::ReturnVolatileMemory
void ReturnVolatileMemory()
Definition GPUReconstruction.cxx:813

o2::gpu::GPUReconstruction::GetDeviceBackendSettings
const GPUSettingsDeviceBackend & GetDeviceBackendSettings() const
Definition GPUReconstruction.h:205

o2::gpu::GPUReconstruction::ComputeReuseMax
void ComputeReuseMax(GPUProcessor *proc)
Definition GPUReconstruction.cxx:481

o2::gpu::GPUReconstruction::SetMemoryExternalInput
void SetMemoryExternalInput(int16_t res, void *ptr)
Definition GPUReconstruction.cxx:932

o2::gpu::GPUReconstruction::getGeneralStepNum
int32_t getGeneralStepNum(GeneralStep step, bool validCheck=true)
Definition GPUReconstruction.cxx:1056

o2::gpu::GPUReconstruction::debugInit
void debugInit()
Definition GPUReconstructionDebug.cxx:43

o2::gpu::GPUReconstruction::NSECTORS
static constexpr uint32_t NSECTORS
Definition GPUReconstruction.h:83

o2::gpu::GPUReconstruction::MakeFutureDeviceMemoryAllocationsVolatile
void MakeFutureDeviceMemoryAllocationsVolatile()
Definition GPUReconstruction.cxx:795

o2::gpu::GPUReconstruction::mInputControl
GPUOutputControl mInputControl
Definition GPUReconstruction.h:321

o2::gpu::GPUReconstruction::GetRecoStepsGPU
RecoStepField GetRecoStepsGPU() const
Definition GPUReconstruction.h:224

o2::gpu::GPUReconstruction::SetResetTimers
void SetResetTimers(bool reset)
Definition GPUReconstruction.cxx:1274

o2::gpu::GPUReconstruction::RunPipelineWorker
void RunPipelineWorker()
Definition GPUReconstruction.cxx:1058

o2::gpu::GPUReconstruction::RegisterGPUDeviceProcessor
void RegisterGPUDeviceProcessor(GPUProcessor *proc, GPUProcessor *slaveProcessor)
Definition GPUReconstruction.cxx:478

o2::gpu::GPUReconstruction::PrintMemoryMax
void PrintMemoryMax()
Definition GPUReconstruction.cxx:966

o2::gpu::GPUReconstruction::mSlaves
std::vector< GPUReconstruction * > mSlaves
Definition GPUReconstruction.h:349

o2::gpu::GPUReconstruction::IsGPU
bool IsGPU() const
Definition GPUReconstruction.h:200

o2::gpu::GPUReconstruction::mNStreams
int32_t mNStreams
Definition GPUReconstruction.h:365

o2::gpu::GPUReconstruction::mNonPersistentMemoryStack
std::vector< std::tuple< void *, void *, size_t, size_t, uint64_t > > mNonPersistentMemoryStack
Definition GPUReconstruction.h:387

o2::gpu::GPUReconstruction::ReadStructFromFile
std::unique_ptr< T > ReadStructFromFile(const char *file)
Definition GPUReconstructionIO.h:168

o2::gpu::GPUReconstruction::UpdateDynamicSettings
void UpdateDynamicSettings(const GPUSettingsRecDynamic *d)
Definition GPUReconstruction.cxx:1191

o2::gpu::GPUReconstruction::mDeviceBackendSettings
std::unique_ptr< GPUSettingsDeviceBackend > mDeviceBackendSettings
Definition GPUReconstruction.h:318

o2::gpu::GPUReconstruction::mMemoryResources
std::vector< GPUMemoryResource > mMemoryResources
Definition GPUReconstruction.h:74

o2::gpu::GPUReconstruction::mPipelineContext
std::unique_ptr< GPUReconstructionPipelineContext > mPipelineContext
Definition GPUReconstruction.h:393

o2::gpu::GPUReconstruction::mHostConstantMem
std::unique_ptr< GPUConstantMem > mHostConstantMem
Definition GPUReconstruction.h:313

o2::gpu::GPUReconstruction::AllocateRegisteredPermanentMemory
size_t AllocateRegisteredPermanentMemory()
Definition GPUReconstruction.cxx:546

o2::gpu::GPUReconstruction::ResetRegisteredMemoryPointers
void ResetRegisteredMemoryPointers(GPUProcessor *proc)
Definition GPUReconstruction.cxx:819

o2::gpu::GPUReconstruction::DumpStructToFile
void DumpStructToFile(const T *obj, const char *file)
Definition GPUReconstructionIO.h:155

o2::gpu::GPUReconstruction::AllocateRegisteredMemoryInternal
void AllocateRegisteredMemoryInternal(GPUMemoryResource *res, GPUOutputControl *control, GPUReconstruction *recPool)
Definition GPUReconstruction.cxx:622

o2::gpu::GPUReconstruction::registerMemoryForGPU_internal
virtual int32_t registerMemoryForGPU_internal(const void *ptr, size_t size)=0

o2::gpu::GPUReconstruction::WriteToConstantMemory
virtual size_t WriteToConstantMemory(size_t offset, const void *src, size_t size, int32_t stream=-1, gpu_reconstruction_kernels::deviceEvent *ev=nullptr)=0

o2::gpu::GPUReconstruction::mMemoryReuse1to1
std::unordered_map< GPUMemoryReuse::ID, MemoryReuseMeta > mMemoryReuse1to1
Definition GPUReconstruction.h:386

o2::gpu::GPUReconstruction::mDeviceMemoryUsedMax
size_t mDeviceMemoryUsedMax
Definition GPUReconstruction.h:342

o2::gpu::GPUReconstruction::mProcessors
std::vector< ProcessorData > mProcessors
Definition GPUReconstruction.h:376

o2::gpu::GPUReconstruction::ReturnVolatileDeviceMemory
void ReturnVolatileDeviceMemory()
Definition GPUReconstruction.cxx:801

o2::gpu::GPUReconstruction::AllocateVolatileDeviceMemory
void * AllocateVolatileDeviceMemory(size_t size)
Definition GPUReconstruction.cxx:764

o2::gpu::GPUReconstruction::mDeviceMemoryAsVolatile
bool mDeviceMemoryAsVolatile
Definition GPUReconstruction.h:344

o2::gpu::GPUReconstruction::InitDevice
virtual int32_t InitDevice()=0

o2::gpu::GPUReconstruction::SetSettings
void SetSettings(float solenoidBzNominalGPU, const GPURecoStepConfiguration *workflow=nullptr)
Definition GPUReconstruction.cxx:1231

o2::gpu::GPUReconstruction::~GPUReconstruction
virtual ~GPUReconstruction()
Definition GPUReconstruction.cxx:107

o2::gpu::GPUReconstruction::mMaxBackendThreads
int32_t mMaxBackendThreads
Definition GPUReconstruction.h:363

o2::gpu::GPUReconstruction::GetCalib
const GPUCalibObjectsConst & GetCalib() const
Definition GPUReconstruction.cxx:1278

o2::gpu::GPUReconstruction::GetIOPtrs
const GPUTrackingInOutPointers GetIOPtrs() const
Definition GPUReconstruction.cxx:1277

o2::gpu::GPUReconstruction::GetThreadContext
virtual std::unique_ptr< gpu_reconstruction_kernels::threadContext > GetThreadContext()=0

o2::gpu::GPUReconstruction::mDeviceMemoryBase
void * mDeviceMemoryBase
Definition GPUReconstruction.h:336

o2::gpu::GPUReconstruction::UnblockStackedMemory
void UnblockStackedMemory()
Definition GPUReconstruction.cxx:921

o2::gpu::GPUReconstruction::GPUReconstruction
GPUReconstruction(const GPUReconstruction &)=delete

o2::gpu::GPUReconstruction::geometryType
static constexpr GeometryType geometryType
Definition GPUReconstruction.h:96

o2::gpu::GPUReconstruction::Exit
int32_t Exit()
Definition GPUReconstruction.cxx:447

o2::gpu::GPUReconstruction::mNonPersistentIndividualDirectAllocations
std::vector< std::unique_ptr< char[], alignedDeleter > > mNonPersistentIndividualDirectAllocations
Definition GPUReconstruction.h:389

o2::gpu::GPUReconstruction::WriteConstantParams
void WriteConstantParams()
Definition GPUReconstruction.cxx:431

o2::gpu::GPUReconstruction::FreeRegisteredMemory
void FreeRegisteredMemory(GPUProcessor *proc, bool freeCustom=false, bool freePermanent=false)
Definition GPUReconstruction.cxx:849

o2::gpu::GPUReconstruction::mVolatileChunks
std::vector< std::unique_ptr< char[], alignedDeleter > > mVolatileChunks
Definition GPUReconstruction.h:391

o2::gpu::GPUReconstruction::Finalize
int32_t Finalize()
Definition GPUReconstruction.cxx:439

o2::gpu::GPUReconstruction::UpdateMaxMemoryUsed
void UpdateMaxMemoryUsed()
Definition GPUReconstruction.cxx:960

o2::gpu::GPUReconstruction::AvailableGPURecoSteps
virtual RecoStepField AvailableGPURecoSteps()
Definition GPUReconstruction.h:306

o2::gpu::GPUReconstruction::IOTYPENAMES
static constexpr const char *const IOTYPENAMES[]
Definition GPUReconstruction.h:120

o2::gpu::GPUReconstruction::mDirectMemoryChunks
std::vector< std::unique_ptr< char[], alignedDeleter > > mDirectMemoryChunks
Definition GPUReconstruction.h:390

o2::gpu::GPUReconstruction::UpdateSettings
void UpdateSettings(const GPUSettingsGRP *g, const GPUSettingsProcessing *p=nullptr, const GPUSettingsRecDynamic *d=nullptr)
Definition GPUReconstruction.cxx:1196

o2::gpu::GPUReconstruction::GetDeviceType
DeviceType GetDeviceType() const
Definition GPUReconstruction.cxx:1272

o2::gpu::GPUReconstruction::CheckErrorCodes
int32_t CheckErrorCodes(bool cpuOnly=false, bool forceShowErrors=false, std::vector< std::array< uint32_t, 4 > > *fillErrors=nullptr)
Definition GPUReconstruction.cxx:1154

o2::gpu::GPUReconstruction::GetParam
const GPUParam & GetParam() const
Definition GPUReconstruction.cxx:1273

o2::gpu::GPUReconstruction::ClearAllocatedMemory
void ClearAllocatedMemory(bool clearOutputs=true)
Definition GPUReconstruction.cxx:937

o2::gpu::GPUReconstruction::GEOMETRY_TYPE_NAMES
static constexpr const char *const GEOMETRY_TYPE_NAMES[]
Definition GPUReconstruction.h:92

o2::gpu::GPUReconstruction::mOutputControl
GPUOutputControl mOutputControl
Definition GPUReconstruction.h:320

o2::gpu::GPUReconstruction::mHostMemoryUsedMax
size_t mHostMemoryUsedMax
Definition GPUReconstruction.h:335

o2::gpu::GPUReconstruction::mDeviceMemoryPoolEnd
void * mDeviceMemoryPoolEnd
Definition GPUReconstruction.h:339

o2::gpu::GPUReconstruction::ExitDevice
virtual int32_t ExitDevice()=0

o2::gpu::GPUReconstruction::PrintMemoryOverview
void PrintMemoryOverview()
Definition GPUReconstruction.cxx:971

o2::gpu::GPUReconstruction::mGRPSettings
std::unique_ptr< GPUSettingsGRP > mGRPSettings
Definition GPUReconstruction.h:317

o2::gpu::GPUReconstruction::mProcessingSettings
std::unique_ptr< GPUSettingsProcessing > mProcessingSettings
Definition GPUReconstruction.h:319

o2::gpu::GPUReconstruction::CanQueryMaxMemory
virtual bool CanQueryMaxMemory()
Definition GPUReconstruction.h:307

o2::gpu::GPUReconstruction::PrintMemoryStatistics
void PrintMemoryStatistics()
Definition GPUReconstruction.cxx:981

o2::gpu::GPUReconstruction::debugExit
void debugExit()
Definition GPUReconstructionDebug.cxx:91

o2::gpu::GPUReconstruction::PushNonPersistentMemory
void PushNonPersistentMemory(uint64_t tag)
Definition GPUReconstruction.cxx:875

o2::gpu::GPUReconstruction::Init
int32_t Init()
Definition GPUReconstruction.cxx:132

o2::gpu::GPUReconstruction::getRecoStepNum
int32_t getRecoStepNum(RecoStep step, bool validCheck=true)
Definition GPUReconstruction.cxx:1055

o2::gpu::GPUReconstruction::unregisterMemoryForGPU_internal
virtual int32_t unregisterMemoryForGPU_internal(const void *ptr)=0

o2::gpu::GPUReconstruction::InitPhaseAfterDevice
int32_t InitPhaseAfterDevice()
Definition GPUReconstruction.cxx:411

o2::gpu::GPUReconstruction::getHostThreadIndex
static int32_t getHostThreadIndex()
Definition GPUReconstruction.cxx:127

o2::gpu::GPUReconstruction::mDeviceMemoryPermanent
void * mDeviceMemoryPermanent
Definition GPUReconstruction.h:337

o2::gpu::GPUReconstruction::BlockStackedMemory
void BlockStackedMemory(GPUReconstruction *rec)
Definition GPUReconstruction.cxx:912

o2::gpu::GPUReconstruction::mInitialized
bool mInitialized
Definition GPUReconstruction.h:353

o2::gpu::GPUReconstruction::GetProcessingSettings
const GPUSettingsProcessing & GetProcessingSettings() const
Definition GPUReconstruction.h:206

o2::gpu::GPUReconstruction::DumpSettings
void DumpSettings(const char *dir="")
Definition GPUReconstruction.cxx:1180

o2::gpu::GPUReconstruction::AllocateDirectMemory
void * AllocateDirectMemory(size_t size, int32_t type)
Definition GPUReconstruction.cxx:723

o2::gpu::GPUReconstruction::mHostMemoryPoolBlocked
void * mHostMemoryPoolBlocked
Definition GPUReconstruction.h:333

o2::gpu::GPUReconstruction::mDeviceMemoryPool
void * mDeviceMemoryPool
Definition GPUReconstruction.h:338

o2::gpu::GPUReconstruction::unregisterMemoryForGPU
int32_t unregisterMemoryForGPU(const void *ptr)
Definition GPUReconstruction.cxx:1022

o2::gpu::GPUReconstruction::registerMemoryForGPU
int32_t registerMemoryForGPU(const void *ptr, size_t size)
Definition GPUReconstruction.cxx:1010

o2::gpu::GPUReconstruction::SetDebugLevelTmp
void SetDebugLevelTmp(int32_t level)
Definition GPUReconstruction.cxx:1275

o2::gpu::GPUReconstruction::EnqueuePipeline
int32_t EnqueuePipeline(bool terminate=false)
Definition GPUReconstruction.cxx:1099

o2::gpu::GPUReconstruction::mInErrorHandling
bool mInErrorHandling
Definition GPUReconstruction.h:354

o2::gpu::GPUReconstruction::mThreading
std::shared_ptr< GPUReconstructionThreading > mThreading
Definition GPUReconstruction.h:250

o2::gpu::GPUReconstruction::mNonPersistentIndividualAllocations
std::vector< GPUMemoryResource * > mNonPersistentIndividualAllocations
Definition GPUReconstruction.h:388

o2::gpu::GPUReconstruction::mSlaveId
int mSlaveId
Definition GPUReconstruction.h:350

o2::gpu::GPUReconstruction::param
GPUParam & param()
Definition GPUReconstruction.cxx:1276

o2::gpu::GPUReconstruction::mHostMemoryPoolEnd
void * mHostMemoryPoolEnd
Definition GPUReconstruction.h:332

o2::gpu::GPUReconstruction::mHostMemoryBase
void * mHostMemoryBase
Definition GPUReconstruction.h:329

o2::gpu::GPUReconstruction::mHostMemorySize
size_t mHostMemorySize
Definition GPUReconstruction.h:334

o2::gpu::GPUReconstruction::mDeviceMemoryPoolBlocked
void * mDeviceMemoryPoolBlocked
Definition GPUReconstruction.h:340

o2::gpu::GPUReconstruction::mVolatileMemoryStart
void * mVolatileMemoryStart
Definition GPUReconstruction.h:343

o2::gpu::GPUReconstruction::GPUChkErrInternal
virtual int32_t GPUChkErrInternal(const int64_t error, const char *file, int32_t line) const
Definition GPUReconstruction.h:268

o2::gpu::GPUReconstruction::GetNextChainInQueue
GPUChain * GetNextChainInQueue()
Definition GPUReconstruction.cxx:1128

o2::gpu::GPUReconstruction::mHostMemoryPermanent
void * mHostMemoryPermanent
Definition GPUReconstruction.h:330

o2::gpu::GPUReconstruction::GPUChkErrA
int32_t GPUChkErrA(const int64_t error, const char *file, int32_t line, bool failOnError)
Definition GPUReconstruction.cxx:1165

o2::gpu::GPUReconstruction::AllocateRegisteredMemory
size_t AllocateRegisteredMemory(GPUProcessor *proc, bool resetCustom=false)
Definition GPUReconstruction.cxx:525

o2::gpu::GPUReconstruction::ReadSettings
int32_t ReadSettings(const char *dir="")
Definition GPUReconstruction.cxx:1215

o2::gpu::GPUReconstruction::SetOutputControl
void SetOutputControl(const GPUOutputControl &v)
Definition GPUReconstruction.h:215

o2::gpu::GPUTPCClusterFinder::mISector
int32_t mISector
Definition GPUTPCClusterFinder.h:125

o2::gpu::GPUTPCTracker::SetSector
void SetSector(int32_t iSector)
Definition GPUTPCTracker.cxx:45

o2::gpu::ThrustVolatileAllocator
Definition GPUCommonHelpers.h:69

o2::its::TrackerTraits
Definition TrackerTraits.h:44

o2::its::VertexerTraits
Definition VertexerTraits.h:52

TPC_MAX_FRAGMENT_LEN_GPU
#define TPC_MAX_FRAGMENT_LEN_GPU
Definition clusterFinderDefs.h:45

TPC_MAX_FRAGMENT_LEN_HOST
#define TPC_MAX_FRAGMENT_LEN_HOST
Definition clusterFinderDefs.h:46

n
GLdouble n
Definition glcorearb.h:1982

x
GLint GLenum GLint x
Definition glcorearb.h:403

m
const GLfloat * m
Definition glcorearb.h:4066

size
GLsizeiptr size
Definition glcorearb.h:659

sizes
GLuint GLsizei const GLuint const GLintptr const GLsizeiptr * sizes
Definition glcorearb.h:2595

name
GLuint const GLchar * name
Definition glcorearb.h:781

f
GLdouble f
Definition glcorearb.h:310

b
GLboolean GLboolean GLboolean b
Definition glcorearb.h:1233

type
GLint GLint GLsizei GLint GLenum GLenum type
Definition glcorearb.h:275

void
typedef void(APIENTRYP PFNGLCULLFACEPROC)(GLenum mode)

g
GLboolean GLboolean g
Definition glcorearb.h:1233

level
GLint level
Definition glcorearb.h:275

r
GLboolean r
Definition glcorearb.h:1233

param
GLenum GLfloat param
Definition glcorearb.h:271

a
GLboolean GLboolean GLboolean GLboolean a
Definition glcorearb.h:1233

w
GLubyte GLubyte GLubyte GLubyte w
Definition glcorearb.h:852

o2::gpu::internal
Definition GPUCommonHelpers.h:42

o2::gpu
Definition TrackTRD.h:35

file
const char * file
Definition standalone-cluster-dump-entropy-analysed.cxx:52

eventDisplay
std::unique_ptr< GPUDisplayFrontendInterface > eventDisplay
Definition standalone.cxx:83

rec
GPUReconstruction * rec
Definition standalone.cxx:74

strtag.h

qTag2Str
std::string qTag2Str(const T tag)
Definition strtag.h:35

o2::gpu::GPUCalibObjectsTemplate< ConstPtr >

o2::gpu::GPUConstantMem
Definition GPUConstantMem.h:42

o2::gpu::GPUConstantMem::tpcTrackers
GPUTPCTracker tpcTrackers[GPUCA_NSECTORS]
Definition GPUConstantMem.h:44

o2::gpu::GPUConstantMem::tpcClusterer
GPUTPCClusterFinder tpcClusterer[GPUCA_NSECTORS]
Definition GPUConstantMem.h:51

o2::gpu::GPUConstantMem::calibObjects
GPUCalibObjectsConst calibObjects
Definition GPUConstantMem.h:54

o2::gpu::GPUMemoryReuse
Definition GPUMemoryResource.h:24

o2::gpu::GPUMemoryReuse::NONE
@ NONE
Definition GPUMemoryResource.h:26

o2::gpu::GPUMemorySizeScalers
Definition GPUMemorySizeScalers.h:23

o2::gpu::GPUO2InterfaceConfiguration
Definition GPUO2InterfaceConfiguration.h:72

o2::gpu::GPUO2InterfaceConfiguration::configProcessing
GPUSettingsProcessing configProcessing
Definition GPUO2InterfaceConfiguration.h:88

o2::gpu::GPUO2InterfaceConfiguration::configGRP
GPUSettingsGRP configGRP
Definition GPUO2InterfaceConfiguration.h:89

o2::gpu::GPUO2InterfaceConfiguration::ReadConfigurableParam
GPUSettingsO2 ReadConfigurableParam()
Definition GPUO2InterfaceConfiguration.cxx:20

o2::gpu::GPUO2InterfaceConfiguration::configReconstruction
GPUSettingsRec configReconstruction
Definition GPUO2InterfaceConfiguration.h:90

o2::gpu::GPUOutputControl
Definition GPUOutputControl.h:34

o2::gpu::GPUOutputControl::useInternal
bool useInternal()
Definition GPUOutputControl.h:52

o2::gpu::GPUOutputControl::useExternal
bool useExternal()
Definition GPUOutputControl.h:51

o2::gpu::GPUOutputControl::set
void set(void *p, size_t s)
Definition GPUOutputControl.h:36

o2::gpu::GPUOutputControl::size
size_t size
Definition GPUOutputControl.h:62

o2::gpu::GPUOutputControl::ptrBase
void * ptrBase
Definition GPUOutputControl.h:60

o2::gpu::GPUOutputControl::ptrCurrent
void * ptrCurrent
Definition GPUOutputControl.h:61

o2::gpu::GPUOutputControl::allocator
std::function< void *(size_t)> allocator
Definition GPUOutputControl.h:63

o2::gpu::GPUParam
Definition GPUParam.h:79

o2::gpu::GPUParam::UpdateSettings
void UpdateSettings(const GPUSettingsGRP *g, const GPUSettingsProcessing *p=nullptr, const GPURecoStepConfiguration *w=nullptr, const GPUSettingsRecDynamic *d=nullptr)
Definition GPUParam.cxx:117

o2::gpu::GPUParam::SetDefaults
void SetDefaults(float solenoidBz, bool assumeConstantBz)
Definition GPUParam.cxx:33

o2::gpu::GPURecoStepConfiguration
Definition GPUDataTypes.h:157

o2::gpu::GPURecoStepConfiguration::stepsGPUMask
GPUDataTypes::RecoStepField stepsGPUMask
Definition GPUDataTypes.h:159

o2::gpu::GPURecoStepConfiguration::outputs
GPUDataTypes::InOutTypeField outputs
Definition GPUDataTypes.h:161

o2::gpu::GPURecoStepConfiguration::steps
GPUDataTypes::RecoStepField steps
Definition GPUDataTypes.h:158

o2::gpu::GPURecoStepConfiguration::inputs
GPUDataTypes::InOutTypeField inputs
Definition GPUDataTypes.h:160

o2::gpu::GPUReconstructionPipelineContext
Definition GPUReconstruction.cxx:64

o2::gpu::GPUReconstructionPipelineContext::terminate
bool terminate
Definition GPUReconstruction.cxx:68

o2::gpu::GPUReconstructionPipelineContext::cond
std::condition_variable cond
Definition GPUReconstruction.cxx:67

o2::gpu::GPUReconstructionPipelineContext::mutex
std::mutex mutex
Definition GPUReconstruction.cxx:66

o2::gpu::GPUReconstructionPipelineContext::queue
std::queue< GPUReconstructionPipelineQueue * > queue
Definition GPUReconstruction.cxx:65

o2::gpu::GPUReconstruction::alignedDeleter
Definition GPUReconstruction.h:383

o2::gpu::GPUSettingsDeviceBackend
Definition GPUSettings.h:75

o2::gpu::GPUSettingsDeviceBackend::deviceType
uint32_t deviceType
Definition GPUSettings.h:76

o2::gpu::GPUSettingsDeviceBackend::master
GPUReconstruction * master
Definition GPUSettings.h:78

o2::gpu::GPUSettingsGRP
Definition GPUSettings.h:51

o2::gpu::GPUSettingsGRP::solenoidBzNominalGPU
float solenoidBzNominalGPU
Definition GPUSettings.h:53

o2::gpu::GPUTrackingInOutPointers
Definition GPUDataTypes.h:215

o2::gpu::internal::GPUParam_t::rec
T rec
Definition GPUParam.h:52

o2::its::TimeFrame
Definition TimeFrame.h:68