dc/de2/GPUTPCNNClusterizerHost_8cxx_source.html

// Copyright 2019-2020 CERN and copyright holders of ALICE O2.

// See https://alice-o2.web.cern.ch/copyright for details of the copyright holders.

// All rights not expressly granted are reserved.

//

// This software is distributed under the terms of the GNU General Public

// License v3 (GPL Version 3), copied verbatim in the file "COPYING".

//

// In applying this license CERN does not waive the privileges and immunities

// granted to it by virtue of its status as an Intergovernmental Organization

// or submit itself to any jurisdiction.


#include <CommonUtils/StringUtils.h>


#include "GPUTPCNNClusterizerHost.h"

#include "GPUTPCNNClusterizer.h"

#include "GPUSettings.h"

#include "ML/3rdparty/GPUORTFloat16.h"

#include "GPUReconstruction.h"

#include "GPUTPCGeometry.h"

#include "DataFormatsTPC/Constants.h"

#include "clusterFinderDefs.h"


#ifdef GPUCA_HAS_ONNX

#include <onnxruntime_cxx_api.h>

#endif


using namespace o2::gpu;


void GPUTPCNNClusterizerHost::init(const GPUSettingsProcessingNNclusterizer& settings, bool useDeterministicMode)

{

  std::string class_model_path = settings.nnClassificationPath, reg_model_path = settings.nnRegressionPath;

  std::vector<std::string> reg_model_paths_local;

  std::vector<std::string> evalMode = o2::utils::Str::tokenize(settings.nnEvalMode, ':');


  if (settings.nnLoadFromCCDB) {

    reg_model_path = settings.nnLocalFolder + "/net_regression_c1.onnx"; // Needs to be set identical to GPUWorkflowSpec.cxx, otherwise the networks might be loaded from the wrong place

    if (evalMode[0] == "c1") {

      class_model_path = settings.nnLocalFolder + "/net_classification_c1.onnx";

    } else if (evalMode[0] == "c2") {

      class_model_path = settings.nnLocalFolder + "/net_classification_c2.onnx";

    }


    if (evalMode[1] == "r2") {

      reg_model_path += ":" + settings.nnLocalFolder + "/net_regression_c2.onnx";

    }

  }


  mOrtOptions = {

    {"model-path", class_model_path},

    {"device-type", settings.nnInferenceDevice},

    {"allocate-device-memory", std::to_string(settings.nnInferenceAllocateDevMem)},

    {"intra-op-num-threads", std::to_string(settings.nnInferenceIntraOpNumThreads)},

    {"inter-op-num-threads", std::to_string(settings.nnInferenceInterOpNumThreads)},

    {"enable-optimizations", std::to_string(settings.nnInferenceEnableOrtOptimization)},

    {"deterministic-compute", std::to_string(useDeterministicMode ? 1 : settings.nnInferenceUseDeterministicCompute)}, // TODO: This unfortunately doesn't guarantee determinism (25.07.2025)

    {"enable-profiling", std::to_string(settings.nnInferenceOrtProfiling)},

    {"profiling-output-path", settings.nnInferenceOrtProfilingPath},

    {"logging-level", std::to_string(settings.nnInferenceVerbosity)},

    {"onnx-environment-name", "c1"}};


  mModelClass.initOptions(mOrtOptions);

  mModelsUsed[0] = true;


  reg_model_paths_local = o2::utils::Str::tokenize(reg_model_path, ':');


  if (!settings.nnClusterizerUseCfRegression) {

    if (reg_model_paths_local.size() == 1) {

      mOrtOptions["model-path"] = reg_model_paths_local[0];

      mOrtOptions["onnx-environment-name"] = "r1";

      mModelReg1.initOptions(mOrtOptions);

      mModelsUsed[1] = true;

    } else {

      mOrtOptions["model-path"] = reg_model_paths_local[0];

      mOrtOptions["onnx-environment-name"] = "r1";

      mModelReg1.initOptions(mOrtOptions);

      mModelsUsed[1] = true;

      mOrtOptions["model-path"] = reg_model_paths_local[1];

      mOrtOptions["onnx-environment-name"] = "r2";

      mModelReg2.initOptions(mOrtOptions);

      mModelsUsed[2] = true;

    }

  }

}


void GPUTPCNNClusterizerHost::initClusterizer(const GPUSettingsProcessingNNclusterizer& settings, GPUTPCNNClusterizer& clustererNN, int32_t maxFragmentLen, int32_t maxAllowedTimebin)

{

  clustererNN.mNnClusterizerUseCfRegression = settings.nnClusterizerUseCfRegression;

  clustererNN.mNnClusterizerSizeInputRow = settings.nnClusterizerSizeInputRow;

  clustererNN.mNnClusterizerSizeInputPad = settings.nnClusterizerSizeInputPad;

  clustererNN.mNnClusterizerSizeInputTime = settings.nnClusterizerSizeInputTime;

  clustererNN.mNnClusterizerFullRowSize = 2 * settings.nnClusterizerSizeInputRow + 1;

  clustererNN.mNnClusterizerFullPadSize = 2 * settings.nnClusterizerSizeInputPad + 1;

  clustererNN.mNnClusterizerFullTimeSize = 2 * settings.nnClusterizerSizeInputTime + 1;

  clustererNN.mNnClusterizerChargeArraySize = clustererNN.mNnClusterizerFullRowSize * clustererNN.mNnClusterizerFullPadSize * clustererNN.mNnClusterizerFullTimeSize;

  clustererNN.mNnClusterizerPadTimeSize = clustererNN.mNnClusterizerFullPadSize * clustererNN.mNnClusterizerFullTimeSize;

  clustererNN.mNnClusterizerRowTimeSize = clustererNN.mNnClusterizerFullRowSize * clustererNN.mNnClusterizerFullTimeSize;

  clustererNN.mNnClusterizerRowTimeSizeFull = clustererNN.mNnClusterizerRowTimeSize + (settings.nnClusterizerAddIndexData ? 3 : 0);

  clustererNN.mNnClusterizerRowTimeSizeThreads = clustererNN.mNnClusterizerRowTimeSize + (settings.nnClusterizerAddIndexData ? 1 : 0);

  clustererNN.mNnClusterizerElementSize = clustererNN.mNnClusterizerChargeArraySize + (settings.nnClusterizerAddIndexData ? 3 : 0);

  // clustererNN.mBoundaryMapSizeRow = 3 * clustererNN.mNnClusterizerSizeInputRow + o2::tpc::constants::MAXGLOBALPADROW;

  // clustererNN.mBoundaryPadding = 11; // padding on each side to account for pad_offset. N=11 since then mIsBoundary = 24320 ~< (1.5 x 2^14 = 24576) && N must be bigger than (NPads[row(end_iroc + 1)] - NPads[row(end_iroc)])/2 (=6) for pad_offset to work

  // clustererNN.mBoundaryMapSizePadsPerRow = GPUTPCGeometry::NPads(o2::tpc::constants::MAXGLOBALPADROW - 1) + 2 * clustererNN.mBoundaryPadding;

  // clustererNN.mBoundaryMapSize = clustererNN.mBoundaryMapSizeRow * clustererNN.mBoundaryMapSizePadsPerRow;

  // clustererNN.mIndexLookupSize = 3 * clustererNN.mNnClusterizerChargeArraySize; // local row, pad, time shift from flat index

  clustererNN.mNnClusterizerAddIndexData = settings.nnClusterizerAddIndexData;

  clustererNN.mNnClusterizerBatchedMode = settings.nnClusterizerBatchedMode;

  clustererNN.mNnClusterizerBoundaryFillValue = settings.nnClusterizerBoundaryFillValue;

  clustererNN.mNnSigmoidTrafoClassThreshold = settings.nnSigmoidTrafoClassThreshold;

  clustererNN.mNnClusterizerUseClassification = settings.nnClusterizerUseClassification;

  clustererNN.mNnClusterizerSetDeconvolutionFlags = (bool)settings.nnClusterizerSetDeconvolutionFlags;

  clustererNN.maxFragmentLen = maxFragmentLen == -1 ? TPC_MAX_FRAGMENT_LEN_GPU : maxFragmentLen;

  clustererNN.maxAllowedTimebin = maxAllowedTimebin == -1 ? TPC_MAX_FRAGMENT_LEN_GPU : maxAllowedTimebin;

  if (clustererNN.mNnSigmoidTrafoClassThreshold) {

    clustererNN.mNnClassThreshold = (float)std::log(settings.nnClassThreshold / (1.f - settings.nnClassThreshold));

  } else {

    clustererNN.mNnClassThreshold = settings.nnClassThreshold;

  }

  if (settings.nnClusterizerVerbosity < 0) {

    clustererNN.mNnClusterizerVerbosity = settings.nnInferenceVerbosity;

  } else {

    clustererNN.mNnClusterizerVerbosity = settings.nnClusterizerVerbosity;

  }

  clustererNN.mNnInferenceInputDType = settings.nnInferenceInputDType.find("32") != std::string::npos;

  clustererNN.mNnInferenceOutputDType = settings.nnInferenceOutputDType.find("32") != std::string::npos;

  clustererNN.mNnClusterizerModelClassNumOutputNodes = mModelClass.getNumOutputNodes()[0][1];

  if (!settings.nnClusterizerUseCfRegression) {

    if (mModelClass.getNumOutputNodes()[0][1] == 1 || !mModelReg2.isInitialized()) {

      clustererNN.mNnClusterizerModelReg1NumOutputNodes = mModelReg1.getNumOutputNodes()[0][1];

    } else {

      clustererNN.mNnClusterizerModelReg1NumOutputNodes = mModelReg1.getNumOutputNodes()[0][1];

      clustererNN.mNnClusterizerModelReg2NumOutputNodes = mModelReg2.getNumOutputNodes()[0][1];

    }

  }

}


// void GPUTPCNNClusterizerHost::createBoundary(GPUTPCNNClusterizer& clustererNN)

// {

//   // Call after init of the clustererNN elements

//   for (int r = 0; r < clustererNN.mBoundaryMapSizeRow; r++) {

//     int8_t skipCheckInRow = 0;

//     for (int p = 0; p < clustererNN.mBoundaryMapSizePadsPerRow; p++) {

//       int32_t i = r * clustererNN.mBoundaryMapSizePadsPerRow + p;

//       clustererNN.mIsBoundary[i] = 1;

//       if (!skipCheckInRow && (p >= clustererNN.mBoundaryPadding || r >= clustererNN.mNnClusterizerSizeInputRow)) {

//         if (r < (GPUTPCGeometry::EndIROC() + clustererNN.mNnClusterizerSizeInputRow)) {

//           clustererNN.mIsBoundary[i] = (int32_t)((p - clustererNN.mBoundaryPadding) >= static_cast<int>(GPUTPCGeometry::NPads(r - clustererNN.mNnClusterizerSizeInputRow)));

//         } else if (r >= (GPUTPCGeometry::EndIROC() + 2 * clustererNN.mNnClusterizerSizeInputRow) && r < (o2::tpc::constants::MAXGLOBALPADROW + 2 * clustererNN.mNnClusterizerSizeInputRow)) {

//           clustererNN.mIsBoundary[i] = (int32_t)((p - clustererNN.mBoundaryPadding) >= static_cast<int>(GPUTPCGeometry::NPads(r - 2 * clustererNN.mNnClusterizerSizeInputRow)));

//         }

//         skipCheckInRow = (clustererNN.mIsBoundary[i] == 1); // No need to check further pads in this row

//       }

//     }

//   }

// }


// void GPUTPCNNClusterizerHost::createIndexLookup(GPUTPCNNClusterizer& clustererNN)

// {

//   for (int32_t i = 0; i < clustererNN.mNnClusterizerChargeArraySize; i++) {

//     int32_t r = CAMath::Floor(i / ((2 * clustererNN.mNnClusterizerSizeInputPad + 1) * (2 * clustererNN.mNnClusterizerSizeInputTime + 1))) - clustererNN.mNnClusterizerSizeInputRow;

//     int32_t rest_1 = i % ((2 * clustererNN.mNnClusterizerSizeInputPad + 1) * (2 * clustererNN.mNnClusterizerSizeInputTime + 1));

//     int32_t p = CAMath::Floor(rest_1 / (2 * clustererNN.mNnClusterizerSizeInputTime + 1)) - clustererNN.mNnClusterizerSizeInputPad;

//     int32_t t = (rest_1 % (2 * clustererNN.mNnClusterizerSizeInputTime + 1)) - clustererNN.mNnClusterizerSizeInputTime;

//     clustererNN.mIndexLookup[3 * i] = r;

//     clustererNN.mIndexLookup[3 * i + 1] = p;

//     clustererNN.mIndexLookup[3 * i + 2] = t;

//   }

// }


// MockedOrtAllocator implementation to be able to use volatile assignment


struct MockedOrtAllocator : OrtAllocator {

  MockedOrtAllocator(GPUReconstruction* = nullptr, OrtMemoryInfo* = nullptr);

  ~MockedOrtAllocator();


  void* Alloc(size_t size);

  void Free(void* p);

  const OrtMemoryInfo* Info() const;

  void* Reserve(size_t size);

  size_t NumAllocations() const;

  size_t NumReserveAllocations() const;


  void LeakCheck();


 private:

  MockedOrtAllocator(const MockedOrtAllocator&) = delete;

  MockedOrtAllocator& operator=(const MockedOrtAllocator&) = delete;


  std::atomic<size_t> memory_inuse{0};

  std::atomic<size_t> num_allocations{0};

  std::atomic<size_t> num_reserve_allocations{0};

  OrtMemoryInfo* mMemoryInfoInternal;

  GPUReconstruction* mRecInternal;

};


MockedOrtAllocator::MockedOrtAllocator(GPUReconstruction* r, OrtMemoryInfo* info)

{

  OrtAllocator::version = ORT_API_VERSION;

  OrtAllocator::Alloc = [](OrtAllocator* this_, size_t size) { return static_cast<MockedOrtAllocator*>(this_)->Alloc(size); };

  OrtAllocator::Free = [](OrtAllocator* this_, void* p) { static_cast<MockedOrtAllocator*>(this_)->Free(p); };

  OrtAllocator::Info = [](const OrtAllocator* this_) { return static_cast<const MockedOrtAllocator*>(this_)->Info(); };

  OrtAllocator::Reserve = [](OrtAllocator* this_, size_t size) { return static_cast<MockedOrtAllocator*>(this_)->Reserve(size); };

  mRecInternal = r;

  mMemoryInfoInternal = info;

}


MockedOrtAllocator::~MockedOrtAllocator()

{

  // Ort::GetApi().ReleaseMemoryInfo(mMemoryInfoInternal);

  (void)0; // Suppress warning for empty destructor

}


void* MockedOrtAllocator::Alloc(size_t size)

{

  LOG(info) << "(ORT) Allocating direct memory of size " << size << " bytes";

  return mRecInternal->AllocateDirectMemory(size, GPUMemoryResource::MEMORY_GPU | GPUMemoryResource::MEMORY_STACK);

}


void* MockedOrtAllocator::Reserve(size_t size)

{

  LOG(info) << "(ORT) Reserving direct memory of size " << size << " bytes";

  return mRecInternal->AllocateDirectMemory(size, GPUMemoryResource::MEMORY_GPU | GPUMemoryResource::MEMORY_STACK);

}


void MockedOrtAllocator::Free(void* p)

{

  // LOG(info) << "(ORT) Freeing volatile memory " << p;

}


const OrtMemoryInfo* MockedOrtAllocator::Info() const

{

  return mMemoryInfoInternal;

}


size_t MockedOrtAllocator::NumAllocations() const

{

  return num_allocations.load();

}


size_t MockedOrtAllocator::NumReserveAllocations() const

{

  return num_reserve_allocations.load();

}


void MockedOrtAllocator::LeakCheck()

{

  if (memory_inuse.load()) {

    LOG(warning) << "memory leak!!!";

  }

}


void GPUTPCNNClusterizerHost::directOrtAllocator(Ort::Env* env, Ort::MemoryInfo* memInfo, GPUReconstruction* rec, bool recreate)

{

  mMockedAlloc = std::make_shared<MockedOrtAllocator>(rec, (OrtMemoryInfo*)(*memInfo));

  if (recreate) {

    Ort::ThrowOnError(Ort::GetApi().UnregisterAllocator((OrtEnv*)(*env), (OrtMemoryInfo*)(*memInfo)));

  }

  Ort::ThrowOnError(Ort::GetApi().RegisterAllocator((OrtEnv*)(*env), mMockedAlloc.get()));

  memInfo = (Ort::MemoryInfo*)mMockedAlloc->Info();

}


const OrtMemoryInfo* GPUTPCNNClusterizerHost::getMockedMemoryInfo()

{

  return mMockedAlloc->Info();

}


MockedOrtAllocator* GPUTPCNNClusterizerHost::getMockedAllocator()

{

  return mMockedAlloc.get();

}


StringUtils.h

Constants.h

GPUORTFloat16.h

GPUReconstruction.h

GPUSettings.h

GPUTPCGeometry.h

GPUTPCNNClusterizerHost.h

GPUTPCNNClusterizer.h

OrtAllocator

o2::gpu::GPUMemoryResource::MEMORY_STACK
@ MEMORY_STACK
Definition GPUMemoryResource.h:75

o2::gpu::GPUMemoryResource::MEMORY_GPU
@ MEMORY_GPU
Definition GPUMemoryResource.h:63

o2::gpu::GPUReconstruction
Definition GPUReconstruction.h:71

o2::gpu::GPUTPCNNClusterizerHost::mModelReg1
o2::ml::OrtModel mModelReg1
Definition GPUTPCNNClusterizerHost.h:61

o2::gpu::GPUTPCNNClusterizerHost::mModelClass
o2::ml::OrtModel mModelClass
Definition GPUTPCNNClusterizerHost.h:61

o2::gpu::GPUTPCNNClusterizerHost::getMockedMemoryInfo
const OrtMemoryInfo * getMockedMemoryInfo()
Definition GPUTPCNNClusterizerHost.cxx:263

o2::gpu::GPUTPCNNClusterizerHost::mModelReg2
o2::ml::OrtModel mModelReg2
Definition GPUTPCNNClusterizerHost.h:61

o2::gpu::GPUTPCNNClusterizerHost::init
void init(const GPUSettingsProcessingNNclusterizer &, bool=false)
Definition GPUTPCNNClusterizerHost.cxx:32

o2::gpu::GPUTPCNNClusterizerHost::mOrtOptions
std::unordered_map< std::string, std::string > mOrtOptions
Definition GPUTPCNNClusterizerHost.h:60

o2::gpu::GPUTPCNNClusterizerHost::getMockedAllocator
MockedOrtAllocator * getMockedAllocator()
Definition GPUTPCNNClusterizerHost.cxx:268

o2::gpu::GPUTPCNNClusterizerHost::mMockedAlloc
std::shared_ptr< MockedOrtAllocator > mMockedAlloc
Definition GPUTPCNNClusterizerHost.h:64

o2::gpu::GPUTPCNNClusterizerHost::mModelsUsed
std::vector< bool > mModelsUsed
Definition GPUTPCNNClusterizerHost.h:62

o2::gpu::GPUTPCNNClusterizerHost::directOrtAllocator
void directOrtAllocator(Ort::Env *, Ort::MemoryInfo *, GPUReconstruction *, bool=false)
Definition GPUTPCNNClusterizerHost.cxx:253

o2::gpu::GPUTPCNNClusterizerHost::initClusterizer
void initClusterizer(const GPUSettingsProcessingNNclusterizer &, GPUTPCNNClusterizer &, int32_t=-1, int32_t=-1)
Definition GPUTPCNNClusterizerHost.cxx:88

o2::gpu::GPUTPCNNClusterizer
Definition GPUTPCNNClusterizer.h:30

o2::gpu::GPUTPCNNClusterizer::mNnClusterizerSizeInputTime
int32_t mNnClusterizerSizeInputTime
Definition GPUTPCNNClusterizer.h:42

o2::gpu::GPUTPCNNClusterizer::mNnClusterizerRowTimeSize
uint32_t mNnClusterizerRowTimeSize
Definition GPUTPCNNClusterizer.h:72

o2::gpu::GPUTPCNNClusterizer::mNnClusterizerSizeInputRow
int32_t mNnClusterizerSizeInputRow
Definition GPUTPCNNClusterizer.h:40

o2::gpu::GPUTPCNNClusterizer::mNnClusterizerSizeInputPad
int32_t mNnClusterizerSizeInputPad
Definition GPUTPCNNClusterizer.h:41

o2::gpu::GPUTPCNNClusterizer::mNnClusterizerFullPadSize
uint32_t mNnClusterizerFullPadSize
Definition GPUTPCNNClusterizer.h:69

o2::gpu::GPUTPCNNClusterizer::mNnClusterizerBatchedMode
int32_t mNnClusterizerBatchedMode
Definition GPUTPCNNClusterizer.h:51

o2::gpu::GPUTPCNNClusterizer::mNnClusterizerElementSize
int32_t mNnClusterizerElementSize
Definition GPUTPCNNClusterizer.h:44

o2::gpu::GPUTPCNNClusterizer::mNnClusterizerModelReg1NumOutputNodes
int32_t mNnClusterizerModelReg1NumOutputNodes
Definition GPUTPCNNClusterizer.h:56

o2::gpu::GPUTPCNNClusterizer::mNnClusterizerVerbosity
int32_t mNnClusterizerVerbosity
Definition GPUTPCNNClusterizer.h:53

o2::gpu::GPUTPCNNClusterizer::mNnClassThreshold
float mNnClassThreshold
Definition GPUTPCNNClusterizer.h:47

o2::gpu::GPUTPCNNClusterizer::maxAllowedTimebin
int32_t maxAllowedTimebin
Definition GPUTPCNNClusterizer.h:65

o2::gpu::GPUTPCNNClusterizer::mNnClusterizerUseCfRegression
int32_t mNnClusterizerUseCfRegression
Definition GPUTPCNNClusterizer.h:50

o2::gpu::GPUTPCNNClusterizer::mNnClusterizerModelClassNumOutputNodes
int32_t mNnClusterizerModelClassNumOutputNodes
Definition GPUTPCNNClusterizer.h:55

o2::gpu::GPUTPCNNClusterizer::mNnClusterizerBoundaryFillValue
int32_t mNnClusterizerBoundaryFillValue
Definition GPUTPCNNClusterizer.h:54

o2::gpu::GPUTPCNNClusterizer::mNnClusterizerAddIndexData
int8_t mNnClusterizerAddIndexData
Definition GPUTPCNNClusterizer.h:45

o2::gpu::GPUTPCNNClusterizer::mNnSigmoidTrafoClassThreshold
int8_t mNnSigmoidTrafoClassThreshold
Definition GPUTPCNNClusterizer.h:48

o2::gpu::GPUTPCNNClusterizer::mNnInferenceInputDType
int32_t mNnInferenceInputDType
Definition GPUTPCNNClusterizer.h:58

o2::gpu::GPUTPCNNClusterizer::mNnClusterizerRowTimeSizeFull
uint32_t mNnClusterizerRowTimeSizeFull
Definition GPUTPCNNClusterizer.h:73

o2::gpu::GPUTPCNNClusterizer::maxFragmentLen
int32_t maxFragmentLen
Definition GPUTPCNNClusterizer.h:64

o2::gpu::GPUTPCNNClusterizer::mNnInferenceOutputDType
int32_t mNnInferenceOutputDType
Definition GPUTPCNNClusterizer.h:59

o2::gpu::GPUTPCNNClusterizer::mNnClusterizerFullRowSize
uint32_t mNnClusterizerFullRowSize
Definition GPUTPCNNClusterizer.h:68

o2::gpu::GPUTPCNNClusterizer::mNnClusterizerRowTimeSizeThreads
uint32_t mNnClusterizerRowTimeSizeThreads
Definition GPUTPCNNClusterizer.h:74

o2::gpu::GPUTPCNNClusterizer::mNnClusterizerModelReg2NumOutputNodes
int32_t mNnClusterizerModelReg2NumOutputNodes
Definition GPUTPCNNClusterizer.h:57

o2::gpu::GPUTPCNNClusterizer::mNnClusterizerChargeArraySize
int32_t mNnClusterizerChargeArraySize
Definition GPUTPCNNClusterizer.h:43

o2::gpu::GPUTPCNNClusterizer::mNnClusterizerFullTimeSize
uint32_t mNnClusterizerFullTimeSize
Definition GPUTPCNNClusterizer.h:70

o2::gpu::GPUTPCNNClusterizer::mNnClusterizerSetDeconvolutionFlags
int8_t mNnClusterizerSetDeconvolutionFlags
Definition GPUTPCNNClusterizer.h:49

o2::gpu::GPUTPCNNClusterizer::mNnClusterizerPadTimeSize
uint32_t mNnClusterizerPadTimeSize
Definition GPUTPCNNClusterizer.h:71

o2::gpu::GPUTPCNNClusterizer::mNnClusterizerUseClassification
int8_t mNnClusterizerUseClassification
Definition GPUTPCNNClusterizer.h:46

o2::ml::OrtModel::initOptions
void initOptions(std::unordered_map< std::string, std::string > optionsMap)
Definition OrtInterface.cxx:51

o2::ml::OrtModel::isInitialized
bool isInitialized()
Definition OrtInterface.h:56

o2::ml::OrtModel::getNumOutputNodes
std::vector< std::vector< int64_t > > getNumOutputNodes() const
Definition OrtInterface.h:61

clusterFinderDefs.h

TPC_MAX_FRAGMENT_LEN_GPU
#define TPC_MAX_FRAGMENT_LEN_GPU
Definition clusterFinderDefs.h:45

size
GLsizeiptr size
Definition glcorearb.h:659

void
typedef void(APIENTRYP PFNGLCULLFACEPROC)(GLenum mode)

r
GLboolean r
Definition glcorearb.h:1233

o2::gpu
Definition TrackTRD.h:35

std::to_string
std::string to_string(gsl::span< T, Size > span)
Definition common.h:52

rec
GPUReconstruction * rec
Definition standalone.cxx:74

MockedOrtAllocator
Definition GPUTPCNNClusterizerHost.cxx:173

MockedOrtAllocator::Alloc
void * Alloc(size_t size)
Definition GPUTPCNNClusterizerHost.cxx:214

MockedOrtAllocator::NumAllocations
size_t NumAllocations() const
Definition GPUTPCNNClusterizerHost.cxx:236

MockedOrtAllocator::Info
const OrtMemoryInfo * Info() const
Definition GPUTPCNNClusterizerHost.cxx:231

MockedOrtAllocator::~MockedOrtAllocator
~MockedOrtAllocator()
Definition GPUTPCNNClusterizerHost.cxx:208

MockedOrtAllocator::Free
void Free(void *p)
Definition GPUTPCNNClusterizerHost.cxx:226

MockedOrtAllocator::MockedOrtAllocator
MockedOrtAllocator(GPUReconstruction *=nullptr, OrtMemoryInfo *=nullptr)
Definition GPUTPCNNClusterizerHost.cxx:197

MockedOrtAllocator::Reserve
void * Reserve(size_t size)
Definition GPUTPCNNClusterizerHost.cxx:220

MockedOrtAllocator::LeakCheck
void LeakCheck()
Definition GPUTPCNNClusterizerHost.cxx:246

MockedOrtAllocator::NumReserveAllocations
size_t NumReserveAllocations() const
Definition GPUTPCNNClusterizerHost.cxx:241

o2::utils::Str::tokenize
static std::vector< std::string > tokenize(const std::string &src, char delim, bool trimToken=true, bool skipEmpty=true)
Definition StringUtils.cxx:23

LOG
LOG(info)<< "Compressed in "<< sw.CpuTime()<< " s"