Project
Loading...
Searching...
No Matches
GPUMemorySizeScalers.cxx
Go to the documentation of this file.
1// Copyright 2019-2020 CERN and copyright holders of ALICE O2.
2// See https://alice-o2.web.cern.ch/copyright for details of the copyright holders.
3// All rights not expressly granted are reserved.
4//
5// This software is distributed under the terms of the GNU General Public
6// License v3 (GPL Version 3), copied verbatim in the file "COPYING".
7//
8// In applying this license CERN does not waive the privileges and immunities
9// granted to it by virtue of its status as an Intergovernmental Organization
10// or submit itself to any jurisdiction.
11
14
16#include "GPUTPCGeometry.h"
17#include "GPULogging.h"
18
19#include <random>
20
21using namespace o2::gpu;
22
23void GPUMemorySizeScalers::rescaleMaxMem(size_t newAvailableMemory)
24{
26 double scaleFactor = (double)newAvailableMemory / tmp.availableMemory;
27 if (scaleFactor != 1.) {
28 GPUInfo("Rescaling buffer size limits from %lu to %lu bytes of memory (factor %f)", tmp.availableMemory, newAvailableMemory, scaleFactor);
29 }
30 tpcMaxPeaks = (double)tmp.tpcMaxPeaks * scaleFactor;
31 tpcMaxClusters = (double)tmp.tpcMaxClusters * scaleFactor;
32 tpcMaxStartHits = (double)tmp.tpcMaxStartHits * scaleFactor;
33 tpcMaxRowStartHits = (double)tmp.tpcMaxRowStartHits * scaleFactor;
34 tpcMaxTracklets = (double)tmp.tpcMaxTracklets * scaleFactor;
35 tpcMaxTrackletHits = (double)tmp.tpcMaxTrackletHits * scaleFactor;
36 tpcMaxSectorTracks = (double)tmp.tpcMaxSectorTracks * scaleFactor;
37 tpcMaxSectorTrackHits = (double)tmp.tpcMaxSectorTrackHits * scaleFactor;
38 tpcMaxMergedTracks = (double)tmp.tpcMaxMergedTracks * scaleFactor;
39 tpcMaxMergedTrackHits = (double)tmp.tpcMaxMergedTrackHits * scaleFactor;
40 availableMemory = newAvailableMemory;
41}
42
44{
45 if (!doFuzzing) {
46 return scalingFactor;
47 }
48 static std::uniform_int_distribution<uint32_t> dist(0, 1000000);
49 static std::mt19937 rng;
50 if (fuzzSeed) {
51 rng = std::mt19937(fuzzSeed);
52 fuzzLimit = dist(rng) / 10;
53 fuzzSeed = 0;
54 }
55 if (dist(rng) > fuzzLimit) {
56 return scalingFactor;
57 }
58 return scalingFactor * 0.000001 * dist(rng);
59}
60
62{
63 fuzzSeed = seed;
64 doFuzzing = true;
65}
66
67size_t GPUMemorySizeScalers::getValue(size_t maxVal, size_t val)
68{
69 return returnMaxVal ? maxVal : (std::min<size_t>(maxVal, offset + val) * (doFuzzing == 0 ? scalingFactor : getScalingFactor()) * temporaryFactor);
70}
71
72size_t GPUMemorySizeScalers::NTPCPeaks(size_t tpcDigits, bool perSector) { return getValue(perSector ? tpcMaxPeaks : (GPUTPCGeometry::NSECTORS * tpcMaxPeaks), hitOffset + tpcDigits * tpcPeaksPerDigit); }
73size_t GPUMemorySizeScalers::NTPCClusters(size_t tpcDigits, bool perSector) { return getValue(perSector ? tpcMaxSectorClusters : tpcMaxClusters, (conservativeMemoryEstimate ? 1.0 : tpcClustersPerPeak) * NTPCPeaks(tpcDigits, perSector)); }
74size_t GPUMemorySizeScalers::NTPCStartHits(size_t tpcHits) { return getValue(tpcMaxStartHits, tpcHits * tpcStartHitsPerHit); }
75size_t GPUMemorySizeScalers::NTPCRowStartHits(size_t tpcHits) { return getValue(tpcMaxRowStartHits, std::max<size_t>(NTPCStartHits(tpcHits) * (tpcHits < 30000000 ? 20 : 12) / GPUTPCGeometry::NROWS, tpcMinRowStartHits)); }
76size_t GPUMemorySizeScalers::NTPCTracklets(size_t tpcHits, bool lowField) { return getValue(tpcMaxTracklets, NTPCStartHits(tpcHits) * (lowField ? tpcTrackletsPerStartHitLowField : tpcTrackletsPerStartHit)); }
77size_t GPUMemorySizeScalers::NTPCTrackletHits(size_t tpcHits, bool lowField) { return getValue(tpcMaxTrackletHits, hitOffset + tpcHits * (lowField ? tpcTrackletHitsPerHitLowField : tpcTrackletHitsPerHit)); }
78size_t GPUMemorySizeScalers::NTPCSectorTracks(size_t tpcHits) { return getValue(tpcMaxSectorTracks, tpcHits * tpcSectorTracksPerHit); }
79size_t GPUMemorySizeScalers::NTPCSectorTrackHits(size_t tpcHits, uint8_t withRejection) { return getValue(tpcMaxSectorTrackHits, tpcHits * (withRejection ? tpcSectorTrackHitsPerHitWithRejection : tpcSectorTrackHitsPerHit)); }
80size_t GPUMemorySizeScalers::NTPCMergedTracks(size_t tpcSectorTracks) { return getValue(tpcMaxMergedTracks, tpcSectorTracks * (conservativeMemoryEstimate ? 1.0 : tpcMergedTrackPerSectorTrack)); }
81size_t GPUMemorySizeScalers::NTPCMergedTrackHits(size_t tpcSectorTrackHitss) { return getValue(tpcMaxMergedTrackHits, tpcSectorTrackHitss * tpcMergedTrackHitPerSectorHit); }
82size_t GPUMemorySizeScalers::NTPCUnattachedHitsBase1024(int32_t type) { return (returnMaxVal || conservativeMemoryEstimate) ? 1024 : std::min<size_t>(1024, tpcCompressedUnattachedHitsBase1024[type] * (doFuzzing == 0 ? scalingFactor : getScalingFactor()) * temporaryFactor); }
static constexpr uint32_t NROWS
static constexpr uint32_t NSECTORS
GLint GLint GLsizei GLint GLenum GLenum type
Definition glcorearb.h:275
GLintptr offset
Definition glcorearb.h:660
GLuint GLfloat * val
Definition glcorearb.h:1582
size_t NTPCTracklets(size_t tpcHits, bool lowField)
size_t NTPCUnattachedHitsBase1024(int32_t type)
size_t NTPCRowStartHits(size_t tpcHits)
size_t NTPCMergedTracks(size_t tpcSectorTracks)
size_t NTPCSectorTracks(size_t tpcHits)
size_t NTPCTrackletHits(size_t tpcHits, bool lowField)
size_t NTPCPeaks(size_t tpcDigits, bool perSector=false)
size_t NTPCClusters(size_t tpcDigits, bool perSector=false)
void rescaleMaxMem(size_t newAvailableMemory)
size_t NTPCMergedTrackHits(size_t tpcSectorTrackHitss)
size_t NTPCSectorTrackHits(size_t tpcHits, uint8_t withRejection=0)
size_t getValue(size_t maxVal, size_t val)