Project
Loading...
Searching...
No Matches
GPUReconstructionConvert.cxx
Go to the documentation of this file.
1// Copyright 2019-2020 CERN and copyright holders of ALICE O2.
2// See https://alice-o2.web.cern.ch/copyright for details of the copyright holders.
3// All rights not expressly granted are reserved.
4//
5// This software is distributed under the terms of the GNU General Public
6// License v3 (GPL Version 3), copied verbatim in the file "COPYING".
7//
8// In applying this license CERN does not waive the privileges and immunities
9// granted to it by virtue of its status as an Intergovernmental Organization
10// or submit itself to any jurisdiction.
11
14
15#ifdef GPUCA_O2_LIB
17#include "TPCBase/Sector.h"
19#include "TPCBase/Mapper.h"
20#endif
21
23#include "TPCFastTransform.h"
24#include "GPUTPCClusterData.h"
25#include "GPUO2DataTypes.h"
26#include "GPUDataTypes.h"
27#include "GPUTPCGeometry.h"
28#include "AliHLTTPCRawCluster.h" // VS: It can not be removed. Used in line 93.
29#include "GPUParam.h"
30#include "GPULogging.h"
31#include <algorithm>
32#include <vector>
33
34#include "clusterFinderDefs.h"
40#include "TPCBase/RDHUtils.h"
41#include "TPCBase/CRU.h"
43
44#include <oneapi/tbb.h>
45
46using namespace o2::gpu;
47using namespace o2::tpc;
48using namespace o2::tpc::constants;
49using namespace std::string_literals;
50
51void GPUReconstructionConvert::ConvertNativeToClusterData(o2::tpc::ClusterNativeAccess* native, std::unique_ptr<GPUTPCClusterData[]>* clusters, uint32_t* nClusters, const TPCFastTransform* transform, int32_t continuousMaxTimeBin)
52{
53 memset(nClusters, 0, NSECTORS * sizeof(nClusters[0]));
54 uint32_t offset = 0;
55 for (uint32_t i = 0; i < NSECTORS; i++) {
56 uint32_t nClSector = 0;
57 for (int32_t j = 0; j < GPUCA_ROW_COUNT; j++) {
58 nClSector += native->nClusters[i][j];
59 }
60 nClusters[i] = nClSector;
61 clusters[i].reset(new GPUTPCClusterData[nClSector]);
62 nClSector = 0;
63 for (int32_t j = 0; j < GPUCA_ROW_COUNT; j++) {
64 for (uint32_t k = 0; k < native->nClusters[i][j]; k++) {
65 const auto& clin = native->clusters[i][j][k];
66 float x = 0, y = 0, z = 0;
67 if (continuousMaxTimeBin == 0) {
68 transform->Transform(i, j, clin.getPad(), clin.getTime(), x, y, z);
69 } else {
70 transform->TransformInTimeFrame(i, j, clin.getPad(), clin.getTime(), x, y, z, continuousMaxTimeBin);
71 }
72 auto& clout = clusters[i].get()[nClSector];
73 clout.x = x;
74 clout.y = y;
75 clout.z = z;
76 clout.row = j;
77 clout.amp = clin.qTot;
78 clout.flags = clin.getFlags();
79 clout.id = offset + k;
80 nClSector++;
81 }
82 native->clusterOffset[i][j] = offset;
83 offset += native->nClusters[i][j];
84 }
85 }
86}
87
88void GPUReconstructionConvert::ConvertRun2RawToNative(o2::tpc::ClusterNativeAccess& native, std::unique_ptr<ClusterNative[]>& nativeBuffer, const AliHLTTPCRawCluster** rawClusters, uint32_t* nRawClusters)
89{
90 memset((void*)&native, 0, sizeof(native));
91 for (uint32_t i = 0; i < NSECTORS; i++) {
92 for (uint32_t j = 0; j < nRawClusters[i]; j++) {
93 native.nClusters[i][rawClusters[i][j].GetPadRow()]++;
94 }
95 native.nClustersTotal += nRawClusters[i];
96 }
97 nativeBuffer.reset(new ClusterNative[native.nClustersTotal]);
98 native.clustersLinear = nativeBuffer.get();
99 native.setOffsetPtrs();
100 for (uint32_t i = 0; i < NSECTORS; i++) {
101 for (uint32_t j = 0; j < GPUCA_ROW_COUNT; j++) {
102 native.nClusters[i][j] = 0;
103 }
104 for (uint32_t j = 0; j < nRawClusters[i]; j++) {
105 const AliHLTTPCRawCluster& org = rawClusters[i][j];
106 int32_t row = org.GetPadRow();
107 ClusterNative& c = nativeBuffer[native.clusterOffset[i][row] + native.nClusters[i][row]++];
108 c.setTimeFlags(org.GetTime(), org.GetFlags());
109 c.setPad(org.GetPad());
110 c.setSigmaTime(CAMath::Sqrt(org.GetSigmaTime2()));
111 c.setSigmaPad(CAMath::Sqrt(org.GetSigmaPad2()));
112 c.qMax = org.GetQMax();
113 c.qTot = org.GetCharge();
114 }
115 }
116}
117
119{
120 float retVal = 0;
121 for (uint32_t i = 0; i < NSECTORS; i++) {
122 for (uint32_t j = 0; j < GPUCA_ROW_COUNT; j++) {
123 for (uint32_t k = 0; k < native.nClusters[i][j]; k++) {
124 if (native.clusters[i][j][k].getTime() > retVal) {
125 retVal = native.clusters[i][j][k].getTime();
126 }
127 }
128 }
129 }
130 return ceil(retVal);
131}
132
134{
135 float retVal = 0;
136 for (uint32_t i = 0; i < NSECTORS; i++) {
137 for (uint32_t k = 0; k < digits.nTPCDigits[i]; k++) {
138 if (digits.tpcDigits[i][k].getTimeStamp() > retVal) {
139 retVal = digits.tpcDigits[i][k].getTimeStamp();
140 }
141 }
142 }
143 return ceil(retVal);
144}
145
147{
148 float retVal = 0;
149 for (uint32_t i = 0; i < NSECTORS; i++) {
150 int32_t firstHBF = zspages.sector[i].count[0] ? o2::raw::RDHUtils::getHeartBeatOrbit(*(const o2::header::RAWDataHeader*)zspages.sector[i].zsPtr[0][0]) : 0;
151 for (uint32_t j = 0; j < GPUTrackingInOutZS::NENDPOINTS; j++) {
152 for (uint32_t k = 0; k < zspages.sector[i].count[j]; k++) {
153 const char* page = (const char*)zspages.sector[i].zsPtr[j][k];
154 for (uint32_t l = 0; l < zspages.sector[i].nZSPtr[j][k]; l++) {
157 int32_t nTimeBinSpan = hdr->nTimeBinSpan;
159 TPCZSHDRV2* hdr2 = (TPCZSHDRV2*)hdr;
160 if (hdr2->flags & TPCZSHDRV2::ZSFlags::nTimeBinSpanBit8) {
161 nTimeBinSpan += 256;
162 }
163 }
164 uint32_t timeBin = (hdr->timeOffset + (o2::raw::RDHUtils::getHeartBeatOrbit(*rdh) - firstHBF) * o2::constants::lhc::LHCMaxBunches) / LHCBCPERTIMEBIN + nTimeBinSpan;
165 if (timeBin > retVal) {
166 retVal = timeBin;
167 }
168 }
169 }
170 }
171 }
172 return ceil(retVal);
173}
174
175// ------------------------------------------------- TPC ZS -------------------------------------------------
176
177#ifdef GPUCA_TPC_GEOMETRY_O2
178namespace o2::gpu
179{
180namespace // anonymous
181{
182
183// ------------------------------------------------- TPC ZS General -------------------------------------------------
184
185typedef std::array<int64_t, TPCZSHDR::TPC_ZS_PAGE_SIZE / sizeof(int64_t)> zsPage;
186
187struct zsEncoder {
188 int32_t curRegion = 0, outputRegion = 0;
189 uint32_t encodeBits = 0;
190 uint32_t zsVersion = 0;
191 uint32_t iSector = 0;
192 o2::raw::RawFileWriter* raw = nullptr;
193 const o2::InteractionRecord* ir = nullptr;
194 const GPUParam* param = nullptr;
195 bool padding = false;
196 int32_t lastEndpoint = -2, lastTime = -1, lastRow = GPUCA_ROW_COUNT;
197 int32_t endpoint = 0, outputEndpoint = 0;
198 int64_t hbf = -1, nexthbf = 0;
199 zsPage* page = nullptr;
200 uint8_t* pagePtr = nullptr;
201 int32_t bcShiftInFirstHBF = 0;
202 int32_t firstTimebinInPage = -1;
203 float encodeBitsFactor = 0;
204 bool needAnotherPage = false;
205 uint32_t packetCounter = 0;
206 uint32_t pageCounter = 0;
207 void ZSfillEmpty(void* ptr, int32_t shift, uint32_t feeId, int32_t orbit, int32_t linkid);
208 static void ZSstreamOut(uint16_t* bufIn, uint32_t& lenIn, uint8_t* bufOut, uint32_t& lenOut, uint32_t nBits);
209 int64_t getHbf(int64_t timestamp) { return (timestamp * LHCBCPERTIMEBIN + bcShiftInFirstHBF) / o2::constants::lhc::LHCMaxBunches; }
210};
211
212inline void zsEncoder::ZSfillEmpty(void* ptr, int32_t shift, uint32_t feeId, int32_t orbit, int32_t linkid)
213{
216 o2::raw::RDHUtils::setHeartBeatBC(*rdh, shift);
218 o2::raw::RDHUtils::setVersion(*rdh, o2::raw::RDHUtils::getVersion<o2::header::RAWDataHeader>());
219 o2::raw::RDHUtils::setFEEID(*rdh, feeId);
221 o2::raw::RDHUtils::setLinkID(*rdh, linkid);
222 o2::raw::RDHUtils::setPacketCounter(*rdh, packetCounter++);
223 o2::raw::RDHUtils::setPageCounter(*rdh, pageCounter++);
224}
225
226inline void zsEncoder::ZSstreamOut(uint16_t* bufIn, uint32_t& lenIn, uint8_t* bufOut, uint32_t& lenOut, uint32_t nBits)
227{
228 uint32_t byte = 0, bits = 0;
229 uint32_t mask = (1 << nBits) - 1;
230 for (uint32_t i = 0; i < lenIn; i++) {
231 byte |= (bufIn[i] & mask) << bits;
232 bits += nBits;
233 while (bits >= 8) {
234 bufOut[lenOut++] = (uint8_t)(byte & 0xFF);
235 byte = byte >> 8;
236 bits -= 8;
237 }
238 }
239 if (bits) {
240 bufOut[lenOut++] = byte;
241 }
242 lenIn = 0;
243}
244
245static inline auto ZSEncoderGetDigits(const GPUTrackingInOutDigits& in, int32_t i) { return in.tpcDigits[i]; }
246static inline auto ZSEncoderGetNDigits(const GPUTrackingInOutDigits& in, int32_t i) { return in.nTPCDigits[i]; }
247#ifdef GPUCA_O2_LIB
248using DigitArray = std::array<gsl::span<const o2::tpc::Digit>, o2::tpc::Sector::MAXSECTOR>;
249static inline auto ZSEncoderGetDigits(const DigitArray& in, int32_t i) { return in[i].data(); }
250static inline auto ZSEncoderGetNDigits(const DigitArray& in, int32_t i) { return in[i].size(); }
251#endif // GPUCA_O2_LIB
252
253// ------------------------------------------------- TPC ZS Original Row-based ZS -------------------------------------------------
254
255struct zsEncoderRow : public zsEncoder {
256 std::array<uint16_t, TPCZSHDR::TPC_ZS_PAGE_SIZE> streamBuffer = {};
257 std::array<uint8_t, TPCZSHDR::TPC_ZS_PAGE_SIZE> streamBuffer8 = {};
258 TPCZSHDR* hdr = nullptr;
259 TPCZSTBHDR* curTBHdr = nullptr;
260 uint8_t* nSeq = nullptr;
261 int32_t seqLen = 0;
262 int32_t endpointStart = 0;
263 int32_t nRowsInTB = 0;
264 uint32_t streamSize = 0, streamSize8 = 0;
265 constexpr static int32_t RAWLNK = rdh_utils::UserLogicLinkID;
266
267 bool checkInput(std::vector<o2::tpc::Digit>& tmpBuffer, uint32_t k);
268 bool writeSubPage();
269 void init() { encodeBits = zsVersion == 2 ? TPCZSHDR::TPC_ZS_NBITS_V2 : TPCZSHDR::TPC_ZS_NBITS_V1; }
270 void initPage() {}
271 uint32_t encodeSequence(std::vector<o2::tpc::Digit>& tmpBuffer, uint32_t k);
272
273 bool sort(const o2::tpc::Digit a, const o2::tpc::Digit b);
274 void decodePage(std::vector<o2::tpc::Digit>& outputBuffer, const zsPage* page, uint32_t endpoint, uint32_t firstOrbit, uint32_t triggerBC = 0);
275};
276
277inline bool zsEncoderRow::sort(const o2::tpc::Digit a, const o2::tpc::Digit b)
278{
279 int32_t endpointa = GPUTPCGeometry::GetRegion(a.getRow());
280 int32_t endpointb = GPUTPCGeometry::GetRegion(b.getRow());
281 endpointa = 2 * endpointa + (a.getRow() >= GPUTPCGeometry::GetRegionStart(endpointa) + GPUTPCGeometry::GetRegionRows(endpointa) / 2);
282 endpointb = 2 * endpointb + (b.getRow() >= GPUTPCGeometry::GetRegionStart(endpointb) + GPUTPCGeometry::GetRegionRows(endpointb) / 2);
283 if (endpointa != endpointb) {
284 return endpointa <= endpointb;
285 }
286 if (a.getTimeStamp() != b.getTimeStamp()) {
287 return a.getTimeStamp() < b.getTimeStamp();
288 }
289 if (a.getRow() != b.getRow()) {
290 return a.getRow() < b.getRow();
291 }
292 return a.getPad() < b.getPad();
293}
294
295bool zsEncoderRow::checkInput(std::vector<o2::tpc::Digit>& tmpBuffer, uint32_t k)
296{
297 seqLen = 1;
298 if (lastRow != tmpBuffer[k].getRow()) {
299 endpointStart = GPUTPCGeometry::GetRegionStart(curRegion);
300 endpoint = curRegion * 2;
301 if (tmpBuffer[k].getRow() >= endpointStart + GPUTPCGeometry::GetRegionRows(curRegion) / 2) {
302 endpoint++;
303 endpointStart += GPUTPCGeometry::GetRegionRows(curRegion) / 2;
304 }
305 }
306 for (uint32_t l = k + 1; l < tmpBuffer.size(); l++) {
307 if (tmpBuffer[l].getRow() == tmpBuffer[k].getRow() && tmpBuffer[l].getTimeStamp() == tmpBuffer[k].getTimeStamp() && tmpBuffer[l].getPad() == tmpBuffer[l - 1].getPad() + 1) {
308 seqLen++;
309 } else {
310 break;
311 }
312 }
313 if (lastEndpoint >= 0 && lastTime != -1 && (int32_t)hdr->nTimeBinSpan + tmpBuffer[k].getTimeStamp() - lastTime >= 256) {
314 lastEndpoint = -1;
315 }
316 if (endpoint == lastEndpoint) {
317 uint32_t sizeChk = (uint32_t)(pagePtr - reinterpret_cast<uint8_t*>(page)); // already written
318 sizeChk += 2 * (nRowsInTB + (tmpBuffer[k].getRow() != lastRow && tmpBuffer[k].getTimeStamp() == lastTime)); // TB HDR
319 sizeChk += streamSize8; // in stream buffer
320 sizeChk += (lastTime != tmpBuffer[k].getTimeStamp()) && ((sizeChk + (streamSize * encodeBits + 7) / 8) & 1); // time bin alignment
321 sizeChk += (tmpBuffer[k].getTimeStamp() != lastTime || tmpBuffer[k].getRow() != lastRow) ? 3 : 0; // new row overhead
322 sizeChk += (lastTime != -1 && tmpBuffer[k].getTimeStamp() > lastTime) ? ((tmpBuffer[k].getTimeStamp() - lastTime - 1) * 2) : 0; // empty time bins
323 sizeChk += 2; // sequence metadata
324 const uint32_t streamSizeChkBits = streamSize * encodeBits + ((lastTime != tmpBuffer[k].getTimeStamp() && (streamSize * encodeBits) % 8) ? (8 - (streamSize * encodeBits) % 8) : 0);
325 if (sizeChk + (encodeBits + streamSizeChkBits + 7) / 8 > TPCZSHDR::TPC_ZS_PAGE_SIZE) {
326 lastEndpoint = -1;
327 } else if (sizeChk + (seqLen * encodeBits + streamSizeChkBits + 7) / 8 > TPCZSHDR::TPC_ZS_PAGE_SIZE) {
328 seqLen = ((TPCZSHDR::TPC_ZS_PAGE_SIZE - sizeChk) * 8 - streamSizeChkBits) / encodeBits;
329 }
330 // sizeChk += (seqLen * encodeBits + streamSizeChkBits + 7) / 8;
331 // printf("Endpoint %d (%d), Pos %d, Chk %d, Len %d, rows %d, StreamSize %d %d, time %d (%d), row %d (%d), pad %d\n", endpoint, lastEndpoint, (int32_t) (pagePtr - reinterpret_cast<uint8_t*>(page)), sizeChk, seqLen, nRowsInTB, streamSize8, streamSize, (int32_t)tmpBuffer[k].getTimeStamp(), lastTime, (int32_t)tmpBuffer[k].getRow(), lastRow, tmpBuffer[k].getPad());
332 }
333 return endpoint != lastEndpoint || tmpBuffer[k].getTimeStamp() != lastTime;
334}
335
336bool zsEncoderRow::writeSubPage()
337{
338 if (pagePtr != reinterpret_cast<uint8_t*>(page)) {
339 pagePtr += 2 * nRowsInTB;
340 ZSstreamOut(streamBuffer.data(), streamSize, streamBuffer8.data(), streamSize8, encodeBits);
341 pagePtr = std::copy(streamBuffer8.data(), streamBuffer8.data() + streamSize8, pagePtr);
342 if (pagePtr - reinterpret_cast<uint8_t*>(page) > 8192) {
343 throw std::runtime_error("internal error during ZS encoding");
344 }
345 streamSize8 = 0;
346 for (int32_t l = 1; l < nRowsInTB; l++) {
347 curTBHdr->rowAddr1()[l - 1] += 2 * nRowsInTB;
348 }
349 }
350 return endpoint != lastEndpoint;
351}
352
353uint32_t zsEncoderRow::encodeSequence(std::vector<o2::tpc::Digit>& tmpBuffer, uint32_t k)
354{
355 if (tmpBuffer[k].getTimeStamp() != lastTime) {
356 if (lastTime != -1) {
357 hdr->nTimeBinSpan += tmpBuffer[k].getTimeStamp() - lastTime - 1;
358 pagePtr += (tmpBuffer[k].getTimeStamp() - lastTime - 1) * 2;
359 }
360 hdr->nTimeBinSpan++;
361 if ((pagePtr - reinterpret_cast<uint8_t*>(page)) & 1) {
362 pagePtr++;
363 }
364 curTBHdr = reinterpret_cast<TPCZSTBHDR*>(pagePtr);
365 curTBHdr->rowMask |= (endpoint & 1) << 15;
366 nRowsInTB = 0;
367 lastRow = GPUCA_ROW_COUNT;
368 }
369 if (tmpBuffer[k].getRow() != lastRow) {
370 curTBHdr->rowMask |= 1 << (tmpBuffer[k].getRow() - endpointStart);
371 ZSstreamOut(streamBuffer.data(), streamSize, streamBuffer8.data(), streamSize8, encodeBits);
372 if (nRowsInTB) {
373 curTBHdr->rowAddr1()[nRowsInTB - 1] = (pagePtr - reinterpret_cast<uint8_t*>(page)) + streamSize8;
374 }
375 nRowsInTB++;
376 nSeq = streamBuffer8.data() + streamSize8++;
377 *nSeq = 0;
378 }
379 (*nSeq)++;
380 streamBuffer8[streamSize8++] = tmpBuffer[k].getPad();
381 streamBuffer8[streamSize8++] = streamSize + seqLen;
382 for (int32_t l = 0; l < seqLen; l++) {
383 streamBuffer[streamSize++] = (uint16_t)(tmpBuffer[k + l].getChargeFloat() * encodeBitsFactor + 0.5f);
384 }
385 return seqLen;
386}
387
388void zsEncoderRow::decodePage(std::vector<o2::tpc::Digit>& outputBuffer, const zsPage* decPage, uint32_t decEndpoint, uint32_t firstOrbit, uint32_t triggerBC)
389{
390 const uint8_t* decPagePtr = reinterpret_cast<const uint8_t*>(decPage);
391 const o2::header::RAWDataHeader* rdh = (const o2::header::RAWDataHeader*)decPagePtr;
392 if (o2::raw::RDHUtils::getMemorySize(*rdh) == sizeof(o2::header::RAWDataHeader)) {
393 return;
394 }
395 decPagePtr += sizeof(o2::header::RAWDataHeader);
396 const TPCZSHDR* decHDR = reinterpret_cast<const TPCZSHDR*>(decPagePtr);
397 decPagePtr += sizeof(*decHDR);
398 if (decHDR->version != 1 && decHDR->version != 2) {
399 throw std::runtime_error("invalid ZS version "s + std::to_string(decHDR->version) + " (1 or 2 expected)"s);
400 }
401 const float decodeBitsFactor = 1.f / (1 << (encodeBits - 10));
402 uint32_t mask = (1 << encodeBits) - 1;
403 int32_t cruid = decHDR->cruID;
404 uint32_t sector = cruid / 10;
405 if (sector != iSector) {
406 throw std::runtime_error("invalid TPC sector");
407 }
408 int32_t region = cruid % 10;
409 if ((uint32_t)region != decEndpoint / 2) {
410 throw std::runtime_error("CRU ID / endpoint mismatch");
411 }
412 int32_t nRowsRegion = GPUTPCGeometry::GetRegionRows(region);
413
414 int32_t timeBin = (decHDR->timeOffset + (uint64_t)(o2::raw::RDHUtils::getHeartBeatOrbit(*rdh) - firstOrbit) * o2::constants::lhc::LHCMaxBunches) / LHCBCPERTIMEBIN;
415 for (int32_t l = 0; l < decHDR->nTimeBinSpan; l++) {
416 if ((decPagePtr - reinterpret_cast<const uint8_t*>(decPage)) & 1) {
417 decPagePtr++;
418 }
419 const TPCZSTBHDR* tbHdr = reinterpret_cast<const TPCZSTBHDR*>(decPagePtr);
420 bool upperRows = tbHdr->rowMask & 0x8000;
421 if (tbHdr->rowMask != 0 && ((upperRows) ^ ((decEndpoint & 1) != 0))) {
422 throw std::runtime_error("invalid endpoint");
423 }
424 const int32_t rowOffset = GPUTPCGeometry::GetRegionStart(region) + (upperRows ? (nRowsRegion / 2) : 0);
425 const int32_t nRows = upperRows ? (nRowsRegion - nRowsRegion / 2) : (nRowsRegion / 2);
426 const int32_t nRowsUsed = __builtin_popcount((uint32_t)(tbHdr->rowMask & 0x7FFF));
427 decPagePtr += nRowsUsed ? (2 * nRowsUsed) : 2;
428 int32_t rowPos = 0;
429 for (int32_t m = 0; m < nRows; m++) {
430 if ((tbHdr->rowMask & (1 << m)) == 0) {
431 continue;
432 }
433 const uint8_t* rowData = rowPos == 0 ? decPagePtr : (reinterpret_cast<const uint8_t*>(decPage) + tbHdr->rowAddr1()[rowPos - 1]);
434 const int32_t nSeqRead = *rowData;
435 const uint8_t* adcData = rowData + 2 * nSeqRead + 1;
436 int32_t nADC = (rowData[2 * nSeqRead] * encodeBits + 7) / 8;
437 decPagePtr += 1 + 2 * nSeqRead + nADC;
438 uint32_t byte = 0, bits = 0, posXbits = 0;
439 std::array<uint16_t, TPCZSHDR::TPC_ZS_PAGE_SIZE> decBuffer;
440 for (int32_t n = 0; n < nADC; n++) {
441 byte |= *(adcData++) << bits;
442 bits += 8;
443 while (bits >= encodeBits) {
444 decBuffer[posXbits++] = byte & mask;
445 byte = byte >> encodeBits;
446 bits -= encodeBits;
447 }
448 }
449 posXbits = 0;
450 for (int32_t n = 0; n < nSeqRead; n++) {
451 const int32_t decSeqLen = rowData[(n + 1) * 2] - (n ? rowData[n * 2] : 0);
452 for (int32_t o = 0; o < decSeqLen; o++) {
453 outputBuffer.emplace_back(o2::tpc::Digit{cruid, decBuffer[posXbits++] * decodeBitsFactor, (tpccf::Row)(rowOffset + m), (tpccf::Pad)(rowData[n * 2 + 1] + o), timeBin + l});
454 }
455 }
456 rowPos++;
457 }
458 }
459}
460
461// ------------------------------------------------- TPC ZS Link Based ZS -------------------------------------------------
462
463#ifdef GPUCA_O2_LIB
464struct zsEncoderLinkBased : public zsEncoder {
465 TPCZSHDRV2* hdr = nullptr;
466 TPCZSHDRV2 hdrBuffer;
467 int32_t inverseChannelMapping[5][32];
468 int32_t nSamples = 0;
469 int32_t link = 0;
470 bool finishPage = false;
471 std::vector<uint16_t> adcValues = {};
472 std::bitset<80> bitmask = {};
473
474 void createBitmask(std::vector<o2::tpc::Digit>& tmpBuffer, uint32_t k);
475 void init();
476 bool sort(const o2::tpc::Digit a, const o2::tpc::Digit b);
477};
478
479void zsEncoderLinkBased::init()
480{
481 encodeBits = TPCZSHDRV2::TPC_ZS_NBITS_V34;
482 for (int32_t i = 0; i < 5; i++) {
483 for (int32_t j = 0; j < 32; j++) {
484 inverseChannelMapping[i][j] = -1;
485 }
486 }
487 for (int32_t iCRU = 0; iCRU < 2; iCRU++) {
488 for (int32_t iChannel = 0; iChannel < 80; iChannel++) {
489 int32_t sampaOnFEC = 0, channelOnSAMPA = 0;
490 Mapper::getSampaAndChannelOnFEC(iCRU, iChannel, sampaOnFEC, channelOnSAMPA);
491 if (inverseChannelMapping[sampaOnFEC][channelOnSAMPA] != -1 && inverseChannelMapping[sampaOnFEC][channelOnSAMPA] != iChannel) {
492 GPUError("ERROR: Channel conflict: %d %d: %d vs %d", sampaOnFEC, channelOnSAMPA, inverseChannelMapping[sampaOnFEC][channelOnSAMPA], iChannel);
493 throw std::runtime_error("ZS error");
494 }
495 inverseChannelMapping[sampaOnFEC][channelOnSAMPA] = iChannel;
496 }
497 }
498 for (int32_t i = 0; i < 5; i++) {
499 for (int32_t j = 0; j < 32; j++) {
500 if (inverseChannelMapping[i][j] == -1) {
501 GPUError("ERROR: Map missing for sampa %d channel %d", i, j);
502 throw std::runtime_error("ZS error");
503 }
504 }
505 }
506}
507
508void zsEncoderLinkBased::createBitmask(std::vector<o2::tpc::Digit>& tmpBuffer, uint32_t k)
509{
510 const auto& mapper = Mapper::instance();
511 nSamples = 0;
512 adcValues.clear();
513 bitmask.reset();
514 uint32_t l;
515 for (l = k; l < tmpBuffer.size(); l++) {
516 const auto& a = tmpBuffer[l];
517 int32_t cruinsector = GPUTPCGeometry::GetRegion(a.getRow());
518 o2::tpc::GlobalPadNumber pad = mapper.globalPadNumber(o2::tpc::PadPos(a.getRow(), a.getPad()));
519 o2::tpc::FECInfo fec = mapper.fecInfo(pad);
520 o2::tpc::CRU cru = cruinsector;
521 int32_t fecInPartition = fec.getIndex() - mapper.getPartitionInfo(cru.partition()).getSectorFECOffset();
522 int32_t tmpEndpoint = 2 * cruinsector + (fecInPartition >= (mapper.getPartitionInfo(cru.partition()).getNumberOfFECs() + 1) / 2);
523 if (l == k) {
524 link = fecInPartition;
525 endpoint = tmpEndpoint;
526 } else if (endpoint != tmpEndpoint || link != fecInPartition || tmpBuffer[l].getTimeStamp() != tmpBuffer[k].getTimeStamp()) {
527 break;
528 }
529 int32_t channel = inverseChannelMapping[fec.getSampaChip()][fec.getSampaChannel()];
530 bitmask[channel] = 1;
531 adcValues.emplace_back((uint16_t)(a.getChargeFloat() * encodeBitsFactor + 0.5f));
532 }
533 nSamples = l - k;
534}
535
536bool zsEncoderLinkBased::sort(const o2::tpc::Digit a, const o2::tpc::Digit b)
537{
538 // Fixme: this is blasphemy... one shoult precompute all values and sort an index array
539 int32_t cruinsectora = GPUTPCGeometry::GetRegion(a.getRow());
540 int32_t cruinsectorb = GPUTPCGeometry::GetRegion(b.getRow());
541 if (cruinsectora != cruinsectorb) {
542 return cruinsectora < cruinsectorb;
543 }
544 const auto& mapper = Mapper::instance();
545 o2::tpc::GlobalPadNumber pada = mapper.globalPadNumber(o2::tpc::PadPos(a.getRow(), a.getPad()));
546 o2::tpc::GlobalPadNumber padb = mapper.globalPadNumber(o2::tpc::PadPos(b.getRow(), b.getPad()));
547 o2::tpc::FECInfo feca = mapper.fecInfo(pada);
548 o2::tpc::FECInfo fecb = mapper.fecInfo(padb);
549 o2::tpc::CRU cru = cruinsectora;
550 int32_t fecInPartitiona = feca.getIndex() - mapper.getPartitionInfo(cru.partition()).getSectorFECOffset();
551 int32_t fecInPartitionb = fecb.getIndex() - mapper.getPartitionInfo(cru.partition()).getSectorFECOffset();
552
553 int32_t endpointa = 2 * cruinsectora + (fecInPartitiona >= (mapper.getPartitionInfo(cru.partition()).getNumberOfFECs() + 1) / 2);
554 int32_t endpointb = 2 * cruinsectorb + (fecInPartitionb >= (mapper.getPartitionInfo(cru.partition()).getNumberOfFECs() + 1) / 2);
555 if (endpointa != endpointb) {
556 return endpointa < endpointb;
557 }
558 if (a.getTimeStamp() != b.getTimeStamp()) {
559 return a.getTimeStamp() < b.getTimeStamp();
560 }
561 if (fecInPartitiona != fecInPartitionb) {
562 return fecInPartitiona < fecInPartitionb;
563 }
564 return inverseChannelMapping[feca.getSampaChip()][feca.getSampaChannel()] < inverseChannelMapping[fecb.getSampaChip()][fecb.getSampaChannel()];
565}
566
567// ------------------------------------------------- TPC Improved Link Based ZS -------------------------------------------------
568
569struct zsEncoderImprovedLinkBased : public zsEncoderLinkBased {
570 bool checkInput(std::vector<o2::tpc::Digit>& tmpBuffer, uint32_t k);
571 uint32_t encodeSequence(std::vector<o2::tpc::Digit>& tmpBuffer, uint32_t k);
572 void decodePage(std::vector<o2::tpc::Digit>& outputBuffer, const zsPage* page, uint32_t endpoint, uint32_t firstOrbit, uint32_t triggerBC = 0);
573 bool writeSubPage();
574 void initPage();
575
576 constexpr static int32_t RAWLNK = rdh_utils::ILBZSLinkID;
577};
578
579bool zsEncoderImprovedLinkBased::checkInput(std::vector<o2::tpc::Digit>& tmpBuffer, uint32_t k)
580{
581 createBitmask(tmpBuffer, k);
582 finishPage = endpoint != lastEndpoint;
583 if (firstTimebinInPage != -1 && tmpBuffer[k].getTimeStamp() - firstTimebinInPage >= 1 << (sizeof(hdr->nTimeBinSpan) * 8)) {
584 finishPage = true;
585 }
586 if (!finishPage) {
587 uint32_t sizeChk = (uint32_t)(pagePtr - reinterpret_cast<uint8_t*>(page));
590 sizeChk += (nSamples * TPCZSHDRV2::TPC_ZS_NBITS_V34 + 127) / 128 * 16;
591 } else {
592 sizeChk += (nSamples + 2 * TPCZSHDRV2::SAMPLESPER64BIT - 1) / (2 * TPCZSHDRV2::SAMPLESPER64BIT) * 16;
593 }
594 if (sizeChk > TPCZSHDR::TPC_ZS_PAGE_SIZE) {
595 finishPage = true;
596 }
597 }
598 return finishPage;
599}
600
601uint32_t zsEncoderImprovedLinkBased::encodeSequence(std::vector<o2::tpc::Digit>& tmpBuffer, uint32_t k)
602{
604 pagePtr += sizeof(*tbHdr);
605 tbHdr->bunchCrossing = (tmpBuffer[k].getTimeStamp() - firstTimebinInPage) * LHCBCPERTIMEBIN;
607 tbHdr->bitMaskHigh = (bitmask >> 64).to_ulong();
608 tbHdr->bitMaskLow = (bitmask & std::bitset<80>(0xFFFFFFFFFFFFFFFFlu)).to_ulong();
609 tbHdr->syncOffsetBC = 0;
610 tbHdr->fecInPartition = link;
611 hdr->nTimeBinSpan = tmpBuffer[k].getTimeStamp() - firstTimebinInPage;
612 hdr->nTimebinHeaders++;
614 tbHdr->numWordsPayload = (nSamples * TPCZSHDRV2::TPC_ZS_NBITS_V34 + 127) / 128; // tightly packed ADC samples
615 uint32_t tmp = 0;
616 uint32_t tmpIn = nSamples;
617 ZSstreamOut(adcValues.data(), tmpIn, pagePtr, tmp, encodeBits);
618 } else {
619 tbHdr->numWordsPayload = (nSamples + 2 * TPCZSHDRV2::SAMPLESPER64BIT - 1) / (2 * TPCZSHDRV2::SAMPLESPER64BIT);
620 uint64_t* payloadPtr = (uint64_t*)pagePtr;
621 for (uint32_t i = 0; i < 2 * tbHdr->numWordsPayload; i++) {
622 payloadPtr[i] = 0;
623 }
624 for (uint32_t i = 0; i < nSamples; i++) {
625 payloadPtr[i / TPCZSHDRV2::SAMPLESPER64BIT] |= ((uint64_t)adcValues[i]) << ((i % TPCZSHDRV2::SAMPLESPER64BIT) * TPCZSHDRV2::TPC_ZS_NBITS_V34);
626 }
627 }
628 pagePtr += tbHdr->numWordsPayload * 16;
629 return nSamples;
630}
631
632bool zsEncoderImprovedLinkBased::writeSubPage()
633{
634 return finishPage;
635}
636
637void zsEncoderImprovedLinkBased::initPage()
638{
640 hdr->nTimebinHeaders = 0;
641 hdr->firstZSDataOffset = 0;
642}
643
644void zsEncoderImprovedLinkBased::decodePage(std::vector<o2::tpc::Digit>& outputBuffer, const zsPage* decPage, uint32_t decEndpoint, uint32_t firstOrbit, uint32_t triggerBC)
645{
646 const auto& mapper = Mapper::instance();
647 const uint8_t* decPagePtr = reinterpret_cast<const uint8_t*>(decPage);
648 const o2::header::RAWDataHeader* rdh = (const o2::header::RAWDataHeader*)decPagePtr;
649 if (o2::raw::RDHUtils::getMemorySize(*rdh) == sizeof(o2::header::RAWDataHeader)) {
650 return;
651 }
652 decPagePtr += sizeof(o2::header::RAWDataHeader);
653 const TPCZSHDRV2* decHDR = reinterpret_cast<const TPCZSHDRV2*>(decPagePtr);
654 decPagePtr += sizeof(*decHDR);
655 if (decHDR->version != ZSVersion::ZSVersionLinkBasedWithMeta) {
656 throw std::runtime_error("invalid ZS version "s + std::to_string(decHDR->version) + " ("s + std::to_string(ZSVersion::ZSVersionLinkBasedWithMeta) + " expected)"s);
657 }
659 throw std::runtime_error("Magic word missing");
660 }
661 const float decodeBitsFactor = 1.f / (1 << (encodeBits - 10));
662 uint32_t mask = (1 << encodeBits) - 1;
663 int32_t cruid = decHDR->cruID;
664 uint32_t sector = cruid / 10;
665 if (sector != iSector) {
666 throw std::runtime_error("invalid TPC sector");
667 }
668 int32_t region = cruid % 10;
669 decPagePtr += decHDR->firstZSDataOffset * 16;
670 for (uint32_t i = 0; i < decHDR->nTimebinHeaders; i++) {
672#if 0 // Decoding using the function for the original linkZS
673 o2::tpc::CRU cru = cruid % 10;
674 const int32_t feeLink = tbHdr->fecInPartition - (decEndpoint & 1) * ((mapper.getPartitionInfo(cru.partition()).getNumberOfFECs() + 1) / 2);
675 auto fillADC = [&outputBuffer](int32_t cru, int32_t rowInSector, int32_t padInRow, int32_t timeBin, float adcValue) {
676 outputBuffer.emplace_back(o2::tpc::Digit{cruid, adcValue, rowInSector, padInRow, timeBin});
677 return true;
678 };
679 size_t size = sizeof(*tbHdr) + tbHdr->numWordsPayload * 16;
680 raw_processing_helpersa::processZSdata((const char*)decPagePtr, size, rdh_utils::getFEEID(cruid, decEndpoint & 1, feeLink), o2::raw::RDHUtils::getHeartBeatOrbit(*rdh), firstOrbit, decHDR->timeOffset, fillADC);
681#else // Decoding directly
682 if (!tbHdr->isLinkZS()) {
683 throw std::runtime_error("ZS TB Hdr does not have linkZS magic word");
684 }
685 int32_t timeBin = (int32_t(decHDR->timeOffset) + int32_t(tbHdr->bunchCrossing) + (int32_t)(o2::raw::RDHUtils::getHeartBeatOrbit(*rdh) - firstOrbit) * o2::constants::lhc::LHCMaxBunches - triggerBC) / LHCBCPERTIMEBIN;
686 if (timeBin < 0) {
687 LOGP(debug, "zsEncoderImprovedLinkBased::decodePage skipping digits hdr->tOff {} + hdr->bc {} + (orbit {} - firstOrbit {}) * maxBunch {} - triggerBC {} = {} < 0", decHDR->timeOffset, tbHdr->bunchCrossing, o2::raw::RDHUtils::getHeartBeatOrbit(*rdh), firstOrbit, o2::constants::lhc::LHCMaxBunches, triggerBC, timeBin);
688 continue;
689 }
690 const uint8_t* adcData = (const uint8_t*)(decPagePtr + sizeof(*tbHdr));
691 const auto& bitmask = tbHdr->getChannelBits();
692 int32_t nADC = bitmask.count();
693 std::vector<uint16_t> decBuffer(nADC);
695 uint32_t byte = 0, bits = 0, posXbits = 0;
696 while (posXbits < nADC) {
697 byte |= *(adcData++) << bits;
698 bits += 8;
699 while (bits >= encodeBits) {
700 decBuffer[posXbits++] = byte & mask;
701 byte = byte >> encodeBits;
702 bits -= encodeBits;
703 }
704 }
705 } else {
706 const uint64_t* adcData64 = (const uint64_t*)adcData;
707 for (int32_t j = 0; j < nADC; j++) {
709 }
710 }
711 for (int32_t j = 0, k = 0; j < bitmask.size(); j++) {
712 if (bitmask[j]) {
713 int32_t sampaOnFEC = 0, channelOnSAMPA = 0;
714 mapper.getSampaAndChannelOnFEC(cruid, j, sampaOnFEC, channelOnSAMPA);
715 const auto padSecPos = mapper.padSecPos(cruid, tbHdr->fecInPartition, sampaOnFEC, channelOnSAMPA);
716 const auto& padPos = padSecPos.getPadPos();
717 outputBuffer.emplace_back(o2::tpc::Digit{cruid, decBuffer[k++] * decodeBitsFactor, (tpccf::Row)padPos.getRow(), (tpccf::Pad)padPos.getPad(), timeBin});
718 }
719 }
720#endif
721 decPagePtr += sizeof(*tbHdr) + tbHdr->numWordsPayload * 16;
722 }
723}
724
725// ------------------------------------------------- TPC ZS Dense Link Based ZS -------------------------------------------------
726
727struct zsEncoderDenseLinkBased : public zsEncoderLinkBased {
728 bool checkInput(std::vector<o2::tpc::Digit>& tmpBuffer, uint32_t k);
729 uint32_t encodeSequence(std::vector<o2::tpc::Digit>& tmpBuffer, uint32_t k);
730 void decodePage(std::vector<o2::tpc::Digit>& outputBuffer, const zsPage* page, uint32_t endpoint, uint32_t firstOrbit, uint32_t triggerBC = 0);
731 bool writeSubPage();
732 void initPage();
733 void amendPageErrorMessage(std::ostringstream& oss, const o2::header::RAWDataHeader* rdh, const TPCZSHDRV2* decHDR, const uint8_t* payloadEnd, const uint8_t* decPagePtr, uint32_t nOutput);
734
735 uint16_t curTimeBin = 0;
736 std::vector<uint8_t> sequenceBuffer;
737 std::vector<uint16_t> sequenceBufferADC;
738
739 constexpr static int32_t RAWLNK = rdh_utils::DLBZSLinkID;
740 constexpr static int32_t v2nbits = 10;
741};
742
743bool zsEncoderDenseLinkBased::checkInput(std::vector<o2::tpc::Digit>& tmpBuffer, uint32_t k)
744{
745 createBitmask(tmpBuffer, k);
746 finishPage = endpoint != lastEndpoint;
747 uint16_t newTimeBin = tmpBuffer[k].getTimeStamp() - firstTimebinInPage;
748 bool retVall = finishPage || newTimeBin != curTimeBin;
749 return retVall;
750}
751
752uint32_t zsEncoderDenseLinkBased::encodeSequence(std::vector<o2::tpc::Digit>& tmpBuffer, uint32_t k)
753{
754 if (sequenceBuffer.size() == 0) {
755 uint16_t bc = (int64_t)tmpBuffer[k].getTimeStamp() * LHCBCPERTIMEBIN - (int64_t)hbf * o2::constants::lhc::LHCMaxBunches;
756 if (zsVersion == ZSVersion::ZSVersionDenseLinkBasedV2) {
757 bc &= 0xFFC;
758 }
759 sequenceBuffer.emplace_back(bc << 4);
760 sequenceBuffer.emplace_back(bc >> 4);
761 curTimeBin = tmpBuffer[k].getTimeStamp() - firstTimebinInPage;
762 hdr->nTimeBinSpan = curTimeBin & 0xFF;
763 if (curTimeBin & 0x100) {
764 hdr->flags |= TPCZSHDRV2::ZSFlags::nTimeBinSpanBit8;
765 }
766 hdr->nTimebinHeaders++;
767 }
768 sequenceBuffer[0]++;
769
770 sequenceBuffer.emplace_back(link);
771 uint8_t* plink = &sequenceBuffer.back();
772
773 std::bitset<10> bitmaskL2;
774 for (int32_t i = 9; i >= 0; i--) {
775 bitmaskL2.set(i, ((bitmask >> (i * 8)) & std::bitset<80>(0xFF)).any());
776 }
777 if (bitmaskL2.all()) {
778 *plink |= 0b00100000;
779 } else {
780 *plink |= (bitmaskL2.to_ulong() >> 2) & 0b11000000;
781 sequenceBuffer.emplace_back(bitmaskL2.to_ulong() & 0xFF);
782 }
783
784 for (int32_t i = 0; i < 10; i++) {
785 if (bitmaskL2.test(i)) {
786 sequenceBuffer.emplace_back(((bitmask >> (i * 8)) & std::bitset<80>(0xFF)).to_ulong());
787 }
788 }
789
790 static_assert(TPCZSHDRV2::TPC_ZS_NBITS_V34 == 12);
791 if (nSamples) {
792 sequenceBufferADC.insert(sequenceBufferADC.end(), adcValues.begin(), adcValues.end());
793 }
794
795 return nSamples;
796}
797
798bool zsEncoderDenseLinkBased::writeSubPage()
799{
800 uint32_t offset = sequenceBuffer.size();
801 if (sequenceBufferADC.size()) {
802 bool need12bit = zsVersion != ZSVersion::ZSVersionDenseLinkBasedV2;
803 uint32_t needNow = 0;
804 if (zsVersion == ZSVersion::ZSVersionDenseLinkBasedV2) {
805 for (uint32_t i = 0; i < sequenceBufferADC.size(); i++) {
806 if (sequenceBufferADC[i] >= (1 << v2nbits)) {
807 need12bit = true;
808 break;
809 }
810 }
811 }
812 uint32_t encodeBitsBlock = encodeBits;
813 if (!need12bit) {
814 encodeBitsBlock = v2nbits;
815 sequenceBuffer[0] |= 0x10;
816 }
817 sequenceBuffer.resize(offset + (sequenceBufferADC.size() * encodeBitsBlock + 7) / 8);
818 uint32_t tmp = 0;
819 uint32_t tmpIn = sequenceBufferADC.size();
820 ZSstreamOut(sequenceBufferADC.data(), tmpIn, sequenceBuffer.data() + offset, tmp, encodeBitsBlock);
821 sequenceBufferADC.clear();
822 }
823
824 if (sequenceBuffer.size()) {
825 uint32_t sizeLeft = TPCZSHDR::TPC_ZS_PAGE_SIZE - (pagePtr - (uint8_t*)page) - sizeof(TPCZSHDRV2) - (hdr->flags & TPCZSHDRV2::ZSFlags::TriggerWordPresent ? TPCZSHDRV2::TRIGGER_WORD_SIZE : 0);
826 uint32_t size = sequenceBuffer.size();
827 uint32_t fill = std::min(sizeLeft, size);
828 memcpy(pagePtr, sequenceBuffer.data(), fill);
829 pagePtr += fill;
830 if (size != fill) {
832 sequenceBuffer.erase(sequenceBuffer.begin(), sequenceBuffer.begin() + fill);
833 } else {
834 sequenceBuffer.clear();
835 }
836 finishPage = finishPage || size >= sizeLeft || needAnotherPage;
837 }
838
839 return finishPage;
840}
841
842void zsEncoderDenseLinkBased::initPage()
843{
845 hdr->nTimebinHeaders = 0;
846 memcpy(pagePtr, sequenceBuffer.data(), sequenceBuffer.size());
847 hdr->firstZSDataOffset = sequenceBuffer.size() + sizeof(o2::header::RAWDataHeader);
848 pagePtr += sequenceBuffer.size();
849 sequenceBuffer.clear();
850 hdr->flags = 0;
851}
852
853void zsEncoderDenseLinkBased::decodePage(std::vector<o2::tpc::Digit>& outputBuffer, const zsPage* decPage, uint32_t decEndpoint, uint32_t firstOrbit, uint32_t triggerBC)
854{
855 const auto& mapper = Mapper::instance();
856 const uint8_t* decPagePtr = reinterpret_cast<const uint8_t*>(decPage);
857 const o2::header::RAWDataHeader* rdh = (const o2::header::RAWDataHeader*)decPagePtr;
858 if (o2::raw::RDHUtils::getMemorySize(*rdh) == sizeof(o2::header::RAWDataHeader)) {
859 return;
860 }
861 const TPCZSHDRV2* decHDR = reinterpret_cast<const TPCZSHDRV2*>(decPagePtr + o2::raw::RDHUtils::getMemorySize(*rdh) - sizeof(TPCZSHDRV2));
862 decPagePtr += sizeof(o2::header::RAWDataHeader);
863 if (decHDR->version < ZSVersion::ZSVersionDenseLinkBased || decHDR->version > ZSVersion::ZSVersionDenseLinkBasedV2) {
864 throw std::runtime_error("invalid ZS version "s + std::to_string(decHDR->version) + " ("s + std::to_string(ZSVersion::ZSVersionDenseLinkBased) + " - "s + std::to_string(ZSVersion::ZSVersionDenseLinkBasedV2) + " expected)"s);
865 }
867 throw std::runtime_error("Magic word missing");
868 }
869 const uint8_t* payloadEnd = ((const uint8_t*)decPage) + o2::raw::RDHUtils::getMemorySize(*rdh) - sizeof(TPCZSHDRV2) - ((decHDR->flags & TPCZSHDRV2::ZSFlags::TriggerWordPresent) ? TPCZSHDRV2::TRIGGER_WORD_SIZE : 0);
870 const float decodeBitsFactor = 1.f / (1 << (encodeBits - 10));
871 int32_t cruid = decHDR->cruID;
872 uint32_t sector = cruid / 10;
873 if (sector != iSector) {
874 throw std::runtime_error("invalid TPC sector");
875 }
876 int32_t region = cruid % 10;
877 decPagePtr += decHDR->firstZSDataOffset - sizeof(o2::header::RAWDataHeader);
878 std::vector<uint8_t> tmpBuffer;
879 bool extendFailure = false;
880 uint32_t nOutput = 0;
881 uint32_t minTimeBin = -1, maxTimeBin = 0;
882 for (uint32_t i = 0; i < decHDR->nTimebinHeaders; i++) {
883 int32_t sizeLeftInPage = payloadEnd - decPagePtr;
884 if (sizeLeftInPage <= 0) {
885 throw std::runtime_error("Decoding ran beyond end of page before processing extended timebin");
886 }
888 if (o2::raw::RDHUtils::getMemorySize(*rdh) != TPCZSHDR::TPC_ZS_PAGE_SIZE) {
889 throw std::runtime_error("pageExtends signaled, but current page is not full");
890 }
891
892 const uint8_t* pageNext = ((const uint8_t*)decPage) + TPCZSHDR::TPC_ZS_PAGE_SIZE;
893 const o2::header::RAWDataHeader* rdhNext = (const o2::header::RAWDataHeader*)pageNext;
894
895 if ((uint16_t)(o2::raw::RDHUtils::getPageCounter(*rdh) + 1) != o2::raw::RDHUtils::getPageCounter(*rdhNext)) {
896 GPUError("Incomplete HBF: Payload extended to next page, but next page missing in stream (packet counters %d %d)", (int32_t)o2::raw::RDHUtils::getPageCounter(*rdh), (int32_t)o2::raw::RDHUtils::getPageCounter(*rdhNext));
897 extendFailure = true;
898 decPagePtr = payloadEnd; // Next 8kb page is missing in stream, cannot decode remaining data, skip it
899 break;
900 }
901
902 const TPCZSHDRV2* hdrNext = reinterpret_cast<const TPCZSHDRV2*>(pageNext + o2::raw::RDHUtils::getMemorySize(*rdhNext) - sizeof(TPCZSHDRV2));
903 tmpBuffer.resize(sizeLeftInPage + hdrNext->firstZSDataOffset - sizeof(o2::header::RAWDataHeader));
904 memcpy(tmpBuffer.data(), decPagePtr, sizeLeftInPage);
905 memcpy(tmpBuffer.data() + sizeLeftInPage, pageNext + sizeof(o2::header::RAWDataHeader), hdrNext->firstZSDataOffset - sizeof(o2::header::RAWDataHeader));
906 decPagePtr = tmpBuffer.data();
907 payloadEnd = decPagePtr + tmpBuffer.size();
908 }
909 uint8_t linkCount = *((const uint8_t*)decPagePtr) & 0x0F;
910 uint16_t linkBC = (*((const uint16_t*)decPagePtr) & 0xFFF0) >> 4;
911 bool v2Flag = decHDR->version == ZSVersion::ZSVersionDenseLinkBasedV2 && *((const uint8_t*)decPagePtr) & 0x10;
912 if (decHDR->version == ZSVersion::ZSVersionDenseLinkBasedV2) {
913 linkBC &= 0xFFC;
914 }
915 decPagePtr += sizeof(uint16_t);
916 std::vector<int32_t> links;
917 std::vector<std::bitset<80>> bitmasks;
918 uint32_t nTotalSamples = 0;
919 for (uint32_t l = 0; l < linkCount; l++) {
920 uint8_t decLinkX = *((const uint8_t*)decPagePtr);
921 decPagePtr += sizeof(uint8_t);
922 uint8_t decLink = decLinkX & 0b00011111;
923 std::bitset<10> bitmaskL2;
924 if (decLinkX & 0b00100000) {
925 bitmaskL2.set();
926 } else {
927 bitmaskL2 = std::bitset<10>(((((uint16_t)decLinkX) & 0b11000000) << 2) | (uint16_t)*((const uint8_t*)decPagePtr));
928 decPagePtr += sizeof(uint8_t);
929 }
930
931 std::bitset<80> bitmask(0);
932 for (int32_t i = 0; i < 10; i++) {
933 if (bitmaskL2.test(i)) {
934 bitmask |= std::bitset<80>(*((const uint8_t*)decPagePtr)) << i * 8;
935 decPagePtr += sizeof(uint8_t);
936 }
937 }
938 links.emplace_back(decLink);
939 bitmasks.emplace_back(bitmask);
940 nTotalSamples += bitmask.count();
941 }
942
943 const uint8_t* adcData = (const uint8_t*)decPagePtr;
944 int32_t encodeBitsBlock = v2Flag ? v2nbits : encodeBits;
945 decPagePtr += (nTotalSamples * encodeBitsBlock + 7) / 8;
946
947 // time bin might be smaller 0 due to triggerBC
948 int32_t timeBin = (int32_t(linkBC) + (int32_t)(o2::raw::RDHUtils::getHeartBeatOrbit(*rdh) - firstOrbit) * o2::constants::lhc::LHCMaxBunches - int32_t(triggerBC)) / LHCBCPERTIMEBIN;
949 if (timeBin < 0 || nTotalSamples == 0) {
950 if (timeBin < 0 && nTotalSamples > 0) {
951 LOGP(debug, "zsEncoderDenseLinkBased::decodePage skipping digits (linkBC {} + orbit {} - firstOrbit {}) * maxBunch {} - triggerBC {} = {} < 0, nTotalSamples {}", linkBC, o2::raw::RDHUtils::getHeartBeatOrbit(*rdh), firstOrbit, o2::constants::lhc::LHCMaxBunches, triggerBC, timeBin, nTotalSamples);
952 }
953 continue;
954 }
955 if (timeBin > maxTimeBin) {
956 maxTimeBin = timeBin;
957 }
958 if (timeBin < minTimeBin) {
959 minTimeBin = timeBin;
960 }
961
962 std::vector<uint16_t> samples(nTotalSamples);
963 uint32_t mask = (1 << encodeBitsBlock) - 1;
964 uint32_t byte = 0, bits = 0, posXbits = 0;
965 while (posXbits < nTotalSamples) {
966 byte |= *(adcData++) << bits;
967 bits += 8;
968 while (bits >= encodeBitsBlock && posXbits < nTotalSamples) {
969 samples[posXbits++] = byte & mask;
970 byte = byte >> encodeBitsBlock;
971 bits -= encodeBitsBlock;
972 }
973 }
974 uint32_t samplePos = 0;
975
976 for (uint32_t l = 0; l < linkCount; l++) {
977 uint8_t decLink = links[l];
978 const auto& bitmask = bitmasks[l];
979 int32_t nADC = bitmask.count();
980
981 for (int32_t j = 0; j < bitmask.size(); j++) {
982 if (bitmask[j]) {
983 int32_t sampaOnFEC = 0, channelOnSAMPA = 0;
984 mapper.getSampaAndChannelOnFEC(cruid, j, sampaOnFEC, channelOnSAMPA);
985 const auto padSecPos = mapper.padSecPos(cruid, decLink, sampaOnFEC, channelOnSAMPA);
986 const auto& padPos = padSecPos.getPadPos();
987 outputBuffer.emplace_back(o2::tpc::Digit{cruid, samples[samplePos++] * decodeBitsFactor, (tpccf::Row)padPos.getRow(), (tpccf::Pad)padPos.getPad(), timeBin});
988 nOutput++;
989 }
990 }
991 }
992 }
993
994 int32_t hdrMinTimeBin = (int32_t(decHDR->timeOffset) + int32_t(o2::raw::RDHUtils::getHeartBeatOrbit(*rdh) - firstOrbit) * o2::constants::lhc::LHCMaxBunches - triggerBC);
995 if (triggerBC > 0 && hdrMinTimeBin < 0) {
996 hdrMinTimeBin = 0;
997 }
998 hdrMinTimeBin /= LHCBCPERTIMEBIN;
999 int32_t hdrMaxTimeBin = hdrMinTimeBin + decHDR->nTimeBinSpan + ((decHDR->flags & TPCZSHDRV2::ZSFlags::nTimeBinSpanBit8) ? 256 : 0);
1000
1001 if (!extendFailure && nOutput != decHDR->nADCsamples) {
1002 std::ostringstream oss;
1003 oss << "Number of decoded digits " << nOutput << " does not match value from MetaInfo " << decHDR->nADCsamples;
1004 amendPageErrorMessage(oss, rdh, decHDR, nullptr, nullptr, nOutput);
1005 throw std::runtime_error(oss.str());
1006 }
1007
1008 if (decHDR->nADCsamples && (minTimeBin < hdrMinTimeBin || maxTimeBin > hdrMaxTimeBin)) {
1009 std::ostringstream oss;
1010 oss << "Incorrect time bin range in MetaInfo, header reports " << hdrMinTimeBin << " - " << hdrMaxTimeBin << "(timeOffset: " << decHDR->timeOffset << " + (orbit: " << o2::raw::RDHUtils::getHeartBeatOrbit(*rdh) << " - firstOrbit " << firstOrbit << ") * LHCMaxBunches - triggerBC: " << triggerBC << ", decoded data is " << minTimeBin << " - " << maxTimeBin;
1011 amendPageErrorMessage(oss, rdh, decHDR, payloadEnd, decPagePtr, nOutput);
1012 throw std::runtime_error(oss.str());
1013 }
1014
1015 if (decHDR->nTimebinHeaders && payloadEnd - decPagePtr < 0) {
1016 std::ostringstream oss;
1017 oss << "Decoding ran over end of page";
1018 amendPageErrorMessage(oss, rdh, decHDR, payloadEnd, decPagePtr, nOutput);
1019 throw std::runtime_error(oss.str());
1020 }
1021 if (decHDR->nTimebinHeaders && payloadEnd - decPagePtr >= 2 * o2::raw::RDHUtils::GBTWord128) {
1022 std::ostringstream oss;
1023 oss << "Decoding didn't reach end of page";
1024 amendPageErrorMessage(oss, rdh, decHDR, payloadEnd, decPagePtr, nOutput);
1025 throw std::runtime_error(oss.str());
1026 }
1027}
1028
1029void zsEncoderDenseLinkBased::amendPageErrorMessage(std::ostringstream& oss, const o2::header::RAWDataHeader* rdh, const TPCZSHDRV2* decHDR, const uint8_t* payloadEnd, const uint8_t* decPagePtr, uint32_t nOutput)
1030{
1031 if (payloadEnd && decPagePtr) {
1032 oss << " (payloadEnd " << (void*)payloadEnd << " - decPagePtr " << (void*)decPagePtr << " - " << (payloadEnd - decPagePtr) << " bytes left, " << nOutput << " of " << decHDR->nADCsamples << " digits decoded)\n";
1033 } else {
1034 oss << "\n";
1035 }
1036 constexpr size_t bufferSize = 3 * std::max(sizeof(*rdh), sizeof(*decHDR)) + 1;
1037 char dumpBuffer[bufferSize];
1038 for (size_t i = 0; i < sizeof(*rdh); i++) {
1039 snprintf(dumpBuffer + 3 * i, 4, "%02X ", (int32_t)((uint8_t*)rdh)[i]);
1040 }
1041 oss << "RDH of page: " << dumpBuffer << "\n";
1042 for (size_t i = 0; i < sizeof(*decHDR); i++) {
1043 snprintf(dumpBuffer + 3 * i, 4, "%02X ", (int32_t)((uint8_t*)decHDR)[i]);
1044 }
1045 oss << "Meta header of page: " << dumpBuffer << "\n";
1046}
1047
1048#endif // GPUCA_O2_LIB
1049
1050// ------------------------------------------------- TPC ZS Main Encoder -------------------------------------------------
1051
1052template <class T>
1053struct zsEncoderRun : public T {
1054 uint32_t run(std::vector<zsPage>* buffer, std::vector<o2::tpc::Digit>& tmpBuffer, size_t* totalSize = nullptr);
1055 size_t compare(std::vector<zsPage>* buffer, std::vector<o2::tpc::Digit>& tmpBuffer);
1056
1057 using T::bcShiftInFirstHBF;
1058 using T::checkInput;
1059 using T::curRegion;
1060 using T::decodePage;
1061 using T::encodeBits;
1062 using T::encodeBitsFactor;
1063 using T::encodeSequence;
1064 using T::endpoint;
1065 using T::firstTimebinInPage;
1066 using T::getHbf;
1067 using T::hbf;
1068 using T::hdr;
1069 using T::init;
1070 using T::initPage;
1071 using T::ir;
1072 using T::iSector;
1073 using T::lastEndpoint;
1074 using T::lastRow;
1075 using T::lastTime;
1076 using T::needAnotherPage;
1077 using T::nexthbf;
1078 using T::outputEndpoint;
1079 using T::outputRegion;
1080 using T::packetCounter;
1081 using T::padding;
1082 using T::page;
1083 using T::pageCounter;
1084 using T::pagePtr;
1085 using T::param;
1086 using T::raw;
1087 using T::sort;
1088 using T::writeSubPage;
1089 using T::ZSfillEmpty;
1090 using T::zsVersion;
1091};
1092
1093template <class T>
1094inline uint32_t zsEncoderRun<T>::run(std::vector<zsPage>* buffer, std::vector<o2::tpc::Digit>& tmpBuffer, size_t* totalSize)
1095{
1096 uint32_t totalPages = 0;
1097 zsPage singleBuffer;
1098#ifdef GPUCA_O2_LIB
1099 int32_t maxhbf = 0;
1100 int32_t minhbf = o2::constants::lhc::LHCMaxBunches;
1101#endif
1102 bcShiftInFirstHBF = ir ? ir->bc : 0;
1103 int32_t orbitShift = ir ? ir->orbit : 0;
1104 int32_t rawcru = 0;
1105 int32_t rawendpoint = 0;
1106 (void)(rawcru + rawendpoint); // avoid compiler warning
1107 encodeBitsFactor = (1 << (encodeBits - 10));
1108
1109 std::sort(tmpBuffer.begin(), tmpBuffer.end(), [this](const o2::tpc::Digit a, const o2::tpc::Digit b) { return sort(a, b); });
1110 for (uint32_t k = 0; k <= tmpBuffer.size();) {
1111 bool mustWritePage = false, mustWriteSubPage = false;
1112 if (needAnotherPage) {
1113 needAnotherPage = false;
1114 mustWritePage = true;
1115 } else {
1116 if (k < tmpBuffer.size()) {
1117 if (tmpBuffer[k].getTimeStamp() != lastTime) {
1118 nexthbf = getHbf(tmpBuffer[k].getTimeStamp());
1119 if (nexthbf < 0) {
1120 throw std::runtime_error("Received digit before the defined first orbit");
1121 }
1122 if (hbf != nexthbf) {
1123 lastEndpoint = -2;
1124 mustWritePage = true;
1125 }
1126 }
1127 if (lastRow != tmpBuffer[k].getRow()) {
1128 curRegion = GPUTPCGeometry::GetRegion(tmpBuffer[k].getRow());
1129 }
1130 mustWriteSubPage = checkInput(tmpBuffer, k);
1131 } else {
1132 nexthbf = -1;
1133 mustWritePage = true;
1134 }
1135 }
1136 if (mustWritePage || mustWriteSubPage) {
1137 mustWritePage |= writeSubPage();
1138
1139 if (page && mustWritePage) {
1140 if constexpr (std::is_same_v<T, struct zsEncoderDenseLinkBased>) {
1141 if ((pagePtr - (uint8_t*)page) % o2::raw::RDHUtils::GBTWord128) {
1143 }
1144 uint8_t* triggerWord = nullptr;
1145 if (hbf != nexthbf || endpoint != lastEndpoint) {
1146 if ((pagePtr - (uint8_t*)page) + sizeof(TPCZSHDRV2) + o2::tpc::TPCZSHDRV2::TRIGGER_WORD_SIZE <= TPCZSHDR::TPC_ZS_PAGE_SIZE) {
1147 if ((pagePtr - (uint8_t*)page) % (2 * o2::raw::RDHUtils::GBTWord128)) {
1148 pagePtr += o2::raw::RDHUtils::GBTWord128; // align to 256 bit, size constrained cannot be affected by this
1149 }
1151 } else {
1152 needAnotherPage = true;
1153 }
1154 if (this->sequenceBuffer.size()) {
1155 needAnotherPage = true;
1156 }
1157 }
1158 if (hdr->flags & o2::tpc::TPCZSHDRV2::TriggerWordPresent) {
1159 triggerWord = pagePtr;
1161 }
1162 if ((pagePtr - (uint8_t*)page) % (2 * o2::raw::RDHUtils::GBTWord128) == 0) {
1163 pagePtr += o2::raw::RDHUtils::GBTWord128; // align to 128bit mod 256
1164 }
1165 TPCZSHDRV2* pagehdr = (TPCZSHDRV2*)pagePtr;
1166 pagePtr += sizeof(TPCZSHDRV2);
1167 if (pagePtr - (uint8_t*)page > TPCZSHDR::TPC_ZS_PAGE_SIZE) {
1168 throw std::runtime_error("TPC ZS page overflow");
1169 }
1170 memcpy(pagehdr, hdr, sizeof(*hdr));
1171 if (triggerWord) {
1172 memset(triggerWord, 0, o2::tpc::TPCZSHDRV2::TRIGGER_WORD_SIZE);
1173 }
1174 }
1175 const rdh_utils::FEEIDType rawfeeid = rdh_utils::getFEEID(rawcru, rawendpoint, this->RAWLNK);
1176 if (totalSize) {
1177 *totalSize += !std::is_same_v<T, struct zsEncoderDenseLinkBased> && (lastEndpoint == -1 || hbf == nexthbf) ? TPCZSHDR::TPC_ZS_PAGE_SIZE : (pagePtr - (uint8_t*)page);
1178 }
1179 size_t size = !std::is_same_v<T, struct zsEncoderDenseLinkBased> && (padding || lastEndpoint == -1 || hbf == nexthbf) ? TPCZSHDR::TPC_ZS_PAGE_SIZE : (pagePtr - (uint8_t*)page);
1180 size = CAMath::nextMultipleOf<o2::raw::RDHUtils::GBTWord128>(size);
1181#ifdef GPUCA_O2_LIB
1182 if (raw) {
1183 raw->addData(rawfeeid, rawcru, 0, rawendpoint, *ir + hbf * o2::constants::lhc::LHCMaxBunches, gsl::span<char>((char*)page + sizeof(o2::header::RAWDataHeader), (char*)page + size), true, 0, 2);
1184 maxhbf = std::max<int32_t>(maxhbf, hbf);
1185 minhbf = std::min<int32_t>(minhbf, hbf);
1186 } else
1187#endif
1188 {
1190 o2::raw::RDHUtils::setHeartBeatOrbit(*rdh, hbf + orbitShift);
1191 o2::raw::RDHUtils::setHeartBeatBC(*rdh, bcShiftInFirstHBF);
1193 o2::raw::RDHUtils::setVersion(*rdh, o2::raw::RDHUtils::getVersion<o2::header::RAWDataHeader>());
1194 o2::raw::RDHUtils::setFEEID(*rdh, rawfeeid);
1196 o2::raw::RDHUtils::setLinkID(*rdh, this->RAWLNK);
1197 o2::raw::RDHUtils::setPacketCounter(*rdh, packetCounter++);
1198 o2::raw::RDHUtils::setPageCounter(*rdh, pageCounter++);
1199 }
1200 }
1201 if (k >= tmpBuffer.size() && !needAnotherPage) {
1202 break;
1203 }
1204 }
1205 if (mustWritePage) {
1206 if (!needAnotherPage) {
1207 if (hbf != nexthbf) {
1208 pageCounter = 0;
1209 }
1210 outputRegion = curRegion;
1211 outputEndpoint = endpoint;
1212 hbf = nexthbf;
1213 lastTime = -1;
1214 lastEndpoint = endpoint;
1215 }
1216 if (raw) {
1217 page = &singleBuffer;
1218 } else {
1219 if (buffer[outputEndpoint].size() == 0 && nexthbf > orbitShift) {
1220 buffer[outputEndpoint].emplace_back();
1221 ZSfillEmpty(&buffer[outputEndpoint].back(), bcShiftInFirstHBF, rdh_utils::getFEEID(iSector * 10 + outputEndpoint / 2, outputEndpoint & 1, this->RAWLNK), orbitShift, this->RAWLNK); // Emplace empty page with RDH containing beginning of TF
1222 if (totalSize) {
1223 *totalSize += sizeof(o2::header::RAWDataHeader);
1224 }
1225 totalPages++;
1226 }
1227 buffer[outputEndpoint].emplace_back();
1228 page = &buffer[outputEndpoint].back();
1229 }
1230 pagePtr = reinterpret_cast<uint8_t*>(page);
1231 std::fill(page->begin(), page->end(), 0);
1232 pagePtr += sizeof(o2::header::RAWDataHeader);
1233 if constexpr (std::is_same_v<T, struct zsEncoderDenseLinkBased>) {
1234 hdr = &this->hdrBuffer;
1235 } else {
1236 hdr = reinterpret_cast<decltype(hdr)>(pagePtr);
1237 pagePtr += sizeof(*hdr);
1238 }
1239 hdr->version = zsVersion;
1240 hdr->cruID = iSector * 10 + outputRegion;
1241 hdr->nTimeBinSpan = 0;
1242 hdr->nADCsamples = 0;
1243 rawcru = iSector * 10 + outputRegion;
1244 rawendpoint = outputEndpoint & 1;
1245 hdr->timeOffset = (int64_t)(needAnotherPage ? firstTimebinInPage : tmpBuffer[k].getTimeStamp()) * LHCBCPERTIMEBIN - (int64_t)hbf * o2::constants::lhc::LHCMaxBunches;
1246 firstTimebinInPage = tmpBuffer[k].getTimeStamp();
1247 initPage();
1248 totalPages++;
1249 }
1250 if (needAnotherPage) {
1251 continue;
1252 }
1253 uint32_t nEncoded = encodeSequence(tmpBuffer, k);
1254 lastTime = tmpBuffer[k].getTimeStamp();
1255 lastRow = tmpBuffer[k].getRow();
1256 hdr->nADCsamples += nEncoded;
1257 k += nEncoded;
1258 }
1259 if (raw) {
1260#ifdef GPUCA_O2_LIB
1261 if (iSector == 0) {
1262 for (int32_t i = minhbf; i <= maxhbf; i++) {
1263 raw->addData(46208, 360, rdh_utils::SACLinkID, 0, *ir + i * o2::constants::lhc::LHCMaxBunches, gsl::span<char>((char*)&singleBuffer, (char*)&singleBuffer), true, 0, 4);
1264 }
1265 }
1266#endif
1267 } else {
1268 for (uint32_t j = 0; j < GPUTrackingInOutZS::NENDPOINTS; j++) {
1269 if (buffer[j].size() == 0) {
1270 buffer[j].emplace_back();
1271 ZSfillEmpty(&buffer[j].back(), bcShiftInFirstHBF, rdh_utils::getFEEID(iSector * 10 + j / 2, j & 1, this->RAWLNK), orbitShift, this->RAWLNK);
1272 totalPages++;
1273 }
1274 }
1275 }
1276 return totalPages;
1277}
1278
1279template <class T>
1280size_t zsEncoderRun<T>::compare(std::vector<zsPage>* buffer, std::vector<o2::tpc::Digit>& tmpBuffer)
1281{
1282 size_t nErrors = 0;
1283 std::vector<o2::tpc::Digit> compareBuffer;
1284 compareBuffer.reserve(tmpBuffer.size());
1285 for (uint32_t j = 0; j < GPUTrackingInOutZS::NENDPOINTS; j++) {
1286 uint32_t firstOrbit = ir ? ir->orbit : 0;
1287 for (uint32_t k = 0; k < buffer[j].size(); k++) {
1288 zsPage* decPage = &buffer[j][k];
1289 decodePage(compareBuffer, decPage, j, firstOrbit);
1290 }
1291 }
1292 if (tmpBuffer.size() != compareBuffer.size()) {
1293 nErrors += tmpBuffer.size();
1294 printf("Number of clusters mismatch %d %d\n", (int32_t)tmpBuffer.size(), (int32_t)compareBuffer.size());
1295 } else {
1296 for (uint32_t j = 0; j < tmpBuffer.size(); j++) {
1297 const float decodeBitsFactor = (1 << (encodeBits - 10));
1298 const float c = CAMath::Round(tmpBuffer[j].getChargeFloat() * decodeBitsFactor) / decodeBitsFactor;
1299 int32_t ok = c == compareBuffer[j].getChargeFloat() && (int32_t)tmpBuffer[j].getTimeStamp() == (int32_t)compareBuffer[j].getTimeStamp() && (int32_t)tmpBuffer[j].getPad() == (int32_t)compareBuffer[j].getPad() && (int32_t)tmpBuffer[j].getRow() == (int32_t)compareBuffer[j].getRow();
1300 if (ok) {
1301 continue;
1302 }
1303 nErrors++;
1304 printf("%4u: OK %d: Charge %3d %3d Time %4d %4d Pad %3d %3d Row %3d %3d\n", j, ok,
1305 (int32_t)c, (int32_t)compareBuffer[j].getChargeFloat(), (int32_t)tmpBuffer[j].getTimeStamp(), (int32_t)compareBuffer[j].getTimeStamp(), (int32_t)tmpBuffer[j].getPad(), (int32_t)compareBuffer[j].getPad(), (int32_t)tmpBuffer[j].getRow(), (int32_t)compareBuffer[j].getRow());
1306 }
1307 }
1308 return nErrors;
1309}
1310
1311} // anonymous namespace
1312} // namespace o2::gpu
1313#endif // GPUCA_TPC_GEOMETRY_O2
1314
1315template <class S>
1316void GPUReconstructionConvert::RunZSEncoder(const S& in, std::unique_ptr<uint64_t[]>* outBuffer, uint32_t* outSizes, o2::raw::RawFileWriter* raw, const o2::InteractionRecord* ir, const GPUParam& param, int32_t version, bool verify, float threshold, bool padding, std::function<void(std::vector<o2::tpc::Digit>&)> digitsFilter)
1317{
1318 // Pass in either outBuffer / outSizes, to fill standalone output buffers, or raw to use RawFileWriter
1319 // ir is the interaction record for time bin 0
1320 if (((outBuffer == nullptr) ^ (outSizes == nullptr)) || ((raw != nullptr) && (ir == nullptr)) || !((outBuffer == nullptr) ^ (raw == nullptr)) || (raw && verify)) {
1321 throw std::runtime_error("Invalid parameters");
1322 }
1323#ifdef GPUCA_TPC_GEOMETRY_O2
1324 std::vector<zsPage> buffer[NSECTORS][GPUTrackingInOutZS::NENDPOINTS];
1325 struct tmpReductionResult {
1326 uint32_t totalPages = 0;
1327 size_t totalSize = 0;
1328 size_t nErrors = 0;
1329 size_t digitsInput = 0;
1330 size_t digitsEncoded = 0;
1331 };
1332 auto reduced = tbb::parallel_reduce(tbb::blocked_range<uint32_t>(0, NSECTORS), tmpReductionResult(), [&](const auto range, auto red) {
1333 for (uint32_t i = range.begin(); i < range.end(); i++) {
1334 std::vector<o2::tpc::Digit> tmpBuffer;
1335 red.digitsInput += ZSEncoderGetNDigits(in, i);
1336 tmpBuffer.resize(ZSEncoderGetNDigits(in, i));
1337 if (threshold > 0.f && !digitsFilter) {
1338 auto it = std::copy_if(ZSEncoderGetDigits(in, i), ZSEncoderGetDigits(in, i) + ZSEncoderGetNDigits(in, i), tmpBuffer.begin(), [threshold](auto& v) { return v.getChargeFloat() >= threshold; });
1339 tmpBuffer.resize(std::distance(tmpBuffer.begin(), it));
1340 } else {
1341 std::copy(ZSEncoderGetDigits(in, i), ZSEncoderGetDigits(in, i) + ZSEncoderGetNDigits(in, i), tmpBuffer.begin());
1342 }
1343
1344 if (digitsFilter) {
1345 digitsFilter(tmpBuffer);
1346 if (threshold > 0.f) {
1347 std::vector<o2::tpc::Digit> tmpBuffer2 = std::move(tmpBuffer);
1348 tmpBuffer = std::vector<o2::tpc::Digit>(tmpBuffer2.size());
1349 auto it = std::copy_if(tmpBuffer2.begin(), tmpBuffer2.end(), tmpBuffer.begin(), [threshold](auto& v) { return v.getChargeFloat() >= threshold; });
1350 tmpBuffer.resize(std::distance(tmpBuffer.begin(), it));
1351 }
1352 }
1353 red.digitsEncoded += tmpBuffer.size();
1354
1355 auto runZS = [&](auto& encoder) {
1356 encoder.zsVersion = version;
1357 encoder.init();
1358 red.totalPages += encoder.run(buffer[i], tmpBuffer, &red.totalSize);
1359 if (verify) {
1360 red.nErrors += encoder.compare(buffer[i], tmpBuffer); // Verification
1361 }
1362 };
1363
1364 if (version >= ZSVersion::ZSVersionRowBased10BitADC && version <= ZSVersion::ZSVersionRowBased12BitADC) {
1365 zsEncoderRun<zsEncoderRow> enc{{{.iSector = i, .raw = raw, .ir = ir, .param = &param, .padding = padding}}};
1366 runZS(enc);
1367 } else if (version >= ZSVersion::ZSVersionLinkBasedWithMeta && version <= ZSVersion::ZSVersionDenseLinkBasedV2) {
1368#ifdef GPUCA_O2_LIB
1369 if (version == ZSVersion::ZSVersionLinkBasedWithMeta) {
1370 zsEncoderRun<zsEncoderImprovedLinkBased> enc{{{{.iSector = i, .raw = raw, .ir = ir, .param = &param, .padding = padding}}}};
1371 runZS(enc);
1372 } else if (version >= ZSVersion::ZSVersionDenseLinkBased && version <= ZSVersion::ZSVersionDenseLinkBasedV2) {
1373 zsEncoderRun<zsEncoderDenseLinkBased> enc{{{{.iSector = i, .raw = raw, .ir = ir, .param = &param, .padding = padding}}}};
1374 runZS(enc);
1375 }
1376#else
1377 throw std::runtime_error("Link based ZS encoding not supported in standalone build");
1378#endif
1379 } else {
1380 throw std::runtime_error("Invalid ZS version "s + std::to_string(version) + ", cannot decode"s);
1381 }
1382 }
1383 return red; }, [&](const auto& red1, const auto& red2) {
1384 auto red = red1;
1385 red.totalPages += red2.totalPages;
1386 red.totalSize += red2.totalSize;
1387 red.nErrors += red2.nErrors;
1388 red.digitsInput += red2.digitsInput;
1389 red.digitsEncoded += red2.digitsEncoded;
1390 return red; });
1391
1392 if (outBuffer) {
1393 outBuffer->reset(new uint64_t[reduced.totalPages * TPCZSHDR::TPC_ZS_PAGE_SIZE / sizeof(uint64_t)]);
1394 uint64_t offset = 0;
1395 for (uint32_t i = 0; i < NSECTORS; i++) {
1396 for (uint32_t j = 0; j < GPUTrackingInOutZS::NENDPOINTS; j++) {
1397 memcpy((char*)outBuffer->get() + offset, buffer[i][j].data(), buffer[i][j].size() * TPCZSHDR::TPC_ZS_PAGE_SIZE);
1399 outSizes[i * GPUTrackingInOutZS::NENDPOINTS + j] = buffer[i][j].size();
1400 }
1401 }
1402 }
1403 if (reduced.nErrors) {
1404 GPUError("ERROR: %lu INCORRECT SAMPLES DURING ZS ENCODING VERIFICATION!!!", reduced.nErrors);
1405 } else if (verify) {
1406 GPUInfo("ENCODING VERIFICATION PASSED");
1407 }
1408 GPUInfo("TOTAL ENCODED SIZE: %lu (%lu of %lu digits encoded)", reduced.totalSize, reduced.digitsEncoded, reduced.digitsInput);
1409#endif
1410}
1411
1412template void GPUReconstructionConvert::RunZSEncoder<GPUTrackingInOutDigits>(const GPUTrackingInOutDigits&, std::unique_ptr<uint64_t[]>*, uint32_t*, o2::raw::RawFileWriter*, const o2::InteractionRecord*, const GPUParam&, int32_t, bool, float, bool, std::function<void(std::vector<o2::tpc::Digit>&)> digitsFilter);
1413#ifdef GPUCA_O2_LIB
1414template void GPUReconstructionConvert::RunZSEncoder<DigitArray>(const DigitArray&, std::unique_ptr<uint64_t[]>*, uint32_t*, o2::raw::RawFileWriter*, const o2::InteractionRecord*, const GPUParam&, int32_t, bool, float, bool, std::function<void(std::vector<o2::tpc::Digit>&)> digitsFilter);
1415#endif
1416
1417void GPUReconstructionConvert::RunZSEncoderCreateMeta(const uint64_t* buffer, const uint32_t* sizes, void** ptrs, GPUTrackingInOutZS* out)
1418{
1419 uint64_t offset = 0;
1420 for (uint32_t i = 0; i < NSECTORS; i++) {
1421 for (uint32_t j = 0; j < GPUTrackingInOutZS::NENDPOINTS; j++) {
1422 ptrs[i * GPUTrackingInOutZS::NENDPOINTS + j] = (char*)buffer + offset;
1424 out->sector[i].zsPtr[j] = &ptrs[i * GPUTrackingInOutZS::NENDPOINTS + j];
1426 out->sector[i].count[j] = 1;
1427 }
1428 }
1429}
1430
1431void GPUReconstructionConvert::RunZSFilter(std::unique_ptr<o2::tpc::Digit[]>* buffers, const o2::tpc::Digit* const* ptrs, size_t* nsb, const size_t* ns, const GPUParam& param, bool zs12bit, float threshold)
1432{
1433 for (uint32_t i = 0; i < NSECTORS; i++) {
1434 if (buffers[i].get() != ptrs[i] || nsb != ns) {
1435 throw std::runtime_error("Not owning digits");
1436 }
1437 uint32_t j = 0;
1438 const uint32_t decodeBits = zs12bit ? TPCZSHDR::TPC_ZS_NBITS_V2 : TPCZSHDR::TPC_ZS_NBITS_V1;
1439 const float decodeBitsFactor = (1 << (decodeBits - 10));
1440 for (uint32_t k = 0; k < ns[i]; k++) {
1441 if (buffers[i][k].getChargeFloat() >= threshold) {
1442 if (k > j) {
1443 buffers[i][j] = buffers[i][k];
1444 }
1445 if (zs12bit) {
1446 buffers[i][j].setCharge(CAMath::Round(buffers[i][j].getChargeFloat() * decodeBitsFactor) / decodeBitsFactor);
1447 } else {
1448 buffers[i][j].setCharge(CAMath::Round(buffers[i][j].getChargeFloat()));
1449 }
1450 j++;
1451 }
1452 }
1453 nsb[i] = j;
1454 }
1455}
1456
1457#ifdef GPUCA_O2_LIB
1458namespace o2::gpu::internal
1459{
1460template <class T>
1461static inline auto GetDecoder_internal(const GPUParam* param, int32_t version)
1462{
1463 std::shared_ptr<T> enc = std::make_shared<T>();
1464 if (param == nullptr) {
1465 static GPUParam dummyParam;
1466 param = &dummyParam;
1467 }
1468 enc->param = param;
1469 enc->zsVersion = version;
1470 enc->init();
1471 return [enc](std::vector<o2::tpc::Digit>& outBuffer, const void* page, uint32_t firstTfOrbit, uint32_t triggerBC = 0) {
1472 const o2::header::RAWDataHeader& rdh = *(const o2::header::RAWDataHeader*)page;
1473 if (o2::raw::RDHUtils::getMemorySize(rdh) == sizeof(o2::header::RAWDataHeader)) {
1474 return;
1475 }
1476 if (o2::raw::RDHUtils::getDetectorField(rdh) != 2) {
1477 return;
1478 }
1479 o2::tpc::CRU cru(o2::tpc::rdh_utils::getCRU(rdh));
1480 enc->iSector = cru.sector();
1481 int32_t endpoint = cru.region() * 2 + o2::tpc::rdh_utils::getEndPoint(rdh);
1482 enc->decodePage(outBuffer, (const zsPage*)page, endpoint, firstTfOrbit, triggerBC);
1483 };
1484}
1485} // namespace o2::gpu::internal
1486
1487std::function<void(std::vector<o2::tpc::Digit>&, const void*, uint32_t, uint32_t)> GPUReconstructionConvert::GetDecoder(int32_t version, const GPUParam* param)
1488{
1490 return o2::gpu::internal::GetDecoder_internal<zsEncoderRow>(param, version);
1492 return o2::gpu::internal::GetDecoder_internal<zsEncoderImprovedLinkBased>(param, version);
1494 return o2::gpu::internal::GetDecoder_internal<zsEncoderDenseLinkBased>(param, version);
1495 } else {
1496 throw std::runtime_error("Invalid ZS version "s + std::to_string(version) + ", cannot create decoder"s);
1497 }
1498}
1499#endif
uint16_t padding
Definition of the TPC Digit.
uint64_t orbit
Definition RawEventData.h:6
uint64_t bc
Definition RawEventData.h:5
int32_t i
int32_t retVal
#define GPUCA_ROW_COUNT
Header to collect LHC related constants.
uint32_t j
Definition RawData.h:0
uint8_t endpoint
Definition RawData.h:0
uint32_t c
Definition RawData.h:2
uint32_t version
Definition RawData.h:8
Utility class to write detectors data to (multiple) raw data file(s) respecting CRU format.
Definition of TPCFastTransform class.
TBranch * ptr
std::ostringstream debug
definitions to deal with the link based zero suppression format
Definitions of TPC Zero Suppression Data Headers.
int nClusters
static void RunZSEncoder(const S &in, std::unique_ptr< uint64_t[]> *outBuffer, uint32_t *outSizes, o2::raw::RawFileWriter *raw, const o2::InteractionRecord *ir, const GPUParam &param, int32_t version, bool verify, float threshold=0.f, bool padding=false, std::function< void(std::vector< o2::tpc::Digit > &)> digitsFilter=nullptr)
static void ConvertNativeToClusterData(o2::tpc::ClusterNativeAccess *native, std::unique_ptr< GPUTPCClusterData[]> *clusters, uint32_t *nClusters, const TPCFastTransform *transform, int32_t continuousMaxTimeBin=0)
static void RunZSFilter(std::unique_ptr< o2::tpc::Digit[]> *buffers, const o2::tpc::Digit *const *ptrs, size_t *nsb, const size_t *ns, const GPUParam &param, bool zs12bit, float threshold)
static std::function< void(std::vector< o2::tpc::Digit > &, const void *, uint32_t, uint32_t)> GetDecoder(int32_t version, const GPUParam *param)
static int32_t GetMaxTimeBin(const o2::tpc::ClusterNativeAccess &native)
static void RunZSEncoderCreateMeta(const uint64_t *buffer, const uint32_t *sizes, void **ptrs, GPUTrackingInOutZS *out)
static void ConvertRun2RawToNative(o2::tpc::ClusterNativeAccess &native, std::unique_ptr< o2::tpc::ClusterNative[]> &nativeBuffer, const AliHLTTPCRawCluster **rawClusters, uint32_t *nRawClusters)
int32_t float float float & x
void addData(uint16_t feeid, uint16_t cru, uint8_t lnk, uint8_t endpoint, const IR &ir, const gsl::span< char > data, bool preformatted=false, uint32_t trigger=0, uint32_t detField=0)
unsigned char partition() const
Definition CRU.h:63
unsigned char getSampaChannel() const
Definition FECInfo.h:45
unsigned char getIndex() const
Definition FECInfo.h:41
unsigned char getSampaChip() const
Definition FECInfo.h:44
static Mapper & instance(const std::string mappingDir="")
Definition Mapper.h:44
static constexpr void getSampaAndChannelOnFEC(const int cruID, const size_t rawFECChannel, int &sampaOnFEC, int &channelOnSAMPA)
Definition Mapper.h:275
static constexpr int MAXSECTOR
Definition Sector.h:44
std::array< gsl::span< const o2::tpc::Digit >, Sector::MAXSECTOR > DigitArray
GLdouble n
Definition glcorearb.h:1982
GLint GLenum GLint x
Definition glcorearb.h:403
const GLfloat * m
Definition glcorearb.h:4066
GLuint buffer
Definition glcorearb.h:655
GLsizeiptr size
Definition glcorearb.h:659
const GLdouble * v
Definition glcorearb.h:832
GLuint GLsizei const GLuint const GLintptr const GLsizeiptr * sizes
Definition glcorearb.h:2595
GLsizei samples
Definition glcorearb.h:1309
GLboolean GLboolean GLboolean b
Definition glcorearb.h:1233
GLenum GLint * range
Definition glcorearb.h:1899
GLint y
Definition glcorearb.h:270
GLenum GLint GLenum GLsizei GLsizei GLsizei GLint GLsizei const void * bits
Definition glcorearb.h:4150
GLintptr offset
Definition glcorearb.h:660
typedef void(APIENTRYP PFNGLCULLFACEPROC)(GLenum mode)
GLenum GLfloat param
Definition glcorearb.h:271
GLboolean GLboolean GLboolean GLboolean a
Definition glcorearb.h:1233
GLint GLuint mask
Definition glcorearb.h:291
GLdouble GLdouble GLdouble z
Definition glcorearb.h:843
const GLuint * buffers
Definition glcorearb.h:656
uint8_t itsSharedClusterMap uint8_t
constexpr int LHCMaxBunches
const GBTLinkAttributes links[kNGBTLinks]
Definition RawWriter.h:54
RAWDataHeaderV7 RAWDataHeader
void dumpBuffer(gsl::span< const std::byte > buffer, std::ostream &out=std::cout, size_t maxbytes=std::numeric_limits< size_t >::max())
Definition DumpBuffer.h:139
constexpr int LHCBCPERTIMEBIN
Definition Constants.h:38
uint64_t getTimeStamp(o2::framework::ProcessingContext &pc)
uint16_t FEEIDType
Definition RDHUtils.h:26
Global TPC definitions and constants.
Definition SimTraits.h:168
@ ZSVersionDenseLinkBased
@ ZSVersionLinkBasedWithMeta
@ ZSVersionDenseLinkBasedV2
@ ZSVersionRowBased10BitADC
@ ZSVersionRowBased12BitADC
constexpr std::array< int, nLayers > nRows
Definition Specs.h:56
a couple of static helper functions to create timestamp values for CCDB queries or override obsolete ...
std::string to_string(gsl::span< T, Size > span)
Definition common.h:52
int32_t GetCharge() const
uint16_t GetFlags() const
int32_t GetPadRow() const
uint32_t orbit
LHC orbit.
uint16_t bc
bunch crossing ID of interaction
const o2::tpc::Digit * tpcDigits[NSECTORS]
GPUTrackingInOutZSSector sector[NSECTORS]
static constexpr uint32_t NENDPOINTS
static void setLinkID(H &rdh, uint8_t v, NOTPTR(H))
Definition RDHUtils.h:258
static void setDetectorField(H &rdh, uint32_t v, NOTPTR(H))
Definition RDHUtils.h:584
static constexpr int GBTWord128
Definition RDHUtils.h:54
static void setPageCounter(H &rdh, uint16_t v, NOTPTR(H))
Definition RDHUtils.h:559
static void setMemorySize(H &rdh, uint16_t v, NOTPTR(H))
Definition RDHUtils.h:242
static void setVersion(H &rdh, uint8_t v, NOTPTR(H))
Definition RDHUtils.h:90
static void setPacketCounter(H &rdh, uint8_t v, NOTPTR(H))
Definition RDHUtils.h:274
static void setHeartBeatOrbit(RDHv4 &rdh, uint32_t v)
Definition RDHUtils.h:364
static void setFEEID(RDHv4 &rdh, uint16_t v)
Definition RDHUtils.h:148
unsigned int nClusters[constants::MAXSECTOR][constants::MAXGLOBALPADROW]
const ClusterNative * clusters[constants::MAXSECTOR][constants::MAXGLOBALPADROW]
unsigned int clusterOffset[constants::MAXSECTOR][constants::MAXGLOBALPADROW]
const ClusterNative * clustersLinear
unsigned short nTimebinHeaders
unsigned char magicWord
unsigned short firstZSDataOffset
static constexpr bool TIGHTLY_PACKED_V3
static constexpr unsigned int TPC_ZS_NBITS_V34
static constexpr unsigned int SAMPLESPER64BIT
static constexpr unsigned int TRIGGER_WORD_SIZE
unsigned char nTimeBinSpan
unsigned char version
unsigned short timeOffset
unsigned short cruID
static constexpr unsigned int TPC_ZS_NBITS_V1
static constexpr unsigned int TPC_ZS_NBITS_V2
static constexpr size_t TPC_ZS_PAGE_SIZE
unsigned short nADCsamples
unsigned short rowMask
void compare(std::string_view s1, std::string_view s2)
o2::InteractionRecord ir(0, 0)
std::vector< Cluster > clusters
std::vector< Digit > digits
std::vector< int > row