dc/d65/GPUTPCCFDecodeZS_8h_source.html

// Copyright 2019-2020 CERN and copyright holders of ALICE O2.

// See https://alice-o2.web.cern.ch/copyright for details of the copyright holders.

// All rights not expressly granted are reserved.

//

// This software is distributed under the terms of the GNU General Public

// License v3 (GPL Version 3), copied verbatim in the file "COPYING".

//

// In applying this license CERN does not waive the privileges and immunities

// granted to it by virtue of its status as an Intergovernmental Organization

// or submit itself to any jurisdiction.


#ifndef O2_GPU_DECODE_ZS_H

#define O2_GPU_DECODE_ZS_H


#include "clusterFinderDefs.h"

#include "GPUGeneralKernels.h"

#include "GPUConstantMem.h"

#include "TPCBase/PadPos.h"

#include "DataFormatsTPC/ZeroSuppression.h"

#include "DataFormatsTPC/ZeroSuppressionLinkBased.h"

#include "Headers/RAWDataHeader.h"


namespace o2::gpu

{


class GPUTPCClusterFinder;


class GPUTPCCFDecodeZS : public GPUKernelTemplate

{

 public:


  struct GPUSharedMemory /*: public GPUKernelTemplate::GPUSharedMemoryScan64<int32_t, GPUCA_WARP_SIZE>*/ {

    CA_SHARED_STORAGE(uint32_t ZSPage[o2::tpc::TPCZSHDR::TPC_ZS_PAGE_SIZE / sizeof(uint32_t)]);

    uint32_t RowClusterOffset[o2::tpc::TPCZSHDR::TPC_MAX_ZS_ROW_IN_ENDPOINT];

    uint32_t nRowsRegion;

    uint32_t regionStartRow;

    uint32_t nThreadsPerRow;

    uint32_t rowStride;

    GPUAtomic(uint32_t) rowOffsetCounter;

  };


  enum K : int32_t {

    decodeZS,

  };


  static GPUd() void decode(GPUTPCClusterFinder& clusterer, GPUSharedMemory& s, int32_t nBlocks, int32_t nThreads, int32_t iBlock, int32_t iThread, int32_t firstHBF, int32_t tpcTimeBinCut);


  typedef GPUTPCClusterFinder processorType;


  GPUhdi() static processorType* Processor(GPUConstantMem& processors)

  {

    return processors.tpcClusterer;

  }


  GPUhdi() constexpr static gpudatatypes::RecoStep GetRecoStep()

  {

    return gpudatatypes::RecoStep::TPCClusterFinding;

  }


  template <int32_t iKernel = defaultKernel, typename... Args>

  GPUd() static void Thread(int32_t nBlocks, int32_t nThreads, int32_t iBlock, int32_t iThread, GPUSharedMemory& smem, processorType& clusterer, Args... args);

};


class GPUTPCCFDecodeZSLinkBase : public GPUKernelTemplate

{


 public:

  typedef GPUTPCClusterFinder processorType;


  GPUhdi() static processorType* Processor(GPUConstantMem& processors)

  {

    return processors.tpcClusterer;

  }


  GPUhdi() constexpr static gpudatatypes::RecoStep GetRecoStep()

  {

    return gpudatatypes::RecoStep::TPCClusterFinding;

  }


  struct DecodeCtx {

    processorType& clusterer;

    const uint8_t* page;

    int32_t iBlock, nThreads, iThread;

    uint32_t pageDigitOffset;

    int32_t firstHBF;

    int32_t tpcTimeBinCut;

  };


  template <class Decoder>

  GPUd() static void Decode(int32_t nBlocks, int32_t nThreads, int32_t iBlock, int32_t iThread, typename Decoder::GPUSharedMemory& smem, processorType& clusterer, int32_t firstHBF, int32_t tpcTimeBinCut);


  GPUd() static o2::tpc::PadPos GetPadAndRowFromFEC(processorType& clusterer, int32_t cru, int32_t rawFecChannel, int32_t fecInPartition);

  GPUd() static void WriteCharge(processorType& clusterer, float charge, o2::tpc::PadPos pos, tpccf::TPCFragmentTime localTime, size_t positionOffset);

  GPUd() static uint16_t FillWithInvalid(processorType& clusterer, int32_t iThread, int32_t nThreads, uint32_t pageDigitOffset, uint16_t nSamples);


  GPUdi() static const uint8_t* ConsumeBytes(const uint8_t*& page, size_t nbytes)

  {

    const uint8_t* oldPage = page;

    page += nbytes;

    return oldPage;

  }


  GPUdi() static uint8_t ConsumeByte(const uint8_t*& page)

  {

    return *(page++);

  }


  template <typename T>


  GPUdi() static const T* ConsumeHeader(const uint8_t*& page)

  {

    assert(size_t(page) % alignof(T) == 0);

    return reinterpret_cast<const T*>(ConsumeBytes(page, sizeof(T)));

  }


  template <typename T = uint8_t>

  GPUdi() static const T* Peek(const uint8_t* page, ptrdiff_t offset = 0)

  {

    // if ((size_t(page) + offset) % alignof(T) != 0) {

    //   printf("page = %zu, offset = %zu, alignof = %zu\n", size_t(page), offset, alignof(T));

    // }

    assert((size_t(page) + offset) % alignof(T) == 0);

    return reinterpret_cast<const T*>(page + offset);

  }


  GPUdi() static float ADCToFloat(uint32_t adc, uint32_t decodeMask, float decodeBitsFactor)

  {

    return float(adc & decodeMask) * decodeBitsFactor;

  }

};


class GPUTPCCFDecodeZSLink : public GPUTPCCFDecodeZSLinkBase

{

 public:

  // constants for decoding

  static inline constexpr int32_t DECODE_BITS = o2::tpc::TPCZSHDRV2::TPC_ZS_NBITS_V34;

  static inline constexpr float DECODE_BITS_FACTOR = 1.f / (1 << (DECODE_BITS - 10));

  static inline constexpr uint32_t DECODE_MASK = (1 << DECODE_BITS) - 1;


  struct GPUSharedMemory : GPUKernelTemplate::GPUSharedMemoryWarpScan64<uint8_t, GPUCA_GET_THREAD_COUNT(GPUCA_LB_GPUTPCCFDecodeZSLink)> {

    // CA_SHARED_STORAGE(uint32_t ZSPage[o2::tpc::TPCZSHDR::TPC_ZS_PAGE_SIZE / sizeof(uint32_t)]);

  };


  template <int32_t iKernel = defaultKernel, typename... Args>

  GPUd() static void Thread(int32_t nBlocks, int32_t nThreads, int32_t iBlock, int32_t iThread, GPUSharedMemory& smem, processorType& clusterer, Args... args);


  GPUd() static size_t DecodePage(GPUSharedMemory& smem, DecodeCtx& ctx);


  GPUd() static void GetChannelBitmask(const tpc::zerosupp_link_based::CommonHeader& tbHdr, uint32_t* chan);

  GPUd() static bool ChannelIsActive(const uint32_t* chan, uint8_t chanIndex);


  GPUd() static void DecodeTB(GPUSharedMemory& smem, DecodeCtx& ctx, const uint8_t* adcData, uint32_t nAdc, const uint32_t* channelMask, int32_t timeBin, int32_t cru, int32_t fecInPartition);

};


class GPUTPCCFDecodeZSDenseLink : public GPUTPCCFDecodeZSLinkBase

{

 public:

  // constants for decoding

  static inline constexpr int32_t DECODE_BITS = o2::tpc::TPCZSHDRV2::TPC_ZS_NBITS_V34;

  static inline constexpr float DECODE_BITS_FACTOR = 1.f / (1 << (DECODE_BITS - 10));

  static inline constexpr uint32_t DECODE_MASK = (1 << DECODE_BITS) - 1;


  static inline constexpr int32_t MaxNLinksPerTimebin = 16;


  struct GPUSharedMemory : GPUKernelTemplate::GPUSharedMemoryWarpScan64<uint8_t, GPUCA_GET_THREAD_COUNT(GPUCA_LB_GPUTPCCFDecodeZSDenseLink)> {

    // CA_SHARED_STORAGE(uint32_t ZSPage[o2::tpc::TPCZSHDR::TPC_ZS_PAGE_SIZE / sizeof(uint32_t)]);

    uint16_t samplesPerLinkEnd[MaxNLinksPerTimebin]; // Offset from end of TB link header to first sample not in this link

    uint8_t linkIds[MaxNLinksPerTimebin];

    uint8_t rawFECChannels[MaxNLinksPerTimebin * 80];

  };


  template <int32_t iKernel = defaultKernel, typename... Args>

  GPUd() static void Thread(int32_t nBlocks, int32_t nThreads, int32_t iBlock, int32_t iThread, GPUSharedMemory& smem, processorType& clusterer, Args... args);


  GPUd() static uint32_t DecodePage(GPUSharedMemory& smem, DecodeCtx& ctx);


  GPUd() static bool ChannelIsActive(const uint8_t* chan, uint16_t chanIndex);


  // Decode a single timebin within an 8kb page.

  // Returns the number of samples decoded from the page

  // or negative value to indicate an error (no samples are written in this case)

  template <bool PayloadExtendsToNextPage>

  GPUd() static int16_t DecodeTB(GPUSharedMemory& smem, DecodeCtx& ctx, const header::RAWDataHeader* rawDataHeader, int32_t cru, uint16_t nSamplesLeftInPage, const uint8_t* payloadEnd, const uint8_t* nextPage);

};


} // namespace o2::gpu


#endif

charge
int16_t charge
Definition RawEventData.h:5

GPUd
#define GPUd()
Definition GPUCommonDefAPI.h:31

GPUConstantMem.h

GPUGeneralKernels.h

PadPos.h

RAWDataHeader.h
Definition of the RAW Data Header.

pos
uint16_t pos
Definition RawData.h:3

ZeroSuppressionLinkBased.h
definitions to deal with the link based zero suppression format

ZeroSuppression.h
Definitions of TPC Zero Suppression Data Headers.

o2::gpu::GPUKernelTemplate
Definition GPUGeneralKernels.h:41

o2::gpu::GPUKernelTemplate::processors
int32_t int32_t int32_t processorType & processors
Definition GPUGeneralKernels.h:89

o2::gpu::GPUKernelTemplate::defaultKernel
@ defaultKernel
Definition GPUGeneralKernels.h:43

o2::gpu::GPUTPCCFDecodeZSDenseLink
Definition GPUTPCCFDecodeZS.h:155

o2::gpu::GPUTPCCFDecodeZSLinkBase
Definition GPUTPCCFDecodeZS.h:66

o2::gpu::GPUTPCCFDecodeZSLinkBase::oldPage
return oldPage
Definition GPUTPCCFDecodeZS.h:100

o2::gpu::GPUTPCCFDecodeZSLinkBase::processorType
GPUTPCClusterFinder processorType
Definition GPUTPCCFDecodeZS.h:69

o2::gpu::GPUTPCCFDecodeZSLinkBase::GPUdi
GPUdi() static uint8_t ConsumeByte(const uint8_t *&page)
Definition GPUTPCCFDecodeZS.h:103

o2::gpu::GPUTPCCFDecodeZSLinkBase::GPUdi
GPUdi() static const T *Peek(const uint8_t *page

o2::gpu::GPUTPCCFDecodeZSLinkBase::GPUdi
GPUdi() static const T *ConsumeHeader(const uint8_t *&page)
Definition GPUTPCCFDecodeZS.h:109

o2::gpu::GPUTPCCFDecodeZSLinkBase::GPUhdi
GPUhdi() static processorType *Processor(GPUConstantMem &processors)
Definition GPUTPCCFDecodeZS.h:70

o2::gpu::GPUTPCCFDecodeZSLinkBase::GPUhdi
GPUhdi() const expr static gpudatatypes
Definition GPUTPCCFDecodeZS.h:75

o2::gpu::GPUTPCCFDecodeZSLink
Definition GPUTPCCFDecodeZS.h:132

o2::gpu::GPUTPCCFDecodeZS
Definition GPUTPCCFDecodeZS.h:32

o2::gpu::GPUTPCCFDecodeZS::iBlock
static GPUSharedMemory int32_t int32_t int32_t iBlock
Definition GPUTPCCFDecodeZS.h:48

o2::gpu::GPUTPCCFDecodeZS::GPUd
GPUd() static void Thread(int32_t nBlocks

o2::gpu::GPUTPCCFDecodeZS::nBlocks
static GPUSharedMemory int32_t nBlocks
Definition GPUTPCCFDecodeZS.h:48

o2::gpu::GPUTPCCFDecodeZS::GPUhdi
GPUhdi() const expr static gpudatatypes
Definition GPUTPCCFDecodeZS.h:56

o2::gpu::GPUTPCCFDecodeZS::clusterer
int32_t int32_t int32_t GPUSharedMemory processorType & clusterer
Definition GPUTPCCFDecodeZS.h:62

o2::gpu::GPUTPCCFDecodeZS::K
K
Definition GPUTPCCFDecodeZS.h:44

o2::gpu::GPUTPCCFDecodeZS::decodeZS
@ decodeZS
Definition GPUTPCCFDecodeZS.h:45

o2::gpu::GPUTPCCFDecodeZS::nThreads
static GPUSharedMemory int32_t int32_t nThreads
Definition GPUTPCCFDecodeZS.h:48

o2::gpu::GPUTPCCFDecodeZS::iThread
static GPUSharedMemory int32_t int32_t int32_t int32_t iThread
Definition GPUTPCCFDecodeZS.h:48

o2::gpu::GPUTPCCFDecodeZS::firstHBF
static GPUSharedMemory int32_t int32_t int32_t int32_t int32_t firstHBF
Definition GPUTPCCFDecodeZS.h:48

o2::gpu::GPUTPCCFDecodeZS::smem
int32_t int32_t int32_t GPUSharedMemory & smem
Definition GPUTPCCFDecodeZS.h:62

o2::gpu::GPUTPCCFDecodeZS::args
int32_t int32_t int32_t GPUSharedMemory processorType Args args
Definition GPUTPCCFDecodeZS.h:62

o2::gpu::GPUTPCCFDecodeZS::tpcTimeBinCut
static GPUSharedMemory int32_t int32_t int32_t int32_t int32_t int32_t tpcTimeBinCut
Definition GPUTPCCFDecodeZS.h:48

o2::gpu::GPUTPCCFDecodeZS::s
static GPUSharedMemory & s
Definition GPUTPCCFDecodeZS.h:48

o2::gpu::GPUTPCClusterFinder
Definition GPUTPCClusterFinder.h:53

clusterFinderDefs.h

offset
GLintptr offset
Definition glcorearb.h:660

void
typedef void(APIENTRYP PFNGLCULLFACEPROC)(GLenum mode)

o2::gpu::gpudatatypes::RecoStep::TPCClusterFinding
@ TPCClusterFinding

o2::gpu
Definition TrackTRD.h:35

o2::gpu::GPUdi
GPUdi() o2
Definition TrackTRD.h:38

o2
a couple of static helper functions to create timestamp values for CCDB queries or override obsolete ...
Definition FlattenRestore.h:23

o2::gpu::GPUConstantMem
Definition GPUConstantMem.h:41

o2::gpu::GPUKernelTemplate::GPUSharedMemoryWarpScan64
Definition GPUGeneralKernels.h:55

o2::gpu::GPUKernelTemplate::GPUSharedMemory
Definition GPUGeneralKernels.h:51

o2::gpu::GPUTPCCFDecodeZSDenseLink::GPUSharedMemory
Definition GPUTPCCFDecodeZS.h:164

o2::gpu::GPUTPCCFDecodeZSLinkBase::DecodeCtx
Definition GPUTPCCFDecodeZS.h:80

o2::gpu::GPUTPCCFDecodeZSLinkBase::DecodeCtx::iBlock
int32_t iBlock
Definition GPUTPCCFDecodeZS.h:83

o2::gpu::GPUTPCCFDecodeZSLinkBase::DecodeCtx::pageDigitOffset
uint32_t pageDigitOffset
Definition GPUTPCCFDecodeZS.h:84

o2::gpu::GPUTPCCFDecodeZSLinkBase::DecodeCtx::tpcTimeBinCut
int32_t tpcTimeBinCut
Definition GPUTPCCFDecodeZS.h:86

o2::gpu::GPUTPCCFDecodeZSLinkBase::DecodeCtx::firstHBF
int32_t firstHBF
Definition GPUTPCCFDecodeZS.h:85

o2::gpu::GPUTPCCFDecodeZSLinkBase::DecodeCtx::page
const uint8_t * page
Definition GPUTPCCFDecodeZS.h:82

o2::gpu::GPUTPCCFDecodeZSLinkBase::DecodeCtx::clusterer
processorType & clusterer
Definition GPUTPCCFDecodeZS.h:81

o2::gpu::GPUTPCCFDecodeZSLink::GPUSharedMemory
Definition GPUTPCCFDecodeZS.h:139

o2::gpu::GPUTPCCFDecodeZS::GPUSharedMemory
Definition GPUTPCCFDecodeZS.h:34

o2::gpu::GPUTPCCFDecodeZS::GPUSharedMemory::CA_SHARED_STORAGE
CA_SHARED_STORAGE(uint32_t ZSPage[o2::tpc::TPCZSHDR::TPC_ZS_PAGE_SIZE/sizeof(uint32_t)])

o2::gpu::GPUTPCCFDecodeZS::GPUSharedMemory::regionStartRow
uint32_t regionStartRow
Definition GPUTPCCFDecodeZS.h:38

o2::gpu::GPUTPCCFDecodeZS::GPUSharedMemory::nThreadsPerRow
uint32_t nThreadsPerRow
Definition GPUTPCCFDecodeZS.h:39

o2::gpu::GPUTPCCFDecodeZS::GPUSharedMemory::nRowsRegion
uint32_t nRowsRegion
Definition GPUTPCCFDecodeZS.h:37

o2::gpu::GPUTPCCFDecodeZS::GPUSharedMemory::rowStride
uint32_t rowStride
Definition GPUTPCCFDecodeZS.h:40

o2::gpu::GPUTPCCFDecodeZS::GPUSharedMemory::RowClusterOffset
uint32_t RowClusterOffset[o2::tpc::TPCZSHDR::TPC_MAX_ZS_ROW_IN_ENDPOINT]
Definition GPUTPCCFDecodeZS.h:36

o2::gpu::GPUTPCCFDecodeZS::GPUSharedMemory::GPUAtomic
GPUAtomic(uint32_t) rowOffsetCounter

o2::tpc::TPCZSHDRV2::TPC_ZS_NBITS_V34
static constexpr unsigned int TPC_ZS_NBITS_V34
Definition ZeroSuppression.h:56

o2::tpc::TPCZSHDR::TPC_MAX_ZS_ROW_IN_ENDPOINT
static constexpr size_t TPC_MAX_ZS_ROW_IN_ENDPOINT
Definition ZeroSuppression.h:40

o2::tpc::TPCZSHDR::TPC_ZS_PAGE_SIZE
static constexpr size_t TPC_ZS_PAGE_SIZE
Definition ZeroSuppression.h:38

decode
coder decode(ctfImage, triggersD, clustersD)

adc
ArrayADC adc
Definition test_ctf_io_trd.cxx:48