de/df8/bench__ransDecodeScaling_8cxx_source.html

// Copyright 2019-2023 CERN and copyright holders of ALICE O2.

// See https://alice-o2.web.cern.ch/copyright for details of the copyright holders.

// All rights not expressly granted are reserved.

//

// This software is distributed under the terms of the GNU General Public

// License v3 (GPL Version 3), copied verbatim in the file "COPYING".

//

// In applying this license CERN does not waive the privileges and immunities

// granted to it by virtue of its status as an Intergovernmental Organization

// or submit itself to any jurisdiction.


#include "rANS/internal/common/defines.h"


#include <vector>

#include <cstring>

#include <random>

#include <algorithm>

#ifdef RANS_PARALLEL_STL

#include <execution>

#endif

#include <iterator>


#include <benchmark/benchmark.h>


#include "rANS/factory.h"

#include "rANS/histogram.h"


#ifdef ENABLE_VTUNE_PROFILER

#include <ittnotify.h>

#endif


#include "helpers.h"


using namespace o2::rans;


inline constexpr size_t MessageSize = 1ull << 22;


template <typename source_T>


class SourceMessageUniform

{

 public:


  SourceMessageUniform(size_t messageSize, size_t max) : mMax{max}

  {

    std::mt19937 mt(0); // same seed we want always the same distrubution of random numbers;

    std::uniform_int_distribution<source_T> dist(0, max);

    const size_t sourceSize = messageSize / sizeof(source_T) + 1;

    mSourceMessage.resize(sourceSize);

#ifdef RANS_PARALLEL_STL

    std::generate(std::execution::par_unseq, mSourceMessage.begin(), mSourceMessage.end(), [&dist, &mt]() { return dist(mt); });

#else

    std::generate(mSourceMessage.begin(), mSourceMessage.end(), [&dist, &mt]() { return dist(mt); });

#endif // RANS_PARALLEL_STL

  }


  const auto& get() const { return mSourceMessage; };

  size_t getMax() const { return mMax; };


 private:

  size_t mMax{};

  std::vector<source_T> mSourceMessage{};

};


SourceMessageUniform<uint32_t> sourceMessage{0, 0};


void ransDecodeBenchmark(benchmark::State& st)

{


  using source_type = uint32_t;

  size_t max = utils::pow2(st.range(0));


  if (max != sourceMessage.getMax()) {

    sourceMessage = SourceMessageUniform<uint32_t>{MessageSize, max};

  }

  const auto& inputData = sourceMessage.get();

  EncodeBuffer<source_type>

    encodeBuffer{inputData.size()};

  DecodeBuffer<source_type> decodeBuffer{inputData.size()};


  const auto histogram = makeDenseHistogram::fromSamples(gsl::span<const source_type>(inputData));

  Metrics<source_type> metrics{histogram};

  const auto renormedHistogram = renorm(histogram, metrics, RenormingPolicy::Auto, 10);


  auto encoder = makeDenseEncoder<>::fromRenormed(renormedHistogram);

  encodeBuffer.encodeBufferEnd = encoder.process(inputData.data(), inputData.data() + inputData.size(), encodeBuffer.buffer.data());


  auto decoder = makeDecoder<>::fromRenormed(renormedHistogram);

#ifdef ENABLE_VTUNE_PROFILER

  __itt_resume();

#endif

  for (auto _ : st) {

    decoder.process(encodeBuffer.encodeBufferEnd, decodeBuffer.buffer.data(), inputData.size(), encoder.getNStreams());

  }

#ifdef ENABLE_VTUNE_PROFILER

  __itt_pause();

#endif


  if (!(decodeBuffer == inputData)) {

    st.SkipWithError("Missmatch between encoded and decoded Message");

  }


  const auto& datasetProperties = metrics.getDatasetProperties();

  st.SetItemsProcessed(static_cast<int64_t>(inputData.size()) * static_cast<int64_t>(st.iterations()));

  st.SetBytesProcessed(static_cast<int64_t>(inputData.size()) * sizeof(source_type) * static_cast<int64_t>(st.iterations()));

  st.counters["AlphabetRangeBits"] = datasetProperties.alphabetRangeBits;

  st.counters["nUsedAlphabetSymbols"] = datasetProperties.nUsedAlphabetSymbols;

  st.counters["SymbolTablePrecision"] = renormedHistogram.getRenormingBits();

  st.counters["Entropy"] = datasetProperties.entropy;

  st.counters["ExpectedCodewordLength"] = computeExpectedCodewordLength(histogram, renormedHistogram);

  st.counters["SourceSize"] = inputData.size() * sizeof(source_type);

  st.counters["CompressedSize"] = std::distance(encodeBuffer.buffer.data(), encodeBuffer.encodeBufferEnd) * sizeof(typename decltype(encoder)::stream_type);

  st.counters["Compression"] = st.counters["SourceSize"] / static_cast<double>(st.counters["CompressedSize"]);

  st.counters["LowerBound"] = inputData.size() * (static_cast<double>(st.counters["Entropy"]) / 8);

  st.counters["CompressionWRTEntropy"] = st.counters["CompressedSize"] / st.counters["LowerBound"];

};


BENCHMARK(ransDecodeBenchmark)->DenseRange(8, 27, 1);


BENCHMARK_MAIN();

inputData
std::vector< o2::mid::ColumnData > inputData
Definition bench_Clusterizer.cxx:124

MessageSize
constexpr size_t MessageSize
Definition bench_ransDecodeScaling.cxx:40

BENCHMARK_MAIN
BENCHMARK_MAIN()

ransDecodeBenchmark
void ransDecodeBenchmark(benchmark::State &st)
Definition bench_ransDecodeScaling.cxx:69

sourceMessage
SourceMessageUniform< uint32_t > sourceMessage
Definition bench_ransDecodeScaling.cxx:67

BENCHMARK
BENCHMARK(ransDecodeBenchmark) -> DenseRange(8, 27, 1)

st
benchmark::State & st
Definition bench_ransEncodeImpl.cxx:288

source_type
uint32_t source_type
Definition bench_ransPack.cxx:41

stream_type
uint32_t stream_type
Definition bin-encode-decode.cxx:34

SourceMessageUniform
Definition bench_ransDecodeScaling.cxx:44

SourceMessageUniform::get
const auto & get() const
Definition bench_ransDecodeScaling.cxx:59

SourceMessageUniform::SourceMessageUniform
SourceMessageUniform(size_t messageSize, size_t max)
Definition bench_ransDecodeScaling.cxx:46

SourceMessageUniform::getMax
size_t getMax() const
Definition bench_ransDecodeScaling.cxx:60

o2::rans::Metrics
Definition Metrics.h:37

o2::rans::internal::makeEncoder::fromRenormed
static constexpr decltype(auto) fromRenormed(const RenormedHistogramConcept< container_T > &renormed)
Definition factory.h:106

o2::rans::makeDecoder::fromRenormed
static constexpr decltype(auto) fromRenormed(const RenormedDenseHistogram< source_T > &renormed)
Definition factory.h:195

source_T

defines.h
preprocessor defines to enable features based on CPU architecture

factory.h
static factory classes for building histograms, encoders and decoders.

metrics
GLsizei GLenum const void GLuint GLsizei GLfloat * metrics
Definition glcorearb.h:5500

helpers.h
common functionality for rANS benchmarks.

histogram.h
public interface for building and renorming histograms from source data.

o2::rans
Definition compat.h:42

o2::rans::computeExpectedCodewordLength
double_t computeExpectedCodewordLength(const DenseHistogram< source_T > &histogram, const RenormedDenseHistogram< source_T > &rescaledHistogram)
Definition utils.h:33

o2::rans::renorm
decltype(auto) renorm(histogram_T histogram, size_t newPrecision, RenormingPolicy renormingPolicy=RenormingPolicy::Auto, size_t lowProbabilityCutoffBits=0)
Definition renorm.h:203

DecodeBuffer
Definition helpers.h:302

EncodeBuffer
Definition helpers.h:285

o2::rans::makeDenseHistogram::fromSamples
static decltype(auto) fromSamples(source_IT begin, source_IT end, typename std::iterator_traits< source_IT >::value_type min, typename std::iterator_traits< source_IT >::value_type max)
Definition factory.h:144

decodeBuffer
std::string decodeBuffer(int feeId, gsl::span< const std::byte > buffer)
Definition testUserLogicEndpointDecoder.cxx:165

max
constexpr size_t max
Definition test_Algorithm.cxx:49