d3/d66/test__Parallel_8cxx_source.html

// Copyright 2019-2020 CERN and copyright holders of ALICE O2.

// See https://alice-o2.web.cern.ch/copyright for details of the copyright holders.

// All rights not expressly granted are reserved.

//

// This software is distributed under the terms of the GNU General Public

// License v3 (GPL Version 3), copied verbatim in the file "COPYING".

//

// In applying this license CERN does not waive the privileges and immunities

// granted to it by virtue of its status as an Intergovernmental Organization

// or submit itself to any jurisdiction.


#include "Framework/InputSpec.h"

#include "Framework/ControlService.h"

#include "Framework/DataProcessorSpec.h"

#include "Framework/DataSpecUtils.h"

#include "Framework/DataRefUtils.h"

#include "Framework/ParallelContext.h"

#include "Framework/runDataProcessing.h"


#include <boost/algorithm/string.hpp>


using namespace o2::framework;


struct FakeCluster {

  float x;

  float y;

  float z;

  float q;

};

using DataHeader = o2::header::DataHeader;


size_t parallelSize = 4;

size_t collectionChunkSize = 1000;

void someDataProducerAlgorithm(ProcessingContext& ctx);

void someProcessingStageAlgorithm(ProcessingContext& ctx);


std::vector<DataProcessorSpec> defineDataProcessing(ConfigContext const&)

{

  std::vector<DataProcessorSpec> specs;

  auto dataProducers = parallel(

    DataProcessorSpec{

      "dataProducer",

      Inputs{},

      {OutputSpec{"TPC", "CLUSTERS", 0, Lifetime::Timeframe}},

      AlgorithmSpec{

        (AlgorithmSpec::ProcessCallback)someDataProducerAlgorithm}},

    parallelSize,

    [](DataProcessorSpec& spec, size_t index) {

      DataSpecUtils::updateMatchingSubspec(spec.outputs[0], index);

    });


  auto processingStages = parallel(

    DataProcessorSpec{

      "processingStage",

      Inputs{

        {"dataTPC", "TPC", "CLUSTERS", 0, Lifetime::Timeframe}},

      Outputs{

        {"TPC", "CLUSTERS_P", 0, Lifetime::Timeframe}},

      AlgorithmSpec{

        // CLion says it ambiguous without (AlgorithmSpec::ProcessCallback), but cmake compiles fine anyway.

        (AlgorithmSpec::ProcessCallback)someProcessingStageAlgorithm}},

    parallelSize,

    [](DataProcessorSpec& spec, size_t index) {

      DataSpecUtils::updateMatchingSubspec(spec.inputs[0], index);

      DataSpecUtils::updateMatchingSubspec(spec.outputs[0], index);

    });


  auto inputsDataSampler = mergeInputs(

    {"dataTPC", "TPC", "CLUSTERS", 0, Lifetime::Timeframe},

    parallelSize,

    [](InputSpec& input, size_t index) {

      DataSpecUtils::updateMatchingSubspec(input, index);

    });

  auto inputsTpcProc = mergeInputs(

    {"dataTPC-proc", "TPC", "CLUSTERS_P", 0, Lifetime::Timeframe},

    parallelSize,

    [](InputSpec& input, size_t index) {

      DataSpecUtils::updateMatchingSubspec(input, index);

    });

  inputsDataSampler.insert(std::end(inputsDataSampler), std::begin(inputsTpcProc), std::end(inputsTpcProc));


  auto dataSampler = DataProcessorSpec{

    "dataSampler",

    inputsDataSampler,

    Outputs{

      {"TPC", "CLUSTERS_S"},

      {"TPC", "CLUSTERS_P_S"}},

    AlgorithmSpec{

      (AlgorithmSpec::ProcessCallback)[](ProcessingContext & ctx){

        InputRecord& inputs = ctx.inputs();


  for (auto& input : inputs) {


    const InputSpec* inputSpec = input.spec;

    auto matcher = DataSpecUtils::asConcreteDataMatcher(*inputSpec);

    o2::header::DataDescription outputDescription = matcher.description;


    // todo: better sampled data flagging

    size_t len = strlen(outputDescription.str);

    if (len < outputDescription.size - 2) {

      outputDescription.str[len] = '_';

      outputDescription.str[len + 1] = 'S';

    }


    Output description{

      matcher.origin,

      outputDescription,

      0,

      inputSpec->lifetime};


    LOG(debug) << "DataSampler sends data from subSpec: " << matcher.subSpec;


    const auto* inputHeader = DataRefUtils::getHeader<o2::header::DataHeader*>(input);

    auto& output = ctx.outputs().make<char>(description, inputHeader->size());


    // todo: use some std function or adopt(), when it is available for POD data

    const char* input_ptr = input.payload;

    for (char& it : output) {

      it = *input_ptr++;

    }

  }

}

}

}

;


DataProcessorSpec qcTask{

  "qcTask",

  Inputs{

    {"dataTPC-sampled", "TPC", "CLUSTERS_S"},

    {"dataTPC-proc-sampled", "TPC", "CLUSTERS_P_S"}},

  Outputs{},

  AlgorithmSpec{

    (AlgorithmSpec::ProcessCallback)[](ProcessingContext & ctx){

      const FakeCluster* inputDataTpc = reinterpret_cast<const FakeCluster*>(ctx.inputs().get("dataTPC-sampled").payload);

const InputSpec* inputSpec = ctx.inputs().get("dataTPC-sampled").spec;

auto matcher = DataSpecUtils::asConcreteDataMatcher(*inputSpec);

LOG(debug) << "qcTask received data with subSpec: " << matcher.subSpec;

}

}

}

;


DataProcessorSpec sink{

  "sink",

  mergeInputs(

    {"dataTPC-proc", "TPC", "CLUSTERS_P"},

    parallelSize,

    [](InputSpec& input, size_t index) {

      DataSpecUtils::updateMatchingSubspec(input, index);

    }),

  Outputs{},

  AlgorithmSpec{

    [](ProcessingContext& ctx) {

      const FakeCluster* inputDataTpc = reinterpret_cast<const FakeCluster*>(ctx.inputs().get("dataTPC-proc").payload);

    }}};


// error in qcTask:

specs.swap(dataProducers);

specs.insert(std::end(specs), std::begin(processingStages), std::end(processingStages));

specs.push_back(sink);

specs.push_back(dataSampler);

specs.push_back(qcTask);


// no error:

//  specs.swap(dataProducers);

//  specs.insert(std::end(specs), std::begin(processingStages), std::end(processingStages));

//  specs.push_back(dataSampler);

//  specs.push_back(qcTask);

//  specs.push_back(sink);


return specs;

}


void someDataProducerAlgorithm(ProcessingContext& ctx)

{

  size_t index = ctx.services().get<ParallelContext>().index1D();

  // Creates a new message of size collectionChunkSize which

  // has "TPC" as data origin and "CLUSTERS" as data description.

  auto& tpcClusters = ctx.outputs().make<FakeCluster>(

    Output{"TPC", "CLUSTERS", static_cast<o2::header::DataHeader::SubSpecificationType>(index)}, collectionChunkSize);

  int i = 0;


  for (auto& cluster : tpcClusters) {

    assert(i < collectionChunkSize);

    cluster.x = index;

    cluster.y = i;

    cluster.z = i;

    cluster.q = rand() % 1000;

    i++;

  }

  ctx.services().get<ControlService>().endOfStream();

}


void someProcessingStageAlgorithm(ProcessingContext& ctx)

{

  size_t index = ctx.services().get<ParallelContext>().index1D();


  const FakeCluster* inputDataTpc = reinterpret_cast<const FakeCluster*>(ctx.inputs().get("dataTPC").payload);


  auto& processedTpcClusters = ctx.outputs().make<FakeCluster>(

    Output{"TPC", "CLUSTERS_P", static_cast<o2::header::DataHeader::SubSpecificationType>(index)},

    collectionChunkSize);


  int i = 0;

  for (auto& cluster : processedTpcClusters) {

    assert(i < collectionChunkSize);

    cluster.x = -inputDataTpc[i].x;

    cluster.y = 2 * inputDataTpc[i].y;

    cluster.z = inputDataTpc[i].z * inputDataTpc[i].q;

    cluster.q = inputDataTpc[i].q;

    i++;

  }

};


ControlService.h

DataProcessorSpec.h

DataRefUtils.h

DataSpecUtils.h

i
int32_t i
Definition GPUCommonAlgorithm.h:436

InputSpec.h

output
void output(const std::map< std::string, ChannelStat > &channels)
Definition rawdump.cxx:197

ParallelContext.h

debug
std::ostringstream debug
Definition VariantJSONHelpers.cxx:305

o2::framework::ConfigContext
Definition ConfigContext.h:24

o2::framework::ControlService
Definition ControlService.h:40

o2::framework::DataAllocator::make
decltype(auto) make(const Output &spec, Args... args)
Definition DataAllocator.h:167

o2::framework::InputRecord
The input API of the Data Processing Layer This class holds the inputs which are valid for processing...
Definition InputRecord.h:102

o2::framework::InputRecord::get
decltype(auto) get(R binding, int part=0) const
Definition InputRecord.h:248

o2::framework::ParallelContext
Definition ParallelContext.h:33

o2::framework::ProcessingContext
Definition ProcessingContext.h:27

o2::framework::ProcessingContext::outputs
DataAllocator & outputs()
The data allocator is used to allocate memory for the output data.
Definition ProcessingContext.h:41

o2::framework::ProcessingContext::inputs
InputRecord & inputs()
The inputs associated with this processing context.
Definition ProcessingContext.h:37

o2::framework::ProcessingContext::services
ServiceRegistryRef services()
The services registry associated with this processing context.
Definition ProcessingContext.h:39

o2::framework::ServiceRegistryRef::get
T & get() const
Definition ServiceRegistryRef.h:85

index
GLuint index
Definition glcorearb.h:781

len
GLenum GLenum GLsizei len
Definition glcorearb.h:4232

o2::framework
Defining PrimaryVertex explicitly as messageable.
Definition TFIDInfo.h:20

o2::framework::parallel
WorkflowSpec parallel(DataProcessorSpec original, size_t maxIndex, std::function< void(DataProcessorSpec &, size_t id)> amendCallback)

o2::framework::mergeInputs
Inputs mergeInputs(InputSpec original, size_t maxIndex, std::function< void(InputSpec &, size_t)> amendCallback)
Definition WorkflowSpec.cxx:112

o2::framework::Inputs
std::vector< InputSpec > Inputs
Definition DataProcessorSpec.h:29

o2::framework::Outputs
std::vector< OutputSpec > Outputs
Definition DataProcessorSpec.h:30

runDataProcessing.h

FakeCluster
Definition test_AlgorithmWrapper.cxx:22

FakeCluster::q
float q
Definition test_AlgorithmWrapper.cxx:26

FakeCluster::z
float z
Definition test_AlgorithmWrapper.cxx:25

FakeCluster::y
float y
Definition test_AlgorithmWrapper.cxx:24

FakeCluster::x
float x
Definition test_AlgorithmWrapper.cxx:23

o2::framework::AlgorithmSpec
Definition AlgorithmSpec.h:43

o2::framework::AlgorithmSpec::ProcessCallback
std::function< void(ProcessingContext &)> ProcessCallback
Definition AlgorithmSpec.h:44

o2::framework::DataProcessorSpec
Definition DataProcessorSpec.h:41

o2::framework::DataSpecUtils::asConcreteDataMatcher
static ConcreteDataMatcher asConcreteDataMatcher(InputSpec const &input)
Definition DataSpecUtils.cxx:389

o2::framework::DataSpecUtils::updateMatchingSubspec
static void updateMatchingSubspec(InputSpec &in, header::DataHeader::SubSpecificationType subSpec)
Definition DataSpecUtils.cxx:150

o2::framework::InputSpec
Definition InputSpec.h:31

o2::framework::InputSpec::lifetime
enum Lifetime lifetime
Definition InputSpec.h:73

o2::framework::OutputSpec
Definition OutputSpec.h:33

o2::framework::Output
Definition Output.h:27

o2::framework::Output::origin
header::DataOrigin origin
Definition Output.h:28

o2::header::DataHeader
the main header struct
Definition DataHeader.h:618

o2::header::DataHeader::SubSpecificationType
uint32_t SubSpecificationType
Definition DataHeader.h:620

o2::header::Descriptor< gSizeDataDescriptionString >

o2::header::Descriptor::str
char str[N]
Definition DataHeader.h:217

o2::header::Descriptor::size
static int constexpr size
Definition DataHeader.h:211

collectionChunkSize
size_t collectionChunkSize
Definition test_Parallel.cxx:33

someProcessingStageAlgorithm
void someProcessingStageAlgorithm(ProcessingContext &ctx)
Definition test_Parallel.cxx:195

parallelSize
size_t parallelSize
Definition test_Parallel.cxx:32

defineDataProcessing
std::vector< DataProcessorSpec > defineDataProcessing(ConfigContext const &)
This function hooks up the the workflow specifications into the DPL driver.
Definition test_Parallel.cxx:37

someDataProducerAlgorithm
void someDataProducerAlgorithm(ProcessingContext &ctx)
Definition test_Parallel.cxx:175

LOG
LOG(info)<< "Compressed in "<< sw.CpuTime()<< " s"