d1/d43/WorkflowSpec_8cxx_source.html

// Copyright 2019-2020 CERN and copyright holders of ALICE O2.

// See https://alice-o2.web.cern.ch/copyright for details of the copyright holders.

// All rights not expressly granted are reserved.

//

// This software is distributed under the terms of the GNU General Public

// License v3 (GPL Version 3), copied verbatim in the file "COPYING".

//

// In applying this license CERN does not waive the privileges and immunities

// granted to it by virtue of its status as an Intergovernmental Organization

// or submit itself to any jurisdiction.

#include "Framework/WorkflowSpec.h"

#include "Framework/DataProcessorSpec.h"

#include "Framework/DataDescriptorQueryBuilder.h"

#include "Framework/DataSpecUtils.h"


#include <cstddef>

#include <functional>

#include <string>


namespace o2::framework

{


WorkflowSpec parallel(DataProcessorSpec original,

                      size_t maxIndex,

                      std::function<void(DataProcessorSpec&, size_t)> amendCallback)

{

  WorkflowSpec results;

  results.reserve(maxIndex);

  for (size_t i = 0; i < maxIndex; ++i) {

    results.push_back(original);

    results.back().name = original.name + "_" + std::to_string(i);

    results.back().rank = i;

    results.back().nSlots = maxIndex;

    amendCallback(results.back(), i);

  }

  return results;

}


WorkflowSpec parallel(WorkflowSpec specs,

                      size_t maxIndex,

                      std::function<void(DataProcessorSpec&, size_t)> amendCallback)

{

  WorkflowSpec results;

  results.reserve(specs.size() * maxIndex);

  for (auto& spec : specs) {

    auto result = parallel(spec, maxIndex, amendCallback);

    results.insert(results.end(), result.begin(), result.end());

  }


  return results;

}


WorkflowSpec parallelPipeline(const WorkflowSpec& specs,

                              size_t nPipelines,

                              std::function<size_t()> getNumberOfSubspecs,

                              std::function<size_t(size_t)> getSubSpec)

{

  WorkflowSpec result;

  size_t numberOfSubspecs = getNumberOfSubspecs();

  if (numberOfSubspecs < nPipelines) {

    // no need to create more pipelines than the number of parallel Ids, in that case

    // each pipeline serves one id

    nPipelines = numberOfSubspecs;

  }

  for (auto process : specs) {

    size_t channels = numberOfSubspecs;

    size_t inputMultiplicity = numberOfSubspecs / nPipelines;

    if (numberOfSubspecs % nPipelines) {

      // some processes will get one more channel to handle all channels

      inputMultiplicity += 1;

    }

    auto amendProcess = [numberOfSubspecs, nPipelines, &channels, &inputMultiplicity, getSubSpec](DataProcessorSpec& spec, size_t pipeline) {

      auto inputs = std::move(spec.inputs);

      auto outputs = std::move(spec.outputs);

      spec.inputs.reserve(inputMultiplicity);

      spec.outputs.reserve(inputMultiplicity);

      for (size_t inputNo = 0; inputNo < inputMultiplicity; ++inputNo) {

        for (auto& input : inputs) {

          spec.inputs.push_back(input);

          spec.inputs.back().binding += std::to_string(inputNo);

          DataSpecUtils::updateMatchingSubspec(spec.inputs.back(), getSubSpec(pipeline + inputNo * nPipelines));

        }

        for (auto& output : outputs) {

          spec.outputs.push_back(output);

          spec.outputs.back().binding.value += std::to_string(inputNo);

          // FIXME: this will be unneeded once we have a subSpec-less variant...

          DataSpecUtils::updateMatchingSubspec(spec.outputs.back(), getSubSpec(pipeline + inputNo * nPipelines));

        }

      }

      channels -= inputMultiplicity;

      if (inputMultiplicity > numberOfSubspecs / nPipelines &&

          (channels % (nPipelines - (pipeline + 1))) == 0) {

        // if the remaining ids can be distributed equally among the remaining pipelines

        // we can decrease multiplicity

        inputMultiplicity = numberOfSubspecs / nPipelines;

      }

    };


    if (nPipelines > 1) {

      // add multiple processes and distribute inputs among them

      auto amendedProcessors = parallel(process, nPipelines, amendProcess);

      result.insert(result.end(), amendedProcessors.begin(), amendedProcessors.end());

    } else if (nPipelines == 1) {

      // add one single process with all the inputs

      amendProcess(process, 0);

      result.push_back(process);

    }

  }

  return result;

}


Inputs mergeInputs(InputSpec original,

                   size_t maxIndex,

                   std::function<void(InputSpec&, size_t)> amendCallback)

{

  Inputs results;

  results.reserve(maxIndex);

  for (size_t i = 0; i < maxIndex; ++i) {

    results.push_back(original);

    amendCallback(results.back(), i);

  }

  return results;

}


Inputs mergeInputs(Inputs inputs,

                   size_t maxIndex,

                   std::function<void(InputSpec&, size_t)> amendCallback)

{

  Inputs results;

  results.reserve(inputs.size() * maxIndex);

  for (size_t i = 0; i < maxIndex; ++i) {

    for (auto const& original : inputs) {

      results.push_back(original);

      amendCallback(results.back(), i);

    }

  }

  return results;

}


DataProcessorSpec timePipeline(DataProcessorSpec original,

                               size_t count)

{

  if (original.maxInputTimeslices != 1) {

    std::runtime_error("You can time slice only once");

  }

  original.maxInputTimeslices = count;

  return original;

}


std::vector<InputSpec> select(const char* matcher)

{

  return DataDescriptorQueryBuilder::parse(matcher);

}


namespace workflow

{


WorkflowSpec combine(char const* name, std::vector<DataProcessorSpec> const& specs, bool doIt)

{

  if (!doIt) {

    return specs;

  }


  DataProcessorSpec combined;

  combined.name = name;

  // add all the inputs to combined

  for (auto& spec : specs) {

    for (auto& input : spec.inputs) {

      combined.inputs.push_back(input);

    }

    for (auto& output : spec.outputs) {

      combined.outputs.push_back(output);

    }

    for (auto& option : spec.options) {

      combined.options.push_back(option);

    }

    for (auto& label : spec.labels) {

      combined.labels.push_back(label);

    }

    for (auto& metadatum : spec.metadata) {

      combined.metadata.push_back(metadatum);

    }

    for (auto& service : spec.requiredServices) {

      // Insert in the final list of services

      // only if a spec with the same name is not there

      // already.

      bool found = false;

      for (auto& existing : combined.requiredServices) {

        if (existing.name == service.name) {

          found = true;

          break;

        }

      }

      if (!found) {

        combined.requiredServices.push_back(service);

      }

    }

  }


  combined.algorithm = AlgorithmSpec{[specs](InitContext& ctx) {

    std::vector<AlgorithmSpec::ProcessCallback> callbacks;

    for (auto& spec : specs) {

      if (spec.algorithm.onInit) {

        callbacks.push_back(spec.algorithm.onInit(ctx));

      } else if (spec.algorithm.onProcess) {

        callbacks.push_back(spec.algorithm.onProcess);

      }

    }

    return [callbacks](ProcessingContext& context) {

      for (auto& callback : callbacks) {

        callback(context);

      }

    };

  }};

  return {combined};

}


} // namespace workflow


} // namespace o2::framework

DataDescriptorQueryBuilder.h

DataProcessorSpec.h

DataSpecUtils.h

i
int32_t i
Definition GPUCommonAlgorithm.h:431

output
void output(const std::map< std::string, ChannelStat > &channels)
Definition rawdump.cxx:197

WorkflowSpec.h

o2::framework::InitContext
Definition InitContext.h:25

o2::framework::ProcessingContext
Definition ProcessingContext.h:27

count
GLint GLsizei count
Definition glcorearb.h:399

result
GLuint64EXT * result
Definition glcorearb.h:5662

name
GLuint const GLchar * name
Definition glcorearb.h:781

label
GLuint GLsizei const GLchar * label
Definition glcorearb.h:2519

o2::framework::workflow::combine
WorkflowSpec combine(const char *name, std::vector< DataProcessorSpec > const &specs, bool doIt)
Definition WorkflowSpec.cxx:159

o2::framework
Defining PrimaryVertex explicitly as messageable.
Definition TFIDInfo.h:20

o2::framework::parallelPipeline
WorkflowSpec parallelPipeline(const WorkflowSpec &specs, size_t nPipelines, std::function< size_t()> getNumberOfSubspecs, std::function< size_t(size_t)> getSubSpec)
Definition WorkflowSpec.cxx:53

o2::framework::parallel
WorkflowSpec parallel(DataProcessorSpec original, size_t maxIndex, std::function< void(DataProcessorSpec &, size_t id)> amendCallback)

o2::framework::mergeInputs
Inputs mergeInputs(InputSpec original, size_t maxIndex, std::function< void(InputSpec &, size_t)> amendCallback)
Definition WorkflowSpec.cxx:112

o2::framework::WorkflowSpec
std::vector< DataProcessorSpec > WorkflowSpec
Definition HBFUtilsInitializer.h:39

o2::framework::timePipeline
DataProcessorSpec timePipeline(DataProcessorSpec original, size_t count)
Definition WorkflowSpec.cxx:140

o2::framework::select
std::vector< InputSpec > select(char const *matcher="")
Definition WorkflowSpec.cxx:152

o2::framework::Inputs
std::vector< InputSpec > Inputs
Definition DataProcessorSpec.h:29

std::to_string
std::string to_string(gsl::span< T, Size > span)
Definition common.h:52

o2::framework::AlgorithmSpec
Definition AlgorithmSpec.h:43

o2::framework::DataDescriptorQueryBuilder::parse
static std::vector< InputSpec > parse(const char *s="")
Definition DataDescriptorQueryBuilder.cxx:55

o2::framework::DataProcessorSpec
Definition DataProcessorSpec.h:41

o2::framework::DataProcessorSpec::metadata
std::vector< DataProcessorMetadata > metadata
Definition DataProcessorSpec.h:65

o2::framework::DataProcessorSpec::algorithm
AlgorithmSpec algorithm
Definition DataProcessorSpec.h:45

o2::framework::DataProcessorSpec::maxInputTimeslices
size_t maxInputTimeslices
Definition DataProcessorSpec.h:80

o2::framework::DataProcessorSpec::outputs
Outputs outputs
Definition DataProcessorSpec.h:44

o2::framework::DataProcessorSpec::name
std::string name
Definition DataProcessorSpec.h:42

o2::framework::DataProcessorSpec::options
Options options
Definition DataProcessorSpec.h:47

o2::framework::DataProcessorSpec::inputs
Inputs inputs
Definition DataProcessorSpec.h:43

o2::framework::DataProcessorSpec::requiredServices
std::vector< ServiceSpec > requiredServices
Definition DataProcessorSpec.h:54

o2::framework::DataProcessorSpec::labels
std::vector< DataProcessorLabel > labels
Definition DataProcessorSpec.h:61

o2::framework::DataSpecUtils::updateMatchingSubspec
static void updateMatchingSubspec(InputSpec &in, header::DataHeader::SubSpecificationType subSpec)
Definition DataSpecUtils.cxx:158

o2::framework::InputSpec
Definition InputSpec.h:31

process
Definition process_iterator.h:53

nPipelines
size_t nPipelines
Definition test_ParallelPipeline.cxx:47

channels
std::vector< ChannelData > channels
Definition test_ctf_io_fdd.cxx:39