242 static std::vector<bool> present;
243 static std::vector<bool> ignored;
244 static std::vector<size_t> dataSizes;
245 static std::vector<bool> showSize;
247 present.resize(routes.size(),
false);
249 ignored.resize(routes.size(),
false);
251 dataSizes.resize(routes.size(), 0);
253 showSize.resize(routes.size(),
false);
255 static std::vector<size_t> unmatchedDescriptions;
256 unmatchedDescriptions.clear();
262 size_t expectedDataSpecs = 0;
263 for (
size_t pi = 0; pi < present.size(); ++pi) {
264 auto& spec = routes[pi].matcher;
269 if (routes[pi].timeslice == 0) {
274 size_t foundDataSpecs = 0;
275 bool skipAsAllFound =
false;
276 for (
int msgidx = 0; msgidx < parts.Size(); msgidx += 2) {
277 bool allFound =
true;
279 const auto dh = o2::header::get<DataHeader*>(parts.At(msgidx)->GetData());
280 auto const sih = o2::header::get<SourceInfoHeader*>(parts.At(msgidx)->GetData());
281 if (sih !=
nullptr) {
285 if (parts.At(msgidx).get() ==
nullptr) {
286 LOG(error) <<
"unexpected nullptr found. Skipping message pair.";
290 LOG(error) <<
"data on input " << msgidx <<
" does not follow the O2 data model, DataHeader missing";
296 if (firstDH ==
nullptr) {
298 if (doPrintSizes && firstDH->
tfCounter % doPrintSizes != 0) {
303 if (dph ==
nullptr) {
304 dph = o2::header::get<DataProcessingHeader*>(parts.At(msgidx)->GetData());
305 for (
size_t pi = 0; pi < present.size(); ++pi) {
306 if (routes[pi].timeslice != (dph->
startTime % routes[pi].maxTimeslices)) {
311 for (
size_t pi = 0; pi < present.size(); ++pi) {
312 if ((present[pi] || ignored[pi]) && !doPrintSizes) {
316 if (routes[pi].timeslice != (dph->
startTime % routes[pi].maxTimeslices)) {
321 auto& spec = routes[pi].matcher;
322 OutputSpec query{dh->dataOrigin, dh->dataDescription, dh->subSpecification};
324 if (!present[pi] && !ignored[pi]) {
334 if (addToSize >= 0) {
335 int increment = (dh->splitPayloadParts > 0 && dh->splitPayloadParts == dh->splitPayloadIndex) ? 1 : 2;
336 for (
int msgidx2 = msgidx + 1; msgidx2 < msgidxLast; msgidx2 += increment) {
337 dataSizes[addToSize] += parts.At(msgidx2)->GetSize();
341 msgidx = msgidxLast - 2;
342 if (allFound && !doPrintSizes) {
343 skipAsAllFound =
true;
349 for (
size_t pi = 0; pi < present.size(); ++pi) {
350 if (present[pi] && !ignored[pi]) {
353 if (!present[pi] && !ignored[pi]) {
355 unmatchedDescriptions.push_back(pi);
358 int timeframeCompleteness = emptyTf ? 0 : (unmatchedDescriptions.size() ? -1 : 1);
359 (
void)timeframeCompleteness;
361 if (skipAsAllFound && !doPrintSizes) {
365 if (firstDH && doPrintSizes) {
366 std::string
sizes =
"";
367 size_t totalSize = 0;
368 for (
size_t pi = 0; pi < present.size(); ++pi) {
370 totalSize += dataSizes[pi];
371 auto& spec = routes[pi].matcher;
375 LOGP(important,
"RAW {} size report:{}- Total:{}", firstDH->
tfCounter,
sizes, fmt::group_digits(totalSize));
378 if (!doInjectMissingData) {
382 if (unmatchedDescriptions.size() > 0) {
385 LOG(error) <<
"Received an EndOfStream message together with data. This should not happen.";
387 LOG(detail) <<
"This is an End Of Stream message. Not injecting anything.";
390 if (firstDH ==
nullptr) {
391 LOG(error) <<
"Input proxy received incomplete data without any data header. This should not happen! Cannot inject missing data as requsted.";
394 if (dph ==
nullptr) {
395 LOG(error) <<
"Input proxy received incomplete data without any data processing header. This should happen! Cannot inject missing data as requsted.";
398 std::string missing =
"";
399 bool showAlarm =
false;
400 for (
auto mi : unmatchedDescriptions) {
401 auto& spec = routes[mi].matcher;
407 if (subSpec == std::nullopt) {
408 *subSpec = 0xDEADBEEF;
413 dh.subSpecification = *subSpec;
415 dh.splitPayloadParts = 0;
416 dh.splitPayloadIndex = 0;
419 auto& channelName = routes[mi].channel;
420 auto& channelInfo = device.GetChannel(channelName);
421 auto channelAlloc = o2::pmr::getTransportAllocator(channelInfo.Transport());
423 parts.AddPart(std::move(headerMessage));
425 parts.AddPart(device.NewMessageFor(channelName, 0, 0));
430 static int maxWarn = 10;
431 static int contDeadBeef = 0;
432 if (showAlarm && ++contDeadBeef <= maxWarn) {
433 LOGP(alarm,
"Found {}/{} data specs, missing data specs: {}, injecting 0xDEADBEEF{}", foundDataSpecs, expectedDataSpecs, missing, contDeadBeef == maxWarn ?
" - disabling alarm now to stop flooding the log" :
"");
442 class DroppedDataSpecs
445 DroppedDataSpecs() =
default;
451 [[nodiscard]]
bool find(std::string
const& desc)
const
453 return descriptions.find(desc) != std::string::npos;
456 void add(std::string
const& desc)
458 descriptions +=
"\n " + desc;
463 if (not descriptions.empty()) {
464 LOG(warning) <<
"Some input data could not be matched by filter rules to output specs\n"
465 <<
"Active rules: " << descriptions <<
"\n"
466 <<
"DROPPING OF THESE MESSAGES HAS BEEN ENABLED BY CONFIGURATION";
471 std::string descriptions;
474 return [filterSpecs = std::move(filterSpecs), throwOnUnmatchedInputs, droppedDataSpecs = std::make_shared<DroppedDataSpecs>()](
TimingInfo& timingInfo,
ServiceRegistryRef const& services, fair::mq::Parts& parts,
ChannelRetriever channelRetriever,
size_t newTimesliceId,
bool& stop) {
476 std::unordered_map<std::string, fair::mq::Parts> outputs;
477 std::vector<std::string> unmatchedDescriptions;
480 static bool override_creation_env = getenv(
"DPL_RAWPROXY_OVERRIDE_ORBITRESET");
481 bool override_creation =
false;
482 uint64_t creationVal = 0;
483 if (override_creation_env) {
484 static uint64_t creationValBase = std::stoul(getenv(
"DPL_RAWPROXY_OVERRIDE_ORBITRESET"));
485 creationVal = creationValBase;
486 override_creation =
true;
488 auto orbitResetTimeUrl = device->fConfig->GetProperty<std::string>(
"orbit-reset-time",
"ccdb://CTP/Calib/OrbitResetTime");
490 creationVal = std::strtoll(orbitResetTimeUrl.c_str(), &err, 10);
491 if (err && *err == 0 && creationVal) {
492 override_creation =
true;
496 int fmqRunNumber = -1;
498 fmqRunNumber = atoi(device->fConfig->GetProperty<std::string>(
"runNumber",
"").c_str());
502 for (
int msgidx = 0; msgidx < parts.Size(); msgidx += 2) {
503 if (parts.At(msgidx).get() ==
nullptr) {
504 LOG(error) <<
"unexpected nullptr found. Skipping message pair.";
507 const auto dh = o2::header::get<DataHeader*>(parts.At(msgidx)->GetData());
509 LOG(error) <<
"data on input " << msgidx <<
" does not follow the O2 data model, DataHeader missing";
515 auto dph = o2::header::get<DataProcessingHeader*>(parts.At(msgidx)->GetData());
517 LOG(error) <<
"data on input " << msgidx <<
" does not follow the O2 data model, DataProcessingHeader missing";
521 if (override_creation) {
525 timingInfo.creation = dph->creation;
526 timingInfo.firstTForbit = dh->firstTForbit;
527 timingInfo.runNumber = dh->runNumber;
528 timingInfo.tfCounter = dh->tfCounter;
529 LOG(
debug) << msgidx <<
": " <<
DataSpecUtils::describe(
OutputSpec{dh->dataOrigin, dh->dataDescription, dh->subSpecification}) <<
" part " << dh->splitPayloadIndex <<
" of " << dh->splitPayloadParts <<
" payload " << parts.At(msgidx + 1)->GetSize();
530 if (dh->runNumber == 0 || dh->tfCounter == 0 || (fmqRunNumber > 0 && fmqRunNumber != dh->runNumber)) {
531 LOG(error) <<
"INVALID runNumber / tfCounter: runNumber " << dh->runNumber
532 <<
", tfCounter " << dh->tfCounter <<
", FMQ runNumber " << fmqRunNumber
533 <<
" for msgidx " << msgidx <<
": " <<
DataSpecUtils::describe(
OutputSpec{dh->dataOrigin, dh->dataDescription, dh->subSpecification}) <<
" part " << dh->splitPayloadIndex <<
" of " << dh->splitPayloadParts <<
" payload " << parts.At(msgidx + 1)->GetSize();
536 OutputSpec query{dh->dataOrigin, dh->dataDescription, dh->subSpecification};
537 LOG(
debug) <<
"processing " <<
DataSpecUtils::describe(
OutputSpec{dh->dataOrigin, dh->dataDescription, dh->subSpecification}) <<
" time slice " << dph->startTime <<
" part " << dh->splitPayloadIndex <<
" of " << dh->splitPayloadParts;
538 int finalBlockIndex = 0;
539 std::string channelName =
"";
541 for (
auto const& spec : filterSpecs) {
545 channelName = channelRetriever(query, dph->startTime);
554 if (finalBlockIndex > parts.Size()) {
560 if (!channelName.empty()) {
574 LOGP(
debug,
"associating {} part(s) at index {} to channel {} ({})", finalBlockIndex - msgidx, msgidx, channelName, outputs[channelName].
Size());
575 for (; msgidx < finalBlockIndex; ++msgidx) {
576 outputs[channelName].AddPart(std::move(parts.At(msgidx)));
580 msgidx = finalBlockIndex - 2;
587 bool didSendParts =
false;
588 for (
auto& [channelName, channelParts] : outputs) {
589 if (channelParts.Size() == 0) {
593 sendOnChannel(*device, channelParts, channelName, newTimesliceId);
595 if (not unmatchedDescriptions.empty()) {
596 if (throwOnUnmatchedInputs) {
597 std::string descriptions;
598 for (
auto const& desc : unmatchedDescriptions) {
599 descriptions +=
"\n " + desc;
601 throw std::runtime_error(
"No matching filter rule for input data " + descriptions +
602 "\n Add appropriate matcher(s) to dataspec definition or allow to drop unmatched data");
604 bool changed =
false;
605 for (
auto const& desc : unmatchedDescriptions) {
606 if (not droppedDataSpecs->find(desc)) {
608 droppedDataSpecs->add(desc);
613 droppedDataSpecs->warning();
654 std::vector<OutputSpec>
const& outputs,
655 char const* defaultChannelConfig,
659 bool doInjectMissingData,
660 unsigned int doPrintSizes)
666 static std::vector<std::string>
channels;
667 static std::vector<int> numberOfEoS(
channels.size(), 0);
668 static std::vector<int> eosPeersCount(
channels.size(), 0);
676 auto outputChannels = ctx.services().get<
RawDeviceService>().spec().outputChannels;
685 auto channelConfigurationChecker = [device, deviceName, services = ctx.services()]() {
689 eosPeersCount.clear();
690 for (
auto& [channelName, _] : services.get<
RawDeviceService>().device()->GetChannels()) {
692 if (strncmp(channelName.c_str(), deviceName.c_str(), deviceName.size()) == 0) {
697 LOGP(detail,
"Injecting channel '{}' into DPL configuration", channel);
699 auto& channelPtr = services.get<
RawDeviceService>().device()->GetChannel(channel, 0);
702 .hasPendingEvents =
false,
704 .channel = &channelPtr,
709 numberOfEoS.resize(
channels.size(), 0);
710 eosPeersCount.resize(
channels.size(), 0);
718 static bool wasRunning =
false;
719 if (fair::mq::State{
state} == fair::mq::State::Running) {
722 if (fair::mq::State{
state} != fair::mq::State::Ready || !wasRunning) {
725 uv_update_time(deviceState.loop);
730 int64_t cleanupCount = deviceState.cleanupCount.load();
735 doDrain = device->NewStatePending() ==
false && deviceState.cleanupCount == cleanupCount;
736 fair::mq::Parts parts;
737 for (
size_t ci = 0; ci < deviceState.inputChannelInfos.size(); ++ci) {
738 auto& info = deviceState.inputChannelInfos[ci];
743 info.channel->Receive(parts, 10);
746 uv_run(deviceState.loop, UV_RUN_NOWAIT);
750 ctx.services().get<
CallbackService>().set<CallbackService::Id::Start>(channelConfigurationChecker);
751 if (ctx.options().get<std::string>(
"ready-state-policy") ==
"drain") {
752 LOG(info) <<
"Drain mode requested while in Ready state";
753 ctx.services().get<
CallbackService>().set<CallbackService::Id::DeviceStateChanged>(drainMessages);
756 static auto countEoS = [](fair::mq::Parts& inputs) ->
int {
758 for (
int msgidx = 0; msgidx < inputs.Size() / 2; ++msgidx) {
761 if (inputs.At(msgidx * 2).get() ==
nullptr) {
764 auto const sih = o2::header::get<SourceInfoHeader*>(inputs.At(msgidx * 2)->GetData());
773 auto dataHandler = [converter, doInjectMissingData, doPrintSizes,
774 outputRoutes = std::move(outputRoutes),
782 static std::string emptyChannel =
"";
783 for (
auto& route : outputRoutes) {
785 if (
DataSpecUtils::match(route.matcher, query) && ((timeslice % route.maxTimeslices) == route.timeslice)) {
786 return route.channel;
792 std::string
const& channel =
channels[ci];
794 int nEos = countEoS(inputs);
796 std::fill(numberOfEoS.begin(), numberOfEoS.end(), 0);
797 std::fill(eosPeersCount.begin(), eosPeersCount.end(), 0);
799 numberOfEoS[ci] += nEos;
800 if (numberOfEoS[ci]) {
801 eosPeersCount[ci] = std::max<int>(eosPeersCount[ci], device->GetNumberOfConnectedPeers(channel));
804 bool shouldstop =
false;
805 if (doInjectMissingData) {
806 injectMissingData(*device, inputs, outputRoutes, doInjectMissingData, doPrintSizes);
808 bool didSendParts = converter(timingInfo,
ref, inputs, channelRetriever, timesliceIndex->getOldestPossibleOutput().timeslice.value, shouldstop);
816 bool everyEoS = shouldstop;
817 if (!shouldstop && nEos) {
819 for (
unsigned int i = 0;
i < numberOfEoS.size();
i++) {
820 if (numberOfEoS[
i] < eosPeersCount[
i]) {
828 LOG(info) <<
"Received (on channel " << ci <<
") " << numberOfEoS[ci] <<
" end-of-stream from " << eosPeersCount[ci] <<
" peers, forwarding end-of-stream (shouldstop " << (
int)shouldstop <<
", nEos " << nEos <<
", newRun " << (
int)newRun <<
")";
830 for (
auto& info : deviceState->inputChannelInfos) {
833 std::fill(numberOfEoS.begin(), numberOfEoS.end(), 0);
834 std::fill(eosPeersCount.begin(), eosPeersCount.end(), 0);
835 control->endOfStream();
842 static size_t currentRunNumber = -1;
843 static bool inStopTransition =
false;
846 if (limiter.
check(ctx, std::stoi(device->fConfig->GetValue<std::string>(
"timeframes-rate-limit")), minSHM)) {
847 inStopTransition =
true;
850 bool didSendParts =
false;
851 for (
size_t ci = 0; ci <
channels.size(); ++ci) {
852 std::string
const& channel =
channels[ci];
853 int waitTime =
channels.size() == 1 ? -1 : 1;
855 while (maxRead-- > 0) {
856 fair::mq::Parts parts;
857 auto res = device->Receive(parts, channel, 0, waitTime);
858 if (
res == (
size_t)fair::mq::TransferCode::error) {
859 LOGP(error,
"Error while receiving on channel {}", channel);
862 unsigned int nReceived = parts.Size();
863 if (nReceived != 0) {
864 auto const dh = o2::header::get<DataHeader*>(parts.At(0)->GetData());
865 auto& timingInfo = ctx.services().get<
TimingInfo>();
867 if (currentRunNumber != -1 && dh->runNumber != 0 && dh->runNumber != currentRunNumber) {
869 inStopTransition =
false;
871 if (currentRunNumber == -1 || dh->runNumber != 0) {
874 timingInfo.runNumber = dh->runNumber;
875 timingInfo.firstTForbit = dh->firstTForbit;
876 timingInfo.tfCounter = dh->tfCounter;
878 auto const dph = o2::header::get<DataProcessingHeader*>(parts.At(0)->GetData());
879 if (dph !=
nullptr) {
880 timingInfo.timeslice = dph->startTime;
881 timingInfo.creation = dph->creation;
883 if (!inStopTransition) {
884 didSendParts |= dataHandler(ctx.services(), timingInfo, parts, 0, ci, newRun);
887 ctx.services().get<o2::monitoring::Monitoring>().send(o2::monitoring::Metric{(uint64_t)timingInfo.tfCounter,
"df-sent"}.addTag(o2::monitoring::tags::Key::Subsystem, o2::monitoring::tags::Value::DPL));
890 if (nReceived == 0 ||
channels.size() == 1) {
903 decongestion.nextEnumerationTimeslice -= 1;
909 const char* d = strdup(((std::string(defaultChannelConfig).find(
"name=") == std::string::npos ? (std::string(
"name=") +
name +
",") :
"") + std::string(defaultChannelConfig)).c_str());
924 const char* defaultChannelConfig)
935 auto channelConfig = options.
get<std::string>(
"channel-config");
936 std::regex
r{R
"(name=([^,]*))"};
937 std::vector<std::string> values{std::sregex_token_iterator{std::begin(channelConfig), std::end(channelConfig), r, 1},
938 std::sregex_token_iterator{}};
940 throw std::runtime_error(
"failed to extract channel name from channel configuration parameter '" + channelConfig +
"'");
942 std::string outputChannelName =
values[0];
944 auto* device = rds.
device();
948 auto channelConfigurationChecker = [inputSpecs = std::move(inputSpecs), device, outputChannelName]() {
949 LOG(info) <<
"checking channel configuration";
950 if (device->GetChannels().count(outputChannelName) == 0) {
951 throw std::runtime_error(
"no corresponding output channel found for input '" + outputChannelName +
"'");
955 auto lastDataProcessingHeader = std::make_shared<DataProcessingHeader>(0, 0);
957 auto& spec =
const_cast<DeviceSpec&
>(deviceSpec);
959 for (
auto const& inputSpec : inputSpecs) {
965 .matcher = inputSpec,
966 .channel = outputChannelName,
968 spec.forwards.emplace_back(route);
971 auto forwardEos = [device, lastDataProcessingHeader, outputChannelName](
EndOfStreamContext&) {
975 for (
auto& channelInfo : device->GetChannels()) {
976 auto& channelName = channelInfo.first;
977 if (channelName != outputChannelName) {
991 auto channelAlloc = o2::pmr::getTransportAllocator(channelInfo.second[0].Transport());
994 out.AddPart(std::move(headerMessage));
996 out.AddPart(device->NewMessageFor(channelName, 0, 0));
1003 for (
size_t ii = 0; ii != inputs.
size(); ++ii) {
1004 for (
size_t pi = 0; pi < inputs.
getNofParts(ii); ++pi) {
1005 auto part = inputs.
getByPos(ii, pi);
1006 const auto* dph = o2::header::get<DataProcessingHeader*>(part.header);
1009 lastDataProcessingHeader->startTime = dph->startTime;
1010 lastDataProcessingHeader->duration = dph->duration;
1011 lastDataProcessingHeader->creation = dph->creation;
1017 const char* d = strdup(((std::string(defaultChannelConfig).find(
"name=") == std::string::npos ? (std::string(
"name=") +
name +
",") :
"") + std::string(defaultChannelConfig)).c_str());
1026 Inputs const& inputSpecs,
1027 const char* defaultChannelConfig,
1034 spec.
inputs = inputSpecs;
1037 auto device = rds.
device();
1042 auto channelNames = std::make_shared<std::vector<std::string>>();
1043 auto channelConfigurationInitializer = [&proxy, inputSpecs = std::move(inputSpecs), device, channelSelector, &deviceSpec, channelNames]() {
1044 channelNames->clear();
1045 auto& mutableDeviceSpec =
const_cast<DeviceSpec&
>(deviceSpec);
1046 for (
auto const& spec : inputSpecs) {
1047 auto channel = channelSelector(spec, device->GetChannels());
1048 if (device->GetChannels().count(channel) == 0) {
1049 throw std::runtime_error(
"no corresponding output channel found for input '" + channel +
"'");
1062 mutableDeviceSpec.forwards.emplace_back(route);
1064 channelNames->emplace_back(std::move(channel));
1066 proxy.
bind(mutableDeviceSpec.outputs, mutableDeviceSpec.inputs, mutableDeviceSpec.forwards, *device);
1069 auto channelConfigurationDisposer = [&deviceSpec]() {
1070 auto& mutableDeviceSpec =
const_cast<DeviceSpec&
>(deviceSpec);
1071 mutableDeviceSpec.
forwards.clear();
1076 auto lastDataProcessingHeader = std::make_shared<DataProcessingHeader>(0, 0);
1077 auto forwardEos = [device, lastDataProcessingHeader, channelNames](
EndOfStreamContext&) {
1081 for (
auto& channelInfo : device->GetChannels()) {
1082 auto& channelName = channelInfo.first;
1083 auto checkChannel = [channelNames = std::move(*channelNames)](std::string
const&
name) ->
bool {
1084 for (
auto const&
n : channelNames) {
1091 if (!checkChannel(channelName)) {
1105 auto channelAlloc = o2::pmr::getTransportAllocator(channelInfo.second[0].Transport());
1107 fair::mq::Parts out;
1108 out.AddPart(std::move(headerMessage));
1110 out.AddPart(device->NewMessageFor(channelName, 0, 0));
1111 LOGP(detail,
"Forwarding EoS to {}", channelName);
1121 for (
size_t ii = 0; ii != inputs.
size(); ++ii) {
1122 for (
size_t pi = 0; pi < inputs.
getNofParts(ii); ++pi) {
1123 auto part = inputs.
getByPos(ii, pi);
1124 const auto* dph = o2::header::get<DataProcessingHeader*>(part.header);
1127 lastDataProcessingHeader->startTime = dph->startTime;
1128 lastDataProcessingHeader->duration = dph->duration;
1129 lastDataProcessingHeader->creation = dph->creation;
1135 const char* d = strdup(((std::string(defaultChannelConfig).find(
"name=") == std::string::npos ? (std::string(
"name=") +
name +
",") :
"") + std::string(defaultChannelConfig)).c_str());