Project
Loading...
Searching...
No Matches
DataDescriptorQueryBuilder.cxx
Go to the documentation of this file.
1// Copyright 2019-2020 CERN and copyright holders of ALICE O2.
2// See https://alice-o2.web.cern.ch/copyright for details of the copyright holders.
3// All rights not expressly granted are reserved.
4//
5// This software is distributed under the terms of the GNU General Public
6// License v3 (GPL Version 3), copied verbatim in the file "COPYING".
7//
8// In applying this license CERN does not waive the privileges and immunities
9// granted to it by virtue of its status as an Intergovernmental Organization
10// or submit itself to any jurisdiction.
11
14#include "Framework/InputSpec.h"
15
16#include <memory>
17#include <optional>
18#include <string>
19#include <vector>
20#include <regex>
21#include <iostream>
22
23using namespace o2::framework::data_matcher;
24
25namespace o2::framework
26{
27
54
55std::vector<InputSpec> DataDescriptorQueryBuilder::parse(char const* config)
56{
57 std::vector<QueryBuilderState> states;
58 states.push_back(IN_BEGIN_QUERY);
59
60 std::vector<InputSpec> result;
61 char const* next = config;
62 char const* cur = config;
63 char const* expectedSeparators;
64 char* endptr;
65 std::string errorString;
66 std::unique_ptr<DataDescriptorMatcher> currentMatcher;
67 std::vector<data_matcher::Node> nodes;
68 std::optional<std::string> currentBinding;
69 std::optional<std::string> currentOrigin;
70 std::optional<std::string> currentDescription;
71 std::optional<std::string> currentKey;
72 std::optional<std::string> currentValue;
73 std::optional<header::DataHeader::SubSpecificationType> currentSubSpec;
74 std::optional<uint64_t> currentTimeModulo;
75 Lifetime currentLifetime = Lifetime::Timeframe;
76 size_t currentNumber;
77
78 auto error = [&errorString, &states](std::string const& s) {
79 errorString = s;
80 states.push_back(IN_ERROR);
81 };
82
83 auto pushState = [&states](QueryBuilderState state) {
84 states.push_back(state);
85 };
86
87 auto checkModifier = [&states, &cur, &next, &error](QueryBuilderState state, const char* mod) {
88 const char* modifier = nullptr;
89 if (mod[0] != '\0' && (modifier = strpbrk(cur, mod)) != nullptr) {
90 switch (*modifier) {
91 case '!':
92 states.push_back(IN_NEGATION);
93 break;
94 default:
95 error("invalid modifier '" + std::string(modifier, 1) + "'");
96 return;
97 }
98 next = ++cur;
99 }
100 states.push_back(state);
101 };
102
103 auto token = [&states, &expectedSeparators](QueryBuilderState state, char const* sep) {
104 states.push_back(state);
105 expectedSeparators = sep;
106 };
107
108 auto assignLastStringMatch = [&next, &cur, &error, &pushState](std::string const& what, int maxSize, std::optional<std::string>& s, QueryBuilderState nextState) {
109 if ((next - cur == 0) || (next - cur > maxSize)) {
110 error(what + " needs to be between 1 and " + std::to_string(maxSize) + " char long");
111 return false;
112 }
113 s = std::string(cur, next - cur);
114 if (memchr("\0;", *next, 2)) {
115 pushState(IN_END_MATCHER);
116 cur = next;
117 return true;
118 }
119 pushState(nextState);
120 cur = next + 1;
121 return true;
122 };
123
124 auto assignLastNumericMatch = [&next, &cur, &error, &pushState, &currentNumber](std::string const&, auto& value,
125 QueryBuilderState nextState) {
126 if ((next - cur == 0)) {
127 error("number expected");
128 return false;
129 }
130 value = currentNumber;
131 if (memchr("\0;", *next, 2)) {
132 pushState(IN_END_MATCHER);
133 cur = next;
134 return true;
135 }
136 pushState(nextState);
137 cur = next + 1;
138 return true;
139 };
140
141 std::vector<ConfigParamSpec> attributes;
142
143 auto buildMatchingTree = [&nodes](std::string const& binding, std::vector<ConfigParamSpec> attributes) -> InputSpec {
144 auto lastMatcher =
145 std::make_unique<DataDescriptorMatcher>(DataDescriptorMatcher::Op::Just,
147 for (size_t ni = 0, ne = nodes.size(); ni < ne; ++ni) {
148 auto& node = nodes[nodes.size() - 1 - ni];
149 auto tmp = std::make_unique<DataDescriptorMatcher>(DataDescriptorMatcher::Op::And,
150 std::move(node),
151 std::move(lastMatcher));
152 assert(lastMatcher.get() == nullptr);
153 lastMatcher = std::move(tmp);
154 }
155 Lifetime lifetime = Lifetime::Timeframe;
156 for (auto& attribute : attributes) {
157 if (attribute.name == "lifetime" && attribute.defaultValue.get<std::string>() == "condition") {
158 lifetime = Lifetime::Condition;
159 }
160 if (attribute.name == "lifetime" && attribute.defaultValue.get<std::string>() == "sporadic") {
161 lifetime = Lifetime::Sporadic;
162 }
163 }
164 return InputSpec{binding, std::move(*lastMatcher.release()), lifetime, attributes};
165 };
166
167 auto pushMatcher = [&nodes, &states](auto&& matcher) {
168 if (states.empty() == false && states.back() == IN_NEGATION) {
169 states.pop_back();
170 auto notMatcher = std::make_unique<DataDescriptorMatcher>(DataDescriptorMatcher::Op::Xor,
171 std::move(matcher),
173 nodes.push_back(std::move(notMatcher));
174 } else {
175 nodes.push_back(std::move(matcher));
176 }
177 };
178
179 while (states.empty() == false) {
180 auto const state = states.back();
181 states.pop_back();
182
183 switch (state) {
184 case IN_STRING: {
185 next = strpbrk(cur, expectedSeparators);
186 if (next == nullptr) {
187 next = cur + strlen(cur);
188 }
189 } break;
190 case IN_NUMBER: {
191 currentNumber = strtoll(cur, &endptr, 0);
192 if (endptr == cur) {
193 error("Expected a number");
194 }
195 next = endptr;
196 } break;
197 case IN_BEGIN_QUERY: {
198 (*cur == 0) ? pushState(IN_END_QUERY)
199 : pushState(IN_BEGIN_MATCHER);
200 } break;
201 case IN_BEGIN_MATCHER: {
202 nodes.clear();
203 attributes.clear();
204 pushState(IN_BEGIN_BINDING);
205 } break;
206 case IN_BEGIN_BINDING: {
207 pushState(IN_END_BINDING);
208 token(IN_STRING, ":/;,");
209 } break;
210 case IN_END_BINDING: {
211 // We are at the end of the string already.
212 // This is really an origin...
213 if (strchr("\0/;", *next)) {
214 pushState(IN_END_ORIGIN);
215 continue;
216 }
217 if (next - cur == 0) {
218 error("empty binding string");
219 continue;
220 }
221 currentBinding = std::string(cur, next - cur);
222 pushState(IN_BEGIN_ORIGIN);
223 cur = next + 1;
224 } break;
225 case IN_BEGIN_ORIGIN: {
226 pushState(IN_END_ORIGIN);
227 token(IN_STRING, "/;?");
228 } break;
229 case IN_END_ORIGIN: {
230 if (*next == '/' && assignLastStringMatch("origin", 4, currentOrigin, IN_BEGIN_DESCRIPTION)) {
231 nodes.push_back(OriginValueMatcher{*currentOrigin});
232 } else if (*next == ';' && assignLastStringMatch("origin", 4, currentOrigin, IN_END_MATCHER)) {
233 nodes.push_back(OriginValueMatcher{*currentOrigin});
234 } else if (*next == '?' && assignLastStringMatch("origin", 4, currentOrigin, IN_BEGIN_ATTRIBUTES)) {
235 nodes.push_back(OriginValueMatcher{*currentOrigin});
236 } else if (*next == '\0' && assignLastStringMatch("origin", 4, currentOrigin, IN_END_MATCHER)) {
237 nodes.push_back(OriginValueMatcher{*currentOrigin});
238 } else {
239 error("origin needs to be between 1 and 4 char long");
240 }
241 } break;
243 pushState(IN_END_DESCRIPTION);
244 token(IN_STRING, "/;?");
245 } break;
246 case IN_END_DESCRIPTION: {
247 if (*next == '/' && assignLastStringMatch("description", 16, currentDescription, IN_BEGIN_SUBSPEC)) {
248 nodes.push_back(DescriptionValueMatcher{*currentDescription});
249 } else if (*next == ';' && assignLastStringMatch("description", 16, currentDescription, IN_END_MATCHER)) {
250 nodes.push_back(DescriptionValueMatcher{*currentDescription});
251 } else if (*next == '?' && assignLastStringMatch("description", 16, currentDescription, IN_BEGIN_ATTRIBUTES)) {
252 nodes.push_back(DescriptionValueMatcher{*currentDescription});
253 } else if (*next == '\0' && assignLastStringMatch("description", 16, currentDescription, IN_END_MATCHER)) {
254 nodes.push_back(DescriptionValueMatcher{*currentDescription});
255 } else {
256 error("description needs to be between 1 and 16 char long");
257 }
258 } break;
259 case IN_BEGIN_SUBSPEC: {
260 checkModifier(IN_END_SUBSPEC, "!");
261 token(IN_NUMBER, ";%?");
262 } break;
263 case IN_END_SUBSPEC: {
264 if (*next == '%' && assignLastNumericMatch("subspec", currentSubSpec, IN_BEGIN_TIMEMODULO)) {
265 } else if (*next == '?' && assignLastNumericMatch("subspec", currentSubSpec, IN_BEGIN_ATTRIBUTES)) {
266 } else if (*next == ';' && assignLastNumericMatch("subspec", currentSubSpec, IN_END_MATCHER)) {
267 } else if (*next == '\0' && assignLastNumericMatch("subspec", currentSubSpec, IN_END_MATCHER)) {
268 } else {
269 error("Expected a number");
270 break;
271 }
272 auto backup = states.back();
273 states.pop_back();
274 pushMatcher(SubSpecificationTypeValueMatcher{*currentSubSpec});
275 states.push_back(backup);
276 } break;
277 case IN_BEGIN_TIMEMODULO: {
278 pushState(IN_END_TIMEMODULO);
279 token(IN_NUMBER, ";?");
280 } break;
281 case IN_END_TIMEMODULO: {
282 assignLastNumericMatch("timemodulo", currentTimeModulo, IN_ERROR);
283 } break;
284 case IN_END_MATCHER: {
285 if (*cur == ';' && *(cur + 1) == '\0') {
286 error("Remove trailing ;");
287 continue;
288 }
289 result.push_back(buildMatchingTree(*currentBinding, attributes));
290 if (*cur == '\0') {
291 pushState(IN_END_QUERY);
292 } else if (*cur == ';') {
293 cur += 1;
294 pushState(IN_BEGIN_MATCHER);
295 } else {
296 error("Unexpected character " + std::string(cur, 1));
297 }
298 } break;
299 case IN_BEGIN_ATTRIBUTES: {
300 pushState(IN_BEGIN_KEY);
301 } break;
302 case IN_BEGIN_KEY: {
303 pushState(IN_END_KEY);
304 token(IN_STRING, "=");
305 } break;
306 case IN_END_KEY: {
307 if (*next == '=') {
308 assignLastStringMatch("key", 1000, currentKey, IN_BEGIN_VALUE);
309 } else {
310 error("missing value for attribute key");
311 }
312 } break;
313 case IN_BEGIN_VALUE: {
314 pushState(IN_END_VALUE);
315 token(IN_STRING, "&;");
316 } break;
317 case IN_END_VALUE: {
318 if (*next == '&') {
319 assignLastStringMatch("value", 1000, currentValue, IN_BEGIN_KEY);
320 if (*currentKey == "lifetime" && currentValue == "condition") {
321 currentLifetime = Lifetime::Condition;
322 }
323 if (*currentKey == "ccdb-run-dependent") {
324 int val = currentValue == "false" ? 0 : (currentValue == "true" ? 1 : std::stoi(*currentValue));
325 attributes.push_back(ConfigParamSpec{*currentKey, VariantType::Int, val, {}});
326 } else {
327 attributes.push_back(ConfigParamSpec{*currentKey, VariantType::String, *currentValue, {}});
328 }
329 } else if (*next == ';') {
330 assignLastStringMatch("value", 1000, currentValue, IN_END_ATTRIBUTES);
331 if (*currentKey == "lifetime" && currentValue == "condition") {
332 currentLifetime = Lifetime::Condition;
333 }
334 if (*currentKey == "ccdb-run-dependent") {
335 int val = currentValue == "false" ? 0 : (currentValue == "true" ? 1 : std::stoi(*currentValue));
336 attributes.push_back(ConfigParamSpec{*currentKey, VariantType::Int, val, {}});
337 } else {
338 attributes.push_back(ConfigParamSpec{*currentKey, VariantType::String, *currentValue, {}});
339 }
340 } else if (*next == '\0') {
341 assignLastStringMatch("value", 1000, currentValue, IN_END_ATTRIBUTES);
342 if (*currentKey == "lifetime" && currentValue == "condition") {
343 currentLifetime = Lifetime::Condition;
344 }
345 if (*currentKey == "ccdb-run-dependent") {
346 int val = currentValue == "false" ? 0 : (currentValue == "true" ? 1 : std::stoi(*currentValue));
347 attributes.push_back(ConfigParamSpec{*currentKey, VariantType::Int, val, {}});
348 } else {
349 attributes.push_back(ConfigParamSpec{*currentKey, VariantType::String, *currentValue, {}});
350 }
351 } else {
352 error("missing value for string value");
353 }
354 } break;
355 case IN_END_ATTRIBUTES: {
356 pushState(IN_END_MATCHER);
357 } break;
358 case IN_NEGATION: {
359 error("property modifiers should have been handled before when inserting previous matcher");
360 } break;
361 case IN_ERROR: {
362 throw std::runtime_error("Parse error: " + errorString);
363 } break;
364 case IN_END_QUERY: {
365 } break;
366 default: {
367 error("Unhandled state");
368 } break;
369 }
370 }
371 return std::move(result);
372}
373
375{
376 static const std::regex delim(",");
377
378 std::sregex_token_iterator end;
379 std::sregex_token_iterator iter(config.begin(),
380 config.end(),
381 delim,
382 -1);
383
384 std::unique_ptr<DataDescriptorMatcher> next, result;
385
386 for (; iter != end; ++iter) {
387 std::smatch m;
388 auto s = iter->str();
389 auto newNode = buildNode(s);
390
391 if (result.get() == nullptr) {
392 result = std::move(newNode);
393 } else {
394 next = std::move(std::make_unique<DataDescriptorMatcher>(DataDescriptorMatcher::Op::Or,
395 std::move(result),
396 std::move(newNode)));
397 result = std::move(next);
398 }
399 }
400
401 return std::move(DataDescriptorQuery{{}, std::move(result)});
402}
403
405{
406 static const std::regex delim1(",");
407 static const std::regex delim2(":");
408
409 std::sregex_token_iterator end;
410 std::sregex_token_iterator iter1(config.begin(),
411 config.end(),
412 delim1,
413 -1);
414
415 std::unique_ptr<DataDescriptorMatcher> next, result;
416
417 // looping over ','-separated items
418 for (; iter1 != end; ++iter1) {
419 auto s = iter1->str();
420
421 // get first part of item
422 std::sregex_token_iterator iter2(s.begin(),
423 s.end(),
424 delim2,
425 -1);
426 if (iter2 == end) {
427 continue;
428 }
429 s = iter2->str();
430
431 // create the corresponding DataDescriptorMatcher
432 std::smatch m;
433 auto newNode = buildNode(s);
434
435 if (result.get() == nullptr) {
436 result = std::move(newNode);
437 } else {
438 next = std::move(std::make_unique<DataDescriptorMatcher>(DataDescriptorMatcher::Op::Or,
439 std::move(result),
440 std::move(newNode)));
441 result = std::move(next);
442 }
443 }
444
445 return std::move(DataDescriptorQuery{{}, std::move(result)});
446}
447
448std::unique_ptr<DataDescriptorMatcher> DataDescriptorQueryBuilder::buildNode(std::string const& nodeString)
449{
450
451 auto m = getTokens(nodeString);
452
453 std::unique_ptr<DataDescriptorMatcher> next;
454 auto newNode = std::make_unique<DataDescriptorMatcher>(
455 DataDescriptorMatcher::Op::And,
457 std::make_unique<DataDescriptorMatcher>(
458 DataDescriptorMatcher::Op::And,
461
462 return newNode;
463}
464
465std::vector<std::string> DataDescriptorQueryBuilder::getTokens(std::string const& nodeString)
466{
467
468 static const std::regex specTokenRE(R"re((\w{1,4})/(\w{1,16})/(\d*))re");
469 std::smatch match;
470
471 std::regex_match(nodeString, match, specTokenRE);
472
473 std::vector<std::string> result;
474 for (size_t i = 0; i < 4; ++i) {
475 result.push_back(match[i].str());
476 }
477 return result;
478}
479
480} // namespace o2::framework
benchmark::State & state
int32_t i
std::string currentKey
Something which can be matched against a header::DataDescription.
Something which can be matched against a header::DataOrigin.
Matcher on actual time, as reported in the DataProcessingHeader.
Something which can be matched against a header::SubSpecificationType.
bool match(const std::vector< std::string > &queries, const char *pattern)
Definition dcs-ccdb.cxx:229
const GLfloat * m
Definition glcorearb.h:4066
GLuint64EXT * result
Definition glcorearb.h:5662
GLuint GLuint end
Definition glcorearb.h:469
GLsizei const GLfloat * value
Definition glcorearb.h:819
GLuint GLfloat * val
Definition glcorearb.h:1582
GLuint * states
Definition glcorearb.h:4932
Defining PrimaryVertex explicitly as messageable.
Definition TFIDInfo.h:20
Lifetime
Possible Lifetime of objects being exchanged by the DPL.
Definition Lifetime.h:18
std::string to_string(gsl::span< T, Size > span)
Definition common.h:52
static std::vector< InputSpec > parse(const char *s="")
static std::unique_ptr< data_matcher::DataDescriptorMatcher > buildNode(std::string const &nodeString)
static DataDescriptorQuery buildFromExtendedKeepConfig(std::string const &config)
deprecated?
static std::vector< std::string > getTokens(std::string const &nodeString)
static DataDescriptorQuery buildFromKeepConfig(std::string const &config)
A typesafe reference to an element of the context.
const std::string str