Project
Loading...
Searching...
No Matches
TableBuilder.h
Go to the documentation of this file.
1// Copyright 2019-2020 CERN and copyright holders of ALICE O2.
2// See https://alice-o2.web.cern.ch/copyright for details of the copyright holders.
3// All rights not expressly granted are reserved.
4//
5// This software is distributed under the terms of the GNU General Public
6// License v3 (GPL Version 3), copied verbatim in the file "COPYING".
7//
8// In applying this license CERN does not waive the privileges and immunities
9// granted to it by virtue of its status as an Intergovernmental Organization
10// or submit itself to any jurisdiction.
11
12#ifndef O2_FRAMEWORK_TABLEBUILDER_H_
13#define O2_FRAMEWORK_TABLEBUILDER_H_
14
15#include "Framework/ASoA.h"
18#include "arrow/type_traits.h"
19
20// Apparently needs to be on top of the arrow includes.
21#include <sstream>
22
23#include <arrow/chunked_array.h>
24#include <arrow/status.h>
25#include <arrow/memory_pool.h>
26#include <arrow/stl.h>
27#include <arrow/type_traits.h>
28#include <arrow/table.h>
29#include <arrow/builder.h>
30
31#include <vector>
32#include <string>
33#include <memory>
34#include <tuple>
35#include <type_traits>
36#include <concepts>
37
38namespace arrow
39{
40class ArrayBuilder;
41class Table;
42class Array;
43} // namespace arrow
44
45template <typename T>
46struct BulkInfo {
47 const T ptr;
48 size_t size;
49};
50
51namespace o2::framework
52{
53namespace detail
54{
56template <typename T>
58};
59
60template <typename T, int N>
61struct ConversionTraits<T (&)[N]> {
62 using ArrowType = ::arrow::FixedSizeListType;
63};
64
65template <typename T, int N>
66struct ConversionTraits<T[N]> {
67 using ArrowType = ::arrow::FixedSizeListType;
68};
69
70template <typename T, int N>
71struct ConversionTraits<std::array<T, N>> {
72 using ArrowType = ::arrow::FixedSizeListType;
73};
74
75template <typename T>
76struct ConversionTraits<std::vector<T>> {
77 using ArrowType = ::arrow::ListType;
78};
79
80#define O2_ARROW_STL_CONVERSION(c_type, ArrowType_) \
81 template <> \
82 struct ConversionTraits<c_type> { \
83 using ArrowType = ::arrow::ArrowType_; \
84 };
85
86// FIXME: for now we use Int8 to store booleans
87O2_ARROW_STL_CONVERSION(bool, BooleanType)
88O2_ARROW_STL_CONVERSION(int8_t, Int8Type)
89O2_ARROW_STL_CONVERSION(int16_t, Int16Type)
90O2_ARROW_STL_CONVERSION(int32_t, Int32Type)
91O2_ARROW_STL_CONVERSION(long long, Int64Type)
92O2_ARROW_STL_CONVERSION(long, Int64Type)
93O2_ARROW_STL_CONVERSION(uint8_t, UInt8Type)
94O2_ARROW_STL_CONVERSION(uint16_t, UInt16Type)
95O2_ARROW_STL_CONVERSION(uint32_t, UInt32Type)
96O2_ARROW_STL_CONVERSION(long long unsigned, UInt64Type)
97O2_ARROW_STL_CONVERSION(long unsigned, UInt64Type)
98O2_ARROW_STL_CONVERSION(float, FloatType)
99O2_ARROW_STL_CONVERSION(double, DoubleType)
100O2_ARROW_STL_CONVERSION(std::string, StringType)
101} // namespace detail
102
103void addLabelToSchema(std::shared_ptr<arrow::Schema>& schema, const char* label);
104
106 template <typename T>
107 static arrow::Status appendToList(std::unique_ptr<arrow::FixedSizeListBuilder>& builder, T* data, int size = 1)
108 {
109 using ArrowType = typename detail::ConversionTraits<std::decay_t<T>>::ArrowType;
110 using BuilderType = typename arrow::TypeTraits<ArrowType>::BuilderType;
111 size_t numElements = static_cast<const arrow::FixedSizeListType*>(builder->type().get())->list_size();
112
113 auto status = builder->AppendValues(size);
114 auto ValueBuilder = static_cast<BuilderType*>(builder->value_builder());
115 status &= ValueBuilder->AppendValues(data, numElements * size, nullptr);
116
117 return status;
118 }
119
120 template <typename HolderType, typename T>
121 static arrow::Status append(HolderType& holder, T value)
122 {
123 return static_cast<typename HolderType::Policy&>(holder).append(holder.builder, value);
124 }
125
126 template <typename HolderType>
127 static arrow::Status flush(HolderType& holder)
128 {
129 return static_cast<typename HolderType::Policy&>(holder).flush(holder.builder);
130 }
131
135 template <typename HolderType, typename T>
136 static arrow::Status append(HolderType& holder, T* data)
137 {
138 if constexpr (std::is_same_v<decltype(holder.builder), std::unique_ptr<arrow::FixedSizeListBuilder>>) {
139 return appendToList<T>(holder.builder, data);
140 } else {
141 return holder.builder->Append(reinterpret_cast<const uint8_t*>(data));
142 }
143 }
145 template <typename HolderType, typename T, int N>
146 static arrow::Status append(HolderType& holder, T (&data)[N])
147 {
148 return holder.builder->Append(reinterpret_cast<const uint8_t*>(data));
149 }
150
152 template <typename HolderType, typename T, int N>
153 static arrow::Status append(HolderType& holder, std::array<T, N> const& data)
154 {
155 return holder.builder->Append(reinterpret_cast<const uint8_t*>(data.data()));
156 }
157
159 template <typename HolderType, typename T>
160 static arrow::Status append(HolderType& holder, std::vector<T> const& data)
161 {
162 using ArrowType = typename detail::ConversionTraits<T>::ArrowType;
163 using ValueBuilderType = typename arrow::TypeTraits<ArrowType>::BuilderType;
164 auto status = holder.builder->Reserve(data.size());
165 status &= holder.builder->Append();
166 auto vbuilder = static_cast<ValueBuilderType*>(holder.builder->value_builder());
167 status &= vbuilder->AppendValues(data.begin(), data.end());
168
169 return status;
170 }
171
172 template <typename HolderType, typename T>
173 static void unsafeAppend(HolderType& holder, std::vector<T> const& value)
174 {
175 auto status = append(holder, value);
176 if (!status.ok()) {
177 throw runtime_error("Unable to append to column");
178 }
179 }
180
181 template <typename HolderType, typename T>
182 static void unsafeAppend(HolderType& holder, T value)
183 {
184 return holder.builder->UnsafeAppend(value);
185 }
186
187 template <typename HolderType, typename T>
188 static void unsafeAppend(HolderType& holder, T* value)
189 {
190 if constexpr (std::is_same_v<decltype(holder.builder), std::unique_ptr<arrow::FixedSizeListBuilder>>) {
191 auto status = appendToList<T>(holder.builder, value);
192 } else {
193 return holder.builder->UnsafeAppend(reinterpret_cast<const uint8_t*>(value));
194 }
195 }
196
197 template <typename HolderType, typename PTR>
198 static arrow::Status bulkAppend(HolderType& holder, size_t bulkSize, const PTR ptr)
199 {
200 return holder.builder->AppendValues(ptr, bulkSize, nullptr);
201 }
202
203 template <typename HolderType, typename PTR>
204 static arrow::Status bulkAppendChunked(HolderType& holder, BulkInfo<PTR> info)
205 {
206 // Appending nullptr is a no-op.
207 if (info.ptr == nullptr) {
208 return arrow::Status::OK();
209 }
210 if constexpr (std::is_same_v<decltype(holder.builder), std::unique_ptr<arrow::FixedSizeListBuilder>>) {
211 if (appendToList<std::remove_pointer_t<decltype(info.ptr)>>(holder.builder, info.ptr, info.size).ok() == false) {
212 throw runtime_error("Unable to append to column");
213 } else {
214 return arrow::Status::OK();
215 }
216 } else {
217 if (holder.builder->AppendValues(info.ptr, info.size, nullptr).ok() == false) {
218 throw runtime_error("Unable to append to column");
219 } else {
220 return arrow::Status::OK();
221 }
222 }
223 }
224
225 template <typename HolderType, typename ITERATOR>
226 static arrow::Status append(HolderType& holder, std::pair<ITERATOR, ITERATOR> ip)
227 {
229 using ValueBuilderType = typename arrow::TypeTraits<ArrowType>::BuilderType;
230 // FIXME: for the moment we do not fill things.
231 auto status = holder.builder->Append();
232 auto valueBuilder = reinterpret_cast<ValueBuilderType*>(holder.builder->value_builder());
233 return status & valueBuilder->AppendValues(&*ip.first, std::distance(ip.first, ip.second));
234 }
235
236 // Lists do not have UnsafeAppend so we need to use the slow path in any case.
237 template <typename HolderType, typename ITERATOR>
238 static void unsafeAppend(HolderType& holder, std::pair<ITERATOR, ITERATOR> ip)
239 {
241 using ValueBuilderType = typename arrow::TypeTraits<ArrowType>::BuilderType;
242 // FIXME: for the moment we do not fill things.
243 auto status = holder.builder->Append();
244 auto valueBuilder = reinterpret_cast<ValueBuilderType*>(holder.builder->value_builder());
245 status &= valueBuilder->AppendValues(&*ip.first, std::distance(ip.first, ip.second));
246 if (!status.ok()) {
247 throw runtime_error("Unable to append values to valueBuilder!");
248 }
249 return;
250 }
251};
252
253template <typename T>
255 using FillType = T;
256 using STLValueType = T;
258 using BuilderType = typename arrow::TypeTraits<ArrowType>::BuilderType;
259
260 static std::unique_ptr<BuilderType> make(arrow::MemoryPool* pool)
261 {
262 return std::make_unique<BuilderType>(pool);
263 }
264
265 static std::shared_ptr<arrow::DataType> make_datatype()
266 {
267 return arrow::TypeTraits<ArrowType>::type_singleton();
268 }
269
270 static arrow::Status append(BuilderType& builder, T value)
271 {
272 return builder.Append(value);
273 }
274
275 template <int N>
276 static arrow::Status append(BuilderType& builder, std::array<T, N>& value)
277 {
278 return builder.Append(value);
279 }
280};
281
282template <>
283struct BuilderMaker<bool> {
284 using FillType = bool;
285 using STLValueType = bool;
287 using BuilderType = typename arrow::TypeTraits<ArrowType>::BuilderType;
288
289 static std::unique_ptr<BuilderType> make(arrow::MemoryPool* pool)
290 {
291 return std::make_unique<BuilderType>(pool);
292 }
293
294 static std::shared_ptr<arrow::DataType> make_datatype()
295 {
296 return arrow::TypeTraits<ArrowType>::type_singleton();
297 }
298
299 static arrow::Status append(BuilderType& builder, bool value)
300 {
301 return builder.Append(value);
302 }
303};
304
305template <typename ITERATOR>
306struct BuilderMaker<std::pair<ITERATOR, ITERATOR>> {
307 using FillType = std::pair<ITERATOR, ITERATOR>;
308 using STLValueType = typename ITERATOR::value_type;
309 using ArrowType = arrow::ListType;
311 using BuilderType = arrow::ListBuilder;
312 using ValueBuilder = typename arrow::TypeTraits<ValueType>::BuilderType;
313
314 static std::unique_ptr<BuilderType> make(arrow::MemoryPool* pool)
315 {
316 auto valueBuilder = std::make_shared<ValueBuilder>(pool);
317 return std::make_unique<arrow::ListBuilder>(pool, valueBuilder);
318 }
319
320 static std::shared_ptr<arrow::DataType> make_datatype()
321 {
322 return arrow::list(arrow::TypeTraits<ValueType>::type_singleton());
323 }
324};
325
326template <typename T, int N>
327struct BuilderMaker<T (&)[N]> {
328 using FillType = T*;
329 using STLValueType = T;
330 using BuilderType = arrow::FixedSizeListBuilder;
331 using ArrowType = arrow::FixedSizeListType;
333
334 static std::unique_ptr<BuilderType> make(arrow::MemoryPool* pool)
335 {
336 std::unique_ptr<arrow::ArrayBuilder> valueBuilder;
337 auto status =
338 arrow::MakeBuilder(pool, arrow::TypeTraits<ElementType>::type_singleton(), &valueBuilder);
339 return std::make_unique<BuilderType>(pool, std::move(valueBuilder), N);
340 }
341
342 static std::shared_ptr<arrow::DataType> make_datatype()
343 {
344 return arrow::fixed_size_list(arrow::TypeTraits<ElementType>::type_singleton(), N);
345 }
346};
347
348template <typename T, int N>
349struct BuilderMaker<T[N]> {
350 using FillType = T*;
351 using BuilderType = arrow::FixedSizeListBuilder;
352 using ArrowType = arrow::FixedSizeListType;
354
355 static std::unique_ptr<BuilderType> make(arrow::MemoryPool* pool)
356 {
357 std::unique_ptr<arrow::ArrayBuilder> valueBuilder;
358 auto status =
359 arrow::MakeBuilder(pool, arrow::TypeTraits<ElementType>::type_singleton(), &valueBuilder);
360 return std::make_unique<BuilderType>(pool, std::move(valueBuilder), N);
361 }
362
363 static std::shared_ptr<arrow::DataType> make_datatype()
364 {
365 return arrow::fixed_size_list(arrow::TypeTraits<ElementType>::type_singleton(), N);
366 }
367};
368
369template <typename T, int N>
370struct BuilderMaker<std::array<T, N>> {
371 using FillType = T*;
372 using BuilderType = arrow::FixedSizeListBuilder;
373 using ArrowType = arrow::FixedSizeListType;
375
376 static std::unique_ptr<BuilderType> make(arrow::MemoryPool* pool)
377 {
378 std::unique_ptr<arrow::ArrayBuilder> valueBuilder;
379 auto status =
380 arrow::MakeBuilder(pool, arrow::TypeTraits<ElementType>::type_singleton(), &valueBuilder);
381 return std::make_unique<BuilderType>(pool, std::move(valueBuilder), N);
382 }
383
384 static std::shared_ptr<arrow::DataType> make_datatype()
385 {
386 return arrow::fixed_size_list(arrow::TypeTraits<ElementType>::type_singleton(), N);
387 }
388};
389
390template <typename T>
391struct BuilderMaker<std::vector<T>> {
392 using FillType = std::vector<T>;
393 using BuilderType = arrow::ListBuilder;
394 using ArrowType = arrow::ListType;
396
397 static std::unique_ptr<BuilderType> make(arrow::MemoryPool* pool)
398 {
399 std::unique_ptr<arrow::ArrayBuilder> valueBuilder;
400 auto status =
401 arrow::MakeBuilder(pool, arrow::TypeTraits<ElementType>::type_singleton(), &valueBuilder);
402 return std::make_unique<BuilderType>(pool, std::move(valueBuilder));
403 }
404
405 static std::shared_ptr<arrow::DataType> make_datatype()
406 {
407 return arrow::list(arrow::TypeTraits<ElementType>::type_singleton());
408 }
409};
410
411template <typename... ARGS>
413{
414 return std::make_tuple(std::make_unique<ARGS>()...);
415}
416
417template <typename T>
420 using BuilderType = typename arrow::TypeTraits<ArrowType>::BuilderType;
421};
422
423// Support for building tables where each entry is an iterator pair.
424// We map them to an arrow::list for now.
425template <typename ITERATOR>
426struct BuilderTraits<std::pair<ITERATOR, ITERATOR>> {
427 using ArrowType = arrow::ListType;
428 using BuilderType = arrow::ListBuilder;
429};
430
431// Support for building array columns
432// FIXME: move to use FixedSizeList<T> once we move to 0.16.1
433template <typename T, int N>
434struct BuilderTraits<T[N]> {
435 using ArrowType = arrow::FixedSizeListType;
436 using BuilderType = arrow::FixedSizeListBuilder;
437};
438
439template <typename T>
440struct BuilderTraits<std::vector<T>> {
441 using ArrowType = arrow::ListType;
442 using BuilderType = arrow::ListBuilder;
443};
444
445template <typename T>
447 template <typename BUILDER>
448 arrow::Status append(BUILDER& builder, T value)
449 {
450 return builder->Append(value);
451 }
452
453 template <typename BUILDER>
454 arrow::Status flush(BUILDER&)
455 {
456 return arrow::Status::OK();
457 }
458};
459
460template <typename T>
462 static constexpr int CHUNK_SIZE = 256;
463
464 template <typename BUILDER>
465 arrow::Status append(BUILDER& builder, T value)
466 {
468 ++pos;
469 if (pos % CHUNK_SIZE == 0) {
470 return builder->AppendValues(cache, CHUNK_SIZE, nullptr);
471 }
472 return arrow::Status::OK();
473 }
474
475 template <typename BUILDER>
476 arrow::Status flush(BUILDER& builder)
477 {
478 if (pos % CHUNK_SIZE != 0) {
479 return builder->AppendValues(cache, pos % CHUNK_SIZE, nullptr);
480 }
481 return arrow::Status::OK();
482 }
484 int pos = 0;
485};
486
487template <size_t I, typename T, typename P>
488struct BuilderHolder : P {
489 static constexpr size_t index = I;
490 using Policy = P;
492 using BuilderType = typename arrow::TypeTraits<ArrowType>::BuilderType;
493
494 BuilderHolder(arrow::MemoryPool* pool, size_t nRows = 0)
495 : builder{BuilderMaker<T>::make(pool)}
496 {
497 if (nRows > 0) {
498 auto s = builder->Reserve(nRows);
499 if (!s.ok()) {
500 throw runtime_error_f("Unable to reserve %ll rows", nRows);
501 }
502 }
503 }
504
505 std::unique_ptr<BuilderType> builder;
506};
507
509 template <typename... ARGS, size_t NCOLUMNS>
510 static std::array<arrow::DataType, NCOLUMNS> makeArrowColumnTypes()
511 {
513 }
514
515 template <typename... ARGS, size_t NCOLUMNS = sizeof...(ARGS)>
516 static std::vector<std::shared_ptr<arrow::Field>> makeFields(std::array<char const*, NCOLUMNS> const& names)
517 {
518 char const* const* names_ptr = names.data();
519 return {
520 std::make_shared<arrow::Field>(*names_ptr++, BuilderMaker<ARGS>::make_datatype(), true, nullptr)...};
521 }
522
524 template <typename... Ts, typename VALUES>
525 static bool append(std::tuple<Ts...>& holders, VALUES&& values)
526 {
527 return (BuilderUtils::append(std::get<Ts::index>(holders), std::get<Ts::index>(values)).ok() && ...);
528 }
529
533 template <typename... Ts, typename VALUES>
534 static void unsafeAppend(std::tuple<Ts...>& holders, VALUES&& values)
535 {
536 (BuilderUtils::unsafeAppend(std::get<Ts::index>(holders), std::get<Ts::index>(values)), ...);
537 }
538
539 template <typename... Ts, typename PTRS>
540 static bool bulkAppend(std::tuple<Ts...>& holders, size_t bulkSize, PTRS ptrs)
541 {
542 return (BuilderUtils::bulkAppend(std::get<Ts::index>(holders), bulkSize, std::get<Ts::index>(ptrs)).ok() && ...);
543 }
544
546 template <typename... Ts, typename INFOS>
547 static bool bulkAppendChunked(std::tuple<Ts...>& holders, INFOS infos)
548 {
549 return (BuilderUtils::bulkAppendChunked(std::get<Ts::index>(holders), std::get<Ts::index>(infos)).ok() && ...);
550 }
551
553 template <typename... Ts>
554 static bool finalize(std::vector<std::shared_ptr<arrow::Array>>& arrays, std::tuple<Ts...>& holders)
555 {
556 return (finalize(arrays[Ts::index], std::get<Ts::index>(holders)) && ...);
557 }
558
559 template <typename HOLDER>
560 static bool finalize(std::shared_ptr<arrow::Array>& array, HOLDER& holder)
561 {
562 return BuilderUtils::flush(holder).ok() && holder.builder->Finish(&array).ok();
563 }
564};
565
566template <typename... ARGS>
567constexpr auto tuple_to_pack(std::tuple<ARGS...>&&)
568{
569 return framework::pack<ARGS...>{};
570}
571
572template <typename T>
573concept BulkInsertable = (std::integral<std::decay<T>> && !std::same_as<bool, std::decay_t<T>>);
574
575template <typename T>
577 static consteval DirectInsertion<T> policy()
578 requires(!BulkInsertable<T>);
579 static consteval CachedInsertion<T> policy()
580 requires(BulkInsertable<T>);
581 using Policy = decltype(policy());
582};
583
586template <class T>
587auto constexpr to_tuple(T&& object) noexcept
588{
589 using type = std::decay_t<T>;
591 auto&& [p0, p1, p2, p3] = object;
592 return std::make_tuple(p0, p1, p2, p3);
594 auto&& [p0, p1, p2] = object;
595 return std::make_tuple(p0, p1, p2);
597 auto&& [p0, p1] = object;
598 return std::make_tuple(p0, p1);
599 } else if constexpr (is_braces_constructible<type, any_type>{}) {
600 auto&& [p0] = object;
601 return std::make_tuple(p0);
602 } else {
603 return std::make_tuple();
604 }
605}
606
607template <typename... ARGS>
608constexpr auto makeHolderTypes()
609{
610 return []<std::size_t... Is>(std::index_sequence<Is...>) {
611 return std::tuple(BuilderHolder<Is, ARGS, typename InsertionTrait<ARGS>::Policy>(arrow::default_memory_pool())...);
612 }(std::make_index_sequence<sizeof...(ARGS)>{});
613}
614
615template <typename... ARGS>
616auto makeHolders(arrow::MemoryPool* pool, size_t nRows)
617{
618 return [pool, nRows]<std::size_t... Is>(std::index_sequence<Is...>) {
619 return new std::tuple(BuilderHolder<Is, ARGS, typename InsertionTrait<ARGS>::Policy>(pool, nRows)...);
620 }(std::make_index_sequence<sizeof...(ARGS)>{});
621}
622
623template <typename... ARGS>
624using IndexedHoldersTuple = decltype(makeHolderTypes<ARGS...>());
625
626template <typename T>
627concept ShouldNotDeconstruct = std::is_bounded_array_v<T> || std::is_arithmetic_v<T> || framework::is_base_of_template_v<std::vector, T>;
628
633{
634 static void throwError(RuntimeErrorRef const& ref);
635
636 template <typename... ARGS>
637 using HoldersTuple = typename std::tuple<BuilderHolder<0, ARGS, typename InsertionTrait<ARGS>::Policy>...>;
638
639 template <typename... ARGS>
640 using HoldersTupleIndexed = decltype(makeHolderTypes<ARGS...>());
641
644 template <typename... ARGS>
645 auto getBuilders(o2::framework::pack<ARGS...>)
646 {
647 return (HoldersTupleIndexed<ARGS...>*)mHolders;
648 }
649
650 void validate() const;
651
652 template <typename... ARGS, size_t I = sizeof...(ARGS)>
653 auto makeBuilders(std::array<char const*, I> const& columnNames, size_t nRows)
654 {
655 mSchema = std::make_shared<arrow::Schema>(TableBuilderHelpers::makeFields<ARGS...>(columnNames));
656
657 mHolders = makeHolders<ARGS...>(mMemoryPool, nRows);
658 mFinalizer = [](std::vector<std::shared_ptr<arrow::Array>>& arrays, void* holders) -> bool {
659 return TableBuilderHelpers::finalize(arrays, *(HoldersTupleIndexed<ARGS...>*)holders);
660 };
661 mDestructor = [](void* holders) mutable -> void {
662 delete (HoldersTupleIndexed<ARGS...>*)holders;
663 };
664 }
665
666 public:
667 template <typename ARG0, typename... ARGS>
668 requires(sizeof...(ARGS) == 0) && (!ShouldNotDeconstruct<ARG0>)
669 static constexpr int countColumns()
670 {
671 using argsPack_t = decltype(tuple_to_pack(framework::to_tuple(std::declval<ARG0>())));
672 return framework::pack_size(argsPack_t{});
673 }
674
675 template <typename ARG0, typename... ARGS>
676 requires(sizeof...(ARGS) > 0) || ShouldNotDeconstruct<ARG0>
677 static constexpr int countColumns()
678 {
679 return 1 + sizeof...(ARGS);
680 }
681
682 void setLabel(const char* label);
683
684 TableBuilder(arrow::MemoryPool* pool = arrow::default_memory_pool())
685 : mHolders{nullptr},
686 mMemoryPool{pool}
687 {
688 }
689
691 {
692 mDestructor(mHolders);
693 }
694
697 template <typename ARG0, typename... ARGS>
698 requires(sizeof...(ARGS) > 0) || ShouldNotDeconstruct<ARG0>
699 auto persist(std::array<char const*, sizeof...(ARGS) + 1> const& columnNames)
700 {
701 auto persister = persistTuple(framework::pack<ARG0, ARGS...>{}, columnNames);
702 // Callback used to fill the builders
703 return [persister = persister](unsigned int slot, typename BuilderMaker<ARG0>::FillType const& arg, typename BuilderMaker<ARGS>::FillType... args) -> void {
704 persister(slot, std::forward_as_tuple(arg, args...));
705 };
706 }
707
708 // Special case for a single parameter to handle the serialization of struct
709 // which can be decomposed
710 template <typename ARG0, typename... ARGS>
711 requires(sizeof...(ARGS) == 0) && (!ShouldNotDeconstruct<ARG0>)
712 auto persist(std::array<char const*, countColumns<ARG0, ARGS...>()> const& columnNames)
713 {
714 using argsPack_t = decltype(tuple_to_pack(framework::to_tuple(std::declval<ARG0>())));
715 auto persister = persistTuple(argsPack_t{}, columnNames);
716 return [persister = persister](unsigned int slot, ARG0 const& obj) -> void {
717 auto t = to_tuple(obj);
718 persister(slot, t);
719 };
720 }
721
723 template <typename... ARGS>
724 auto persistTuple(framework::pack<ARGS...>, std::array<char const*, sizeof...(ARGS)> const& columnNames)
725 {
726 constexpr int nColumns = sizeof...(ARGS);
727 validate();
728 mArrays.resize(nColumns);
729 makeBuilders<ARGS...>(columnNames, 10);
730
731 // Callback used to fill the builders
732 using FillTuple = std::tuple<typename BuilderMaker<ARGS>::FillType...>;
733 return [holders = mHolders](unsigned int /*slot*/, FillTuple const& t) -> void {
734 auto status = TableBuilderHelpers::append(*(HoldersTupleIndexed<ARGS...>*)holders, t);
735 if (status == false) {
736 throwError(runtime_error("Unable to append"));
737 }
738 };
739 }
740
741 // Same as above, but starting from a o2::soa::Table, which has all the
742 // information already available.
743 template <typename T>
744 auto cursor()
745 {
746 return [this]<typename... Cs>(pack<Cs...>) {
747 return this->template persist<typename Cs::type...>({Cs::columnLabel()...});
748 }(typename T::table_t::persistent_columns_t{});
749 }
750
751 template <typename... Cs>
753 {
754 return this->template persist<typename Cs::type...>({Cs::columnLabel()...});
755 }
756
757 template <typename T, typename E>
758 auto cursor()
759 {
760 return [this]<typename... Cs>(pack<Cs...>) {
761 return this->template persist<E>({Cs::columnLabel()...});
762 }(typename T::table_t::persistent_columns_t{});
763 }
764
765 template <typename... ARGS, size_t NCOLUMNS = sizeof...(ARGS)>
766 auto preallocatedPersist(std::array<char const*, NCOLUMNS> const& columnNames, int nRows)
767 {
768 constexpr size_t nColumns = NCOLUMNS;
769 validate();
770 mArrays.resize(nColumns);
771 makeBuilders<ARGS...>(columnNames, nRows);
772
773 // Callback used to fill the builders
774 return [holders = mHolders](unsigned int /*slot*/, typename BuilderMaker<ARGS>::FillType... args) -> void {
775 TableBuilderHelpers::unsafeAppend(*(HoldersTupleIndexed<ARGS...>*)holders, std::forward_as_tuple(args...));
776 };
777 }
778
779 template <typename... ARGS, size_t NCOLUMNS = sizeof...(ARGS)>
780 auto bulkPersist(std::array<char const*, NCOLUMNS> const& columnNames, size_t nRows)
781 {
782 validate();
783 // Should not be called more than once
784 mArrays.resize(NCOLUMNS);
785 makeBuilders<ARGS...>(columnNames, nRows);
786
787 return [holders = mHolders](unsigned int /*slot*/, size_t batchSize, typename BuilderMaker<ARGS>::FillType const*... args) -> void {
788 TableBuilderHelpers::bulkAppend(*(HoldersTupleIndexed<ARGS...>*)holders, batchSize, std::forward_as_tuple(args...));
789 };
790 }
791
792 template <typename... ARGS, size_t NCOLUMNS = sizeof...(ARGS)>
793 auto bulkPersistChunked(std::array<char const*, NCOLUMNS> const& columnNames, size_t nRows)
794 {
795 validate();
796 mArrays.resize(NCOLUMNS);
797 makeBuilders<ARGS...>(columnNames, nRows);
798
799 return [holders = mHolders](unsigned int /*slot*/, BulkInfo<typename BuilderMaker<ARGS>::STLValueType const*>... args) -> bool {
800 return TableBuilderHelpers::bulkAppendChunked(*(HoldersTupleIndexed<ARGS...>*)holders, std::forward_as_tuple(args...));
801 };
802 }
803
805 template <typename... Ts>
806 auto reserveArrays(std::tuple<Ts...>& holders, int s)
807 {
808 return (std::get<Ts::index>(holders).builder->Reserve(s).ok() && ...);
809 }
810
811 template <typename... ARGS>
813 {
814 reserveArrays(*(HoldersTupleIndexed<ARGS...>*)mHolders, s);
815 }
816
818 void extracted(bool& status);
819 std::shared_ptr<arrow::Table> finalize();
820
821 private:
822 bool (*mFinalizer)(std::vector<std::shared_ptr<arrow::Array>>& arrays, void* holders);
823 void (*mDestructor)(void* holders);
824 void* mHolders;
825 arrow::MemoryPool* mMemoryPool;
826 std::shared_ptr<arrow::Schema> mSchema;
827 std::vector<std::shared_ptr<arrow::Array>> mArrays;
828};
829
830template <typename T>
831auto makeEmptyTable(const char* name)
832{
834 [[maybe_unused]] auto writer = b.cursor<T>();
835 b.setLabel(name);
836 return b.finalize();
837}
838
839template <soa::TableRef R>
841{
843 [[maybe_unused]] auto writer = b.cursor(typename aod::MetadataTrait<aod::Hash<R.desc_hash>>::metadata::persistent_columns_t{});
844 b.setLabel(aod::label<R>());
845 return b.finalize();
846}
847
848template <typename... Cs>
850{
852 [[maybe_unused]] auto writer = b.cursor(p);
853 b.setLabel(name);
854 return b.finalize();
855}
856
857std::shared_ptr<arrow::Table> spawnerHelper(std::shared_ptr<arrow::Table> const& fullTable, std::shared_ptr<arrow::Schema> newSchema, size_t nColumns,
858 expressions::Projector* projectors, std::vector<std::shared_ptr<arrow::Field>> const& fields, const char* name);
859
861template <aod::is_aod_hash D>
862auto spawner(std::vector<std::shared_ptr<arrow::Table>>&& tables, const char* name)
863{
864 using expression_pack_t = typename o2::aod::MetadataTrait<D>::metadata::expression_pack_t;
865 auto fullTable = soa::ArrowHelpers::joinTables(std::move(tables));
866 if (fullTable->num_rows() == 0) {
867 return makeEmptyTable(name, expression_pack_t{});
868 }
869 static auto fields = o2::soa::createFieldsFromColumns(expression_pack_t{});
870 static auto new_schema = std::make_shared<arrow::Schema>(fields);
871 auto projectors = []<typename... C>(framework::pack<C...>) -> std::array<expressions::Projector, sizeof...(C)>
872 {
873 return {{std::move(C::Projector())...}};
874 }
875 (expression_pack_t{});
876
877 return spawnerHelper(fullTable, new_schema, framework::pack_size(expression_pack_t{}), projectors.data(), fields, name);
878}
879
880template <aod::is_aod_hash D>
881auto spawner(std::shared_ptr<arrow::Table> const& fullTable, const char* name)
882{
883 using expression_pack_t = typename o2::aod::MetadataTrait<D>::metadata::expression_pack_t;
884 if (fullTable->num_rows() == 0) {
885 return makeEmptyTable(name, expression_pack_t{});
886 }
887 static auto fields = o2::soa::createFieldsFromColumns(expression_pack_t{});
888 static auto new_schema = std::make_shared<arrow::Schema>(fields);
889 auto projectors = []<typename... C>(framework::pack<C...>) -> std::array<expressions::Projector, sizeof...(C)>
890 {
891 return {{std::move(C::Projector())...}};
892 }
893 (expression_pack_t{});
894
895 return spawnerHelper(fullTable, new_schema, framework::pack_size(expression_pack_t{}), projectors.data(), fields, name);
896}
897
898// template <soa::OriginEnc ORIGIN, typename... C>
899// auto spawner(framework::pack<C...> columns, std::vector<std::shared_ptr<arrow::Table>>&& tables, const char* name)
900// {
901// auto fullTable = soa::ArrowHelpers::joinTables(std::move(tables));
902// if (fullTable->num_rows() == 0) {
903// return makeEmptyTable<soa::Table<ORIGIN, C...>>(name);
904// }
905// static auto fields = o2::soa::createFieldsFromColumns(columns);
906// static auto new_schema = std::make_shared<arrow::Schema>(fields);
907// std::array<expressions::Projector, sizeof...(C)> projectors{{std::move(C::Projector())...}};
908// return spawnerHelper(fullTable, new_schema, sizeof...(C), projectors.data(), fields, name);
909// }
910
911template <typename... C>
912auto spawner(framework::pack<C...> columns, std::vector<std::shared_ptr<arrow::Table>>&& tables, const char* name)
913{
914 auto fullTable = soa::ArrowHelpers::joinTables(std::move(tables));
915 if (fullTable->num_rows() == 0) {
917 }
918 static auto fields = o2::soa::createFieldsFromColumns(columns);
919 static auto new_schema = std::make_shared<arrow::Schema>(fields);
920 std::array<expressions::Projector, sizeof...(C)> projectors{{std::move(C::Projector())...}};
921 return spawnerHelper(fullTable, new_schema, sizeof...(C), projectors.data(), fields, name);
922}
923
924template <typename... T>
925using iterator_tuple_t = std::tuple<typename T::iterator...>;
926} // namespace o2::framework
927#endif // FRAMEWORK_TABLEBUILDER_H
constexpr int p2()
constexpr int p1()
constexpr to accelerate the coordinates changing
TBranch * ptr
#define O2_ARROW_STL_CONVERSION(c_type, ArrowType_)
auto cursor(framework::pack< Cs... >)
auto persist(std::array< char const *, countColumns< ARG0, ARGS... >()> const &columnNames)
auto persistTuple(framework::pack< ARGS... >, std::array< char const *, sizeof...(ARGS)> const &columnNames)
Same a the above, but use a tuple to persist stuff.
void setLabel(const char *label)
static constexpr int countColumns()
auto bulkPersistChunked(std::array< char const *, NCOLUMNS > const &columnNames, size_t nRows)
auto bulkPersist(std::array< char const *, NCOLUMNS > const &columnNames, size_t nRows)
void extracted(bool &status)
Actually creates the arrow::Table from the builders.
static constexpr int countColumns()
auto reserve(o2::framework::pack< ARGS... > &&, int s)
TableBuilder(arrow::MemoryPool *pool=arrow::default_memory_pool())
auto reserveArrays(std::tuple< Ts... > &holders, int s)
Reserve method to expand the columns as needed.
auto persist(std::array< char const *, sizeof...(ARGS)+1 > const &columnNames)
std::shared_ptr< arrow::Table > finalize()
auto preallocatedPersist(std::array< char const *, NCOLUMNS > const &columnNames, int nRows)
GLsizeiptr size
Definition glcorearb.h:659
GLenum array
Definition glcorearb.h:4274
GLuint index
Definition glcorearb.h:781
GLuint const GLchar * name
Definition glcorearb.h:781
GLboolean GLboolean GLboolean b
Definition glcorearb.h:1233
GLsizei const GLfloat * value
Definition glcorearb.h:819
GLint GLint GLsizei GLint GLenum GLenum type
Definition glcorearb.h:275
GLenum GLsizei GLsizei GLint * values
Definition glcorearb.h:1576
GLboolean * data
Definition glcorearb.h:298
GLuint GLsizei const GLchar * label
Definition glcorearb.h:2519
typedef void(APIENTRYP PFNGLCULLFACEPROC)(GLenum mode)
GLuint object
Definition glcorearb.h:4041
const GLuint * arrays
Definition glcorearb.h:1314
Defining PrimaryVertex explicitly as messageable.
Definition TFIDInfo.h:20
void addLabelToSchema(std::shared_ptr< arrow::Schema > &schema, const char *label)
RuntimeErrorRef runtime_error(const char *)
constexpr auto makeHolderTypes()
auto constexpr to_tuple(T &&object) noexcept
std::shared_ptr< arrow::Table > spawnerHelper(std::shared_ptr< arrow::Table > const &fullTable, std::shared_ptr< arrow::Schema > newSchema, size_t nColumns, expressions::Projector *projectors, std::vector< std::shared_ptr< arrow::Field > > const &fields, const char *name)
constexpr auto tuple_to_pack(std::tuple< ARGS... > &&)
auto spawner(std::vector< std::shared_ptr< arrow::Table > > &&tables, const char *name)
Expression-based column generator to materialize columns.
auto makeEmptyTable()
auto makeHolders(arrow::MemoryPool *pool, size_t nRows)
constexpr std::size_t pack_size(pack< Ts... > const &)
template function to determine number of types in a pack
Definition Pack.h:28
decltype(makeHolderTypes< ARGS... >()) IndexedHoldersTuple
auto make_builders()
RuntimeErrorRef runtime_error_f(const char *,...)
std::tuple< typename T::iterator... > iterator_tuple_t
auto createFieldsFromColumns(framework::pack< C... >)
Definition ASoA.h:406
Defining DataPointCompositeObject explicitly as copiable.
size_t size
const T ptr
BuilderHolder(arrow::MemoryPool *pool, size_t nRows=0)
std::unique_ptr< BuilderType > builder
typename arrow::TypeTraits< ArrowType >::BuilderType BuilderType
typename detail::ConversionTraits< T >::ArrowType ArrowType
typename detail::ConversionTraits< T >::ArrowType ElementType
static std::unique_ptr< BuilderType > make(arrow::MemoryPool *pool)
arrow::FixedSizeListBuilder BuilderType
arrow::FixedSizeListType ArrowType
static std::shared_ptr< arrow::DataType > make_datatype()
static std::unique_ptr< BuilderType > make(arrow::MemoryPool *pool)
typename detail::ConversionTraits< T >::ArrowType ElementType
arrow::FixedSizeListType ArrowType
static std::shared_ptr< arrow::DataType > make_datatype()
arrow::FixedSizeListBuilder BuilderType
typename arrow::TypeTraits< ArrowType >::BuilderType BuilderType
static arrow::Status append(BuilderType &builder, bool value)
static std::unique_ptr< BuilderType > make(arrow::MemoryPool *pool)
static std::shared_ptr< arrow::DataType > make_datatype()
typename detail::ConversionTraits< bool >::ArrowType ArrowType
typename detail::ConversionTraits< T >::ArrowType ElementType
static std::unique_ptr< BuilderType > make(arrow::MemoryPool *pool)
static std::shared_ptr< arrow::DataType > make_datatype()
static std::unique_ptr< BuilderType > make(arrow::MemoryPool *pool)
typename detail::ConversionTraits< typename ITERATOR::value_type >::ArrowType ValueType
typename arrow::TypeTraits< ValueType >::BuilderType ValueBuilder
static std::shared_ptr< arrow::DataType > make_datatype()
static std::unique_ptr< BuilderType > make(arrow::MemoryPool *pool)
typename detail::ConversionTraits< T >::ArrowType ElementType
static std::shared_ptr< arrow::DataType > make_datatype()
typename arrow::TypeTraits< ArrowType >::BuilderType BuilderType
static arrow::Status append(BuilderType &builder, std::array< T, N > &value)
static arrow::Status append(BuilderType &builder, T value)
typename detail::ConversionTraits< T >::ArrowType ArrowType
static std::unique_ptr< BuilderType > make(arrow::MemoryPool *pool)
static std::shared_ptr< arrow::DataType > make_datatype()
arrow::FixedSizeListBuilder BuilderType
arrow::FixedSizeListType ArrowType
typename arrow::TypeTraits< ArrowType >::BuilderType BuilderType
typename detail::ConversionTraits< T >::ArrowType ArrowType
static arrow::Status bulkAppend(HolderType &holder, size_t bulkSize, const PTR ptr)
static arrow::Status append(HolderType &holder, std::vector< T > const &data)
Appender for the vector case.
static arrow::Status appendToList(std::unique_ptr< arrow::FixedSizeListBuilder > &builder, T *data, int size=1)
static arrow::Status flush(HolderType &holder)
static arrow::Status append(HolderType &holder, T value)
static arrow::Status append(HolderType &holder, T(&data)[N])
Appender for the array case.
static arrow::Status append(HolderType &holder, T *data)
static void unsafeAppend(HolderType &holder, std::vector< T > const &value)
static arrow::Status append(HolderType &holder, std::pair< ITERATOR, ITERATOR > ip)
static void unsafeAppend(HolderType &holder, T *value)
static void unsafeAppend(HolderType &holder, std::pair< ITERATOR, ITERATOR > ip)
static arrow::Status append(HolderType &holder, std::array< T, N > const &data)
Appender for the array case.
static arrow::Status bulkAppendChunked(HolderType &holder, BulkInfo< PTR > info)
static void unsafeAppend(HolderType &holder, T value)
static constexpr int CHUNK_SIZE
arrow::Status append(BUILDER &builder, T value)
arrow::Status flush(BUILDER &builder)
arrow::Status append(BUILDER &builder, T value)
arrow::Status flush(BUILDER &)
static consteval DirectInsertion< T > policy()
static consteval CachedInsertion< T > policy()
static bool bulkAppendChunked(std::tuple< Ts... > &holders, INFOS infos)
Return true if all columns are done.
static bool finalize(std::shared_ptr< arrow::Array > &array, HOLDER &holder)
static bool append(std::tuple< Ts... > &holders, VALUES &&values)
Invokes the append method for each entry in the tuple.
static std::array< arrow::DataType, NCOLUMNS > makeArrowColumnTypes()
static bool finalize(std::vector< std::shared_ptr< arrow::Array > > &arrays, std::tuple< Ts... > &holders)
Invokes the append method for each entry in the tuple.
static bool bulkAppend(std::tuple< Ts... > &holders, size_t bulkSize, PTRS ptrs)
static void unsafeAppend(std::tuple< Ts... > &holders, VALUES &&values)
static std::vector< std::shared_ptr< arrow::Field > > makeFields(std::array< char const *, NCOLUMNS > const &names)
FIXME: adapt type conversion to new arrow.
A struct, containing the root of the expression tree.
static std::shared_ptr< arrow::Table > joinTables(std::vector< std::shared_ptr< arrow::Table > > &&tables)
Definition ASoA.cxx:67