userver: userver/storages/clickhouse/io/columns/array_column.hpp Source File
Loading...
Searching...
No Matches
array_column.hpp
Go to the documentation of this file.
1#pragma once
2
3/// @file userver/storages/clickhouse/io/columns/array_column.hpp
4/// @brief Array column support
5/// @ingroup userver_clickhouse_types
6
7#include <userver/utils/assert.hpp>
8
9#include <userver/storages/clickhouse/io/columns/column_includes.hpp>
10#include <userver/storages/clickhouse/io/columns/common_columns.hpp>
11
12USERVER_NAMESPACE_BEGIN
13
14namespace storages::clickhouse::io::columns {
15
16struct ArrayColumnMeta final {
17 ColumnRef data;
18 ColumnRef offsets;
19};
20
21ColumnRef ConvertMetaToColumn(ArrayColumnMeta&& meta);
22ColumnRef ExtractArrayItem(const ColumnRef& column, std::size_t ind);
23
24/// @brief Represents ClickHouse Array(T) column,
25/// where T is a ClickhouseColumn as well
26template <typename T>
27class ArrayColumn final : public ClickhouseColumn<ArrayColumn<T>> {
28public:
29 using cpp_type = std::vector<typename T::cpp_type>;
30 using container_type = std::vector<cpp_type>;
31
32 ArrayColumn(ColumnRef column);
33
34 class ArrayDataHolder final {
35 public:
36 ArrayDataHolder() = default;
37 ArrayDataHolder(typename ColumnIterator<ArrayColumn<T>>::IteratorPosition iter_position, ColumnRef&& column);
38
39 ArrayDataHolder operator++(int);
40 ArrayDataHolder& operator++();
41 cpp_type& UpdateValue();
42
43 bool operator==(const ArrayDataHolder& other) const;
44
45 private:
46 ColumnRef inner_{};
47 std::size_t ind_{0};
48 std::optional<cpp_type> current_value_ = std::nullopt;
49 };
50 using iterator_data = ArrayDataHolder;
51
52 static ColumnRef Serialize(const container_type& from);
53 static cpp_type RetrieveElement(const ColumnRef& ref, std::size_t ind);
54};
55
56template <typename T>
57ArrayColumn<T>::ArrayDataHolder::ArrayDataHolder(
58 typename ColumnIterator<ArrayColumn<T>>::IteratorPosition iter_position,
59 ColumnRef&& column
60)
61 : inner_{std::move(column)},
62 ind_(iter_position == decltype(iter_position)::kEnd ? GetColumnSize(inner_) : 0)
63{}
64
65template <typename T>
66typename ArrayColumn<T>::ArrayDataHolder ArrayColumn<T>::ArrayDataHolder::operator++(int) {
67 ArrayDataHolder old{};
68 old.inner_ = inner_;
69 old.ind_ = ind_++;
70 old.current_value_ = std::move_if_noexcept(current_value_);
71 current_value_.reset();
72
73 return old;
74}
75
76template <typename T>
77typename ArrayColumn<T>::ArrayDataHolder& ArrayColumn<T>::ArrayDataHolder::operator++() {
78 ++ind_;
79 current_value_.reset();
80
81 return *this;
82}
83
84template <typename T>
85typename ArrayColumn<T>::cpp_type& ArrayColumn<T>::ArrayDataHolder::UpdateValue() {
86 UASSERT(ind_ < GetColumnSize(inner_));
87 if (!current_value_.has_value()) {
88 cpp_type item = RetrieveElement(inner_, ind_);
89 current_value_.emplace(std::move(item));
90 }
91
92 return *current_value_;
93}
94
95template <typename T>
96bool ArrayColumn<T>::ArrayDataHolder::operator==(const ArrayDataHolder& other) const {
97 return inner_.get() == other.inner_.get() && ind_ == other.ind_;
98}
99
100template <typename T>
101ArrayColumn<T>::ArrayColumn(ColumnRef column)
102 : ClickhouseColumn<ArrayColumn>{std::move(column)}
103{}
104
105template <typename T>
106ColumnRef ArrayColumn<T>::Serialize(const container_type& from) {
107 uint64_t cumulative_offset = 0;
108 std::vector<uint64_t> offsets;
109 offsets.reserve(from.size());
110
111 for (const auto& value : from) {
112 cumulative_offset += value.size();
113 offsets.push_back(cumulative_offset);
114 }
115 typename T::container_type values;
116 values.reserve(cumulative_offset);
117
118 for (const auto& value : from) {
119 for (const auto& item : value) {
120 values.push_back(item);
121 }
122 }
123
124 ArrayColumnMeta array_meta;
125 array_meta.offsets = UInt64Column::Serialize(offsets);
126 array_meta.data = T::Serialize(values);
127
128 return ConvertMetaToColumn(std::move(array_meta));
129}
130
131template <typename T>
132typename ArrayColumn<T>::cpp_type ArrayColumn<T>::RetrieveElement(const ColumnRef& ref, std::size_t ind) {
133 auto array_item = ExtractArrayItem(ref, ind);
134 T typed_column(array_item);
135
136 cpp_type result;
137 result.reserve(GetColumnSize(array_item));
138 for (auto it = typed_column.begin(); it != typed_column.end(); ++it) {
139 result.push_back(std::move(*it));
140 }
141 return result;
142}
143
144} // namespace storages::clickhouse::io::columns
145
146USERVER_NAMESPACE_END