be/src/exec/pipeline/dependency.h
Line | Count | Source |
1 | | // Licensed to the Apache Software Foundation (ASF) under one |
2 | | // or more contributor license agreements. See the NOTICE file |
3 | | // distributed with this work for additional information |
4 | | // regarding copyright ownership. The ASF licenses this file |
5 | | // to you under the Apache License, Version 2.0 (the |
6 | | // "License"); you may not use this file except in compliance |
7 | | // with the License. You may obtain a copy of the License at |
8 | | // |
9 | | // http://www.apache.org/licenses/LICENSE-2.0 |
10 | | // |
11 | | // Unless required by applicable law or agreed to in writing, |
12 | | // software distributed under the License is distributed on an |
13 | | // "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY |
14 | | // KIND, either express or implied. See the License for the |
15 | | // specific language governing permissions and limitations |
16 | | // under the License. |
17 | | |
18 | | #pragma once |
19 | | |
20 | | #ifdef __APPLE__ |
21 | | #include <netinet/in.h> |
22 | | #include <sys/_types/_u_int.h> |
23 | | #endif |
24 | | |
25 | | #include <concurrentqueue.h> |
26 | | #include <gen_cpp/Partitions_types.h> |
27 | | #include <gen_cpp/internal_service.pb.h> |
28 | | #include <sqltypes.h> |
29 | | |
30 | | #include <atomic> |
31 | | #include <functional> |
32 | | #include <memory> |
33 | | #include <mutex> |
34 | | #include <thread> |
35 | | #include <utility> |
36 | | |
37 | | #include "common/config.h" |
38 | | #include "common/logging.h" |
39 | | #include "common/thread_safety_annotations.h" |
40 | | #include "core/block/block.h" |
41 | | #include "core/types.h" |
42 | | #include "exec/common/agg_utils.h" |
43 | | #include "exec/common/join_utils.h" |
44 | | #include "exec/common/set_utils.h" |
45 | | #include "exec/operator/data_queue.h" |
46 | | #include "exec/operator/join/process_hash_table_probe.h" |
47 | | #include "exec/sort/partition_sorter.h" |
48 | | #include "exec/sort/sorter.h" |
49 | | #include "exec/spill/spill_file.h" |
50 | | #include "runtime/runtime_profile_counter_names.h" |
51 | | #include "util/brpc_closure.h" |
52 | | #include "util/stack_util.h" |
53 | | |
54 | | namespace doris { |
55 | | class AggFnEvaluator; |
56 | | class VSlotRef; |
57 | | } // namespace doris |
58 | | |
59 | | namespace doris { |
60 | | class Dependency; |
61 | | class PipelineTask; |
62 | | struct BasicSharedState; |
63 | | using DependencySPtr = std::shared_ptr<Dependency>; |
64 | | class LocalExchangeSourceLocalState; |
65 | | |
66 | | static constexpr auto SLOW_DEPENDENCY_THRESHOLD = 60 * 1000L * 1000L * 1000L; |
67 | | static constexpr auto TIME_UNIT_DEPENDENCY_LOG = 30 * 1000L * 1000L * 1000L; |
68 | | static_assert(TIME_UNIT_DEPENDENCY_LOG < SLOW_DEPENDENCY_THRESHOLD); |
69 | | |
70 | | struct BasicSharedState { |
71 | | ENABLE_FACTORY_CREATOR(BasicSharedState) |
72 | | |
73 | | template <class TARGET> |
74 | 2.46M | TARGET* cast() { |
75 | 18.4E | DCHECK(dynamic_cast<TARGET*>(this)) |
76 | 18.4E | << " Mismatch type! Current type is " << typeid(*this).name() |
77 | 18.4E | << " and expect type is" << typeid(TARGET).name(); |
78 | 2.46M | return reinterpret_cast<TARGET*>(this); |
79 | 2.46M | } _ZN5doris16BasicSharedState4castINS_19HashJoinSharedStateEEEPT_v Line | Count | Source | 74 | 183k | TARGET* cast() { | 75 | 18.4E | DCHECK(dynamic_cast<TARGET*>(this)) | 76 | 18.4E | << " Mismatch type! Current type is " << typeid(*this).name() | 77 | 18.4E | << " and expect type is" << typeid(TARGET).name(); | 78 | 183k | return reinterpret_cast<TARGET*>(this); | 79 | 183k | } |
_ZN5doris16BasicSharedState4castINS_30PartitionedHashJoinSharedStateEEEPT_v Line | Count | Source | 74 | 3 | TARGET* cast() { | 75 | 3 | DCHECK(dynamic_cast<TARGET*>(this)) | 76 | 0 | << " Mismatch type! Current type is " << typeid(*this).name() | 77 | 0 | << " and expect type is" << typeid(TARGET).name(); | 78 | 3 | return reinterpret_cast<TARGET*>(this); | 79 | 3 | } |
_ZN5doris16BasicSharedState4castINS_15SortSharedStateEEEPT_v Line | Count | Source | 74 | 481k | TARGET* cast() { | 75 | 18.4E | DCHECK(dynamic_cast<TARGET*>(this)) | 76 | 18.4E | << " Mismatch type! Current type is " << typeid(*this).name() | 77 | 18.4E | << " and expect type is" << typeid(TARGET).name(); | 78 | 481k | return reinterpret_cast<TARGET*>(this); | 79 | 481k | } |
_ZN5doris16BasicSharedState4castINS_20SpillSortSharedStateEEEPT_v Line | Count | Source | 74 | 55 | TARGET* cast() { | 75 | 55 | DCHECK(dynamic_cast<TARGET*>(this)) | 76 | 0 | << " Mismatch type! Current type is " << typeid(*this).name() | 77 | 0 | << " and expect type is" << typeid(TARGET).name(); | 78 | 55 | return reinterpret_cast<TARGET*>(this); | 79 | 55 | } |
_ZN5doris16BasicSharedState4castINS_25NestedLoopJoinSharedStateEEEPT_v Line | Count | Source | 74 | 19.1k | TARGET* cast() { | 75 | 18.4E | DCHECK(dynamic_cast<TARGET*>(this)) | 76 | 18.4E | << " Mismatch type! Current type is " << typeid(*this).name() | 77 | 18.4E | << " and expect type is" << typeid(TARGET).name(); | 78 | 19.1k | return reinterpret_cast<TARGET*>(this); | 79 | 19.1k | } |
_ZN5doris16BasicSharedState4castINS_19AnalyticSharedStateEEEPT_v Line | Count | Source | 74 | 14.0k | TARGET* cast() { | 75 | 18.4E | DCHECK(dynamic_cast<TARGET*>(this)) | 76 | 18.4E | << " Mismatch type! Current type is " << typeid(*this).name() | 77 | 18.4E | << " and expect type is" << typeid(TARGET).name(); | 78 | 14.0k | return reinterpret_cast<TARGET*>(this); | 79 | 14.0k | } |
_ZN5doris16BasicSharedState4castINS_14AggSharedStateEEEPT_v Line | Count | Source | 74 | 293k | TARGET* cast() { | 75 | 18.4E | DCHECK(dynamic_cast<TARGET*>(this)) | 76 | 18.4E | << " Mismatch type! Current type is " << typeid(*this).name() | 77 | 18.4E | << " and expect type is" << typeid(TARGET).name(); | 78 | 293k | return reinterpret_cast<TARGET*>(this); | 79 | 293k | } |
_ZN5doris16BasicSharedState4castINS_22BucketedAggSharedStateEEEPT_v Line | Count | Source | 74 | 775 | TARGET* cast() { | 75 | 18.4E | DCHECK(dynamic_cast<TARGET*>(this)) | 76 | 18.4E | << " Mismatch type! Current type is " << typeid(*this).name() | 77 | 18.4E | << " and expect type is" << typeid(TARGET).name(); | 78 | 775 | return reinterpret_cast<TARGET*>(this); | 79 | 775 | } |
_ZN5doris16BasicSharedState4castINS_25PartitionedAggSharedStateEEEPT_v Line | Count | Source | 74 | 237 | TARGET* cast() { | 75 | 18.4E | DCHECK(dynamic_cast<TARGET*>(this)) | 76 | 18.4E | << " Mismatch type! Current type is " << typeid(*this).name() | 77 | 18.4E | << " and expect type is" << typeid(TARGET).name(); | 78 | 237 | return reinterpret_cast<TARGET*>(this); | 79 | 237 | } |
_ZN5doris16BasicSharedState4castINS_16UnionSharedStateEEEPT_v Line | Count | Source | 74 | 10.2k | TARGET* cast() { | 75 | 18.4E | DCHECK(dynamic_cast<TARGET*>(this)) | 76 | 18.4E | << " Mismatch type! Current type is " << typeid(*this).name() | 77 | 18.4E | << " and expect type is" << typeid(TARGET).name(); | 78 | 10.2k | return reinterpret_cast<TARGET*>(this); | 79 | 10.2k | } |
_ZN5doris16BasicSharedState4castINS_28PartitionSortNodeSharedStateEEEPT_v Line | Count | Source | 74 | 1.28k | TARGET* cast() { | 75 | 18.4E | DCHECK(dynamic_cast<TARGET*>(this)) | 76 | 18.4E | << " Mismatch type! Current type is " << typeid(*this).name() | 77 | 18.4E | << " and expect type is" << typeid(TARGET).name(); | 78 | 1.28k | return reinterpret_cast<TARGET*>(this); | 79 | 1.28k | } |
_ZN5doris16BasicSharedState4castINS_20MultiCastSharedStateEEEPT_v Line | Count | Source | 74 | 14.0k | TARGET* cast() { | 75 | 18.4E | DCHECK(dynamic_cast<TARGET*>(this)) | 76 | 18.4E | << " Mismatch type! Current type is " << typeid(*this).name() | 77 | 18.4E | << " and expect type is" << typeid(TARGET).name(); | 78 | 14.0k | return reinterpret_cast<TARGET*>(this); | 79 | 14.0k | } |
_ZN5doris16BasicSharedState4castINS_14SetSharedStateEEEPT_v Line | Count | Source | 74 | 17.0k | TARGET* cast() { | 75 | 18.4E | DCHECK(dynamic_cast<TARGET*>(this)) | 76 | 18.4E | << " Mismatch type! Current type is " << typeid(*this).name() | 77 | 18.4E | << " and expect type is" << typeid(TARGET).name(); | 78 | 17.0k | return reinterpret_cast<TARGET*>(this); | 79 | 17.0k | } |
_ZN5doris16BasicSharedState4castINS_24LocalExchangeSharedStateEEEPT_v Line | Count | Source | 74 | 934k | TARGET* cast() { | 75 | 18.4E | DCHECK(dynamic_cast<TARGET*>(this)) | 76 | 18.4E | << " Mismatch type! Current type is " << typeid(*this).name() | 77 | 18.4E | << " and expect type is" << typeid(TARGET).name(); | 78 | 934k | return reinterpret_cast<TARGET*>(this); | 79 | 934k | } |
_ZN5doris16BasicSharedState4castIS0_EEPT_v Line | Count | Source | 74 | 498k | TARGET* cast() { | 75 | 18.4E | DCHECK(dynamic_cast<TARGET*>(this)) | 76 | 18.4E | << " Mismatch type! Current type is " << typeid(*this).name() | 77 | 18.4E | << " and expect type is" << typeid(TARGET).name(); | 78 | 498k | return reinterpret_cast<TARGET*>(this); | 79 | 498k | } |
_ZN5doris16BasicSharedState4castINS_20DataQueueSharedStateEEEPT_v Line | Count | Source | 74 | 34 | TARGET* cast() { | 75 | 34 | DCHECK(dynamic_cast<TARGET*>(this)) | 76 | 0 | << " Mismatch type! Current type is " << typeid(*this).name() | 77 | 0 | << " and expect type is" << typeid(TARGET).name(); | 78 | 34 | return reinterpret_cast<TARGET*>(this); | 79 | 34 | } |
_ZN5doris16BasicSharedState4castINS_17RecCTESharedStateEEEPT_v Line | Count | Source | 74 | 489 | TARGET* cast() { | 75 | 489 | DCHECK(dynamic_cast<TARGET*>(this)) | 76 | 0 | << " Mismatch type! Current type is " << typeid(*this).name() | 77 | 0 | << " and expect type is" << typeid(TARGET).name(); | 78 | 489 | return reinterpret_cast<TARGET*>(this); | 79 | 489 | } |
|
80 | | template <class TARGET> |
81 | | const TARGET* cast() const { |
82 | | DCHECK(dynamic_cast<const TARGET*>(this)) |
83 | | << " Mismatch type! Current type is " << typeid(*this).name() |
84 | | << " and expect type is" << typeid(TARGET).name(); |
85 | | return reinterpret_cast<const TARGET*>(this); |
86 | | } |
87 | | std::vector<DependencySPtr> source_deps; |
88 | | std::vector<DependencySPtr> sink_deps; |
89 | | int id = 0; |
90 | | std::set<int> related_op_ids; |
91 | | |
92 | 1.80M | virtual ~BasicSharedState() = default; |
93 | | |
94 | | void create_source_dependencies(int num_sources, int operator_id, int node_id, |
95 | | const std::string& name); |
96 | | Dependency* create_source_dependency(int operator_id, int node_id, const std::string& name); |
97 | | |
98 | | Dependency* create_sink_dependency(int dest_id, int node_id, const std::string& name); |
99 | 701k | std::vector<DependencySPtr> get_dep_by_channel_id(int channel_id) { |
100 | 701k | DCHECK_LT(channel_id, source_deps.size()); |
101 | 701k | return {source_deps[channel_id]}; |
102 | 701k | } |
103 | | }; |
104 | | |
105 | | class Dependency : public std::enable_shared_from_this<Dependency> { |
106 | | public: |
107 | | ENABLE_FACTORY_CREATOR(Dependency); |
108 | | Dependency(int id, int node_id, std::string name, bool ready = false) |
109 | 6.43M | : _id(id), _node_id(node_id), _name(std::move(name)), _ready(ready) {} |
110 | 6.46M | virtual ~Dependency() = default; |
111 | | |
112 | 0 | [[nodiscard]] int id() const { return _id; } |
113 | 7.96M | [[nodiscard]] virtual std::string name() const { return _name; } |
114 | 275k | BasicSharedState* shared_state() { return _shared_state; } |
115 | 2.39M | void set_shared_state(BasicSharedState* shared_state) { _shared_state = shared_state; } |
116 | | virtual std::string debug_string(int indentation_level = 0); |
117 | 1.02G | bool ready() const { return _ready; } |
118 | | |
119 | | // Start the watcher. We use it to count how long this dependency block the current pipeline task. |
120 | 5.02M | void start_watcher() { _watcher.start(); } |
121 | 8.80M | [[nodiscard]] int64_t watcher_elapse_time() { return _watcher.elapsed_time(); } |
122 | | |
123 | | // Which dependency current pipeline task is blocked by. `nullptr` if this dependency is ready. |
124 | | [[nodiscard]] Dependency* is_blocked_by(std::shared_ptr<PipelineTask> task = nullptr); |
125 | | // Notify downstream pipeline tasks this dependency is ready. |
126 | | void set_ready(); |
127 | 514k | void set_ready_to_read(int channel_id = 0) { |
128 | 514k | DCHECK_LT(channel_id, _shared_state->source_deps.size()) << debug_string(); |
129 | 514k | _shared_state->source_deps[channel_id]->set_ready(); |
130 | 514k | } |
131 | 816 | void set_ready_to_write() { |
132 | 816 | DCHECK_EQ(_shared_state->sink_deps.size(), 1) << debug_string(); |
133 | 816 | _shared_state->sink_deps.front()->set_ready(); |
134 | 816 | } |
135 | | |
136 | | // Notify downstream pipeline tasks this dependency is blocked. |
137 | 1.82M | void block() { |
138 | 1.82M | if (_always_ready) { |
139 | 319k | return; |
140 | 319k | } |
141 | 1.50M | std::unique_lock<std::mutex> lc(_always_ready_lock); |
142 | 1.50M | if (_always_ready) { |
143 | 0 | return; |
144 | 0 | } |
145 | 1.50M | _ready = false; |
146 | 1.50M | } |
147 | | |
148 | 4.04M | void set_always_ready() { |
149 | 4.04M | if (_always_ready) { |
150 | 1.83M | return; |
151 | 1.83M | } |
152 | 2.21M | std::unique_lock<std::mutex> lc(_always_ready_lock); |
153 | 2.21M | if (_always_ready) { |
154 | 0 | return; |
155 | 0 | } |
156 | 2.21M | _always_ready = true; |
157 | 2.21M | set_ready(); |
158 | 2.21M | } |
159 | | |
160 | | protected: |
161 | | void _add_block_task(std::shared_ptr<PipelineTask> task); |
162 | | |
163 | | const int _id; |
164 | | const int _node_id; |
165 | | const std::string _name; |
166 | | std::atomic<bool> _ready; |
167 | | |
168 | | BasicSharedState* _shared_state = nullptr; |
169 | | MonotonicStopWatch _watcher; |
170 | | |
171 | | std::mutex _task_lock; |
172 | | std::vector<std::weak_ptr<PipelineTask>> _blocked_task; |
173 | | |
174 | | // If `_always_ready` is true, `block()` will never block tasks. |
175 | | std::atomic<bool> _always_ready = false; |
176 | | std::mutex _always_ready_lock; |
177 | | }; |
178 | | |
179 | | struct FakeSharedState final : public BasicSharedState { |
180 | | ENABLE_FACTORY_CREATOR(FakeSharedState) |
181 | | }; |
182 | | |
183 | | class CountedFinishDependency final : public Dependency { |
184 | | public: |
185 | | using SharedState = FakeSharedState; |
186 | | CountedFinishDependency(int id, int node_id, std::string name) |
187 | 145k | : Dependency(id, node_id, std::move(name), true) {} |
188 | | |
189 | 1.74k | void add(uint32_t count = 1) { |
190 | 1.74k | std::unique_lock<std::mutex> l(_mtx); |
191 | 1.74k | if (!_counter) { |
192 | 1.74k | block(); |
193 | 1.74k | } |
194 | 1.74k | _counter += count; |
195 | 1.74k | } |
196 | | |
197 | 1.74k | void sub() { |
198 | 1.74k | std::unique_lock<std::mutex> l(_mtx); |
199 | | // _counter is unsigned: a stray sub() when counter is already 0 would |
200 | | // underflow to UINT32_MAX and the dependency would never become ready, |
201 | | // hanging the query forever. Fail loudly instead. |
202 | 1.74k | if (_counter == 0) [[unlikely]] { |
203 | 2 | throw Exception(ErrorCode::INTERNAL_ERROR, |
204 | 2 | "CountedFinishDependency::sub() underflow on {}", debug_string()); |
205 | 2 | } |
206 | 1.74k | _counter--; |
207 | 1.74k | if (!_counter) { |
208 | 1.74k | set_ready(); |
209 | 1.74k | } |
210 | 1.74k | } |
211 | | |
212 | | std::string debug_string(int indentation_level = 0) override; |
213 | | |
214 | | private: |
215 | | std::mutex _mtx; |
216 | | uint32_t _counter = 0; |
217 | | }; |
218 | | |
219 | | struct RuntimeFilterTimerQueue; |
220 | | class RuntimeFilterTimer { |
221 | | public: |
222 | | RuntimeFilterTimer(int64_t registration_time, int32_t wait_time_ms, |
223 | | std::shared_ptr<Dependency> parent, bool force_wait_timeout = false) |
224 | 15.9k | : _parent(std::move(parent)), |
225 | 15.9k | _registration_time(registration_time), |
226 | 15.9k | _wait_time_ms(wait_time_ms), |
227 | 15.9k | _force_wait_timeout(force_wait_timeout) {} |
228 | | |
229 | | // Called by runtime filter producer. |
230 | | void call_ready(); |
231 | | |
232 | | // Called by RuntimeFilterTimerQueue which is responsible for checking if this rf is timeout. |
233 | | void call_timeout(); |
234 | | |
235 | 5.26M | int64_t registration_time() const { return _registration_time; } |
236 | 5.26M | int32_t wait_time_ms() const { return _wait_time_ms; } |
237 | | |
238 | | void set_local_runtime_filter_dependencies( |
239 | 5.58k | const std::vector<std::shared_ptr<Dependency>>& deps) { |
240 | 5.58k | _local_runtime_filter_dependencies = deps; |
241 | 5.58k | } |
242 | | |
243 | | bool should_be_check_timeout(); |
244 | | |
245 | 5.28M | bool force_wait_timeout() { return _force_wait_timeout; } |
246 | | |
247 | | private: |
248 | | friend struct RuntimeFilterTimerQueue; |
249 | | std::shared_ptr<Dependency> _parent = nullptr; |
250 | | std::vector<std::shared_ptr<Dependency>> _local_runtime_filter_dependencies; |
251 | | std::mutex _lock; |
252 | | int64_t _registration_time; |
253 | | const int32_t _wait_time_ms; |
254 | | // true only for group_commit_scan_operator |
255 | | bool _force_wait_timeout; |
256 | | }; |
257 | | |
258 | | struct RuntimeFilterTimerQueue { |
259 | | constexpr static int64_t interval = 10; |
260 | 9 | void run() { _thread.detach(); } |
261 | | void start(); |
262 | | |
263 | 3 | void stop() { |
264 | 3 | _stop = true; |
265 | 3 | cv.notify_all(); |
266 | 3 | wait_for_shutdown(); |
267 | 3 | } |
268 | | |
269 | 3 | void wait_for_shutdown() const { |
270 | 6 | while (!_shutdown) { |
271 | 3 | std::this_thread::sleep_for(std::chrono::milliseconds(interval)); |
272 | 3 | } |
273 | 3 | } |
274 | | |
275 | 3 | ~RuntimeFilterTimerQueue() = default; |
276 | 9 | RuntimeFilterTimerQueue() { _thread = std::thread(&RuntimeFilterTimerQueue::start, this); } |
277 | 8.36k | void push_filter_timer(std::vector<std::shared_ptr<RuntimeFilterTimer>>&& filter) { |
278 | 8.36k | std::unique_lock<std::mutex> lc(_que_lock); |
279 | 8.36k | _que.insert(_que.end(), filter.begin(), filter.end()); |
280 | 8.36k | cv.notify_all(); |
281 | 8.36k | } |
282 | | |
283 | | std::thread _thread; |
284 | | std::condition_variable cv; |
285 | | std::mutex cv_m; |
286 | | std::mutex _que_lock; |
287 | | std::atomic_bool _stop = false; |
288 | | std::atomic_bool _shutdown = false; |
289 | | std::list<std::shared_ptr<RuntimeFilterTimer>> _que; |
290 | | }; |
291 | | |
292 | | struct AggSharedState : public BasicSharedState { |
293 | | ENABLE_FACTORY_CREATOR(AggSharedState) |
294 | | public: |
295 | 147k | AggSharedState() { agg_data = std::make_unique<AggregatedDataVariants>(); } |
296 | 147k | ~AggSharedState() override { |
297 | 147k | if (!probe_expr_ctxs.empty()) { |
298 | 44.5k | _close_with_serialized_key(); |
299 | 102k | } else { |
300 | 102k | _close_without_key(); |
301 | 102k | } |
302 | 147k | } |
303 | | |
304 | | Status reset_hash_table(); |
305 | | |
306 | | bool do_limit_filter(Block* block, size_t num_rows, const std::vector<int>* key_locs = nullptr); |
307 | | void build_limit_heap(size_t hash_table_size); |
308 | | |
309 | | // We should call this function only at 1st phase. |
310 | | // 1st phase: is_merge=true, only have one SlotRef. |
311 | | // 2nd phase: is_merge=false, maybe have multiple exprs. |
312 | | static int get_slot_column_id(const AggFnEvaluator* evaluator); |
313 | | |
314 | | AggregatedDataVariantsUPtr agg_data = nullptr; |
315 | | std::unique_ptr<AggregateDataContainer> aggregate_data_container; |
316 | | std::vector<AggFnEvaluator*> aggregate_evaluators; |
317 | | // group by k1,k2 |
318 | | VExprContextSPtrs probe_expr_ctxs; |
319 | | size_t input_num_rows = 0; |
320 | | std::vector<AggregateDataPtr> values; |
321 | | /// The total size of the row from the aggregate functions. |
322 | | size_t total_size_of_aggregate_states = 0; |
323 | | size_t align_aggregate_states = 1; |
324 | | /// The offset to the n-th aggregate function in a row of aggregate functions. |
325 | | Sizes offsets_of_aggregate_states; |
326 | | std::vector<size_t> make_nullable_keys; |
327 | | |
328 | | bool agg_data_created_without_key = false; |
329 | | bool enable_spill = false; |
330 | | bool reach_limit = false; |
331 | | |
332 | | bool use_simple_count = false; |
333 | | int64_t limit = -1; |
334 | | bool do_sort_limit = false; |
335 | | MutableColumns limit_columns; |
336 | | int limit_columns_min = -1; |
337 | | PaddedPODArray<uint8_t> need_computes; |
338 | | std::vector<uint8_t> cmp_res; |
339 | | std::vector<int> order_directions; |
340 | | std::vector<int> null_directions; |
341 | | |
342 | | struct HeapLimitCursor { |
343 | | HeapLimitCursor(int row_id, MutableColumns& limit_columns, |
344 | | std::vector<int>& order_directions, std::vector<int>& null_directions) |
345 | 28.6k | : _row_id(row_id), |
346 | 28.6k | _limit_columns(limit_columns), |
347 | 28.6k | _order_directions(order_directions), |
348 | 28.6k | _null_directions(null_directions) {} |
349 | | |
350 | | HeapLimitCursor(const HeapLimitCursor& other) = default; |
351 | | |
352 | | HeapLimitCursor(HeapLimitCursor&& other) noexcept |
353 | 184k | : _row_id(other._row_id), |
354 | 184k | _limit_columns(other._limit_columns), |
355 | 184k | _order_directions(other._order_directions), |
356 | 184k | _null_directions(other._null_directions) {} |
357 | | |
358 | 0 | HeapLimitCursor& operator=(const HeapLimitCursor& other) noexcept { |
359 | 0 | _row_id = other._row_id; |
360 | 0 | return *this; |
361 | 0 | } |
362 | | |
363 | 302k | HeapLimitCursor& operator=(HeapLimitCursor&& other) noexcept { |
364 | 302k | _row_id = other._row_id; |
365 | 302k | return *this; |
366 | 302k | } |
367 | | |
368 | 276k | bool operator<(const HeapLimitCursor& rhs) const { |
369 | 326k | for (int i = 0; i < _limit_columns.size(); ++i) { |
370 | 326k | const auto& _limit_column = _limit_columns[i]; |
371 | 326k | auto res = _limit_column->compare_at(_row_id, rhs._row_id, *_limit_column, |
372 | 326k | _null_directions[i]) * |
373 | 326k | _order_directions[i]; |
374 | 326k | if (res < 0) { |
375 | 134k | return true; |
376 | 191k | } else if (res > 0) { |
377 | 146k | return false; |
378 | 146k | } |
379 | 326k | } |
380 | 18.4E | return false; |
381 | 276k | } |
382 | | |
383 | | int _row_id; |
384 | | MutableColumns& _limit_columns; |
385 | | std::vector<int>& _order_directions; |
386 | | std::vector<int>& _null_directions; |
387 | | }; |
388 | | |
389 | | std::priority_queue<HeapLimitCursor> limit_heap; |
390 | | |
391 | | // Refresh the top limit heap with a new row |
392 | | void refresh_top_limit(size_t row_id, const ColumnRawPtrs& key_columns); |
393 | | |
394 | | Arena agg_arena_pool; |
395 | | Arena agg_profile_arena; |
396 | | |
397 | | private: |
398 | | MutableColumns _get_keys_hash_table(); |
399 | | |
400 | 44.5k | void _close_with_serialized_key() { |
401 | 44.5k | std::visit(Overload {[&](std::monostate& arg) -> void { |
402 | | // Do nothing |
403 | 0 | }, |
404 | 44.5k | [&](auto& agg_method) -> void { |
405 | 44.5k | if (use_simple_count) { |
406 | | // Inline count: mapped slots hold UInt64, |
407 | | // not real agg state pointers. Skip destroy. |
408 | 3.71k | return; |
409 | 3.71k | } |
410 | 40.8k | auto& data = *agg_method.hash_table; |
411 | 1.28M | data.for_each_mapped([&](auto& mapped) { |
412 | 1.29M | if (mapped) { |
413 | 1.29M | _destroy_agg_status(mapped); |
414 | 1.29M | mapped = nullptr; |
415 | 1.29M | } |
416 | 1.28M | }); _ZZZN5doris14AggSharedState26_close_with_serialized_keyEvENKUlRT_E_clINS_15MethodKeysFixedI9PHHashMapIN4wide7integerILm256EjEEPc9HashCRC32IS9_EEEEEEvS2_ENKUlS2_E_clISA_EEDaS2_ Line | Count | Source | 411 | 4.93k | data.for_each_mapped([&](auto& mapped) { | 412 | 4.93k | if (mapped) { | 413 | 4.93k | _destroy_agg_status(mapped); | 414 | 4.93k | mapped = nullptr; | 415 | 4.93k | } | 416 | 4.93k | }); |
_ZZZN5doris14AggSharedState26_close_with_serialized_keyEvENKUlRT_E_clINS_15MethodKeysFixedI9PHHashMapINS_7UInt136EPc9HashCRC32IS7_EEEEEEvS2_ENKUlS2_E_clIS8_EEDaS2_ Line | Count | Source | 411 | 2.08k | data.for_each_mapped([&](auto& mapped) { | 412 | 2.08k | if (mapped) { | 413 | 2.08k | _destroy_agg_status(mapped); | 414 | 2.08k | mapped = nullptr; | 415 | 2.08k | } | 416 | 2.08k | }); |
_ZZZN5doris14AggSharedState26_close_with_serialized_keyEvENKUlRT_E_clINS_15MethodKeysFixedI9PHHashMapIN4wide7integerILm128EjEEPc9HashCRC32IS9_EEEEEEvS2_ENKUlS2_E_clISA_EEDaS2_ Line | Count | Source | 411 | 13.9k | data.for_each_mapped([&](auto& mapped) { | 412 | 13.9k | if (mapped) { | 413 | 13.9k | _destroy_agg_status(mapped); | 414 | 13.9k | mapped = nullptr; | 415 | 13.9k | } | 416 | 13.9k | }); |
_ZZZN5doris14AggSharedState26_close_with_serialized_keyEvENKUlRT_E_clINS_15MethodKeysFixedI9PHHashMapINS_7UInt104EPc9HashCRC32IS7_EEEEEEvS2_ENKUlS2_E_clIS8_EEDaS2_ Line | Count | Source | 411 | 545 | data.for_each_mapped([&](auto& mapped) { | 412 | 545 | if (mapped) { | 413 | 545 | _destroy_agg_status(mapped); | 414 | 545 | mapped = nullptr; | 415 | 545 | } | 416 | 545 | }); |
_ZZZN5doris14AggSharedState26_close_with_serialized_keyEvENKUlRT_E_clINS_15MethodKeysFixedI9PHHashMapINS_6UInt96EPc9HashCRC32IS7_EEEEEEvS2_ENKUlS2_E_clIS8_EEDaS2_ Line | Count | Source | 411 | 7.70k | data.for_each_mapped([&](auto& mapped) { | 412 | 7.70k | if (mapped) { | 413 | 7.70k | _destroy_agg_status(mapped); | 414 | 7.70k | mapped = nullptr; | 415 | 7.70k | } | 416 | 7.70k | }); |
_ZZZN5doris14AggSharedState26_close_with_serialized_keyEvENKUlRT_E_clINS_15MethodKeysFixedI9PHHashMapINS_6UInt72EPc9HashCRC32IS7_EEEEEEvS2_ENKUlS2_E_clIS8_EEDaS2_ Line | Count | Source | 411 | 745 | data.for_each_mapped([&](auto& mapped) { | 412 | 745 | if (mapped) { | 413 | 745 | _destroy_agg_status(mapped); | 414 | 745 | mapped = nullptr; | 415 | 745 | } | 416 | 745 | }); |
_ZZZN5doris14AggSharedState26_close_with_serialized_keyEvENKUlRT_E_clINS_15MethodKeysFixedI9PHHashMapImPc9HashCRC32ImEEEEEEvS2_ENKUlS2_E_clIS7_EEDaS2_ Line | Count | Source | 411 | 111k | data.for_each_mapped([&](auto& mapped) { | 412 | 111k | if (mapped) { | 413 | 111k | _destroy_agg_status(mapped); | 414 | 111k | mapped = nullptr; | 415 | 111k | } | 416 | 111k | }); |
_ZZZN5doris14AggSharedState26_close_with_serialized_keyEvENKUlRT_E_clINS_26MethodSingleNullableColumnINS_19MethodStringNoCacheINS_15DataWithNullKeyINS_13StringHashMapIPcNS_9AllocatorILb1ELb1ELb0ENS_22DefaultMemoryAllocatorELb1EEEEEEEEEEEEEvS2_ENKUlS2_E_clIS9_EEDaS2_ Line | Count | Source | 411 | 3.58k | data.for_each_mapped([&](auto& mapped) { | 412 | 3.58k | if (mapped) { | 413 | 3.58k | _destroy_agg_status(mapped); | 414 | 3.58k | mapped = nullptr; | 415 | 3.58k | } | 416 | 3.58k | }); |
_ZZZN5doris14AggSharedState26_close_with_serialized_keyEvENKUlRT_E_clINS_26MethodSingleNullableColumnINS_15MethodOneNumberIN4wide7integerILm256EjEENS_15DataWithNullKeyI9PHHashMapIS9_Pc9HashCRC32IS9_EEEEEEEEEEvS2_ENKUlS2_E_clISC_EEDaS2_ Line | Count | Source | 411 | 9 | data.for_each_mapped([&](auto& mapped) { | 412 | 9 | if (mapped) { | 413 | 9 | _destroy_agg_status(mapped); | 414 | 9 | mapped = nullptr; | 415 | 9 | } | 416 | 9 | }); |
_ZZZN5doris14AggSharedState26_close_with_serialized_keyEvENKUlRT_E_clINS_26MethodSingleNullableColumnINS_15MethodOneNumberIN4wide7integerILm128EjEENS_15DataWithNullKeyI9PHHashMapIS9_Pc9HashCRC32IS9_EEEEEEEEEEvS2_ENKUlS2_E_clISC_EEDaS2_ Line | Count | Source | 411 | 328 | data.for_each_mapped([&](auto& mapped) { | 412 | 328 | if (mapped) { | 413 | 328 | _destroy_agg_status(mapped); | 414 | 328 | mapped = nullptr; | 415 | 328 | } | 416 | 328 | }); |
_ZZZN5doris14AggSharedState26_close_with_serialized_keyEvENKUlRT_E_clINS_26MethodSingleNullableColumnINS_15MethodOneNumberImNS_15DataWithNullKeyI9PHHashMapImPc14HashMixWrapperIm9HashCRC32ImEEEEEEEEEEEvS2_ENKUlS2_E_clIS9_EEDaS2_ Line | Count | Source | 411 | 143k | data.for_each_mapped([&](auto& mapped) { | 412 | 143k | if (mapped) { | 413 | 143k | _destroy_agg_status(mapped); | 414 | 143k | mapped = nullptr; | 415 | 143k | } | 416 | 143k | }); |
_ZZZN5doris14AggSharedState26_close_with_serialized_keyEvENKUlRT_E_clINS_26MethodSingleNullableColumnINS_15MethodOneNumberIjNS_15DataWithNullKeyI9PHHashMapIjPc14HashMixWrapperIj9HashCRC32IjEEEEEEEEEEEvS2_ENKUlS2_E_clIS9_EEDaS2_ Line | Count | Source | 411 | 147k | data.for_each_mapped([&](auto& mapped) { | 412 | 147k | if (mapped) { | 413 | 147k | _destroy_agg_status(mapped); | 414 | 147k | mapped = nullptr; | 415 | 147k | } | 416 | 147k | }); |
_ZZZN5doris14AggSharedState26_close_with_serialized_keyEvENKUlRT_E_clINS_26MethodSingleNullableColumnINS_15MethodOneNumberImNS_15DataWithNullKeyI9PHHashMapImPc9HashCRC32ImEEEEEEEEEEvS2_ENKUlS2_E_clIS9_EEDaS2_ Line | Count | Source | 411 | 347 | data.for_each_mapped([&](auto& mapped) { | 412 | 347 | if (mapped) { | 413 | 347 | _destroy_agg_status(mapped); | 414 | 347 | mapped = nullptr; | 415 | 347 | } | 416 | 347 | }); |
_ZZZN5doris14AggSharedState26_close_with_serialized_keyEvENKUlRT_E_clINS_26MethodSingleNullableColumnINS_15MethodOneNumberIjNS_15DataWithNullKeyI9PHHashMapIjPc9HashCRC32IjEEEEEEEEEEvS2_ENKUlS2_E_clIS9_EEDaS2_ Line | Count | Source | 411 | 529 | data.for_each_mapped([&](auto& mapped) { | 412 | 529 | if (mapped) { | 413 | 529 | _destroy_agg_status(mapped); | 414 | 529 | mapped = nullptr; | 415 | 529 | } | 416 | 529 | }); |
_ZZZN5doris14AggSharedState26_close_with_serialized_keyEvENKUlRT_E_clINS_26MethodSingleNullableColumnINS_15MethodOneNumberItNS_15DataWithNullKeyI9PHHashMapItPc9HashCRC32ItEEEEEEEEEEvS2_ENKUlS2_E_clIS9_EEDaS2_ Line | Count | Source | 411 | 931 | data.for_each_mapped([&](auto& mapped) { | 412 | 931 | if (mapped) { | 413 | 931 | _destroy_agg_status(mapped); | 414 | 931 | mapped = nullptr; | 415 | 931 | } | 416 | 931 | }); |
_ZZZN5doris14AggSharedState26_close_with_serialized_keyEvENKUlRT_E_clINS_26MethodSingleNullableColumnINS_15MethodOneNumberIhNS_15DataWithNullKeyI9PHHashMapIhPc9HashCRC32IhEEEEEEEEEEvS2_ENKUlS2_E_clIS9_EEDaS2_ Line | Count | Source | 411 | 2.41k | data.for_each_mapped([&](auto& mapped) { | 412 | 2.41k | if (mapped) { | 413 | 2.41k | _destroy_agg_status(mapped); | 414 | 2.41k | mapped = nullptr; | 415 | 2.41k | } | 416 | 2.41k | }); |
_ZZZN5doris14AggSharedState26_close_with_serialized_keyEvENKUlRT_E_clINS_15MethodOneNumberIm9PHHashMapImPc14HashMixWrapperIm9HashCRC32ImEEEEEEEvS2_ENKUlS2_E_clIS7_EEDaS2_ Line | Count | Source | 411 | 55.8k | data.for_each_mapped([&](auto& mapped) { | 412 | 55.8k | if (mapped) { | 413 | 55.8k | _destroy_agg_status(mapped); | 414 | 55.8k | mapped = nullptr; | 415 | 55.8k | } | 416 | 55.8k | }); |
_ZZZN5doris14AggSharedState26_close_with_serialized_keyEvENKUlRT_E_clINS_15MethodOneNumberIj9PHHashMapIjPc14HashMixWrapperIj9HashCRC32IjEEEEEEEvS2_ENKUlS2_E_clIS7_EEDaS2_ Line | Count | Source | 411 | 687k | data.for_each_mapped([&](auto& mapped) { | 412 | 688k | if (mapped) { | 413 | 688k | _destroy_agg_status(mapped); | 414 | 688k | mapped = nullptr; | 415 | 688k | } | 416 | 687k | }); |
Unexecuted instantiation: _ZZZN5doris14AggSharedState26_close_with_serialized_keyEvENKUlRT_E_clINS_15MethodOneNumberIN4wide7integerILm256EjEE9PHHashMapIS8_Pc9HashCRC32IS8_EEEEEEvS2_ENKUlS2_E_clISA_EEDaS2_ _ZZZN5doris14AggSharedState26_close_with_serialized_keyEvENKUlRT_E_clINS_15MethodOneNumberIN4wide7integerILm128EjEE9PHHashMapIS8_Pc9HashCRC32IS8_EEEEEEvS2_ENKUlS2_E_clISA_EEDaS2_ Line | Count | Source | 411 | 172 | data.for_each_mapped([&](auto& mapped) { | 412 | 172 | if (mapped) { | 413 | 172 | _destroy_agg_status(mapped); | 414 | 172 | mapped = nullptr; | 415 | 172 | } | 416 | 172 | }); |
_ZZZN5doris14AggSharedState26_close_with_serialized_keyEvENKUlRT_E_clINS_19MethodStringNoCacheINS_13StringHashMapIPcNS_9AllocatorILb1ELb1ELb0ENS_22DefaultMemoryAllocatorELb1EEEEEEEEEvS2_ENKUlS2_E_clIS7_EEDaS2_ Line | Count | Source | 411 | 1.15k | data.for_each_mapped([&](auto& mapped) { | 412 | 1.15k | if (mapped) { | 413 | 1.15k | _destroy_agg_status(mapped); | 414 | 1.15k | mapped = nullptr; | 415 | 1.15k | } | 416 | 1.15k | }); |
_ZZZN5doris14AggSharedState26_close_with_serialized_keyEvENKUlRT_E_clINS_15MethodOneNumberIm9PHHashMapImPc9HashCRC32ImEEEEEEvS2_ENKUlS2_E_clIS7_EEDaS2_ Line | Count | Source | 411 | 179 | data.for_each_mapped([&](auto& mapped) { | 412 | 179 | if (mapped) { | 413 | 179 | _destroy_agg_status(mapped); | 414 | 179 | mapped = nullptr; | 415 | 179 | } | 416 | 179 | }); |
_ZZZN5doris14AggSharedState26_close_with_serialized_keyEvENKUlRT_E_clINS_15MethodOneNumberIj9PHHashMapIjPc9HashCRC32IjEEEEEEvS2_ENKUlS2_E_clIS7_EEDaS2_ Line | Count | Source | 411 | 28.8k | data.for_each_mapped([&](auto& mapped) { | 412 | 28.8k | if (mapped) { | 413 | 28.8k | _destroy_agg_status(mapped); | 414 | 28.8k | mapped = nullptr; | 415 | 28.8k | } | 416 | 28.8k | }); |
_ZZZN5doris14AggSharedState26_close_with_serialized_keyEvENKUlRT_E_clINS_15MethodOneNumberIt9PHHashMapItPc9HashCRC32ItEEEEEEvS2_ENKUlS2_E_clIS7_EEDaS2_ Line | Count | Source | 411 | 27 | data.for_each_mapped([&](auto& mapped) { | 412 | 27 | if (mapped) { | 413 | 27 | _destroy_agg_status(mapped); | 414 | 27 | mapped = nullptr; | 415 | 27 | } | 416 | 27 | }); |
_ZZZN5doris14AggSharedState26_close_with_serialized_keyEvENKUlRT_E_clINS_15MethodOneNumberIh9PHHashMapIhPc9HashCRC32IhEEEEEEvS2_ENKUlS2_E_clIS7_EEDaS2_ Line | Count | Source | 411 | 703 | data.for_each_mapped([&](auto& mapped) { | 412 | 704 | if (mapped) { | 413 | 704 | _destroy_agg_status(mapped); | 414 | 704 | mapped = nullptr; | 415 | 704 | } | 416 | 703 | }); |
_ZZZN5doris14AggSharedState26_close_with_serialized_keyEvENKUlRT_E_clINS_16MethodSerializedI9PHHashMapINS_9StringRefEPc11DefaultHashIS7_vEEEEEEvS2_ENKUlS2_E_clIS8_EEDaS2_ Line | Count | Source | 411 | 74.6k | data.for_each_mapped([&](auto& mapped) { | 412 | 74.6k | if (mapped) { | 413 | 74.6k | _destroy_agg_status(mapped); | 414 | 74.6k | mapped = nullptr; | 415 | 74.6k | } | 416 | 74.6k | }); |
|
417 | 40.8k | if (data.has_null_key_data()) { |
418 | 1.18k | _destroy_agg_status( |
419 | 1.18k | data.template get_null_key_data<AggregateDataPtr>()); |
420 | 1.18k | } |
421 | 40.8k | }}, _ZZN5doris14AggSharedState26_close_with_serialized_keyEvENKUlRT_E_clINS_15MethodKeysFixedI9PHHashMapIN4wide7integerILm256EjEEPc9HashCRC32IS9_EEEEEEvS2_ Line | Count | Source | 404 | 3.13k | [&](auto& agg_method) -> void { | 405 | 3.13k | if (use_simple_count) { | 406 | | // Inline count: mapped slots hold UInt64, | 407 | | // not real agg state pointers. Skip destroy. | 408 | 22 | return; | 409 | 22 | } | 410 | 3.11k | auto& data = *agg_method.hash_table; | 411 | 3.11k | data.for_each_mapped([&](auto& mapped) { | 412 | 3.11k | if (mapped) { | 413 | 3.11k | _destroy_agg_status(mapped); | 414 | 3.11k | mapped = nullptr; | 415 | 3.11k | } | 416 | 3.11k | }); | 417 | 3.11k | if (data.has_null_key_data()) { | 418 | 0 | _destroy_agg_status( | 419 | 0 | data.template get_null_key_data<AggregateDataPtr>()); | 420 | 0 | } | 421 | 3.11k | }}, |
_ZZN5doris14AggSharedState26_close_with_serialized_keyEvENKUlRT_E_clINS_15MethodKeysFixedI9PHHashMapINS_7UInt136EPc9HashCRC32IS7_EEEEEEvS2_ Line | Count | Source | 404 | 1.59k | [&](auto& agg_method) -> void { | 405 | 1.59k | if (use_simple_count) { | 406 | | // Inline count: mapped slots hold UInt64, | 407 | | // not real agg state pointers. Skip destroy. | 408 | 63 | return; | 409 | 63 | } | 410 | 1.53k | auto& data = *agg_method.hash_table; | 411 | 1.53k | data.for_each_mapped([&](auto& mapped) { | 412 | 1.53k | if (mapped) { | 413 | 1.53k | _destroy_agg_status(mapped); | 414 | 1.53k | mapped = nullptr; | 415 | 1.53k | } | 416 | 1.53k | }); | 417 | 1.53k | if (data.has_null_key_data()) { | 418 | 0 | _destroy_agg_status( | 419 | 0 | data.template get_null_key_data<AggregateDataPtr>()); | 420 | 0 | } | 421 | 1.53k | }}, |
_ZZN5doris14AggSharedState26_close_with_serialized_keyEvENKUlRT_E_clINS_15MethodKeysFixedI9PHHashMapIN4wide7integerILm128EjEEPc9HashCRC32IS9_EEEEEEvS2_ Line | Count | Source | 404 | 101 | [&](auto& agg_method) -> void { | 405 | 101 | if (use_simple_count) { | 406 | | // Inline count: mapped slots hold UInt64, | 407 | | // not real agg state pointers. Skip destroy. | 408 | 20 | return; | 409 | 20 | } | 410 | 81 | auto& data = *agg_method.hash_table; | 411 | 81 | data.for_each_mapped([&](auto& mapped) { | 412 | 81 | if (mapped) { | 413 | 81 | _destroy_agg_status(mapped); | 414 | 81 | mapped = nullptr; | 415 | 81 | } | 416 | 81 | }); | 417 | 81 | if (data.has_null_key_data()) { | 418 | 0 | _destroy_agg_status( | 419 | 0 | data.template get_null_key_data<AggregateDataPtr>()); | 420 | 0 | } | 421 | 81 | }}, |
_ZZN5doris14AggSharedState26_close_with_serialized_keyEvENKUlRT_E_clINS_15MethodKeysFixedI9PHHashMapINS_7UInt104EPc9HashCRC32IS7_EEEEEEvS2_ Line | Count | Source | 404 | 597 | [&](auto& agg_method) -> void { | 405 | 597 | if (use_simple_count) { | 406 | | // Inline count: mapped slots hold UInt64, | 407 | | // not real agg state pointers. Skip destroy. | 408 | 13 | return; | 409 | 13 | } | 410 | 584 | auto& data = *agg_method.hash_table; | 411 | 584 | data.for_each_mapped([&](auto& mapped) { | 412 | 584 | if (mapped) { | 413 | 584 | _destroy_agg_status(mapped); | 414 | 584 | mapped = nullptr; | 415 | 584 | } | 416 | 584 | }); | 417 | 584 | if (data.has_null_key_data()) { | 418 | 0 | _destroy_agg_status( | 419 | 0 | data.template get_null_key_data<AggregateDataPtr>()); | 420 | 0 | } | 421 | 584 | }}, |
_ZZN5doris14AggSharedState26_close_with_serialized_keyEvENKUlRT_E_clINS_15MethodKeysFixedI9PHHashMapINS_6UInt96EPc9HashCRC32IS7_EEEEEEvS2_ Line | Count | Source | 404 | 618 | [&](auto& agg_method) -> void { | 405 | 618 | if (use_simple_count) { | 406 | | // Inline count: mapped slots hold UInt64, | 407 | | // not real agg state pointers. Skip destroy. | 408 | 0 | return; | 409 | 0 | } | 410 | 618 | auto& data = *agg_method.hash_table; | 411 | 618 | data.for_each_mapped([&](auto& mapped) { | 412 | 618 | if (mapped) { | 413 | 618 | _destroy_agg_status(mapped); | 414 | 618 | mapped = nullptr; | 415 | 618 | } | 416 | 618 | }); | 417 | 618 | if (data.has_null_key_data()) { | 418 | 0 | _destroy_agg_status( | 419 | 0 | data.template get_null_key_data<AggregateDataPtr>()); | 420 | 0 | } | 421 | 618 | }}, |
_ZZN5doris14AggSharedState26_close_with_serialized_keyEvENKUlRT_E_clINS_15MethodKeysFixedI9PHHashMapINS_6UInt72EPc9HashCRC32IS7_EEEEEEvS2_ Line | Count | Source | 404 | 917 | [&](auto& agg_method) -> void { | 405 | 917 | if (use_simple_count) { | 406 | | // Inline count: mapped slots hold UInt64, | 407 | | // not real agg state pointers. Skip destroy. | 408 | 97 | return; | 409 | 97 | } | 410 | 820 | auto& data = *agg_method.hash_table; | 411 | 820 | data.for_each_mapped([&](auto& mapped) { | 412 | 820 | if (mapped) { | 413 | 820 | _destroy_agg_status(mapped); | 414 | 820 | mapped = nullptr; | 415 | 820 | } | 416 | 820 | }); | 417 | 820 | if (data.has_null_key_data()) { | 418 | 0 | _destroy_agg_status( | 419 | 0 | data.template get_null_key_data<AggregateDataPtr>()); | 420 | 0 | } | 421 | 820 | }}, |
_ZZN5doris14AggSharedState26_close_with_serialized_keyEvENKUlRT_E_clINS_15MethodKeysFixedI9PHHashMapImPc9HashCRC32ImEEEEEEvS2_ Line | Count | Source | 404 | 1.03k | [&](auto& agg_method) -> void { | 405 | 1.03k | if (use_simple_count) { | 406 | | // Inline count: mapped slots hold UInt64, | 407 | | // not real agg state pointers. Skip destroy. | 408 | 64 | return; | 409 | 64 | } | 410 | 973 | auto& data = *agg_method.hash_table; | 411 | 973 | data.for_each_mapped([&](auto& mapped) { | 412 | 973 | if (mapped) { | 413 | 973 | _destroy_agg_status(mapped); | 414 | 973 | mapped = nullptr; | 415 | 973 | } | 416 | 973 | }); | 417 | 973 | if (data.has_null_key_data()) { | 418 | 0 | _destroy_agg_status( | 419 | 0 | data.template get_null_key_data<AggregateDataPtr>()); | 420 | 0 | } | 421 | 973 | }}, |
_ZZN5doris14AggSharedState26_close_with_serialized_keyEvENKUlRT_E_clINS_26MethodSingleNullableColumnINS_19MethodStringNoCacheINS_15DataWithNullKeyINS_13StringHashMapIPcNS_9AllocatorILb1ELb1ELb0ENS_22DefaultMemoryAllocatorELb1EEEEEEEEEEEEEvS2_ Line | Count | Source | 404 | 2.84k | [&](auto& agg_method) -> void { | 405 | 2.84k | if (use_simple_count) { | 406 | | // Inline count: mapped slots hold UInt64, | 407 | | // not real agg state pointers. Skip destroy. | 408 | 643 | return; | 409 | 643 | } | 410 | 2.20k | auto& data = *agg_method.hash_table; | 411 | 2.20k | data.for_each_mapped([&](auto& mapped) { | 412 | 2.20k | if (mapped) { | 413 | 2.20k | _destroy_agg_status(mapped); | 414 | 2.20k | mapped = nullptr; | 415 | 2.20k | } | 416 | 2.20k | }); | 417 | 2.20k | if (data.has_null_key_data()) { | 418 | 53 | _destroy_agg_status( | 419 | 53 | data.template get_null_key_data<AggregateDataPtr>()); | 420 | 53 | } | 421 | 2.20k | }}, |
_ZZN5doris14AggSharedState26_close_with_serialized_keyEvENKUlRT_E_clINS_26MethodSingleNullableColumnINS_15MethodOneNumberIN4wide7integerILm256EjEENS_15DataWithNullKeyI9PHHashMapIS9_Pc9HashCRC32IS9_EEEEEEEEEEvS2_ Line | Count | Source | 404 | 10 | [&](auto& agg_method) -> void { | 405 | 10 | if (use_simple_count) { | 406 | | // Inline count: mapped slots hold UInt64, | 407 | | // not real agg state pointers. Skip destroy. | 408 | 0 | return; | 409 | 0 | } | 410 | 10 | auto& data = *agg_method.hash_table; | 411 | 10 | data.for_each_mapped([&](auto& mapped) { | 412 | 10 | if (mapped) { | 413 | 10 | _destroy_agg_status(mapped); | 414 | 10 | mapped = nullptr; | 415 | 10 | } | 416 | 10 | }); | 417 | 10 | if (data.has_null_key_data()) { | 418 | 0 | _destroy_agg_status( | 419 | 0 | data.template get_null_key_data<AggregateDataPtr>()); | 420 | 0 | } | 421 | 10 | }}, |
_ZZN5doris14AggSharedState26_close_with_serialized_keyEvENKUlRT_E_clINS_26MethodSingleNullableColumnINS_15MethodOneNumberIN4wide7integerILm128EjEENS_15DataWithNullKeyI9PHHashMapIS9_Pc9HashCRC32IS9_EEEEEEEEEEvS2_ Line | Count | Source | 404 | 414 | [&](auto& agg_method) -> void { | 405 | 414 | if (use_simple_count) { | 406 | | // Inline count: mapped slots hold UInt64, | 407 | | // not real agg state pointers. Skip destroy. | 408 | 18 | return; | 409 | 18 | } | 410 | 396 | auto& data = *agg_method.hash_table; | 411 | 396 | data.for_each_mapped([&](auto& mapped) { | 412 | 396 | if (mapped) { | 413 | 396 | _destroy_agg_status(mapped); | 414 | 396 | mapped = nullptr; | 415 | 396 | } | 416 | 396 | }); | 417 | 396 | if (data.has_null_key_data()) { | 418 | 5 | _destroy_agg_status( | 419 | 5 | data.template get_null_key_data<AggregateDataPtr>()); | 420 | 5 | } | 421 | 396 | }}, |
_ZZN5doris14AggSharedState26_close_with_serialized_keyEvENKUlRT_E_clINS_26MethodSingleNullableColumnINS_15MethodOneNumberImNS_15DataWithNullKeyI9PHHashMapImPc14HashMixWrapperIm9HashCRC32ImEEEEEEEEEEEvS2_ Line | Count | Source | 404 | 4.68k | [&](auto& agg_method) -> void { | 405 | 4.68k | if (use_simple_count) { | 406 | | // Inline count: mapped slots hold UInt64, | 407 | | // not real agg state pointers. Skip destroy. | 408 | 630 | return; | 409 | 630 | } | 410 | 4.05k | auto& data = *agg_method.hash_table; | 411 | 4.05k | data.for_each_mapped([&](auto& mapped) { | 412 | 4.05k | if (mapped) { | 413 | 4.05k | _destroy_agg_status(mapped); | 414 | 4.05k | mapped = nullptr; | 415 | 4.05k | } | 416 | 4.05k | }); | 417 | 4.05k | if (data.has_null_key_data()) { | 418 | 152 | _destroy_agg_status( | 419 | 152 | data.template get_null_key_data<AggregateDataPtr>()); | 420 | 152 | } | 421 | 4.05k | }}, |
_ZZN5doris14AggSharedState26_close_with_serialized_keyEvENKUlRT_E_clINS_26MethodSingleNullableColumnINS_15MethodOneNumberIjNS_15DataWithNullKeyI9PHHashMapIjPc14HashMixWrapperIj9HashCRC32IjEEEEEEEEEEEvS2_ Line | Count | Source | 404 | 11.4k | [&](auto& agg_method) -> void { | 405 | 11.4k | if (use_simple_count) { | 406 | | // Inline count: mapped slots hold UInt64, | 407 | | // not real agg state pointers. Skip destroy. | 408 | 824 | return; | 409 | 824 | } | 410 | 10.5k | auto& data = *agg_method.hash_table; | 411 | 10.5k | data.for_each_mapped([&](auto& mapped) { | 412 | 10.5k | if (mapped) { | 413 | 10.5k | _destroy_agg_status(mapped); | 414 | 10.5k | mapped = nullptr; | 415 | 10.5k | } | 416 | 10.5k | }); | 417 | 10.5k | if (data.has_null_key_data()) { | 418 | 419 | _destroy_agg_status( | 419 | 419 | data.template get_null_key_data<AggregateDataPtr>()); | 420 | 419 | } | 421 | 10.5k | }}, |
_ZZN5doris14AggSharedState26_close_with_serialized_keyEvENKUlRT_E_clINS_26MethodSingleNullableColumnINS_15MethodOneNumberImNS_15DataWithNullKeyI9PHHashMapImPc9HashCRC32ImEEEEEEEEEEvS2_ Line | Count | Source | 404 | 255 | [&](auto& agg_method) -> void { | 405 | 255 | if (use_simple_count) { | 406 | | // Inline count: mapped slots hold UInt64, | 407 | | // not real agg state pointers. Skip destroy. | 408 | 8 | return; | 409 | 8 | } | 410 | 247 | auto& data = *agg_method.hash_table; | 411 | 247 | data.for_each_mapped([&](auto& mapped) { | 412 | 247 | if (mapped) { | 413 | 247 | _destroy_agg_status(mapped); | 414 | 247 | mapped = nullptr; | 415 | 247 | } | 416 | 247 | }); | 417 | 247 | if (data.has_null_key_data()) { | 418 | 33 | _destroy_agg_status( | 419 | 33 | data.template get_null_key_data<AggregateDataPtr>()); | 420 | 33 | } | 421 | 247 | }}, |
_ZZN5doris14AggSharedState26_close_with_serialized_keyEvENKUlRT_E_clINS_26MethodSingleNullableColumnINS_15MethodOneNumberIjNS_15DataWithNullKeyI9PHHashMapIjPc9HashCRC32IjEEEEEEEEEEvS2_ Line | Count | Source | 404 | 912 | [&](auto& agg_method) -> void { | 405 | 912 | if (use_simple_count) { | 406 | | // Inline count: mapped slots hold UInt64, | 407 | | // not real agg state pointers. Skip destroy. | 408 | 64 | return; | 409 | 64 | } | 410 | 848 | auto& data = *agg_method.hash_table; | 411 | 848 | data.for_each_mapped([&](auto& mapped) { | 412 | 848 | if (mapped) { | 413 | 848 | _destroy_agg_status(mapped); | 414 | 848 | mapped = nullptr; | 415 | 848 | } | 416 | 848 | }); | 417 | 848 | if (data.has_null_key_data()) { | 418 | 11 | _destroy_agg_status( | 419 | 11 | data.template get_null_key_data<AggregateDataPtr>()); | 420 | 11 | } | 421 | 848 | }}, |
_ZZN5doris14AggSharedState26_close_with_serialized_keyEvENKUlRT_E_clINS_26MethodSingleNullableColumnINS_15MethodOneNumberItNS_15DataWithNullKeyI9PHHashMapItPc9HashCRC32ItEEEEEEEEEEvS2_ Line | Count | Source | 404 | 365 | [&](auto& agg_method) -> void { | 405 | 365 | if (use_simple_count) { | 406 | | // Inline count: mapped slots hold UInt64, | 407 | | // not real agg state pointers. Skip destroy. | 408 | 7 | return; | 409 | 7 | } | 410 | 358 | auto& data = *agg_method.hash_table; | 411 | 358 | data.for_each_mapped([&](auto& mapped) { | 412 | 358 | if (mapped) { | 413 | 358 | _destroy_agg_status(mapped); | 414 | 358 | mapped = nullptr; | 415 | 358 | } | 416 | 358 | }); | 417 | 358 | if (data.has_null_key_data()) { | 418 | 12 | _destroy_agg_status( | 419 | 12 | data.template get_null_key_data<AggregateDataPtr>()); | 420 | 12 | } | 421 | 358 | }}, |
_ZZN5doris14AggSharedState26_close_with_serialized_keyEvENKUlRT_E_clINS_26MethodSingleNullableColumnINS_15MethodOneNumberIhNS_15DataWithNullKeyI9PHHashMapIhPc9HashCRC32IhEEEEEEEEEEvS2_ Line | Count | Source | 404 | 2.41k | [&](auto& agg_method) -> void { | 405 | 2.41k | if (use_simple_count) { | 406 | | // Inline count: mapped slots hold UInt64, | 407 | | // not real agg state pointers. Skip destroy. | 408 | 300 | return; | 409 | 300 | } | 410 | 2.11k | auto& data = *agg_method.hash_table; | 411 | 2.11k | data.for_each_mapped([&](auto& mapped) { | 412 | 2.11k | if (mapped) { | 413 | 2.11k | _destroy_agg_status(mapped); | 414 | 2.11k | mapped = nullptr; | 415 | 2.11k | } | 416 | 2.11k | }); | 417 | 2.11k | if (data.has_null_key_data()) { | 418 | 502 | _destroy_agg_status( | 419 | 502 | data.template get_null_key_data<AggregateDataPtr>()); | 420 | 502 | } | 421 | 2.11k | }}, |
_ZZN5doris14AggSharedState26_close_with_serialized_keyEvENKUlRT_E_clINS_15MethodOneNumberIm9PHHashMapImPc14HashMixWrapperIm9HashCRC32ImEEEEEEEvS2_ Line | Count | Source | 404 | 732 | [&](auto& agg_method) -> void { | 405 | 732 | if (use_simple_count) { | 406 | | // Inline count: mapped slots hold UInt64, | 407 | | // not real agg state pointers. Skip destroy. | 408 | 153 | return; | 409 | 153 | } | 410 | 579 | auto& data = *agg_method.hash_table; | 411 | 579 | data.for_each_mapped([&](auto& mapped) { | 412 | 579 | if (mapped) { | 413 | 579 | _destroy_agg_status(mapped); | 414 | 579 | mapped = nullptr; | 415 | 579 | } | 416 | 579 | }); | 417 | 579 | if (data.has_null_key_data()) { | 418 | 0 | _destroy_agg_status( | 419 | 0 | data.template get_null_key_data<AggregateDataPtr>()); | 420 | 0 | } | 421 | 579 | }}, |
_ZZN5doris14AggSharedState26_close_with_serialized_keyEvENKUlRT_E_clINS_15MethodOneNumberIj9PHHashMapIjPc14HashMixWrapperIj9HashCRC32IjEEEEEEEvS2_ Line | Count | Source | 404 | 5.01k | [&](auto& agg_method) -> void { | 405 | 5.01k | if (use_simple_count) { | 406 | | // Inline count: mapped slots hold UInt64, | 407 | | // not real agg state pointers. Skip destroy. | 408 | 186 | return; | 409 | 186 | } | 410 | 4.82k | auto& data = *agg_method.hash_table; | 411 | 4.82k | data.for_each_mapped([&](auto& mapped) { | 412 | 4.82k | if (mapped) { | 413 | 4.82k | _destroy_agg_status(mapped); | 414 | 4.82k | mapped = nullptr; | 415 | 4.82k | } | 416 | 4.82k | }); | 417 | 4.82k | if (data.has_null_key_data()) { | 418 | 0 | _destroy_agg_status( | 419 | 0 | data.template get_null_key_data<AggregateDataPtr>()); | 420 | 0 | } | 421 | 4.82k | }}, |
Unexecuted instantiation: _ZZN5doris14AggSharedState26_close_with_serialized_keyEvENKUlRT_E_clINS_15MethodOneNumberIN4wide7integerILm256EjEE9PHHashMapIS8_Pc9HashCRC32IS8_EEEEEEvS2_ _ZZN5doris14AggSharedState26_close_with_serialized_keyEvENKUlRT_E_clINS_15MethodOneNumberIN4wide7integerILm128EjEE9PHHashMapIS8_Pc9HashCRC32IS8_EEEEEEvS2_ Line | Count | Source | 404 | 185 | [&](auto& agg_method) -> void { | 405 | 185 | if (use_simple_count) { | 406 | | // Inline count: mapped slots hold UInt64, | 407 | | // not real agg state pointers. Skip destroy. | 408 | 17 | return; | 409 | 17 | } | 410 | 168 | auto& data = *agg_method.hash_table; | 411 | 168 | data.for_each_mapped([&](auto& mapped) { | 412 | 168 | if (mapped) { | 413 | 168 | _destroy_agg_status(mapped); | 414 | 168 | mapped = nullptr; | 415 | 168 | } | 416 | 168 | }); | 417 | 168 | if (data.has_null_key_data()) { | 418 | 0 | _destroy_agg_status( | 419 | 0 | data.template get_null_key_data<AggregateDataPtr>()); | 420 | 0 | } | 421 | 168 | }}, |
_ZZN5doris14AggSharedState26_close_with_serialized_keyEvENKUlRT_E_clINS_19MethodStringNoCacheINS_13StringHashMapIPcNS_9AllocatorILb1ELb1ELb0ENS_22DefaultMemoryAllocatorELb1EEEEEEEEEvS2_ Line | Count | Source | 404 | 495 | [&](auto& agg_method) -> void { | 405 | 495 | if (use_simple_count) { | 406 | | // Inline count: mapped slots hold UInt64, | 407 | | // not real agg state pointers. Skip destroy. | 408 | 112 | return; | 409 | 112 | } | 410 | 383 | auto& data = *agg_method.hash_table; | 411 | 383 | data.for_each_mapped([&](auto& mapped) { | 412 | 383 | if (mapped) { | 413 | 383 | _destroy_agg_status(mapped); | 414 | 383 | mapped = nullptr; | 415 | 383 | } | 416 | 383 | }); | 417 | 383 | if (data.has_null_key_data()) { | 418 | 0 | _destroy_agg_status( | 419 | 0 | data.template get_null_key_data<AggregateDataPtr>()); | 420 | 0 | } | 421 | 383 | }}, |
_ZZN5doris14AggSharedState26_close_with_serialized_keyEvENKUlRT_E_clINS_15MethodOneNumberIm9PHHashMapImPc9HashCRC32ImEEEEEEvS2_ Line | Count | Source | 404 | 119 | [&](auto& agg_method) -> void { | 405 | 119 | if (use_simple_count) { | 406 | | // Inline count: mapped slots hold UInt64, | 407 | | // not real agg state pointers. Skip destroy. | 408 | 24 | return; | 409 | 24 | } | 410 | 95 | auto& data = *agg_method.hash_table; | 411 | 95 | data.for_each_mapped([&](auto& mapped) { | 412 | 95 | if (mapped) { | 413 | 95 | _destroy_agg_status(mapped); | 414 | 95 | mapped = nullptr; | 415 | 95 | } | 416 | 95 | }); | 417 | 95 | if (data.has_null_key_data()) { | 418 | 0 | _destroy_agg_status( | 419 | 0 | data.template get_null_key_data<AggregateDataPtr>()); | 420 | 0 | } | 421 | 95 | }}, |
_ZZN5doris14AggSharedState26_close_with_serialized_keyEvENKUlRT_E_clINS_15MethodOneNumberIj9PHHashMapIjPc9HashCRC32IjEEEEEEvS2_ Line | Count | Source | 404 | 261 | [&](auto& agg_method) -> void { | 405 | 261 | if (use_simple_count) { | 406 | | // Inline count: mapped slots hold UInt64, | 407 | | // not real agg state pointers. Skip destroy. | 408 | 15 | return; | 409 | 15 | } | 410 | 246 | auto& data = *agg_method.hash_table; | 411 | 246 | data.for_each_mapped([&](auto& mapped) { | 412 | 246 | if (mapped) { | 413 | 246 | _destroy_agg_status(mapped); | 414 | 246 | mapped = nullptr; | 415 | 246 | } | 416 | 246 | }); | 417 | 246 | if (data.has_null_key_data()) { | 418 | 0 | _destroy_agg_status( | 419 | 0 | data.template get_null_key_data<AggregateDataPtr>()); | 420 | 0 | } | 421 | 246 | }}, |
_ZZN5doris14AggSharedState26_close_with_serialized_keyEvENKUlRT_E_clINS_15MethodOneNumberIt9PHHashMapItPc9HashCRC32ItEEEEEEvS2_ Line | Count | Source | 404 | 25 | [&](auto& agg_method) -> void { | 405 | 25 | if (use_simple_count) { | 406 | | // Inline count: mapped slots hold UInt64, | 407 | | // not real agg state pointers. Skip destroy. | 408 | 0 | return; | 409 | 0 | } | 410 | 25 | auto& data = *agg_method.hash_table; | 411 | 25 | data.for_each_mapped([&](auto& mapped) { | 412 | 25 | if (mapped) { | 413 | 25 | _destroy_agg_status(mapped); | 414 | 25 | mapped = nullptr; | 415 | 25 | } | 416 | 25 | }); | 417 | 25 | if (data.has_null_key_data()) { | 418 | 0 | _destroy_agg_status( | 419 | 0 | data.template get_null_key_data<AggregateDataPtr>()); | 420 | 0 | } | 421 | 25 | }}, |
_ZZN5doris14AggSharedState26_close_with_serialized_keyEvENKUlRT_E_clINS_15MethodOneNumberIh9PHHashMapIhPc9HashCRC32IhEEEEEEvS2_ Line | Count | Source | 404 | 499 | [&](auto& agg_method) -> void { | 405 | 499 | if (use_simple_count) { | 406 | | // Inline count: mapped slots hold UInt64, | 407 | | // not real agg state pointers. Skip destroy. | 408 | 9 | return; | 409 | 9 | } | 410 | 490 | auto& data = *agg_method.hash_table; | 411 | 490 | data.for_each_mapped([&](auto& mapped) { | 412 | 490 | if (mapped) { | 413 | 490 | _destroy_agg_status(mapped); | 414 | 490 | mapped = nullptr; | 415 | 490 | } | 416 | 490 | }); | 417 | 490 | if (data.has_null_key_data()) { | 418 | 0 | _destroy_agg_status( | 419 | 0 | data.template get_null_key_data<AggregateDataPtr>()); | 420 | 0 | } | 421 | 490 | }}, |
_ZZN5doris14AggSharedState26_close_with_serialized_keyEvENKUlRT_E_clINS_16MethodSerializedI9PHHashMapINS_9StringRefEPc11DefaultHashIS7_vEEEEEEvS2_ Line | Count | Source | 404 | 5.91k | [&](auto& agg_method) -> void { | 405 | 5.91k | if (use_simple_count) { | 406 | | // Inline count: mapped slots hold UInt64, | 407 | | // not real agg state pointers. Skip destroy. | 408 | 423 | return; | 409 | 423 | } | 410 | 5.49k | auto& data = *agg_method.hash_table; | 411 | 5.49k | data.for_each_mapped([&](auto& mapped) { | 412 | 5.49k | if (mapped) { | 413 | 5.49k | _destroy_agg_status(mapped); | 414 | 5.49k | mapped = nullptr; | 415 | 5.49k | } | 416 | 5.49k | }); | 417 | 5.49k | if (data.has_null_key_data()) { | 418 | 0 | _destroy_agg_status( | 419 | 0 | data.template get_null_key_data<AggregateDataPtr>()); | 420 | 0 | } | 421 | 5.49k | }}, |
|
422 | 44.5k | agg_data->method_variant); |
423 | 44.5k | } |
424 | | |
425 | 102k | void _close_without_key() { |
426 | | //because prepare maybe failed, and couldn't create agg data. |
427 | | //but finally call close to destory agg data, if agg data has bitmapValue |
428 | | //will be core dump, it's not initialized |
429 | 102k | if (agg_data_created_without_key) { |
430 | 102k | _destroy_agg_status(agg_data->without_key); |
431 | 102k | agg_data_created_without_key = false; |
432 | 102k | } |
433 | 102k | } |
434 | | void _destroy_agg_status(AggregateDataPtr data); |
435 | | }; |
436 | | |
437 | | static constexpr int BUCKETED_AGG_NUM_BUCKETS = 256; |
438 | | |
439 | | /// Shared state for BucketedAggSinkOperatorX / BucketedAggSourceOperatorX. |
440 | | /// |
441 | | /// Each sink pipeline instance owns 256 per-bucket hash tables (two-level hash table |
442 | | /// approach, inspired by ClickHouse). During sink, each row is routed to bucket |
443 | | /// (hash >> 24) & 0xFF. |
444 | | /// |
445 | | /// Source-side merge is pipelined with sink completion: as each sink instance finishes, |
446 | | /// it unblocks all source dependencies. Source instances scan buckets and merge data |
447 | | /// from finished sink instances into the merge target (the first sink to finish). |
448 | | /// Each bucket has a CAS lock so only one source works on a bucket at a time. |
449 | | /// After all sinks finish and all buckets are merged + output, one source handles |
450 | | /// null key merge and the pipeline completes. |
451 | | /// |
452 | | /// Thread safety model: |
453 | | /// - Sink phase: each instance writes only to its own per_instance_data[task_idx]. No locking. |
454 | | /// - Source phase: per-bucket CAS lock (merge_in_progress). Under the lock, a source |
455 | | /// scans all finished sink instances and merges their bucket data into the merge |
456 | | /// target's bucket. Already-merged entries are nulled out to prevent re-processing. |
457 | | /// Output is only done when all sinks have finished and the bucket is fully merged. |
458 | | struct BucketedAggSharedState : public BasicSharedState { |
459 | | ENABLE_FACTORY_CREATOR(BucketedAggSharedState) |
460 | | public: |
461 | 64 | BucketedAggSharedState() = default; |
462 | 64 | ~BucketedAggSharedState() override { _close(); } |
463 | | |
464 | | /// Per-instance data. One per sink pipeline instance. |
465 | | /// Each instance has 256 bucket hash tables + 1 shared arena. |
466 | | struct PerInstanceData { |
467 | | /// 256 per-bucket hash tables. Each bucket has its own BucketedAggDataVariants. |
468 | | /// Uses PHHashMap<StringRef> for string keys instead of StringHashMap. |
469 | | std::vector<BucketedAggDataVariantsUPtr> bucket_agg_data; |
470 | | ArenaUPtr arena; |
471 | | |
472 | 401 | PerInstanceData() : arena(std::make_unique<Arena>()) { |
473 | 401 | bucket_agg_data.resize(BUCKETED_AGG_NUM_BUCKETS); |
474 | 102k | for (auto& p : bucket_agg_data) { |
475 | 102k | p = std::make_unique<BucketedAggDataVariants>(); |
476 | 102k | } |
477 | 401 | } |
478 | | }; |
479 | | |
480 | | /// Per-bucket merge state for pipelined source-side processing. |
481 | | struct BucketMergeState { |
482 | | /// CAS lock: only one source instance can merge/output this bucket at a time. |
483 | | std::atomic<bool> merge_in_progress {false}; |
484 | | /// Set to true once the bucket is fully merged and all rows have been output. |
485 | | std::atomic<bool> output_done {false}; |
486 | | /// Tracks which sink instances have been merged into the merge target |
487 | | /// for this bucket. Accessed only under merge_in_progress CAS lock. |
488 | | /// Element i is true when instance i's data for this bucket has been merged. |
489 | | /// Sized to num_sink_instances in init_instances(). |
490 | | std::vector<bool> merged_instances; |
491 | | }; |
492 | | |
493 | | std::vector<PerInstanceData> per_instance_data; |
494 | | int num_sink_instances = 0; |
495 | | |
496 | | /// Tracks how many sinks have finished. Incremented by each sink on EOS. |
497 | | std::atomic<int> num_sinks_finished = 0; |
498 | | |
499 | | /// Per-sink completion flags. Set to true when each sink instance finishes. |
500 | | /// Source instances read these to know which sinks' data is safe to merge. |
501 | | std::unique_ptr<std::atomic<bool>[]> sink_finished; |
502 | | |
503 | | /// Index of the first sink instance to finish. Its bucket hash tables serve |
504 | | /// as the merge target — all other sinks' data is merged into it. |
505 | | /// Initialized to -1; the first sink to finish CAS-sets it to its instance idx. |
506 | | std::atomic<int> merge_target_instance = -1; |
507 | | |
508 | | /// Per-bucket merge state. Indexed by bucket id [0, 256). |
509 | | std::array<BucketMergeState, BUCKETED_AGG_NUM_BUCKETS> bucket_states; |
510 | | |
511 | | // Aggregate function metadata (shared, read-only after init). |
512 | | std::vector<AggFnEvaluator*> aggregate_evaluators; |
513 | | VExprContextSPtrs probe_expr_ctxs; |
514 | | size_t total_size_of_aggregate_states = 0; |
515 | | size_t align_aggregate_states = 1; |
516 | | Sizes offsets_of_aggregate_states; |
517 | | std::vector<size_t> make_nullable_keys; |
518 | | |
519 | | std::atomic<size_t> input_num_rows {0}; |
520 | | |
521 | | /// When true, the aggregate has exactly one COUNT(*) function with no args. |
522 | | /// In this case, mapped values in the hash table store a UInt64 counter |
523 | | /// directly (reinterpret_cast<AggregateDataPtr>) instead of a pointer to |
524 | | /// allocated aggregate state. This eliminates create/merge/destroy overhead. |
525 | | bool use_simple_count = false; |
526 | | |
527 | | // ---- Source-side fields ---- |
528 | | |
529 | | // Null key handling: null keys are stored separately (not in any bucket). |
530 | | // After all buckets are processed, one source instance merges and outputs |
531 | | // all null key data. This atomic ensures exactly one source instance does it. |
532 | | std::atomic<bool> null_key_output_claimed {false}; |
533 | | |
534 | | /// Monotonically increasing counter bumped on every state change (bucket lock |
535 | | /// release, sink finish). Used by source instances to detect missed wakeups: |
536 | | /// if the generation changed between scan start and post-block() re-check, |
537 | | /// something happened and the source should unblock immediately. |
538 | | std::atomic<uint64_t> state_generation {0}; |
539 | | |
540 | | /// Initialize per-instance data and optionally run a metadata init callback. |
541 | | /// The callback runs exactly once (under std::call_once), must return Status, |
542 | | /// and should populate shared metadata like probe_expr_ctxs, aggregate_evaluators, etc. |
543 | | /// All threads observe the same init status via _init_status. |
544 | | template <typename Func> |
545 | 401 | Status init_instances(int num_instances, Func&& metadata_init) { |
546 | 401 | std::call_once(_init_once, [&]() { |
547 | 64 | num_sink_instances = num_instances; |
548 | 64 | per_instance_data.resize(num_instances); |
549 | 64 | sink_finished = std::make_unique<std::atomic<bool>[]>(num_instances); |
550 | 465 | for (int i = 0; i < num_instances; ++i) { |
551 | 401 | sink_finished[i].store(false, std::memory_order_relaxed); |
552 | 401 | } |
553 | 16.3k | for (auto& bs : bucket_states) { |
554 | 16.3k | bs.merged_instances.resize(num_instances, false); |
555 | 16.3k | } |
556 | 64 | _init_status = std::forward<Func>(metadata_init)(); |
557 | 64 | }); |
558 | 401 | return _init_status; |
559 | 401 | } |
560 | | |
561 | | private: |
562 | | std::once_flag _init_once; |
563 | | Status _init_status; |
564 | | |
565 | 64 | void _close() { |
566 | 401 | for (auto& inst : per_instance_data) { |
567 | 102k | for (auto& bucket_data : inst.bucket_agg_data) { |
568 | 102k | _close_one_agg_data(*bucket_data); |
569 | 102k | } |
570 | 401 | } |
571 | 64 | } |
572 | | |
573 | 102k | void _close_one_agg_data(BucketedAggDataVariants& agg_data) { |
574 | 102k | std::visit( |
575 | 102k | Overload {[&](std::monostate& arg) -> void { |
576 | | // Do nothing |
577 | 0 | }, |
578 | 102k | [&](auto& agg_method) -> void { |
579 | 102k | if (use_simple_count) { |
580 | | // simple_count: mapped slots hold UInt64 counters, |
581 | | // not real agg state pointers. Skip destroy. |
582 | 8.70k | return; |
583 | 8.70k | } |
584 | 93.9k | auto& data = *agg_method.hash_table; |
585 | 93.9k | data.for_each_mapped([&](auto& mapped) { |
586 | 52.2k | if (mapped) { |
587 | 30.9k | _destroy_agg_status(mapped); |
588 | 30.9k | mapped = nullptr; |
589 | 30.9k | } |
590 | 52.2k | }); _ZZZN5doris22BucketedAggSharedState19_close_one_agg_dataERNS_23BucketedAggDataVariantsEENKUlRT_E_clINS_15MethodKeysFixedI9PHHashMapIN4wide7integerILm256EjEEPc9HashCRC32ISB_EEEEEEvS4_ENKUlS4_E_clISC_EEDaS4_ Line | Count | Source | 585 | 69 | data.for_each_mapped([&](auto& mapped) { | 586 | 69 | if (mapped) { | 587 | 36 | _destroy_agg_status(mapped); | 588 | 36 | mapped = nullptr; | 589 | 36 | } | 590 | 69 | }); |
_ZZZN5doris22BucketedAggSharedState19_close_one_agg_dataERNS_23BucketedAggDataVariantsEENKUlRT_E_clINS_15MethodKeysFixedI9PHHashMapINS_7UInt136EPc9HashCRC32IS9_EEEEEEvS4_ENKUlS4_E_clISA_EEDaS4_ Line | Count | Source | 585 | 53 | data.for_each_mapped([&](auto& mapped) { | 586 | 53 | if (mapped) { | 587 | 28 | _destroy_agg_status(mapped); | 588 | 28 | mapped = nullptr; | 589 | 28 | } | 590 | 53 | }); |
Unexecuted instantiation: _ZZZN5doris22BucketedAggSharedState19_close_one_agg_dataERNS_23BucketedAggDataVariantsEENKUlRT_E_clINS_15MethodKeysFixedI9PHHashMapIN4wide7integerILm128EjEEPc9HashCRC32ISB_EEEEEEvS4_ENKUlS4_E_clISC_EEDaS4_ Unexecuted instantiation: _ZZZN5doris22BucketedAggSharedState19_close_one_agg_dataERNS_23BucketedAggDataVariantsEENKUlRT_E_clINS_15MethodKeysFixedI9PHHashMapINS_7UInt104EPc9HashCRC32IS9_EEEEEEvS4_ENKUlS4_E_clISA_EEDaS4_ Unexecuted instantiation: _ZZZN5doris22BucketedAggSharedState19_close_one_agg_dataERNS_23BucketedAggDataVariantsEENKUlRT_E_clINS_15MethodKeysFixedI9PHHashMapINS_6UInt96EPc9HashCRC32IS9_EEEEEEvS4_ENKUlS4_E_clISA_EEDaS4_ Unexecuted instantiation: _ZZZN5doris22BucketedAggSharedState19_close_one_agg_dataERNS_23BucketedAggDataVariantsEENKUlRT_E_clINS_15MethodKeysFixedI9PHHashMapINS_6UInt72EPc9HashCRC32IS9_EEEEEEvS4_ENKUlS4_E_clISA_EEDaS4_ Unexecuted instantiation: _ZZZN5doris22BucketedAggSharedState19_close_one_agg_dataERNS_23BucketedAggDataVariantsEENKUlRT_E_clINS_15MethodKeysFixedI9PHHashMapImPc9HashCRC32ImEEEEEEvS4_ENKUlS4_E_clIS9_EEDaS4_ _ZZZN5doris22BucketedAggSharedState19_close_one_agg_dataERNS_23BucketedAggDataVariantsEENKUlRT_E_clINS_26MethodSingleNullableColumnINS_19MethodStringNoCacheINS_15DataWithNullKeyI9PHHashMapINS_9StringRefEPc11DefaultHashISB_vEEEEEEEEEEvS4_ENKUlS4_E_clISC_EEDaS4_ Line | Count | Source | 585 | 443 | data.for_each_mapped([&](auto& mapped) { | 586 | 443 | if (mapped) { | 587 | 443 | _destroy_agg_status(mapped); | 588 | 443 | mapped = nullptr; | 589 | 443 | } | 590 | 443 | }); |
Unexecuted instantiation: _ZZZN5doris22BucketedAggSharedState19_close_one_agg_dataERNS_23BucketedAggDataVariantsEENKUlRT_E_clINS_26MethodSingleNullableColumnINS_15MethodOneNumberIN4wide7integerILm256EjEENS_15DataWithNullKeyI9PHHashMapISB_Pc9HashCRC32ISB_EEEEEEEEEEvS4_ENKUlS4_E_clISE_EEDaS4_ Unexecuted instantiation: _ZZZN5doris22BucketedAggSharedState19_close_one_agg_dataERNS_23BucketedAggDataVariantsEENKUlRT_E_clINS_26MethodSingleNullableColumnINS_15MethodOneNumberIN4wide7integerILm128EjEENS_15DataWithNullKeyI9PHHashMapISB_Pc9HashCRC32ISB_EEEEEEEEEEvS4_ENKUlS4_E_clISE_EEDaS4_ Unexecuted instantiation: _ZZZN5doris22BucketedAggSharedState19_close_one_agg_dataERNS_23BucketedAggDataVariantsEENKUlRT_E_clINS_26MethodSingleNullableColumnINS_15MethodOneNumberImNS_15DataWithNullKeyI9PHHashMapImPc14HashMixWrapperIm9HashCRC32ImEEEEEEEEEEEvS4_ENKUlS4_E_clISB_EEDaS4_ Unexecuted instantiation: _ZZZN5doris22BucketedAggSharedState19_close_one_agg_dataERNS_23BucketedAggDataVariantsEENKUlRT_E_clINS_26MethodSingleNullableColumnINS_15MethodOneNumberIjNS_15DataWithNullKeyI9PHHashMapIjPc14HashMixWrapperIj9HashCRC32IjEEEEEEEEEEEvS4_ENKUlS4_E_clISB_EEDaS4_ _ZZZN5doris22BucketedAggSharedState19_close_one_agg_dataERNS_23BucketedAggDataVariantsEENKUlRT_E_clINS_26MethodSingleNullableColumnINS_15MethodOneNumberImNS_15DataWithNullKeyI9PHHashMapImPc9HashCRC32ImEEEEEEEEEEvS4_ENKUlS4_E_clISB_EEDaS4_ Line | Count | Source | 585 | 37 | data.for_each_mapped([&](auto& mapped) { | 586 | 37 | if (mapped) { | 587 | 20 | _destroy_agg_status(mapped); | 588 | 20 | mapped = nullptr; | 589 | 20 | } | 590 | 37 | }); |
_ZZZN5doris22BucketedAggSharedState19_close_one_agg_dataERNS_23BucketedAggDataVariantsEENKUlRT_E_clINS_26MethodSingleNullableColumnINS_15MethodOneNumberIjNS_15DataWithNullKeyI9PHHashMapIjPc9HashCRC32IjEEEEEEEEEEvS4_ENKUlS4_E_clISB_EEDaS4_ Line | Count | Source | 585 | 59 | data.for_each_mapped([&](auto& mapped) { | 586 | 59 | if (mapped) { | 587 | 32 | _destroy_agg_status(mapped); | 588 | 32 | mapped = nullptr; | 589 | 32 | } | 590 | 59 | }); |
_ZZZN5doris22BucketedAggSharedState19_close_one_agg_dataERNS_23BucketedAggDataVariantsEENKUlRT_E_clINS_26MethodSingleNullableColumnINS_15MethodOneNumberItNS_15DataWithNullKeyI9PHHashMapItPc9HashCRC32ItEEEEEEEEEEvS4_ENKUlS4_E_clISB_EEDaS4_ Line | Count | Source | 585 | 12 | data.for_each_mapped([&](auto& mapped) { | 586 | 12 | if (mapped) { | 587 | 2 | _destroy_agg_status(mapped); | 588 | 2 | mapped = nullptr; | 589 | 2 | } | 590 | 12 | }); |
Unexecuted instantiation: _ZZZN5doris22BucketedAggSharedState19_close_one_agg_dataERNS_23BucketedAggDataVariantsEENKUlRT_E_clINS_26MethodSingleNullableColumnINS_15MethodOneNumberIhNS_15DataWithNullKeyI9PHHashMapIhPc9HashCRC32IhEEEEEEEEEEvS4_ENKUlS4_E_clISB_EEDaS4_ Unexecuted instantiation: _ZZZN5doris22BucketedAggSharedState19_close_one_agg_dataERNS_23BucketedAggDataVariantsEENKUlRT_E_clINS_15MethodOneNumberIm9PHHashMapImPc14HashMixWrapperIm9HashCRC32ImEEEEEEEvS4_ENKUlS4_E_clIS9_EEDaS4_ Unexecuted instantiation: _ZZZN5doris22BucketedAggSharedState19_close_one_agg_dataERNS_23BucketedAggDataVariantsEENKUlRT_E_clINS_15MethodOneNumberIj9PHHashMapIjPc14HashMixWrapperIj9HashCRC32IjEEEEEEEvS4_ENKUlS4_E_clIS9_EEDaS4_ Unexecuted instantiation: _ZZZN5doris22BucketedAggSharedState19_close_one_agg_dataERNS_23BucketedAggDataVariantsEENKUlRT_E_clINS_15MethodOneNumberIN4wide7integerILm256EjEE9PHHashMapISA_Pc9HashCRC32ISA_EEEEEEvS4_ENKUlS4_E_clISC_EEDaS4_ Unexecuted instantiation: _ZZZN5doris22BucketedAggSharedState19_close_one_agg_dataERNS_23BucketedAggDataVariantsEENKUlRT_E_clINS_15MethodOneNumberIN4wide7integerILm128EjEE9PHHashMapISA_Pc9HashCRC32ISA_EEEEEEvS4_ENKUlS4_E_clISC_EEDaS4_ _ZZZN5doris22BucketedAggSharedState19_close_one_agg_dataERNS_23BucketedAggDataVariantsEENKUlRT_E_clINS_19MethodStringNoCacheI9PHHashMapINS_9StringRefEPc11DefaultHashIS9_vEEEEEEvS4_ENKUlS4_E_clISA_EEDaS4_ Line | Count | Source | 585 | 125 | data.for_each_mapped([&](auto& mapped) { | 586 | 125 | if (mapped) { | 587 | 17 | _destroy_agg_status(mapped); | 588 | 17 | mapped = nullptr; | 589 | 17 | } | 590 | 125 | }); |
Unexecuted instantiation: _ZZZN5doris22BucketedAggSharedState19_close_one_agg_dataERNS_23BucketedAggDataVariantsEENKUlRT_E_clINS_15MethodOneNumberIm9PHHashMapImPc9HashCRC32ImEEEEEEvS4_ENKUlS4_E_clIS9_EEDaS4_ _ZZZN5doris22BucketedAggSharedState19_close_one_agg_dataERNS_23BucketedAggDataVariantsEENKUlRT_E_clINS_15MethodOneNumberIj9PHHashMapIjPc9HashCRC32IjEEEEEEvS4_ENKUlS4_E_clIS9_EEDaS4_ Line | Count | Source | 585 | 50.0k | data.for_each_mapped([&](auto& mapped) { | 586 | 50.0k | if (mapped) { | 587 | 30.0k | _destroy_agg_status(mapped); | 588 | 30.0k | mapped = nullptr; | 589 | 30.0k | } | 590 | 50.0k | }); |
_ZZZN5doris22BucketedAggSharedState19_close_one_agg_dataERNS_23BucketedAggDataVariantsEENKUlRT_E_clINS_15MethodOneNumberIt9PHHashMapItPc9HashCRC32ItEEEEEEvS4_ENKUlS4_E_clIS9_EEDaS4_ Line | Count | Source | 585 | 24 | data.for_each_mapped([&](auto& mapped) { | 586 | 24 | if (mapped) { | 587 | 6 | _destroy_agg_status(mapped); | 588 | 6 | mapped = nullptr; | 589 | 6 | } | 590 | 24 | }); |
_ZZZN5doris22BucketedAggSharedState19_close_one_agg_dataERNS_23BucketedAggDataVariantsEENKUlRT_E_clINS_15MethodOneNumberIh9PHHashMapIhPc9HashCRC32IhEEEEEEvS4_ENKUlS4_E_clIS9_EEDaS4_ Line | Count | Source | 585 | 6 | data.for_each_mapped([&](auto& mapped) { | 586 | 6 | if (mapped) { | 587 | 2 | _destroy_agg_status(mapped); | 588 | 2 | mapped = nullptr; | 589 | 2 | } | 590 | 6 | }); |
_ZZZN5doris22BucketedAggSharedState19_close_one_agg_dataERNS_23BucketedAggDataVariantsEENKUlRT_E_clINS_16MethodSerializedI9PHHashMapINS_9StringRefEPc11DefaultHashIS9_vEEEEEEvS4_ENKUlS4_E_clISA_EEDaS4_ Line | Count | Source | 585 | 1.35k | data.for_each_mapped([&](auto& mapped) { | 586 | 1.35k | if (mapped) { | 587 | 381 | _destroy_agg_status(mapped); | 588 | 381 | mapped = nullptr; | 589 | 381 | } | 590 | 1.35k | }); |
|
591 | | if constexpr (std::is_assignable_v<decltype(data.has_null_key_data()), |
592 | 22.7k | bool>) { |
593 | 22.7k | if (data.has_null_key_data()) { |
594 | 2 | _destroy_agg_status( |
595 | 2 | data.template get_null_key_data<AggregateDataPtr>()); |
596 | 2 | } |
597 | 22.7k | } |
598 | 93.9k | }}, _ZZN5doris22BucketedAggSharedState19_close_one_agg_dataERNS_23BucketedAggDataVariantsEENKUlRT_E_clINS_15MethodKeysFixedI9PHHashMapIN4wide7integerILm256EjEEPc9HashCRC32ISB_EEEEEEvS4_ Line | Count | Source | 578 | 4.60k | [&](auto& agg_method) -> void { | 579 | 4.60k | if (use_simple_count) { | 580 | | // simple_count: mapped slots hold UInt64 counters, | 581 | | // not real agg state pointers. Skip destroy. | 582 | 0 | return; | 583 | 0 | } | 584 | 4.60k | auto& data = *agg_method.hash_table; | 585 | 4.60k | data.for_each_mapped([&](auto& mapped) { | 586 | 4.60k | if (mapped) { | 587 | 4.60k | _destroy_agg_status(mapped); | 588 | 4.60k | mapped = nullptr; | 589 | 4.60k | } | 590 | 4.60k | }); | 591 | | if constexpr (std::is_assignable_v<decltype(data.has_null_key_data()), | 592 | | bool>) { | 593 | | if (data.has_null_key_data()) { | 594 | | _destroy_agg_status( | 595 | | data.template get_null_key_data<AggregateDataPtr>()); | 596 | | } | 597 | | } | 598 | 4.60k | }}, |
_ZZN5doris22BucketedAggSharedState19_close_one_agg_dataERNS_23BucketedAggDataVariantsEENKUlRT_E_clINS_15MethodKeysFixedI9PHHashMapINS_7UInt136EPc9HashCRC32IS9_EEEEEEvS4_ Line | Count | Source | 578 | 28.9k | [&](auto& agg_method) -> void { | 579 | 28.9k | if (use_simple_count) { | 580 | | // simple_count: mapped slots hold UInt64 counters, | 581 | | // not real agg state pointers. Skip destroy. | 582 | 0 | return; | 583 | 0 | } | 584 | 28.9k | auto& data = *agg_method.hash_table; | 585 | 28.9k | data.for_each_mapped([&](auto& mapped) { | 586 | 28.9k | if (mapped) { | 587 | 28.9k | _destroy_agg_status(mapped); | 588 | 28.9k | mapped = nullptr; | 589 | 28.9k | } | 590 | 28.9k | }); | 591 | | if constexpr (std::is_assignable_v<decltype(data.has_null_key_data()), | 592 | | bool>) { | 593 | | if (data.has_null_key_data()) { | 594 | | _destroy_agg_status( | 595 | | data.template get_null_key_data<AggregateDataPtr>()); | 596 | | } | 597 | | } | 598 | 28.9k | }}, |
Unexecuted instantiation: _ZZN5doris22BucketedAggSharedState19_close_one_agg_dataERNS_23BucketedAggDataVariantsEENKUlRT_E_clINS_15MethodKeysFixedI9PHHashMapIN4wide7integerILm128EjEEPc9HashCRC32ISB_EEEEEEvS4_ Unexecuted instantiation: _ZZN5doris22BucketedAggSharedState19_close_one_agg_dataERNS_23BucketedAggDataVariantsEENKUlRT_E_clINS_15MethodKeysFixedI9PHHashMapINS_7UInt104EPc9HashCRC32IS9_EEEEEEvS4_ _ZZN5doris22BucketedAggSharedState19_close_one_agg_dataERNS_23BucketedAggDataVariantsEENKUlRT_E_clINS_15MethodKeysFixedI9PHHashMapINS_6UInt96EPc9HashCRC32IS9_EEEEEEvS4_ Line | Count | Source | 578 | 256 | [&](auto& agg_method) -> void { | 579 | 256 | if (use_simple_count) { | 580 | | // simple_count: mapped slots hold UInt64 counters, | 581 | | // not real agg state pointers. Skip destroy. | 582 | 0 | return; | 583 | 0 | } | 584 | 256 | auto& data = *agg_method.hash_table; | 585 | 256 | data.for_each_mapped([&](auto& mapped) { | 586 | 256 | if (mapped) { | 587 | 256 | _destroy_agg_status(mapped); | 588 | 256 | mapped = nullptr; | 589 | 256 | } | 590 | 256 | }); | 591 | | if constexpr (std::is_assignable_v<decltype(data.has_null_key_data()), | 592 | | bool>) { | 593 | | if (data.has_null_key_data()) { | 594 | | _destroy_agg_status( | 595 | | data.template get_null_key_data<AggregateDataPtr>()); | 596 | | } | 597 | | } | 598 | 256 | }}, |
Unexecuted instantiation: _ZZN5doris22BucketedAggSharedState19_close_one_agg_dataERNS_23BucketedAggDataVariantsEENKUlRT_E_clINS_15MethodKeysFixedI9PHHashMapINS_6UInt72EPc9HashCRC32IS9_EEEEEEvS4_ Unexecuted instantiation: _ZZN5doris22BucketedAggSharedState19_close_one_agg_dataERNS_23BucketedAggDataVariantsEENKUlRT_E_clINS_15MethodKeysFixedI9PHHashMapImPc9HashCRC32ImEEEEEEvS4_ _ZZN5doris22BucketedAggSharedState19_close_one_agg_dataERNS_23BucketedAggDataVariantsEENKUlRT_E_clINS_26MethodSingleNullableColumnINS_19MethodStringNoCacheINS_15DataWithNullKeyI9PHHashMapINS_9StringRefEPc11DefaultHashISB_vEEEEEEEEEEvS4_ Line | Count | Source | 578 | 1.79k | [&](auto& agg_method) -> void { | 579 | 1.79k | if (use_simple_count) { | 580 | | // simple_count: mapped slots hold UInt64 counters, | 581 | | // not real agg state pointers. Skip destroy. | 582 | 1.53k | return; | 583 | 1.53k | } | 584 | 256 | auto& data = *agg_method.hash_table; | 585 | 256 | data.for_each_mapped([&](auto& mapped) { | 586 | 256 | if (mapped) { | 587 | 256 | _destroy_agg_status(mapped); | 588 | 256 | mapped = nullptr; | 589 | 256 | } | 590 | 256 | }); | 591 | | if constexpr (std::is_assignable_v<decltype(data.has_null_key_data()), | 592 | 256 | bool>) { | 593 | 256 | if (data.has_null_key_data()) { | 594 | 0 | _destroy_agg_status( | 595 | 0 | data.template get_null_key_data<AggregateDataPtr>()); | 596 | 0 | } | 597 | 256 | } | 598 | 256 | }}, |
Unexecuted instantiation: _ZZN5doris22BucketedAggSharedState19_close_one_agg_dataERNS_23BucketedAggDataVariantsEENKUlRT_E_clINS_26MethodSingleNullableColumnINS_15MethodOneNumberIN4wide7integerILm256EjEENS_15DataWithNullKeyI9PHHashMapISB_Pc9HashCRC32ISB_EEEEEEEEEEvS4_ Unexecuted instantiation: _ZZN5doris22BucketedAggSharedState19_close_one_agg_dataERNS_23BucketedAggDataVariantsEENKUlRT_E_clINS_26MethodSingleNullableColumnINS_15MethodOneNumberIN4wide7integerILm128EjEENS_15DataWithNullKeyI9PHHashMapISB_Pc9HashCRC32ISB_EEEEEEEEEEvS4_ Unexecuted instantiation: _ZZN5doris22BucketedAggSharedState19_close_one_agg_dataERNS_23BucketedAggDataVariantsEENKUlRT_E_clINS_26MethodSingleNullableColumnINS_15MethodOneNumberImNS_15DataWithNullKeyI9PHHashMapImPc14HashMixWrapperIm9HashCRC32ImEEEEEEEEEEEvS4_ Unexecuted instantiation: _ZZN5doris22BucketedAggSharedState19_close_one_agg_dataERNS_23BucketedAggDataVariantsEENKUlRT_E_clINS_26MethodSingleNullableColumnINS_15MethodOneNumberIjNS_15DataWithNullKeyI9PHHashMapIjPc14HashMixWrapperIj9HashCRC32IjEEEEEEEEEEEvS4_ _ZZN5doris22BucketedAggSharedState19_close_one_agg_dataERNS_23BucketedAggDataVariantsEENKUlRT_E_clINS_26MethodSingleNullableColumnINS_15MethodOneNumberImNS_15DataWithNullKeyI9PHHashMapImPc9HashCRC32ImEEEEEEEEEEvS4_ Line | Count | Source | 578 | 7.16k | [&](auto& agg_method) -> void { | 579 | 7.16k | if (use_simple_count) { | 580 | | // simple_count: mapped slots hold UInt64 counters, | 581 | | // not real agg state pointers. Skip destroy. | 582 | 1.53k | return; | 583 | 1.53k | } | 584 | 5.63k | auto& data = *agg_method.hash_table; | 585 | 5.63k | data.for_each_mapped([&](auto& mapped) { | 586 | 5.63k | if (mapped) { | 587 | 5.63k | _destroy_agg_status(mapped); | 588 | 5.63k | mapped = nullptr; | 589 | 5.63k | } | 590 | 5.63k | }); | 591 | | if constexpr (std::is_assignable_v<decltype(data.has_null_key_data()), | 592 | 5.63k | bool>) { | 593 | 5.63k | if (data.has_null_key_data()) { | 594 | 2 | _destroy_agg_status( | 595 | 2 | data.template get_null_key_data<AggregateDataPtr>()); | 596 | 2 | } | 597 | 5.63k | } | 598 | 5.63k | }}, |
_ZZN5doris22BucketedAggSharedState19_close_one_agg_dataERNS_23BucketedAggDataVariantsEENKUlRT_E_clINS_26MethodSingleNullableColumnINS_15MethodOneNumberIjNS_15DataWithNullKeyI9PHHashMapIjPc9HashCRC32IjEEEEEEEEEEvS4_ Line | Count | Source | 578 | 15.3k | [&](auto& agg_method) -> void { | 579 | 15.3k | if (use_simple_count) { | 580 | | // simple_count: mapped slots hold UInt64 counters, | 581 | | // not real agg state pointers. Skip destroy. | 582 | 0 | return; | 583 | 0 | } | 584 | 15.3k | auto& data = *agg_method.hash_table; | 585 | 15.3k | data.for_each_mapped([&](auto& mapped) { | 586 | 15.3k | if (mapped) { | 587 | 15.3k | _destroy_agg_status(mapped); | 588 | 15.3k | mapped = nullptr; | 589 | 15.3k | } | 590 | 15.3k | }); | 591 | | if constexpr (std::is_assignable_v<decltype(data.has_null_key_data()), | 592 | 15.3k | bool>) { | 593 | 15.3k | if (data.has_null_key_data()) { | 594 | 0 | _destroy_agg_status( | 595 | 0 | data.template get_null_key_data<AggregateDataPtr>()); | 596 | 0 | } | 597 | 15.3k | } | 598 | 15.3k | }}, |
_ZZN5doris22BucketedAggSharedState19_close_one_agg_dataERNS_23BucketedAggDataVariantsEENKUlRT_E_clINS_26MethodSingleNullableColumnINS_15MethodOneNumberItNS_15DataWithNullKeyI9PHHashMapItPc9HashCRC32ItEEEEEEEEEEvS4_ Line | Count | Source | 578 | 1.53k | [&](auto& agg_method) -> void { | 579 | 1.53k | if (use_simple_count) { | 580 | | // simple_count: mapped slots hold UInt64 counters, | 581 | | // not real agg state pointers. Skip destroy. | 582 | 0 | return; | 583 | 0 | } | 584 | 1.53k | auto& data = *agg_method.hash_table; | 585 | 1.53k | data.for_each_mapped([&](auto& mapped) { | 586 | 1.53k | if (mapped) { | 587 | 1.53k | _destroy_agg_status(mapped); | 588 | 1.53k | mapped = nullptr; | 589 | 1.53k | } | 590 | 1.53k | }); | 591 | | if constexpr (std::is_assignable_v<decltype(data.has_null_key_data()), | 592 | 1.53k | bool>) { | 593 | 1.53k | if (data.has_null_key_data()) { | 594 | 0 | _destroy_agg_status( | 595 | 0 | data.template get_null_key_data<AggregateDataPtr>()); | 596 | 0 | } | 597 | 1.53k | } | 598 | 1.53k | }}, |
Unexecuted instantiation: _ZZN5doris22BucketedAggSharedState19_close_one_agg_dataERNS_23BucketedAggDataVariantsEENKUlRT_E_clINS_26MethodSingleNullableColumnINS_15MethodOneNumberIhNS_15DataWithNullKeyI9PHHashMapIhPc9HashCRC32IhEEEEEEEEEEvS4_ Unexecuted instantiation: _ZZN5doris22BucketedAggSharedState19_close_one_agg_dataERNS_23BucketedAggDataVariantsEENKUlRT_E_clINS_15MethodOneNumberIm9PHHashMapImPc14HashMixWrapperIm9HashCRC32ImEEEEEEEvS4_ Unexecuted instantiation: _ZZN5doris22BucketedAggSharedState19_close_one_agg_dataERNS_23BucketedAggDataVariantsEENKUlRT_E_clINS_15MethodOneNumberIj9PHHashMapIjPc14HashMixWrapperIj9HashCRC32IjEEEEEEEvS4_ Unexecuted instantiation: _ZZN5doris22BucketedAggSharedState19_close_one_agg_dataERNS_23BucketedAggDataVariantsEENKUlRT_E_clINS_15MethodOneNumberIN4wide7integerILm256EjEE9PHHashMapISA_Pc9HashCRC32ISA_EEEEEEvS4_ Unexecuted instantiation: _ZZN5doris22BucketedAggSharedState19_close_one_agg_dataERNS_23BucketedAggDataVariantsEENKUlRT_E_clINS_15MethodOneNumberIN4wide7integerILm128EjEE9PHHashMapISA_Pc9HashCRC32ISA_EEEEEEvS4_ _ZZN5doris22BucketedAggSharedState19_close_one_agg_dataERNS_23BucketedAggDataVariantsEENKUlRT_E_clINS_19MethodStringNoCacheI9PHHashMapINS_9StringRefEPc11DefaultHashIS9_vEEEEEEvS4_ Line | Count | Source | 578 | 12.0k | [&](auto& agg_method) -> void { | 579 | 12.0k | if (use_simple_count) { | 580 | | // simple_count: mapped slots hold UInt64 counters, | 581 | | // not real agg state pointers. Skip destroy. | 582 | 4.09k | return; | 583 | 4.09k | } | 584 | 7.93k | auto& data = *agg_method.hash_table; | 585 | 7.93k | data.for_each_mapped([&](auto& mapped) { | 586 | 7.93k | if (mapped) { | 587 | 7.93k | _destroy_agg_status(mapped); | 588 | 7.93k | mapped = nullptr; | 589 | 7.93k | } | 590 | 7.93k | }); | 591 | | if constexpr (std::is_assignable_v<decltype(data.has_null_key_data()), | 592 | | bool>) { | 593 | | if (data.has_null_key_data()) { | 594 | | _destroy_agg_status( | 595 | | data.template get_null_key_data<AggregateDataPtr>()); | 596 | | } | 597 | | } | 598 | 7.93k | }}, |
Unexecuted instantiation: _ZZN5doris22BucketedAggSharedState19_close_one_agg_dataERNS_23BucketedAggDataVariantsEENKUlRT_E_clINS_15MethodOneNumberIm9PHHashMapImPc9HashCRC32ImEEEEEEvS4_ _ZZN5doris22BucketedAggSharedState19_close_one_agg_dataERNS_23BucketedAggDataVariantsEENKUlRT_E_clINS_15MethodOneNumberIj9PHHashMapIjPc9HashCRC32IjEEEEEEvS4_ Line | Count | Source | 578 | 2.81k | [&](auto& agg_method) -> void { | 579 | 2.81k | if (use_simple_count) { | 580 | | // simple_count: mapped slots hold UInt64 counters, | 581 | | // not real agg state pointers. Skip destroy. | 582 | 1.53k | return; | 583 | 1.53k | } | 584 | 1.28k | auto& data = *agg_method.hash_table; | 585 | 1.28k | data.for_each_mapped([&](auto& mapped) { | 586 | 1.28k | if (mapped) { | 587 | 1.28k | _destroy_agg_status(mapped); | 588 | 1.28k | mapped = nullptr; | 589 | 1.28k | } | 590 | 1.28k | }); | 591 | | if constexpr (std::is_assignable_v<decltype(data.has_null_key_data()), | 592 | | bool>) { | 593 | | if (data.has_null_key_data()) { | 594 | | _destroy_agg_status( | 595 | | data.template get_null_key_data<AggregateDataPtr>()); | 596 | | } | 597 | | } | 598 | 1.28k | }}, |
_ZZN5doris22BucketedAggSharedState19_close_one_agg_dataERNS_23BucketedAggDataVariantsEENKUlRT_E_clINS_15MethodOneNumberIt9PHHashMapItPc9HashCRC32ItEEEEEEvS4_ Line | Count | Source | 578 | 7.68k | [&](auto& agg_method) -> void { | 579 | 7.68k | if (use_simple_count) { | 580 | | // simple_count: mapped slots hold UInt64 counters, | 581 | | // not real agg state pointers. Skip destroy. | 582 | 0 | return; | 583 | 0 | } | 584 | 7.68k | auto& data = *agg_method.hash_table; | 585 | 7.68k | data.for_each_mapped([&](auto& mapped) { | 586 | 7.68k | if (mapped) { | 587 | 7.68k | _destroy_agg_status(mapped); | 588 | 7.68k | mapped = nullptr; | 589 | 7.68k | } | 590 | 7.68k | }); | 591 | | if constexpr (std::is_assignable_v<decltype(data.has_null_key_data()), | 592 | | bool>) { | 593 | | if (data.has_null_key_data()) { | 594 | | _destroy_agg_status( | 595 | | data.template get_null_key_data<AggregateDataPtr>()); | 596 | | } | 597 | | } | 598 | 7.68k | }}, |
_ZZN5doris22BucketedAggSharedState19_close_one_agg_dataERNS_23BucketedAggDataVariantsEENKUlRT_E_clINS_15MethodOneNumberIh9PHHashMapIhPc9HashCRC32IhEEEEEEvS4_ Line | Count | Source | 578 | 8.19k | [&](auto& agg_method) -> void { | 579 | 8.19k | if (use_simple_count) { | 580 | | // simple_count: mapped slots hold UInt64 counters, | 581 | | // not real agg state pointers. Skip destroy. | 582 | 0 | return; | 583 | 0 | } | 584 | 8.19k | auto& data = *agg_method.hash_table; | 585 | 8.19k | data.for_each_mapped([&](auto& mapped) { | 586 | 8.19k | if (mapped) { | 587 | 8.19k | _destroy_agg_status(mapped); | 588 | 8.19k | mapped = nullptr; | 589 | 8.19k | } | 590 | 8.19k | }); | 591 | | if constexpr (std::is_assignable_v<decltype(data.has_null_key_data()), | 592 | | bool>) { | 593 | | if (data.has_null_key_data()) { | 594 | | _destroy_agg_status( | 595 | | data.template get_null_key_data<AggregateDataPtr>()); | 596 | | } | 597 | | } | 598 | 8.19k | }}, |
_ZZN5doris22BucketedAggSharedState19_close_one_agg_dataERNS_23BucketedAggDataVariantsEENKUlRT_E_clINS_16MethodSerializedI9PHHashMapINS_9StringRefEPc11DefaultHashIS9_vEEEEEEvS4_ Line | Count | Source | 578 | 12.2k | [&](auto& agg_method) -> void { | 579 | 12.2k | if (use_simple_count) { | 580 | | // simple_count: mapped slots hold UInt64 counters, | 581 | | // not real agg state pointers. Skip destroy. | 582 | 0 | return; | 583 | 0 | } | 584 | 12.2k | auto& data = *agg_method.hash_table; | 585 | 12.2k | data.for_each_mapped([&](auto& mapped) { | 586 | 12.2k | if (mapped) { | 587 | 12.2k | _destroy_agg_status(mapped); | 588 | 12.2k | mapped = nullptr; | 589 | 12.2k | } | 590 | 12.2k | }); | 591 | | if constexpr (std::is_assignable_v<decltype(data.has_null_key_data()), | 592 | | bool>) { | 593 | | if (data.has_null_key_data()) { | 594 | | _destroy_agg_status( | 595 | | data.template get_null_key_data<AggregateDataPtr>()); | 596 | | } | 597 | | } | 598 | 12.2k | }}, |
|
599 | 102k | agg_data.method_variant); |
600 | 102k | } |
601 | | |
602 | | void _destroy_agg_status(AggregateDataPtr data); |
603 | | }; |
604 | | |
605 | | struct PartitionedAggSharedState : public BasicSharedState, |
606 | | public std::enable_shared_from_this<PartitionedAggSharedState> { |
607 | | ENABLE_FACTORY_CREATOR(PartitionedAggSharedState) |
608 | | |
609 | 148 | PartitionedAggSharedState() = default; |
610 | 148 | ~PartitionedAggSharedState() override { close(); } |
611 | | |
612 | | void close(); |
613 | | |
614 | | AggSharedState* _in_mem_shared_state = nullptr; |
615 | | std::shared_ptr<BasicSharedState> _in_mem_shared_state_sptr; |
616 | | |
617 | | // partition count is no longer stored in shared state; operators maintain their own |
618 | | std::atomic<bool> _is_spilled = false; |
619 | | // This state is shared by the partitioned agg sink and source pipelines. Spill files left |
620 | | // here are owned by the shared state until the source moves them into its local queue, so the |
621 | | // cleanup must be tied to the shared state's lifetime and must be idempotent. |
622 | | std::atomic_bool is_closed = false; |
623 | | std::deque<SpillFileSPtr> _spill_partitions; |
624 | | }; |
625 | | |
626 | | struct SortSharedState : public BasicSharedState { |
627 | | ENABLE_FACTORY_CREATOR(SortSharedState) |
628 | | public: |
629 | | std::shared_ptr<Sorter> sorter; |
630 | | }; |
631 | | |
632 | | struct SpillSortSharedState : public BasicSharedState, |
633 | | public std::enable_shared_from_this<SpillSortSharedState> { |
634 | | ENABLE_FACTORY_CREATOR(SpillSortSharedState) |
635 | | |
636 | 33 | SpillSortSharedState() = default; |
637 | 33 | ~SpillSortSharedState() override = default; |
638 | | |
639 | 587 | void update_spill_block_batch_row_count(RuntimeState* state, const Block* block) { |
640 | 587 | auto rows = block->rows(); |
641 | 587 | if (rows > 0 && 0 == avg_row_bytes) { |
642 | 19 | avg_row_bytes = std::max((std::size_t)1, block->bytes() / rows); |
643 | 19 | spill_block_batch_row_count = |
644 | 19 | (state->spill_buffer_size_bytes() + avg_row_bytes - 1) / avg_row_bytes; |
645 | 19 | LOG(INFO) << "spill sort block batch row count: " << spill_block_batch_row_count; |
646 | 19 | } |
647 | 587 | } |
648 | | |
649 | | void close(); |
650 | | |
651 | | SortSharedState* in_mem_shared_state = nullptr; |
652 | | bool enable_spill = false; |
653 | | bool is_spilled = false; |
654 | | int64_t limit = -1; |
655 | | int64_t offset = 0; |
656 | | std::atomic_bool is_closed = false; |
657 | | std::shared_ptr<BasicSharedState> in_mem_shared_state_sptr; |
658 | | |
659 | | std::deque<SpillFileSPtr> sorted_spill_groups; |
660 | | size_t avg_row_bytes = 0; |
661 | | size_t spill_block_batch_row_count; |
662 | | }; |
663 | | |
664 | | struct UnionSharedState : public BasicSharedState { |
665 | | ENABLE_FACTORY_CREATOR(UnionSharedState) |
666 | | |
667 | | public: |
668 | 3.23k | UnionSharedState(int child_count = 1) : data_queue(child_count), _child_count(child_count) {}; |
669 | 0 | int child_count() const { return _child_count; } |
670 | | DataQueue data_queue; |
671 | | const int _child_count; |
672 | | }; |
673 | | |
674 | | struct DataQueueSharedState : public BasicSharedState { |
675 | | ENABLE_FACTORY_CREATOR(DataQueueSharedState) |
676 | | public: |
677 | | DataQueue data_queue; |
678 | | }; |
679 | | |
680 | | class MultiCastDataStreamer; |
681 | | |
682 | | struct MultiCastSharedState : public BasicSharedState, |
683 | | public std::enable_shared_from_this<MultiCastSharedState> { |
684 | | MultiCastSharedState(ObjectPool* pool, int cast_sender_count, int node_id); |
685 | | |
686 | | std::unique_ptr<MultiCastDataStreamer> multi_cast_data_streamer; |
687 | | }; |
688 | | |
689 | | struct AnalyticSharedState : public BasicSharedState { |
690 | | ENABLE_FACTORY_CREATOR(AnalyticSharedState) |
691 | | |
692 | | public: |
693 | 7.06k | AnalyticSharedState() = default; |
694 | | std::queue<Block> blocks_buffer GUARDED_BY(buffer_mutex); |
695 | | AnnotatedMutex buffer_mutex; |
696 | | bool sink_eos GUARDED_BY(sink_eos_lock) = false; |
697 | | AnnotatedMutex sink_eos_lock; |
698 | | Arena agg_arena_pool; |
699 | | }; |
700 | | |
701 | | struct JoinSharedState : public BasicSharedState { |
702 | | // For some join case, we can apply a short circuit strategy |
703 | | // 1. _has_null_in_build_side = true |
704 | | // 2. build side rows is empty, Join op is: inner join/right outer join/left semi/right semi/right anti |
705 | | bool _has_null_in_build_side = false; |
706 | | bool short_circuit_for_probe = false; |
707 | | // for some join, when build side rows is empty, we could return directly by add some additional null data in probe table. |
708 | | bool empty_right_table_need_probe_dispose = false; |
709 | | JoinOpVariants join_op_variants; |
710 | | }; |
711 | | |
712 | | struct HashJoinSharedState : public JoinSharedState { |
713 | | ENABLE_FACTORY_CREATOR(HashJoinSharedState) |
714 | 97.5k | HashJoinSharedState() { |
715 | 97.5k | hash_table_variant_vector.push_back(std::make_shared<JoinDataVariants>()); |
716 | 97.5k | } |
717 | 5.09k | HashJoinSharedState(int num_instances) { |
718 | 5.09k | source_deps.resize(num_instances, nullptr); |
719 | 5.09k | hash_table_variant_vector.resize(num_instances, nullptr); |
720 | 24.2k | for (int i = 0; i < num_instances; i++) { |
721 | 19.1k | hash_table_variant_vector[i] = std::make_shared<JoinDataVariants>(); |
722 | 19.1k | } |
723 | 5.09k | } |
724 | | std::shared_ptr<Arena> arena = std::make_shared<Arena>(); |
725 | | |
726 | | const std::vector<TupleDescriptor*> build_side_child_desc; |
727 | | size_t build_exprs_size = 0; |
728 | | std::shared_ptr<Block> build_block; |
729 | | std::shared_ptr<std::vector<uint32_t>> build_indexes_null; |
730 | | |
731 | | // Used by shared hash table |
732 | | // For probe operator, hash table in _hash_table_variants is read-only if visited flags is not |
733 | | // used. (visited flags will be used only in right / full outer join). |
734 | | // |
735 | | // For broadcast join, although hash table is read-only, some states in `_hash_table_variants` |
736 | | // are still could be written. For example, serialized keys will be written in a continuous |
737 | | // memory in `_hash_table_variants`. So before execution, we should use a local _hash_table_variants |
738 | | // which has a shared hash table in it. |
739 | | std::vector<std::shared_ptr<JoinDataVariants>> hash_table_variant_vector; |
740 | | |
741 | | // whether left semi join could directly return |
742 | | // if runtime filters contains local in filter, we can make sure all input rows are matched |
743 | | // local filter will always be applied, and in filter could guarantee precise filtering |
744 | | // ATTN: we should disable always_true logic for in filter when we set this flag |
745 | | bool left_semi_direct_return = false; |
746 | | |
747 | | // ASOF JOIN specific fields |
748 | | // Whether the inequality is >= or > (true) vs <= or < (false) |
749 | | bool asof_inequality_is_greater = true; |
750 | | // Whether the inequality is strict (> or <) vs non-strict (>= or <=) |
751 | | bool asof_inequality_is_strict = false; |
752 | | |
753 | | // ASOF JOIN pre-sorted index with inline values for O(log K) branchless lookup |
754 | | // Typed AsofIndexGroups stored in a variant (uint32_t for DateV2, uint64_t for DateTimeV2/TimestampTZ) |
755 | | AsofIndexVariant asof_index_groups; |
756 | | // build_row_index -> bucket_id for O(1) reverse lookup |
757 | | std::vector<uint32_t> asof_build_row_to_bucket; |
758 | | }; |
759 | | |
760 | | struct PartitionedHashJoinSharedState |
761 | | : public HashJoinSharedState, |
762 | | public std::enable_shared_from_this<PartitionedHashJoinSharedState> { |
763 | | ENABLE_FACTORY_CREATOR(PartitionedHashJoinSharedState) |
764 | | |
765 | | std::unique_ptr<RuntimeState> _inner_runtime_state; |
766 | | std::shared_ptr<HashJoinSharedState> _inner_shared_state; |
767 | | std::vector<std::unique_ptr<MutableBlock>> _partitioned_build_blocks; |
768 | | std::vector<SpillFileSPtr> _spilled_build_groups; |
769 | | std::atomic<bool> _is_spilled = false; |
770 | | }; |
771 | | |
772 | | struct NestedLoopJoinSharedState : public JoinSharedState { |
773 | | ENABLE_FACTORY_CREATOR(NestedLoopJoinSharedState) |
774 | | // if true, probe child has no more rows to process |
775 | | bool probe_side_eos = false; |
776 | | // Visited flags for each row in build side. |
777 | | MutableColumns build_side_visited_flags; |
778 | | // List of build blocks, constructed in prepare() |
779 | | Blocks build_blocks; |
780 | | }; |
781 | | |
782 | | struct PartitionSortNodeSharedState : public BasicSharedState { |
783 | | ENABLE_FACTORY_CREATOR(PartitionSortNodeSharedState) |
784 | | public: |
785 | | std::queue<Block> blocks_buffer GUARDED_BY(buffer_mutex); |
786 | | AnnotatedMutex buffer_mutex; |
787 | | std::vector<std::unique_ptr<PartitionSorter>> partition_sorts; |
788 | | bool sink_eos GUARDED_BY(sink_eos_lock) = false; |
789 | | AnnotatedMutex sink_eos_lock; |
790 | | AnnotatedMutex prepared_finish_lock; |
791 | | }; |
792 | | |
793 | | struct SetSharedState : public BasicSharedState { |
794 | | ENABLE_FACTORY_CREATOR(SetSharedState) |
795 | | public: |
796 | | /// default init |
797 | | Block build_block; // build to source |
798 | | //record element size in hashtable |
799 | | int64_t valid_element_in_hash_tbl = 0; |
800 | | //first: idx mapped to column types |
801 | | //second: column_id, could point to origin column or cast column |
802 | | std::unordered_map<int, int> build_col_idx; |
803 | | |
804 | | //// shared static states (shared, decided in prepare/open...) |
805 | | |
806 | | /// init in setup_local_state |
807 | | std::unique_ptr<SetDataVariants> hash_table_variants = |
808 | | std::make_unique<SetDataVariants>(); // the real data HERE. |
809 | | std::vector<bool> build_not_ignore_null; |
810 | | |
811 | | // The SET operator's child might have different nullable attributes. |
812 | | // If a calculation involves both nullable and non-nullable columns, the final output should be a nullable column |
813 | | Status update_build_not_ignore_null(const VExprContextSPtrs& ctxs); |
814 | | |
815 | | size_t get_hash_table_size() const; |
816 | | /// init in both upstream side. |
817 | | //The i-th result expr list refers to the i-th child. |
818 | | std::vector<VExprContextSPtrs> child_exprs_lists; |
819 | | |
820 | | /// init in build side |
821 | | size_t child_quantity; |
822 | | VExprContextSPtrs build_child_exprs; |
823 | | std::vector<Dependency*> probe_finished_children_dependency; |
824 | | |
825 | | /// init in probe side |
826 | | std::vector<VExprContextSPtrs> probe_child_exprs_lists; |
827 | | |
828 | | std::atomic<bool> ready_for_read = false; |
829 | | |
830 | | Arena arena; |
831 | | |
832 | | /// called in setup_local_state |
833 | | Status hash_table_init(); |
834 | | }; |
835 | | |
836 | 1.21M | inline bool is_shuffled_exchange(TLocalPartitionType::type idx) { |
837 | 1.21M | return idx == TLocalPartitionType::GLOBAL_EXECUTION_HASH_SHUFFLE || |
838 | 1.21M | idx == TLocalPartitionType::LOCAL_EXECUTION_HASH_SHUFFLE || |
839 | 1.21M | idx == TLocalPartitionType::BUCKET_HASH_SHUFFLE; |
840 | 1.21M | } |
841 | | |
842 | 228k | inline std::string get_exchange_type_name(TLocalPartitionType::type idx) { |
843 | 228k | switch (idx) { |
844 | 14 | case TLocalPartitionType::NOOP: |
845 | 14 | return "NOOP"; |
846 | 65 | case TLocalPartitionType::GLOBAL_EXECUTION_HASH_SHUFFLE: |
847 | 65 | return "GLOBAL_HASH_SHUFFLE"; |
848 | 34.0k | case TLocalPartitionType::LOCAL_EXECUTION_HASH_SHUFFLE: |
849 | 34.0k | return "LOCAL_HASH_SHUFFLE"; |
850 | 186k | case TLocalPartitionType::PASSTHROUGH: |
851 | 186k | return "PASSTHROUGH"; |
852 | 982 | case TLocalPartitionType::BUCKET_HASH_SHUFFLE: |
853 | 982 | return "BUCKET_HASH_SHUFFLE"; |
854 | 608 | case TLocalPartitionType::BROADCAST: |
855 | 608 | return "BROADCAST"; |
856 | 1.86k | case TLocalPartitionType::ADAPTIVE_PASSTHROUGH: |
857 | 1.86k | return "ADAPTIVE_PASSTHROUGH"; |
858 | 4.70k | case TLocalPartitionType::PASS_TO_ONE: |
859 | 4.70k | return "PASS_TO_ONE"; |
860 | 0 | case TLocalPartitionType::LOCAL_MERGE_SORT: |
861 | 0 | return "LOCAL_MERGE_SORT"; |
862 | 228k | } |
863 | 0 | throw Exception(Status::FatalError("__builtin_unreachable")); |
864 | 228k | } |
865 | | |
866 | | struct DataDistribution { |
867 | 1.97M | DataDistribution(TLocalPartitionType::type type) : distribution_type(type) {} |
868 | | DataDistribution(TLocalPartitionType::type type, const std::vector<TExpr>& partition_exprs_) |
869 | 73.5k | : distribution_type(type), partition_exprs(partition_exprs_) {} |
870 | 8.13k | DataDistribution(const DataDistribution& other) = default; |
871 | 206k | bool need_local_exchange() const { return distribution_type != TLocalPartitionType::NOOP; } |
872 | 219k | DataDistribution& operator=(const DataDistribution& other) = default; |
873 | | TLocalPartitionType::type distribution_type; |
874 | | std::vector<TExpr> partition_exprs; |
875 | | }; |
876 | | |
877 | | class ExchangerBase; |
878 | | |
879 | | struct LocalExchangeSharedState : public BasicSharedState { |
880 | | public: |
881 | | ENABLE_FACTORY_CREATOR(LocalExchangeSharedState); |
882 | | LocalExchangeSharedState(int num_instances); |
883 | | ~LocalExchangeSharedState() override; |
884 | | std::unique_ptr<ExchangerBase> exchanger {}; |
885 | | std::vector<RuntimeProfile::Counter*> mem_counters; |
886 | | std::atomic<int64_t> mem_usage = 0; |
887 | | std::atomic<size_t> _buffer_mem_limit = config::local_exchange_buffer_mem_limit; |
888 | | // We need to make sure to add mem_usage first and then enqueue, otherwise sub mem_usage may cause negative mem_usage during concurrent dequeue. |
889 | | std::mutex le_lock; |
890 | | void sub_running_sink_operators(); |
891 | | void sub_running_source_operators(); |
892 | 229k | void _set_always_ready() { |
893 | 1.38M | for (auto& dep : source_deps) { |
894 | 1.38M | DCHECK(dep); |
895 | 1.38M | dep->set_always_ready(); |
896 | 1.38M | } |
897 | 229k | for (auto& dep : sink_deps) { |
898 | 229k | DCHECK(dep); |
899 | 229k | dep->set_always_ready(); |
900 | 229k | } |
901 | 229k | } |
902 | | |
903 | 253k | Dependency* get_sink_dep_by_channel_id(int channel_id) { return nullptr; } |
904 | | |
905 | 253k | void set_ready_to_read(int channel_id) { |
906 | 253k | auto& dep = source_deps[channel_id]; |
907 | 18.4E | DCHECK(dep) << channel_id; |
908 | 253k | dep->set_ready(); |
909 | 253k | } |
910 | | |
911 | 253k | void add_mem_usage(int channel_id, size_t delta) { mem_counters[channel_id]->update(delta); } |
912 | | |
913 | 253k | void sub_mem_usage(int channel_id, size_t delta) { |
914 | 253k | mem_counters[channel_id]->update(-(int64_t)delta); |
915 | 253k | } |
916 | | |
917 | 209k | void add_total_mem_usage(size_t delta) { |
918 | 209k | if (cast_set<int64_t>(mem_usage.fetch_add(delta) + delta) > _buffer_mem_limit) { |
919 | 1.06k | sink_deps.front()->block(); |
920 | 1.06k | } |
921 | 209k | } |
922 | | |
923 | 209k | void sub_total_mem_usage(size_t delta) { |
924 | 209k | auto prev_usage = mem_usage.fetch_sub(delta); |
925 | 209k | DCHECK_GE(prev_usage, cast_set<int64_t>(delta)) |
926 | 0 | << "prev_usage: " << prev_usage << " delta: " << delta; |
927 | 209k | if (cast_set<int64_t>(prev_usage - delta) <= _buffer_mem_limit) { |
928 | 208k | sink_deps.front()->set_ready(); |
929 | 208k | } |
930 | 209k | } |
931 | | |
932 | 0 | void set_low_memory_mode(RuntimeState* state) { |
933 | 0 | _buffer_mem_limit = std::min<int64_t>(config::local_exchange_buffer_mem_limit, |
934 | 0 | state->low_memory_mode_buffer_limit()); |
935 | 0 | } |
936 | | }; |
937 | | |
938 | | } // namespace doris |