Coverage Report

Created: 2026-01-23 04:49

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/root/doris/be/src/pipeline/dependency.cpp
Line
Count
Source
1
// Licensed to the Apache Software Foundation (ASF) under one
2
// or more contributor license agreements.  See the NOTICE file
3
// distributed with this work for additional information
4
// regarding copyright ownership.  The ASF licenses this file
5
// to you under the Apache License, Version 2.0 (the
6
// "License"); you may not use this file except in compliance
7
// with the License.  You may obtain a copy of the License at
8
//
9
//   http://www.apache.org/licenses/LICENSE-2.0
10
//
11
// Unless required by applicable law or agreed to in writing,
12
// software distributed under the License is distributed on an
13
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
14
// KIND, either express or implied.  See the License for the
15
// specific language governing permissions and limitations
16
// under the License.
17
18
#include "dependency.h"
19
20
#include <memory>
21
#include <mutex>
22
23
#include "common/logging.h"
24
#include "exec/rowid_fetcher.h"
25
#include "pipeline/exec/multi_cast_data_streamer.h"
26
#include "pipeline/pipeline_fragment_context.h"
27
#include "pipeline/pipeline_task.h"
28
#include "runtime/exec_env.h"
29
#include "runtime/memory/mem_tracker.h"
30
#include "runtime_filter/runtime_filter_consumer.h"
31
#include "util/brpc_client_cache.h"
32
#include "vec/exec/scan/file_scanner.h"
33
#include "vec/exprs/vectorized_agg_fn.h"
34
#include "vec/exprs/vslot_ref.h"
35
#include "vec/spill/spill_stream_manager.h"
36
#include "vec/utils/util.hpp"
37
38
namespace doris::pipeline {
39
#include "common/compile_check_begin.h"
40
41
Dependency* BasicSharedState::create_source_dependency(int operator_id, int node_id,
42
378k
                                                       const std::string& name) {
43
378k
    source_deps.push_back(std::make_shared<Dependency>(operator_id, node_id, name + "_DEPENDENCY"));
44
378k
    source_deps.back()->set_shared_state(this);
45
378k
    return source_deps.back().get();
46
378k
}
47
48
void BasicSharedState::create_source_dependencies(int num_sources, int operator_id, int node_id,
49
102k
                                                  const std::string& name) {
50
102k
    source_deps.resize(num_sources, nullptr);
51
633k
    for (auto& source_dep : source_deps) {
52
633k
        source_dep = std::make_shared<Dependency>(operator_id, node_id, name + "_DEPENDENCY");
53
633k
        source_dep->set_shared_state(this);
54
633k
    }
55
102k
}
56
57
Dependency* BasicSharedState::create_sink_dependency(int dest_id, int node_id,
58
885k
                                                     const std::string& name) {
59
885k
    sink_deps.push_back(std::make_shared<Dependency>(dest_id, node_id, name + "_DEPENDENCY", true));
60
885k
    sink_deps.back()->set_shared_state(this);
61
885k
    return sink_deps.back().get();
62
885k
}
63
64
3.90M
void Dependency::_add_block_task(std::shared_ptr<PipelineTask> task) {
65
18.4E
    DCHECK(_blocked_task.empty() || _blocked_task[_blocked_task.size() - 1].lock() == nullptr ||
66
18.4E
           _blocked_task[_blocked_task.size() - 1].lock().get() != task.get())
67
18.4E
            << "Duplicate task: " << task->debug_string();
68
3.90M
    _blocked_task.push_back(task);
69
3.90M
}
70
71
14.2M
void Dependency::set_ready() {
72
14.2M
    if (_ready) {
73
10.5M
        return;
74
10.5M
    }
75
3.70M
    std::vector<std::weak_ptr<PipelineTask>> local_block_task {};
76
3.70M
    {
77
3.70M
        std::unique_lock<std::mutex> lc(_task_lock);
78
3.70M
        if (_ready) {
79
1
            return;
80
1
        }
81
3.70M
        _watcher.stop();
82
3.70M
        _ready = true;
83
3.70M
        local_block_task.swap(_blocked_task);
84
3.70M
    }
85
3.91M
    for (auto task : local_block_task) {
86
3.91M
        if (auto t = task.lock()) {
87
3.91M
            std::unique_lock<std::mutex> lc(_task_lock);
88
3.91M
            THROW_IF_ERROR(t->wake_up(this, lc));
89
3.91M
        }
90
3.91M
    }
91
3.70M
}
92
93
30.0M
Dependency* Dependency::is_blocked_by(std::shared_ptr<PipelineTask> task) {
94
30.0M
    std::unique_lock<std::mutex> lc(_task_lock);
95
30.0M
    auto ready = _ready.load();
96
30.0M
    if (!ready && task) {
97
3.91M
        _add_block_task(task);
98
3.91M
        start_watcher();
99
3.91M
        THROW_IF_ERROR(task->blocked(this, lc));
100
3.91M
    }
101
30.0M
    return ready ? nullptr : this;
102
30.0M
}
103
104
173k
std::string Dependency::debug_string(int indentation_level) {
105
173k
    fmt::memory_buffer debug_string_buffer;
106
173k
    fmt::format_to(debug_string_buffer, "{}{}: id={}, block task = {}, ready={}, _always_ready={}",
107
173k
                   std::string(indentation_level * 2, ' '), _name, _node_id, _blocked_task.size(),
108
173k
                   _ready, _always_ready);
109
173k
    return fmt::to_string(debug_string_buffer);
110
173k
}
111
112
0
std::string CountedFinishDependency::debug_string(int indentation_level) {
113
0
    fmt::memory_buffer debug_string_buffer;
114
0
    fmt::format_to(debug_string_buffer,
115
0
                   "{}{}: id={}, block_task={}, ready={}, _always_ready={}, count={}",
116
0
                   std::string(indentation_level * 2, ' '), _name, _node_id, _blocked_task.size(),
117
0
                   _ready, _always_ready, _counter);
118
0
    return fmt::to_string(debug_string_buffer);
119
0
}
120
121
3.37k
void RuntimeFilterTimer::call_timeout() {
122
3.37k
    _parent->set_ready();
123
3.37k
}
124
125
15.6k
void RuntimeFilterTimer::call_ready() {
126
15.6k
    _parent->set_ready();
127
15.6k
}
128
129
// should check rf timeout in two case:
130
// 1. the rf is ready just remove the wait queue
131
// 2. if the rf have local dependency, the rf should start wait when all local dependency is ready
132
631k
bool RuntimeFilterTimer::should_be_check_timeout() {
133
631k
    if (!_parent->ready() && !_local_runtime_filter_dependencies.empty()) {
134
6.47k
        bool all_ready = true;
135
6.47k
        for (auto& dep : _local_runtime_filter_dependencies) {
136
6.47k
            if (!dep->ready()) {
137
6.32k
                all_ready = false;
138
6.32k
                break;
139
6.32k
            }
140
6.47k
        }
141
6.47k
        if (all_ready) {
142
152
            _local_runtime_filter_dependencies.clear();
143
152
            _registration_time = MonotonicMillis();
144
152
        }
145
6.47k
        return all_ready;
146
6.47k
    }
147
624k
    return true;
148
631k
}
149
150
8
void RuntimeFilterTimerQueue::start() {
151
93.8k
    while (!_stop) {
152
93.8k
        std::unique_lock<std::mutex> lk(cv_m);
153
154
97.9k
        while (_que.empty() && !_stop) {
155
8.26k
            cv.wait_for(lk, std::chrono::seconds(3), [this] { return !_que.empty() || _stop; });
156
4.13k
        }
157
93.8k
        if (_stop) {
158
3
            break;
159
3
        }
160
93.8k
        {
161
93.8k
            std::unique_lock<std::mutex> lc(_que_lock);
162
93.8k
            std::list<std::shared_ptr<pipeline::RuntimeFilterTimer>> new_que;
163
631k
            for (auto& it : _que) {
164
631k
                if (it.use_count() == 1) {
165
                    // `use_count == 1` means this runtime filter has been released
166
631k
                } else if (it->should_be_check_timeout()) {
167
624k
                    if (it->force_wait_timeout() || it->_parent->is_blocked_by()) {
168
                        // This means runtime filter is not ready, so we call timeout or continue to poll this timer.
169
612k
                        int64_t ms_since_registration = MonotonicMillis() - it->registration_time();
170
612k
                        if (ms_since_registration > it->wait_time_ms()) {
171
3.37k
                            it->call_timeout();
172
609k
                        } else {
173
609k
                            new_que.push_back(std::move(it));
174
609k
                        }
175
612k
                    }
176
624k
                } else {
177
6.32k
                    new_que.push_back(std::move(it));
178
6.32k
                }
179
631k
            }
180
93.8k
            new_que.swap(_que);
181
93.8k
        }
182
93.8k
        std::this_thread::sleep_for(std::chrono::milliseconds(interval));
183
93.8k
    }
184
8
    _shutdown = true;
185
8
}
186
187
226k
void LocalExchangeSharedState::sub_running_sink_operators() {
188
226k
    std::unique_lock<std::mutex> lc(le_lock);
189
226k
    if (exchanger->_running_sink_operators.fetch_sub(1) == 1) {
190
98.9k
        _set_always_ready();
191
98.9k
    }
192
226k
}
193
194
616k
void LocalExchangeSharedState::sub_running_source_operators() {
195
616k
    std::unique_lock<std::mutex> lc(le_lock);
196
616k
    if (exchanger->_running_source_operators.fetch_sub(1) == 1) {
197
98.9k
        _set_always_ready();
198
98.9k
        exchanger->finalize();
199
98.9k
    }
200
616k
}
201
202
98.8k
LocalExchangeSharedState::LocalExchangeSharedState(int num_instances) {
203
98.8k
    source_deps.resize(num_instances, nullptr);
204
98.8k
    mem_counters.resize(num_instances, nullptr);
205
98.8k
}
206
207
290
vectorized::MutableColumns AggSharedState::_get_keys_hash_table() {
208
290
    return std::visit(
209
290
            vectorized::Overload {
210
290
                    [&](std::monostate& arg) {
211
0
                        throw doris::Exception(ErrorCode::INTERNAL_ERROR, "uninited hash table");
212
0
                        return vectorized::MutableColumns();
213
0
                    },
214
290
                    [&](auto&& agg_method) -> vectorized::MutableColumns {
215
290
                        vectorized::MutableColumns key_columns;
216
1.00k
                        for (int i = 0; i < probe_expr_ctxs.size(); ++i) {
217
716
                            key_columns.emplace_back(
218
716
                                    probe_expr_ctxs[i]->root()->data_type()->create_column());
219
716
                        }
220
290
                        auto& data = *agg_method.hash_table;
221
290
                        bool has_null_key = data.has_null_key_data();
222
290
                        const auto size = data.size() - has_null_key;
223
290
                        using KeyType = std::decay_t<decltype(agg_method)>::Key;
224
290
                        std::vector<KeyType> keys(size);
225
226
290
                        uint32_t num_rows = 0;
227
290
                        auto iter = aggregate_data_container->begin();
228
290
                        {
229
5.77k
                            while (iter != aggregate_data_container->end()) {
230
5.48k
                                keys[num_rows] = iter.get_key<KeyType>();
231
5.48k
                                ++iter;
232
5.48k
                                ++num_rows;
233
5.48k
                            }
234
290
                        }
235
290
                        agg_method.insert_keys_into_columns(keys, key_columns, num_rows);
236
290
                        if (has_null_key) {
237
2
                            key_columns[0]->insert_data(nullptr, 0);
238
2
                        }
239
290
                        return key_columns;
240
290
                    }},
dependency.cpp:_ZZN5doris8pipeline14AggSharedState20_get_keys_hash_tableEvENK3$_1clIRNS_10vectorized16MethodSerializedI9PHHashMapINS_9StringRefEPc11DefaultHashIS7_vEEEEEESt6vectorINS_3COWINS4_7IColumnEE11mutable_ptrISG_EESaISJ_EEOT_
Line
Count
Source
214
32
                    [&](auto&& agg_method) -> vectorized::MutableColumns {
215
32
                        vectorized::MutableColumns key_columns;
216
160
                        for (int i = 0; i < probe_expr_ctxs.size(); ++i) {
217
128
                            key_columns.emplace_back(
218
128
                                    probe_expr_ctxs[i]->root()->data_type()->create_column());
219
128
                        }
220
32
                        auto& data = *agg_method.hash_table;
221
32
                        bool has_null_key = data.has_null_key_data();
222
32
                        const auto size = data.size() - has_null_key;
223
32
                        using KeyType = std::decay_t<decltype(agg_method)>::Key;
224
32
                        std::vector<KeyType> keys(size);
225
226
32
                        uint32_t num_rows = 0;
227
32
                        auto iter = aggregate_data_container->begin();
228
32
                        {
229
1.95k
                            while (iter != aggregate_data_container->end()) {
230
1.91k
                                keys[num_rows] = iter.get_key<KeyType>();
231
1.91k
                                ++iter;
232
1.91k
                                ++num_rows;
233
1.91k
                            }
234
32
                        }
235
32
                        agg_method.insert_keys_into_columns(keys, key_columns, num_rows);
236
32
                        if (has_null_key) {
237
0
                            key_columns[0]->insert_data(nullptr, 0);
238
0
                        }
239
32
                        return key_columns;
240
32
                    }},
Unexecuted instantiation: dependency.cpp:_ZZN5doris8pipeline14AggSharedState20_get_keys_hash_tableEvENK3$_1clIRNS_10vectorized15MethodOneNumberIh9PHHashMapIhPc9HashCRC32IhEEEEEESt6vectorINS_3COWINS4_7IColumnEE11mutable_ptrISF_EESaISI_EEOT_
Unexecuted instantiation: dependency.cpp:_ZZN5doris8pipeline14AggSharedState20_get_keys_hash_tableEvENK3$_1clIRNS_10vectorized15MethodOneNumberIt9PHHashMapItPc9HashCRC32ItEEEEEESt6vectorINS_3COWINS4_7IColumnEE11mutable_ptrISF_EESaISI_EEOT_
Unexecuted instantiation: dependency.cpp:_ZZN5doris8pipeline14AggSharedState20_get_keys_hash_tableEvENK3$_1clIRNS_10vectorized15MethodOneNumberIj9PHHashMapIjPc9HashCRC32IjEEEEEESt6vectorINS_3COWINS4_7IColumnEE11mutable_ptrISF_EESaISI_EEOT_
dependency.cpp:_ZZN5doris8pipeline14AggSharedState20_get_keys_hash_tableEvENK3$_1clIRNS_10vectorized15MethodOneNumberIm9PHHashMapImPc9HashCRC32ImEEEEEESt6vectorINS_3COWINS4_7IColumnEE11mutable_ptrISF_EESaISI_EEOT_
Line
Count
Source
214
2
                    [&](auto&& agg_method) -> vectorized::MutableColumns {
215
2
                        vectorized::MutableColumns key_columns;
216
4
                        for (int i = 0; i < probe_expr_ctxs.size(); ++i) {
217
2
                            key_columns.emplace_back(
218
2
                                    probe_expr_ctxs[i]->root()->data_type()->create_column());
219
2
                        }
220
2
                        auto& data = *agg_method.hash_table;
221
2
                        bool has_null_key = data.has_null_key_data();
222
2
                        const auto size = data.size() - has_null_key;
223
2
                        using KeyType = std::decay_t<decltype(agg_method)>::Key;
224
2
                        std::vector<KeyType> keys(size);
225
226
2
                        uint32_t num_rows = 0;
227
2
                        auto iter = aggregate_data_container->begin();
228
2
                        {
229
12
                            while (iter != aggregate_data_container->end()) {
230
10
                                keys[num_rows] = iter.get_key<KeyType>();
231
10
                                ++iter;
232
10
                                ++num_rows;
233
10
                            }
234
2
                        }
235
2
                        agg_method.insert_keys_into_columns(keys, key_columns, num_rows);
236
2
                        if (has_null_key) {
237
0
                            key_columns[0]->insert_data(nullptr, 0);
238
0
                        }
239
2
                        return key_columns;
240
2
                    }},
Unexecuted instantiation: dependency.cpp:_ZZN5doris8pipeline14AggSharedState20_get_keys_hash_tableEvENK3$_1clIRNS_10vectorized19MethodStringNoCacheINS_13StringHashMapIPcNS_9AllocatorILb1ELb1ELb0ENS_22DefaultMemoryAllocatorELb1EEEEEEEEESt6vectorINS_3COWINS4_7IColumnEE11mutable_ptrISG_EESaISJ_EEOT_
Unexecuted instantiation: dependency.cpp:_ZZN5doris8pipeline14AggSharedState20_get_keys_hash_tableEvENK3$_1clIRNS_10vectorized15MethodOneNumberIN4wide7integerILm128EjEE9PHHashMapIS8_Pc9HashCRC32IS8_EEEEEESt6vectorINS_3COWINS4_7IColumnEE11mutable_ptrISI_EESaISL_EEOT_
Unexecuted instantiation: dependency.cpp:_ZZN5doris8pipeline14AggSharedState20_get_keys_hash_tableEvENK3$_1clIRNS_10vectorized15MethodOneNumberIN4wide7integerILm256EjEE9PHHashMapIS8_Pc9HashCRC32IS8_EEEEEESt6vectorINS_3COWINS4_7IColumnEE11mutable_ptrISI_EESaISL_EEOT_
dependency.cpp:_ZZN5doris8pipeline14AggSharedState20_get_keys_hash_tableEvENK3$_1clIRNS_10vectorized15MethodOneNumberIj9PHHashMapIjPc14HashMixWrapperIj9HashCRC32IjEEEEEEESt6vectorINS_3COWINS4_7IColumnEE11mutable_ptrISH_EESaISK_EEOT_
Line
Count
Source
214
10
                    [&](auto&& agg_method) -> vectorized::MutableColumns {
215
10
                        vectorized::MutableColumns key_columns;
216
20
                        for (int i = 0; i < probe_expr_ctxs.size(); ++i) {
217
10
                            key_columns.emplace_back(
218
10
                                    probe_expr_ctxs[i]->root()->data_type()->create_column());
219
10
                        }
220
10
                        auto& data = *agg_method.hash_table;
221
10
                        bool has_null_key = data.has_null_key_data();
222
10
                        const auto size = data.size() - has_null_key;
223
10
                        using KeyType = std::decay_t<decltype(agg_method)>::Key;
224
10
                        std::vector<KeyType> keys(size);
225
226
10
                        uint32_t num_rows = 0;
227
10
                        auto iter = aggregate_data_container->begin();
228
10
                        {
229
20
                            while (iter != aggregate_data_container->end()) {
230
10
                                keys[num_rows] = iter.get_key<KeyType>();
231
10
                                ++iter;
232
10
                                ++num_rows;
233
10
                            }
234
10
                        }
235
10
                        agg_method.insert_keys_into_columns(keys, key_columns, num_rows);
236
10
                        if (has_null_key) {
237
0
                            key_columns[0]->insert_data(nullptr, 0);
238
0
                        }
239
10
                        return key_columns;
240
10
                    }},
dependency.cpp:_ZZN5doris8pipeline14AggSharedState20_get_keys_hash_tableEvENK3$_1clIRNS_10vectorized15MethodOneNumberIm9PHHashMapImPc14HashMixWrapperIm9HashCRC32ImEEEEEEESt6vectorINS_3COWINS4_7IColumnEE11mutable_ptrISH_EESaISK_EEOT_
Line
Count
Source
214
6
                    [&](auto&& agg_method) -> vectorized::MutableColumns {
215
6
                        vectorized::MutableColumns key_columns;
216
12
                        for (int i = 0; i < probe_expr_ctxs.size(); ++i) {
217
6
                            key_columns.emplace_back(
218
6
                                    probe_expr_ctxs[i]->root()->data_type()->create_column());
219
6
                        }
220
6
                        auto& data = *agg_method.hash_table;
221
6
                        bool has_null_key = data.has_null_key_data();
222
6
                        const auto size = data.size() - has_null_key;
223
6
                        using KeyType = std::decay_t<decltype(agg_method)>::Key;
224
6
                        std::vector<KeyType> keys(size);
225
226
6
                        uint32_t num_rows = 0;
227
6
                        auto iter = aggregate_data_container->begin();
228
6
                        {
229
28
                            while (iter != aggregate_data_container->end()) {
230
22
                                keys[num_rows] = iter.get_key<KeyType>();
231
22
                                ++iter;
232
22
                                ++num_rows;
233
22
                            }
234
6
                        }
235
6
                        agg_method.insert_keys_into_columns(keys, key_columns, num_rows);
236
6
                        if (has_null_key) {
237
0
                            key_columns[0]->insert_data(nullptr, 0);
238
0
                        }
239
6
                        return key_columns;
240
6
                    }},
Unexecuted instantiation: dependency.cpp:_ZZN5doris8pipeline14AggSharedState20_get_keys_hash_tableEvENK3$_1clIRNS_10vectorized26MethodSingleNullableColumnINS4_15MethodOneNumberIhNS4_15DataWithNullKeyI9PHHashMapIhPc9HashCRC32IhEEEEEEEEEESt6vectorINS_3COWINS4_7IColumnEE11mutable_ptrISJ_EESaISM_EEOT_
Unexecuted instantiation: dependency.cpp:_ZZN5doris8pipeline14AggSharedState20_get_keys_hash_tableEvENK3$_1clIRNS_10vectorized26MethodSingleNullableColumnINS4_15MethodOneNumberItNS4_15DataWithNullKeyI9PHHashMapItPc9HashCRC32ItEEEEEEEEEESt6vectorINS_3COWINS4_7IColumnEE11mutable_ptrISJ_EESaISM_EEOT_
dependency.cpp:_ZZN5doris8pipeline14AggSharedState20_get_keys_hash_tableEvENK3$_1clIRNS_10vectorized26MethodSingleNullableColumnINS4_15MethodOneNumberIjNS4_15DataWithNullKeyI9PHHashMapIjPc9HashCRC32IjEEEEEEEEEESt6vectorINS_3COWINS4_7IColumnEE11mutable_ptrISJ_EESaISM_EEOT_
Line
Count
Source
214
16
                    [&](auto&& agg_method) -> vectorized::MutableColumns {
215
16
                        vectorized::MutableColumns key_columns;
216
32
                        for (int i = 0; i < probe_expr_ctxs.size(); ++i) {
217
16
                            key_columns.emplace_back(
218
16
                                    probe_expr_ctxs[i]->root()->data_type()->create_column());
219
16
                        }
220
16
                        auto& data = *agg_method.hash_table;
221
16
                        bool has_null_key = data.has_null_key_data();
222
16
                        const auto size = data.size() - has_null_key;
223
16
                        using KeyType = std::decay_t<decltype(agg_method)>::Key;
224
16
                        std::vector<KeyType> keys(size);
225
226
16
                        uint32_t num_rows = 0;
227
16
                        auto iter = aggregate_data_container->begin();
228
16
                        {
229
675
                            while (iter != aggregate_data_container->end()) {
230
659
                                keys[num_rows] = iter.get_key<KeyType>();
231
659
                                ++iter;
232
659
                                ++num_rows;
233
659
                            }
234
16
                        }
235
16
                        agg_method.insert_keys_into_columns(keys, key_columns, num_rows);
236
16
                        if (has_null_key) {
237
0
                            key_columns[0]->insert_data(nullptr, 0);
238
0
                        }
239
16
                        return key_columns;
240
16
                    }},
dependency.cpp:_ZZN5doris8pipeline14AggSharedState20_get_keys_hash_tableEvENK3$_1clIRNS_10vectorized26MethodSingleNullableColumnINS4_15MethodOneNumberImNS4_15DataWithNullKeyI9PHHashMapImPc9HashCRC32ImEEEEEEEEEESt6vectorINS_3COWINS4_7IColumnEE11mutable_ptrISJ_EESaISM_EEOT_
Line
Count
Source
214
16
                    [&](auto&& agg_method) -> vectorized::MutableColumns {
215
16
                        vectorized::MutableColumns key_columns;
216
32
                        for (int i = 0; i < probe_expr_ctxs.size(); ++i) {
217
16
                            key_columns.emplace_back(
218
16
                                    probe_expr_ctxs[i]->root()->data_type()->create_column());
219
16
                        }
220
16
                        auto& data = *agg_method.hash_table;
221
16
                        bool has_null_key = data.has_null_key_data();
222
16
                        const auto size = data.size() - has_null_key;
223
16
                        using KeyType = std::decay_t<decltype(agg_method)>::Key;
224
16
                        std::vector<KeyType> keys(size);
225
226
16
                        uint32_t num_rows = 0;
227
16
                        auto iter = aggregate_data_container->begin();
228
16
                        {
229
675
                            while (iter != aggregate_data_container->end()) {
230
659
                                keys[num_rows] = iter.get_key<KeyType>();
231
659
                                ++iter;
232
659
                                ++num_rows;
233
659
                            }
234
16
                        }
235
16
                        agg_method.insert_keys_into_columns(keys, key_columns, num_rows);
236
16
                        if (has_null_key) {
237
0
                            key_columns[0]->insert_data(nullptr, 0);
238
0
                        }
239
16
                        return key_columns;
240
16
                    }},
dependency.cpp:_ZZN5doris8pipeline14AggSharedState20_get_keys_hash_tableEvENK3$_1clIRNS_10vectorized26MethodSingleNullableColumnINS4_15MethodOneNumberIjNS4_15DataWithNullKeyI9PHHashMapIjPc14HashMixWrapperIj9HashCRC32IjEEEEEEEEEEESt6vectorINS_3COWINS4_7IColumnEE11mutable_ptrISL_EESaISO_EEOT_
Line
Count
Source
214
19
                    [&](auto&& agg_method) -> vectorized::MutableColumns {
215
19
                        vectorized::MutableColumns key_columns;
216
38
                        for (int i = 0; i < probe_expr_ctxs.size(); ++i) {
217
19
                            key_columns.emplace_back(
218
19
                                    probe_expr_ctxs[i]->root()->data_type()->create_column());
219
19
                        }
220
19
                        auto& data = *agg_method.hash_table;
221
19
                        bool has_null_key = data.has_null_key_data();
222
19
                        const auto size = data.size() - has_null_key;
223
19
                        using KeyType = std::decay_t<decltype(agg_method)>::Key;
224
19
                        std::vector<KeyType> keys(size);
225
226
19
                        uint32_t num_rows = 0;
227
19
                        auto iter = aggregate_data_container->begin();
228
19
                        {
229
71
                            while (iter != aggregate_data_container->end()) {
230
52
                                keys[num_rows] = iter.get_key<KeyType>();
231
52
                                ++iter;
232
52
                                ++num_rows;
233
52
                            }
234
19
                        }
235
19
                        agg_method.insert_keys_into_columns(keys, key_columns, num_rows);
236
19
                        if (has_null_key) {
237
1
                            key_columns[0]->insert_data(nullptr, 0);
238
1
                        }
239
19
                        return key_columns;
240
19
                    }},
dependency.cpp:_ZZN5doris8pipeline14AggSharedState20_get_keys_hash_tableEvENK3$_1clIRNS_10vectorized26MethodSingleNullableColumnINS4_15MethodOneNumberImNS4_15DataWithNullKeyI9PHHashMapImPc14HashMixWrapperIm9HashCRC32ImEEEEEEEEEEESt6vectorINS_3COWINS4_7IColumnEE11mutable_ptrISL_EESaISO_EEOT_
Line
Count
Source
214
19
                    [&](auto&& agg_method) -> vectorized::MutableColumns {
215
19
                        vectorized::MutableColumns key_columns;
216
38
                        for (int i = 0; i < probe_expr_ctxs.size(); ++i) {
217
19
                            key_columns.emplace_back(
218
19
                                    probe_expr_ctxs[i]->root()->data_type()->create_column());
219
19
                        }
220
19
                        auto& data = *agg_method.hash_table;
221
19
                        bool has_null_key = data.has_null_key_data();
222
19
                        const auto size = data.size() - has_null_key;
223
19
                        using KeyType = std::decay_t<decltype(agg_method)>::Key;
224
19
                        std::vector<KeyType> keys(size);
225
226
19
                        uint32_t num_rows = 0;
227
19
                        auto iter = aggregate_data_container->begin();
228
19
                        {
229
81
                            while (iter != aggregate_data_container->end()) {
230
62
                                keys[num_rows] = iter.get_key<KeyType>();
231
62
                                ++iter;
232
62
                                ++num_rows;
233
62
                            }
234
19
                        }
235
19
                        agg_method.insert_keys_into_columns(keys, key_columns, num_rows);
236
19
                        if (has_null_key) {
237
1
                            key_columns[0]->insert_data(nullptr, 0);
238
1
                        }
239
19
                        return key_columns;
240
19
                    }},
Unexecuted instantiation: dependency.cpp:_ZZN5doris8pipeline14AggSharedState20_get_keys_hash_tableEvENK3$_1clIRNS_10vectorized26MethodSingleNullableColumnINS4_15MethodOneNumberIN4wide7integerILm128EjEENS4_15DataWithNullKeyI9PHHashMapIS9_Pc9HashCRC32IS9_EEEEEEEEEESt6vectorINS_3COWINS4_7IColumnEE11mutable_ptrISM_EESaISP_EEOT_
Unexecuted instantiation: dependency.cpp:_ZZN5doris8pipeline14AggSharedState20_get_keys_hash_tableEvENK3$_1clIRNS_10vectorized26MethodSingleNullableColumnINS4_15MethodOneNumberIN4wide7integerILm256EjEENS4_15DataWithNullKeyI9PHHashMapIS9_Pc9HashCRC32IS9_EEEEEEEEEESt6vectorINS_3COWINS4_7IColumnEE11mutable_ptrISM_EESaISP_EEOT_
Unexecuted instantiation: dependency.cpp:_ZZN5doris8pipeline14AggSharedState20_get_keys_hash_tableEvENK3$_1clIRNS_10vectorized26MethodSingleNullableColumnINS4_19MethodStringNoCacheINS4_15DataWithNullKeyINS_13StringHashMapIPcNS_9AllocatorILb1ELb1ELb0ENS_22DefaultMemoryAllocatorELb1EEEEEEEEEEEEESt6vectorINS_3COWINS4_7IColumnEE11mutable_ptrISK_EESaISN_EEOT_
Unexecuted instantiation: dependency.cpp:_ZZN5doris8pipeline14AggSharedState20_get_keys_hash_tableEvENK3$_1clIRNS_10vectorized15MethodKeysFixedI9PHHashMapImPc9HashCRC32ImEEEEEESt6vectorINS_3COWINS4_7IColumnEE11mutable_ptrISF_EESaISI_EEOT_
dependency.cpp:_ZZN5doris8pipeline14AggSharedState20_get_keys_hash_tableEvENK3$_1clIRNS_10vectorized15MethodKeysFixedI9PHHashMapINS4_6UInt72EPc9HashCRC32IS7_EEEEEESt6vectorINS_3COWINS4_7IColumnEE11mutable_ptrISG_EESaISJ_EEOT_
Line
Count
Source
214
1
                    [&](auto&& agg_method) -> vectorized::MutableColumns {
215
1
                        vectorized::MutableColumns key_columns;
216
3
                        for (int i = 0; i < probe_expr_ctxs.size(); ++i) {
217
2
                            key_columns.emplace_back(
218
2
                                    probe_expr_ctxs[i]->root()->data_type()->create_column());
219
2
                        }
220
1
                        auto& data = *agg_method.hash_table;
221
1
                        bool has_null_key = data.has_null_key_data();
222
1
                        const auto size = data.size() - has_null_key;
223
1
                        using KeyType = std::decay_t<decltype(agg_method)>::Key;
224
1
                        std::vector<KeyType> keys(size);
225
226
1
                        uint32_t num_rows = 0;
227
1
                        auto iter = aggregate_data_container->begin();
228
1
                        {
229
7
                            while (iter != aggregate_data_container->end()) {
230
6
                                keys[num_rows] = iter.get_key<KeyType>();
231
6
                                ++iter;
232
6
                                ++num_rows;
233
6
                            }
234
1
                        }
235
1
                        agg_method.insert_keys_into_columns(keys, key_columns, num_rows);
236
1
                        if (has_null_key) {
237
0
                            key_columns[0]->insert_data(nullptr, 0);
238
0
                        }
239
1
                        return key_columns;
240
1
                    }},
Unexecuted instantiation: dependency.cpp:_ZZN5doris8pipeline14AggSharedState20_get_keys_hash_tableEvENK3$_1clIRNS_10vectorized15MethodKeysFixedI9PHHashMapINS4_6UInt96EPc9HashCRC32IS7_EEEEEESt6vectorINS_3COWINS4_7IColumnEE11mutable_ptrISG_EESaISJ_EEOT_
Unexecuted instantiation: dependency.cpp:_ZZN5doris8pipeline14AggSharedState20_get_keys_hash_tableEvENK3$_1clIRNS_10vectorized15MethodKeysFixedI9PHHashMapINS4_7UInt104EPc9HashCRC32IS7_EEEEEESt6vectorINS_3COWINS4_7IColumnEE11mutable_ptrISG_EESaISJ_EEOT_
Unexecuted instantiation: dependency.cpp:_ZZN5doris8pipeline14AggSharedState20_get_keys_hash_tableEvENK3$_1clIRNS_10vectorized15MethodKeysFixedI9PHHashMapIN4wide7integerILm128EjEEPc9HashCRC32IS9_EEEEEESt6vectorINS_3COWINS4_7IColumnEE11mutable_ptrISI_EESaISL_EEOT_
Unexecuted instantiation: dependency.cpp:_ZZN5doris8pipeline14AggSharedState20_get_keys_hash_tableEvENK3$_1clIRNS_10vectorized15MethodKeysFixedI9PHHashMapINS4_7UInt136EPc9HashCRC32IS7_EEEEEESt6vectorINS_3COWINS4_7IColumnEE11mutable_ptrISG_EESaISJ_EEOT_
dependency.cpp:_ZZN5doris8pipeline14AggSharedState20_get_keys_hash_tableEvENK3$_1clIRNS_10vectorized15MethodKeysFixedI9PHHashMapIN4wide7integerILm256EjEEPc9HashCRC32IS9_EEEEEESt6vectorINS_3COWINS4_7IColumnEE11mutable_ptrISI_EESaISL_EEOT_
Line
Count
Source
214
169
                    [&](auto&& agg_method) -> vectorized::MutableColumns {
215
169
                        vectorized::MutableColumns key_columns;
216
667
                        for (int i = 0; i < probe_expr_ctxs.size(); ++i) {
217
498
                            key_columns.emplace_back(
218
498
                                    probe_expr_ctxs[i]->root()->data_type()->create_column());
219
498
                        }
220
169
                        auto& data = *agg_method.hash_table;
221
169
                        bool has_null_key = data.has_null_key_data();
222
169
                        const auto size = data.size() - has_null_key;
223
169
                        using KeyType = std::decay_t<decltype(agg_method)>::Key;
224
169
                        std::vector<KeyType> keys(size);
225
226
169
                        uint32_t num_rows = 0;
227
169
                        auto iter = aggregate_data_container->begin();
228
169
                        {
229
2.25k
                            while (iter != aggregate_data_container->end()) {
230
2.08k
                                keys[num_rows] = iter.get_key<KeyType>();
231
2.08k
                                ++iter;
232
2.08k
                                ++num_rows;
233
2.08k
                            }
234
169
                        }
235
169
                        agg_method.insert_keys_into_columns(keys, key_columns, num_rows);
236
169
                        if (has_null_key) {
237
0
                            key_columns[0]->insert_data(nullptr, 0);
238
0
                        }
239
169
                        return key_columns;
240
169
                    }},
241
290
            agg_data->method_variant);
242
290
}
243
244
290
void AggSharedState::build_limit_heap(size_t hash_table_size) {
245
290
    limit_columns = _get_keys_hash_table();
246
5.76k
    for (size_t i = 0; i < hash_table_size; ++i) {
247
5.47k
        limit_heap.emplace(i, limit_columns, order_directions, null_directions);
248
5.47k
    }
249
4.92k
    while (hash_table_size > limit) {
250
4.63k
        limit_heap.pop();
251
4.63k
        hash_table_size--;
252
4.63k
    }
253
290
    limit_columns_min = limit_heap.top()._row_id;
254
290
}
255
256
bool AggSharedState::do_limit_filter(vectorized::Block* block, size_t num_rows,
257
3.74k
                                     const std::vector<int>* key_locs) {
258
3.74k
    if (num_rows) {
259
3.74k
        cmp_res.resize(num_rows);
260
3.74k
        need_computes.resize(num_rows);
261
3.74k
        memset(need_computes.data(), 0, need_computes.size());
262
3.74k
        memset(cmp_res.data(), 0, cmp_res.size());
263
264
3.74k
        const auto key_size = null_directions.size();
265
13.4k
        for (int i = 0; i < key_size; i++) {
266
9.68k
            block->get_by_position(key_locs ? key_locs->operator[](i) : i)
267
9.68k
                    .column->compare_internal(limit_columns_min, *limit_columns[i],
268
9.68k
                                              null_directions[i], order_directions[i], cmp_res,
269
9.68k
                                              need_computes.data());
270
9.68k
        }
271
272
3.74k
        auto set_computes_arr = [](auto* __restrict res, auto* __restrict computes, size_t rows) {
273
483k
            for (size_t i = 0; i < rows; ++i) {
274
479k
                computes[i] = computes[i] == res[i];
275
479k
            }
276
3.74k
        };
277
3.74k
        set_computes_arr(cmp_res.data(), need_computes.data(), num_rows);
278
279
3.74k
        return std::find(need_computes.begin(), need_computes.end(), 0) != need_computes.end();
280
3.74k
    }
281
282
0
    return false;
283
3.74k
}
284
285
2.88k
Status AggSharedState::reset_hash_table() {
286
2.88k
    return std::visit(
287
2.88k
            vectorized::Overload {
288
2.88k
                    [&](std::monostate& arg) -> Status {
289
0
                        return Status::InternalError("Uninited hash table");
290
0
                    },
291
2.88k
                    [&](auto& agg_method) {
292
2.88k
                        auto& hash_table = *agg_method.hash_table;
293
2.88k
                        using HashTableType = std::decay_t<decltype(hash_table)>;
294
295
2.88k
                        agg_method.arena.clear();
296
2.88k
                        agg_method.inited_iterator = false;
297
298
1.05M
                        hash_table.for_each_mapped([&](auto& mapped) {
299
1.05M
                            if (mapped) {
300
1.05M
                                _destroy_agg_status(mapped);
301
1.05M
                                mapped = nullptr;
302
1.05M
                            }
303
1.05M
                        });
Unexecuted instantiation: dependency.cpp:_ZZZN5doris8pipeline14AggSharedState16reset_hash_tableEvENK3$_1clINS_10vectorized16MethodSerializedI9PHHashMapINS_9StringRefEPc11DefaultHashIS7_vEEEEEEDaRT_ENKUlSE_E_clIS8_EEDaSE_
dependency.cpp:_ZZZN5doris8pipeline14AggSharedState16reset_hash_tableEvENK3$_1clINS_10vectorized15MethodOneNumberIh9PHHashMapIhPc9HashCRC32IhEEEEEEDaRT_ENKUlSD_E_clIS7_EEDaSD_
Line
Count
Source
298
282
                        hash_table.for_each_mapped([&](auto& mapped) {
299
282
                            if (mapped) {
300
282
                                _destroy_agg_status(mapped);
301
282
                                mapped = nullptr;
302
282
                            }
303
282
                        });
Unexecuted instantiation: dependency.cpp:_ZZZN5doris8pipeline14AggSharedState16reset_hash_tableEvENK3$_1clINS_10vectorized15MethodOneNumberIt9PHHashMapItPc9HashCRC32ItEEEEEEDaRT_ENKUlSD_E_clIS7_EEDaSD_
Unexecuted instantiation: dependency.cpp:_ZZZN5doris8pipeline14AggSharedState16reset_hash_tableEvENK3$_1clINS_10vectorized15MethodOneNumberIj9PHHashMapIjPc9HashCRC32IjEEEEEEDaRT_ENKUlSD_E_clIS7_EEDaSD_
dependency.cpp:_ZZZN5doris8pipeline14AggSharedState16reset_hash_tableEvENK3$_1clINS_10vectorized15MethodOneNumberIm9PHHashMapImPc9HashCRC32ImEEEEEEDaRT_ENKUlSD_E_clIS7_EEDaSD_
Line
Count
Source
298
986
                        hash_table.for_each_mapped([&](auto& mapped) {
299
986
                            if (mapped) {
300
986
                                _destroy_agg_status(mapped);
301
986
                                mapped = nullptr;
302
986
                            }
303
986
                        });
Unexecuted instantiation: dependency.cpp:_ZZZN5doris8pipeline14AggSharedState16reset_hash_tableEvENK3$_1clINS_10vectorized19MethodStringNoCacheINS_13StringHashMapIPcNS_9AllocatorILb1ELb1ELb0ENS_22DefaultMemoryAllocatorELb1EEEEEEEEEDaRT_ENKUlSE_E_clIS7_EEDaSE_
dependency.cpp:_ZZZN5doris8pipeline14AggSharedState16reset_hash_tableEvENK3$_1clINS_10vectorized15MethodOneNumberIN4wide7integerILm128EjEE9PHHashMapIS8_Pc9HashCRC32IS8_EEEEEEDaRT_ENKUlSG_E_clISA_EEDaSG_
Line
Count
Source
298
514
                        hash_table.for_each_mapped([&](auto& mapped) {
299
514
                            if (mapped) {
300
514
                                _destroy_agg_status(mapped);
301
514
                                mapped = nullptr;
302
514
                            }
303
514
                        });
Unexecuted instantiation: dependency.cpp:_ZZZN5doris8pipeline14AggSharedState16reset_hash_tableEvENK3$_1clINS_10vectorized15MethodOneNumberIN4wide7integerILm256EjEE9PHHashMapIS8_Pc9HashCRC32IS8_EEEEEEDaRT_ENKUlSG_E_clISA_EEDaSG_
dependency.cpp:_ZZZN5doris8pipeline14AggSharedState16reset_hash_tableEvENK3$_1clINS_10vectorized15MethodOneNumberIj9PHHashMapIjPc14HashMixWrapperIj9HashCRC32IjEEEEEEEDaRT_ENKUlSF_E_clIS7_EEDaSF_
Line
Count
Source
298
1.04M
                        hash_table.for_each_mapped([&](auto& mapped) {
299
1.04M
                            if (mapped) {
300
1.04M
                                _destroy_agg_status(mapped);
301
1.04M
                                mapped = nullptr;
302
1.04M
                            }
303
1.04M
                        });
dependency.cpp:_ZZZN5doris8pipeline14AggSharedState16reset_hash_tableEvENK3$_1clINS_10vectorized15MethodOneNumberIm9PHHashMapImPc14HashMixWrapperIm9HashCRC32ImEEEEEEEDaRT_ENKUlSF_E_clIS7_EEDaSF_
Line
Count
Source
298
2.15k
                        hash_table.for_each_mapped([&](auto& mapped) {
299
2.15k
                            if (mapped) {
300
2.15k
                                _destroy_agg_status(mapped);
301
2.15k
                                mapped = nullptr;
302
2.15k
                            }
303
2.15k
                        });
dependency.cpp:_ZZZN5doris8pipeline14AggSharedState16reset_hash_tableEvENK3$_1clINS_10vectorized26MethodSingleNullableColumnINS4_15MethodOneNumberIhNS4_15DataWithNullKeyI9PHHashMapIhPc9HashCRC32IhEEEEEEEEEEDaRT_ENKUlSH_E_clIS9_EEDaSH_
Line
Count
Source
298
100
                        hash_table.for_each_mapped([&](auto& mapped) {
299
100
                            if (mapped) {
300
100
                                _destroy_agg_status(mapped);
301
100
                                mapped = nullptr;
302
100
                            }
303
100
                        });
Unexecuted instantiation: dependency.cpp:_ZZZN5doris8pipeline14AggSharedState16reset_hash_tableEvENK3$_1clINS_10vectorized26MethodSingleNullableColumnINS4_15MethodOneNumberItNS4_15DataWithNullKeyI9PHHashMapItPc9HashCRC32ItEEEEEEEEEEDaRT_ENKUlSH_E_clIS9_EEDaSH_
dependency.cpp:_ZZZN5doris8pipeline14AggSharedState16reset_hash_tableEvENK3$_1clINS_10vectorized26MethodSingleNullableColumnINS4_15MethodOneNumberIjNS4_15DataWithNullKeyI9PHHashMapIjPc9HashCRC32IjEEEEEEEEEEDaRT_ENKUlSH_E_clIS9_EEDaSH_
Line
Count
Source
298
688
                        hash_table.for_each_mapped([&](auto& mapped) {
299
688
                            if (mapped) {
300
688
                                _destroy_agg_status(mapped);
301
688
                                mapped = nullptr;
302
688
                            }
303
688
                        });
dependency.cpp:_ZZZN5doris8pipeline14AggSharedState16reset_hash_tableEvENK3$_1clINS_10vectorized26MethodSingleNullableColumnINS4_15MethodOneNumberImNS4_15DataWithNullKeyI9PHHashMapImPc9HashCRC32ImEEEEEEEEEEDaRT_ENKUlSH_E_clIS9_EEDaSH_
Line
Count
Source
298
680
                        hash_table.for_each_mapped([&](auto& mapped) {
299
680
                            if (mapped) {
300
680
                                _destroy_agg_status(mapped);
301
680
                                mapped = nullptr;
302
680
                            }
303
680
                        });
dependency.cpp:_ZZZN5doris8pipeline14AggSharedState16reset_hash_tableEvENK3$_1clINS_10vectorized26MethodSingleNullableColumnINS4_15MethodOneNumberIjNS4_15DataWithNullKeyI9PHHashMapIjPc14HashMixWrapperIj9HashCRC32IjEEEEEEEEEEEDaRT_ENKUlSJ_E_clIS9_EEDaSJ_
Line
Count
Source
298
1.29k
                        hash_table.for_each_mapped([&](auto& mapped) {
299
1.29k
                            if (mapped) {
300
1.29k
                                _destroy_agg_status(mapped);
301
1.29k
                                mapped = nullptr;
302
1.29k
                            }
303
1.29k
                        });
dependency.cpp:_ZZZN5doris8pipeline14AggSharedState16reset_hash_tableEvENK3$_1clINS_10vectorized26MethodSingleNullableColumnINS4_15MethodOneNumberImNS4_15DataWithNullKeyI9PHHashMapImPc14HashMixWrapperIm9HashCRC32ImEEEEEEEEEEEDaRT_ENKUlSJ_E_clIS9_EEDaSJ_
Line
Count
Source
298
893
                        hash_table.for_each_mapped([&](auto& mapped) {
299
893
                            if (mapped) {
300
893
                                _destroy_agg_status(mapped);
301
893
                                mapped = nullptr;
302
893
                            }
303
893
                        });
Unexecuted instantiation: dependency.cpp:_ZZZN5doris8pipeline14AggSharedState16reset_hash_tableEvENK3$_1clINS_10vectorized26MethodSingleNullableColumnINS4_15MethodOneNumberIN4wide7integerILm128EjEENS4_15DataWithNullKeyI9PHHashMapIS9_Pc9HashCRC32IS9_EEEEEEEEEEDaRT_ENKUlSK_E_clISC_EEDaSK_
Unexecuted instantiation: dependency.cpp:_ZZZN5doris8pipeline14AggSharedState16reset_hash_tableEvENK3$_1clINS_10vectorized26MethodSingleNullableColumnINS4_15MethodOneNumberIN4wide7integerILm256EjEENS4_15DataWithNullKeyI9PHHashMapIS9_Pc9HashCRC32IS9_EEEEEEEEEEDaRT_ENKUlSK_E_clISC_EEDaSK_
Unexecuted instantiation: dependency.cpp:_ZZZN5doris8pipeline14AggSharedState16reset_hash_tableEvENK3$_1clINS_10vectorized26MethodSingleNullableColumnINS4_19MethodStringNoCacheINS4_15DataWithNullKeyINS_13StringHashMapIPcNS_9AllocatorILb1ELb1ELb0ENS_22DefaultMemoryAllocatorELb1EEEEEEEEEEEEEDaRT_ENKUlSI_E_clIS9_EEDaSI_
Unexecuted instantiation: dependency.cpp:_ZZZN5doris8pipeline14AggSharedState16reset_hash_tableEvENK3$_1clINS_10vectorized15MethodKeysFixedI9PHHashMapImPc9HashCRC32ImEEEEEEDaRT_ENKUlSD_E_clIS7_EEDaSD_
Unexecuted instantiation: dependency.cpp:_ZZZN5doris8pipeline14AggSharedState16reset_hash_tableEvENK3$_1clINS_10vectorized15MethodKeysFixedI9PHHashMapINS4_6UInt72EPc9HashCRC32IS7_EEEEEEDaRT_ENKUlSE_E_clIS8_EEDaSE_
Unexecuted instantiation: dependency.cpp:_ZZZN5doris8pipeline14AggSharedState16reset_hash_tableEvENK3$_1clINS_10vectorized15MethodKeysFixedI9PHHashMapINS4_6UInt96EPc9HashCRC32IS7_EEEEEEDaRT_ENKUlSE_E_clIS8_EEDaSE_
Unexecuted instantiation: dependency.cpp:_ZZZN5doris8pipeline14AggSharedState16reset_hash_tableEvENK3$_1clINS_10vectorized15MethodKeysFixedI9PHHashMapINS4_7UInt104EPc9HashCRC32IS7_EEEEEEDaRT_ENKUlSE_E_clIS8_EEDaSE_
Unexecuted instantiation: dependency.cpp:_ZZZN5doris8pipeline14AggSharedState16reset_hash_tableEvENK3$_1clINS_10vectorized15MethodKeysFixedI9PHHashMapIN4wide7integerILm128EjEEPc9HashCRC32IS9_EEEEEEDaRT_ENKUlSG_E_clISA_EEDaSG_
Unexecuted instantiation: dependency.cpp:_ZZZN5doris8pipeline14AggSharedState16reset_hash_tableEvENK3$_1clINS_10vectorized15MethodKeysFixedI9PHHashMapINS4_7UInt136EPc9HashCRC32IS7_EEEEEEDaRT_ENKUlSE_E_clIS8_EEDaSE_
Unexecuted instantiation: dependency.cpp:_ZZZN5doris8pipeline14AggSharedState16reset_hash_tableEvENK3$_1clINS_10vectorized15MethodKeysFixedI9PHHashMapIN4wide7integerILm256EjEEPc9HashCRC32IS9_EEEEEEDaRT_ENKUlSG_E_clISA_EEDaSG_
304
305
2.88k
                        if (hash_table.has_null_key_data()) {
306
0
                            _destroy_agg_status(hash_table.template get_null_key_data<
307
0
                                                vectorized::AggregateDataPtr>());
308
0
                        }
309
310
2.88k
                        aggregate_data_container.reset(new AggregateDataContainer(
311
2.88k
                                sizeof(typename HashTableType::key_type),
312
2.88k
                                ((total_size_of_aggregate_states + align_aggregate_states - 1) /
313
2.88k
                                 align_aggregate_states) *
314
2.88k
                                        align_aggregate_states));
315
2.88k
                        agg_method.hash_table.reset(new HashTableType());
316
2.88k
                        return Status::OK();
317
2.88k
                    }},
Unexecuted instantiation: dependency.cpp:_ZZN5doris8pipeline14AggSharedState16reset_hash_tableEvENK3$_1clINS_10vectorized16MethodSerializedI9PHHashMapINS_9StringRefEPc11DefaultHashIS7_vEEEEEEDaRT_
dependency.cpp:_ZZN5doris8pipeline14AggSharedState16reset_hash_tableEvENK3$_1clINS_10vectorized15MethodOneNumberIh9PHHashMapIhPc9HashCRC32IhEEEEEEDaRT_
Line
Count
Source
291
96
                    [&](auto& agg_method) {
292
96
                        auto& hash_table = *agg_method.hash_table;
293
96
                        using HashTableType = std::decay_t<decltype(hash_table)>;
294
295
96
                        agg_method.arena.clear();
296
96
                        agg_method.inited_iterator = false;
297
298
96
                        hash_table.for_each_mapped([&](auto& mapped) {
299
96
                            if (mapped) {
300
96
                                _destroy_agg_status(mapped);
301
96
                                mapped = nullptr;
302
96
                            }
303
96
                        });
304
305
96
                        if (hash_table.has_null_key_data()) {
306
0
                            _destroy_agg_status(hash_table.template get_null_key_data<
307
0
                                                vectorized::AggregateDataPtr>());
308
0
                        }
309
310
96
                        aggregate_data_container.reset(new AggregateDataContainer(
311
96
                                sizeof(typename HashTableType::key_type),
312
96
                                ((total_size_of_aggregate_states + align_aggregate_states - 1) /
313
96
                                 align_aggregate_states) *
314
96
                                        align_aggregate_states));
315
96
                        agg_method.hash_table.reset(new HashTableType());
316
96
                        return Status::OK();
317
96
                    }},
Unexecuted instantiation: dependency.cpp:_ZZN5doris8pipeline14AggSharedState16reset_hash_tableEvENK3$_1clINS_10vectorized15MethodOneNumberIt9PHHashMapItPc9HashCRC32ItEEEEEEDaRT_
Unexecuted instantiation: dependency.cpp:_ZZN5doris8pipeline14AggSharedState16reset_hash_tableEvENK3$_1clINS_10vectorized15MethodOneNumberIj9PHHashMapIjPc9HashCRC32IjEEEEEEDaRT_
dependency.cpp:_ZZN5doris8pipeline14AggSharedState16reset_hash_tableEvENK3$_1clINS_10vectorized15MethodOneNumberIm9PHHashMapImPc9HashCRC32ImEEEEEEDaRT_
Line
Count
Source
291
282
                    [&](auto& agg_method) {
292
282
                        auto& hash_table = *agg_method.hash_table;
293
282
                        using HashTableType = std::decay_t<decltype(hash_table)>;
294
295
282
                        agg_method.arena.clear();
296
282
                        agg_method.inited_iterator = false;
297
298
282
                        hash_table.for_each_mapped([&](auto& mapped) {
299
282
                            if (mapped) {
300
282
                                _destroy_agg_status(mapped);
301
282
                                mapped = nullptr;
302
282
                            }
303
282
                        });
304
305
282
                        if (hash_table.has_null_key_data()) {
306
0
                            _destroy_agg_status(hash_table.template get_null_key_data<
307
0
                                                vectorized::AggregateDataPtr>());
308
0
                        }
309
310
282
                        aggregate_data_container.reset(new AggregateDataContainer(
311
282
                                sizeof(typename HashTableType::key_type),
312
282
                                ((total_size_of_aggregate_states + align_aggregate_states - 1) /
313
282
                                 align_aggregate_states) *
314
282
                                        align_aggregate_states));
315
282
                        agg_method.hash_table.reset(new HashTableType());
316
282
                        return Status::OK();
317
282
                    }},
Unexecuted instantiation: dependency.cpp:_ZZN5doris8pipeline14AggSharedState16reset_hash_tableEvENK3$_1clINS_10vectorized19MethodStringNoCacheINS_13StringHashMapIPcNS_9AllocatorILb1ELb1ELb0ENS_22DefaultMemoryAllocatorELb1EEEEEEEEEDaRT_
dependency.cpp:_ZZN5doris8pipeline14AggSharedState16reset_hash_tableEvENK3$_1clINS_10vectorized15MethodOneNumberIN4wide7integerILm128EjEE9PHHashMapIS8_Pc9HashCRC32IS8_EEEEEEDaRT_
Line
Count
Source
291
150
                    [&](auto& agg_method) {
292
150
                        auto& hash_table = *agg_method.hash_table;
293
150
                        using HashTableType = std::decay_t<decltype(hash_table)>;
294
295
150
                        agg_method.arena.clear();
296
150
                        agg_method.inited_iterator = false;
297
298
150
                        hash_table.for_each_mapped([&](auto& mapped) {
299
150
                            if (mapped) {
300
150
                                _destroy_agg_status(mapped);
301
150
                                mapped = nullptr;
302
150
                            }
303
150
                        });
304
305
150
                        if (hash_table.has_null_key_data()) {
306
0
                            _destroy_agg_status(hash_table.template get_null_key_data<
307
0
                                                vectorized::AggregateDataPtr>());
308
0
                        }
309
310
150
                        aggregate_data_container.reset(new AggregateDataContainer(
311
150
                                sizeof(typename HashTableType::key_type),
312
150
                                ((total_size_of_aggregate_states + align_aggregate_states - 1) /
313
150
                                 align_aggregate_states) *
314
150
                                        align_aggregate_states));
315
150
                        agg_method.hash_table.reset(new HashTableType());
316
150
                        return Status::OK();
317
150
                    }},
Unexecuted instantiation: dependency.cpp:_ZZN5doris8pipeline14AggSharedState16reset_hash_tableEvENK3$_1clINS_10vectorized15MethodOneNumberIN4wide7integerILm256EjEE9PHHashMapIS8_Pc9HashCRC32IS8_EEEEEEDaRT_
dependency.cpp:_ZZN5doris8pipeline14AggSharedState16reset_hash_tableEvENK3$_1clINS_10vectorized15MethodOneNumberIj9PHHashMapIjPc14HashMixWrapperIj9HashCRC32IjEEEEEEEDaRT_
Line
Count
Source
291
243
                    [&](auto& agg_method) {
292
243
                        auto& hash_table = *agg_method.hash_table;
293
243
                        using HashTableType = std::decay_t<decltype(hash_table)>;
294
295
243
                        agg_method.arena.clear();
296
243
                        agg_method.inited_iterator = false;
297
298
243
                        hash_table.for_each_mapped([&](auto& mapped) {
299
243
                            if (mapped) {
300
243
                                _destroy_agg_status(mapped);
301
243
                                mapped = nullptr;
302
243
                            }
303
243
                        });
304
305
243
                        if (hash_table.has_null_key_data()) {
306
0
                            _destroy_agg_status(hash_table.template get_null_key_data<
307
0
                                                vectorized::AggregateDataPtr>());
308
0
                        }
309
310
243
                        aggregate_data_container.reset(new AggregateDataContainer(
311
243
                                sizeof(typename HashTableType::key_type),
312
243
                                ((total_size_of_aggregate_states + align_aggregate_states - 1) /
313
243
                                 align_aggregate_states) *
314
243
                                        align_aggregate_states));
315
243
                        agg_method.hash_table.reset(new HashTableType());
316
243
                        return Status::OK();
317
243
                    }},
dependency.cpp:_ZZN5doris8pipeline14AggSharedState16reset_hash_tableEvENK3$_1clINS_10vectorized15MethodOneNumberIm9PHHashMapImPc14HashMixWrapperIm9HashCRC32ImEEEEEEEDaRT_
Line
Count
Source
291
824
                    [&](auto& agg_method) {
292
824
                        auto& hash_table = *agg_method.hash_table;
293
824
                        using HashTableType = std::decay_t<decltype(hash_table)>;
294
295
824
                        agg_method.arena.clear();
296
824
                        agg_method.inited_iterator = false;
297
298
824
                        hash_table.for_each_mapped([&](auto& mapped) {
299
824
                            if (mapped) {
300
824
                                _destroy_agg_status(mapped);
301
824
                                mapped = nullptr;
302
824
                            }
303
824
                        });
304
305
824
                        if (hash_table.has_null_key_data()) {
306
0
                            _destroy_agg_status(hash_table.template get_null_key_data<
307
0
                                                vectorized::AggregateDataPtr>());
308
0
                        }
309
310
824
                        aggregate_data_container.reset(new AggregateDataContainer(
311
824
                                sizeof(typename HashTableType::key_type),
312
824
                                ((total_size_of_aggregate_states + align_aggregate_states - 1) /
313
824
                                 align_aggregate_states) *
314
824
                                        align_aggregate_states));
315
824
                        agg_method.hash_table.reset(new HashTableType());
316
824
                        return Status::OK();
317
824
                    }},
dependency.cpp:_ZZN5doris8pipeline14AggSharedState16reset_hash_tableEvENK3$_1clINS_10vectorized26MethodSingleNullableColumnINS4_15MethodOneNumberIhNS4_15DataWithNullKeyI9PHHashMapIhPc9HashCRC32IhEEEEEEEEEEDaRT_
Line
Count
Source
291
72
                    [&](auto& agg_method) {
292
72
                        auto& hash_table = *agg_method.hash_table;
293
72
                        using HashTableType = std::decay_t<decltype(hash_table)>;
294
295
72
                        agg_method.arena.clear();
296
72
                        agg_method.inited_iterator = false;
297
298
72
                        hash_table.for_each_mapped([&](auto& mapped) {
299
72
                            if (mapped) {
300
72
                                _destroy_agg_status(mapped);
301
72
                                mapped = nullptr;
302
72
                            }
303
72
                        });
304
305
72
                        if (hash_table.has_null_key_data()) {
306
0
                            _destroy_agg_status(hash_table.template get_null_key_data<
307
0
                                                vectorized::AggregateDataPtr>());
308
0
                        }
309
310
72
                        aggregate_data_container.reset(new AggregateDataContainer(
311
72
                                sizeof(typename HashTableType::key_type),
312
72
                                ((total_size_of_aggregate_states + align_aggregate_states - 1) /
313
72
                                 align_aggregate_states) *
314
72
                                        align_aggregate_states));
315
72
                        agg_method.hash_table.reset(new HashTableType());
316
72
                        return Status::OK();
317
72
                    }},
Unexecuted instantiation: dependency.cpp:_ZZN5doris8pipeline14AggSharedState16reset_hash_tableEvENK3$_1clINS_10vectorized26MethodSingleNullableColumnINS4_15MethodOneNumberItNS4_15DataWithNullKeyI9PHHashMapItPc9HashCRC32ItEEEEEEEEEEDaRT_
dependency.cpp:_ZZN5doris8pipeline14AggSharedState16reset_hash_tableEvENK3$_1clINS_10vectorized26MethodSingleNullableColumnINS4_15MethodOneNumberIjNS4_15DataWithNullKeyI9PHHashMapIjPc9HashCRC32IjEEEEEEEEEEDaRT_
Line
Count
Source
291
190
                    [&](auto& agg_method) {
292
190
                        auto& hash_table = *agg_method.hash_table;
293
190
                        using HashTableType = std::decay_t<decltype(hash_table)>;
294
295
190
                        agg_method.arena.clear();
296
190
                        agg_method.inited_iterator = false;
297
298
190
                        hash_table.for_each_mapped([&](auto& mapped) {
299
190
                            if (mapped) {
300
190
                                _destroy_agg_status(mapped);
301
190
                                mapped = nullptr;
302
190
                            }
303
190
                        });
304
305
190
                        if (hash_table.has_null_key_data()) {
306
0
                            _destroy_agg_status(hash_table.template get_null_key_data<
307
0
                                                vectorized::AggregateDataPtr>());
308
0
                        }
309
310
190
                        aggregate_data_container.reset(new AggregateDataContainer(
311
190
                                sizeof(typename HashTableType::key_type),
312
190
                                ((total_size_of_aggregate_states + align_aggregate_states - 1) /
313
190
                                 align_aggregate_states) *
314
190
                                        align_aggregate_states));
315
190
                        agg_method.hash_table.reset(new HashTableType());
316
190
                        return Status::OK();
317
190
                    }},
dependency.cpp:_ZZN5doris8pipeline14AggSharedState16reset_hash_tableEvENK3$_1clINS_10vectorized26MethodSingleNullableColumnINS4_15MethodOneNumberImNS4_15DataWithNullKeyI9PHHashMapImPc9HashCRC32ImEEEEEEEEEEDaRT_
Line
Count
Source
291
206
                    [&](auto& agg_method) {
292
206
                        auto& hash_table = *agg_method.hash_table;
293
206
                        using HashTableType = std::decay_t<decltype(hash_table)>;
294
295
206
                        agg_method.arena.clear();
296
206
                        agg_method.inited_iterator = false;
297
298
206
                        hash_table.for_each_mapped([&](auto& mapped) {
299
206
                            if (mapped) {
300
206
                                _destroy_agg_status(mapped);
301
206
                                mapped = nullptr;
302
206
                            }
303
206
                        });
304
305
206
                        if (hash_table.has_null_key_data()) {
306
0
                            _destroy_agg_status(hash_table.template get_null_key_data<
307
0
                                                vectorized::AggregateDataPtr>());
308
0
                        }
309
310
206
                        aggregate_data_container.reset(new AggregateDataContainer(
311
206
                                sizeof(typename HashTableType::key_type),
312
206
                                ((total_size_of_aggregate_states + align_aggregate_states - 1) /
313
206
                                 align_aggregate_states) *
314
206
                                        align_aggregate_states));
315
206
                        agg_method.hash_table.reset(new HashTableType());
316
206
                        return Status::OK();
317
206
                    }},
dependency.cpp:_ZZN5doris8pipeline14AggSharedState16reset_hash_tableEvENK3$_1clINS_10vectorized26MethodSingleNullableColumnINS4_15MethodOneNumberIjNS4_15DataWithNullKeyI9PHHashMapIjPc14HashMixWrapperIj9HashCRC32IjEEEEEEEEEEEDaRT_
Line
Count
Source
291
422
                    [&](auto& agg_method) {
292
422
                        auto& hash_table = *agg_method.hash_table;
293
422
                        using HashTableType = std::decay_t<decltype(hash_table)>;
294
295
422
                        agg_method.arena.clear();
296
422
                        agg_method.inited_iterator = false;
297
298
422
                        hash_table.for_each_mapped([&](auto& mapped) {
299
422
                            if (mapped) {
300
422
                                _destroy_agg_status(mapped);
301
422
                                mapped = nullptr;
302
422
                            }
303
422
                        });
304
305
422
                        if (hash_table.has_null_key_data()) {
306
0
                            _destroy_agg_status(hash_table.template get_null_key_data<
307
0
                                                vectorized::AggregateDataPtr>());
308
0
                        }
309
310
422
                        aggregate_data_container.reset(new AggregateDataContainer(
311
422
                                sizeof(typename HashTableType::key_type),
312
422
                                ((total_size_of_aggregate_states + align_aggregate_states - 1) /
313
422
                                 align_aggregate_states) *
314
422
                                        align_aggregate_states));
315
422
                        agg_method.hash_table.reset(new HashTableType());
316
422
                        return Status::OK();
317
422
                    }},
dependency.cpp:_ZZN5doris8pipeline14AggSharedState16reset_hash_tableEvENK3$_1clINS_10vectorized26MethodSingleNullableColumnINS4_15MethodOneNumberImNS4_15DataWithNullKeyI9PHHashMapImPc14HashMixWrapperIm9HashCRC32ImEEEEEEEEEEEDaRT_
Line
Count
Source
291
403
                    [&](auto& agg_method) {
292
403
                        auto& hash_table = *agg_method.hash_table;
293
403
                        using HashTableType = std::decay_t<decltype(hash_table)>;
294
295
403
                        agg_method.arena.clear();
296
403
                        agg_method.inited_iterator = false;
297
298
403
                        hash_table.for_each_mapped([&](auto& mapped) {
299
403
                            if (mapped) {
300
403
                                _destroy_agg_status(mapped);
301
403
                                mapped = nullptr;
302
403
                            }
303
403
                        });
304
305
403
                        if (hash_table.has_null_key_data()) {
306
0
                            _destroy_agg_status(hash_table.template get_null_key_data<
307
0
                                                vectorized::AggregateDataPtr>());
308
0
                        }
309
310
403
                        aggregate_data_container.reset(new AggregateDataContainer(
311
403
                                sizeof(typename HashTableType::key_type),
312
403
                                ((total_size_of_aggregate_states + align_aggregate_states - 1) /
313
403
                                 align_aggregate_states) *
314
403
                                        align_aggregate_states));
315
403
                        agg_method.hash_table.reset(new HashTableType());
316
403
                        return Status::OK();
317
403
                    }},
Unexecuted instantiation: dependency.cpp:_ZZN5doris8pipeline14AggSharedState16reset_hash_tableEvENK3$_1clINS_10vectorized26MethodSingleNullableColumnINS4_15MethodOneNumberIN4wide7integerILm128EjEENS4_15DataWithNullKeyI9PHHashMapIS9_Pc9HashCRC32IS9_EEEEEEEEEEDaRT_
Unexecuted instantiation: dependency.cpp:_ZZN5doris8pipeline14AggSharedState16reset_hash_tableEvENK3$_1clINS_10vectorized26MethodSingleNullableColumnINS4_15MethodOneNumberIN4wide7integerILm256EjEENS4_15DataWithNullKeyI9PHHashMapIS9_Pc9HashCRC32IS9_EEEEEEEEEEDaRT_
Unexecuted instantiation: dependency.cpp:_ZZN5doris8pipeline14AggSharedState16reset_hash_tableEvENK3$_1clINS_10vectorized26MethodSingleNullableColumnINS4_19MethodStringNoCacheINS4_15DataWithNullKeyINS_13StringHashMapIPcNS_9AllocatorILb1ELb1ELb0ENS_22DefaultMemoryAllocatorELb1EEEEEEEEEEEEEDaRT_
Unexecuted instantiation: dependency.cpp:_ZZN5doris8pipeline14AggSharedState16reset_hash_tableEvENK3$_1clINS_10vectorized15MethodKeysFixedI9PHHashMapImPc9HashCRC32ImEEEEEEDaRT_
Unexecuted instantiation: dependency.cpp:_ZZN5doris8pipeline14AggSharedState16reset_hash_tableEvENK3$_1clINS_10vectorized15MethodKeysFixedI9PHHashMapINS4_6UInt72EPc9HashCRC32IS7_EEEEEEDaRT_
Unexecuted instantiation: dependency.cpp:_ZZN5doris8pipeline14AggSharedState16reset_hash_tableEvENK3$_1clINS_10vectorized15MethodKeysFixedI9PHHashMapINS4_6UInt96EPc9HashCRC32IS7_EEEEEEDaRT_
Unexecuted instantiation: dependency.cpp:_ZZN5doris8pipeline14AggSharedState16reset_hash_tableEvENK3$_1clINS_10vectorized15MethodKeysFixedI9PHHashMapINS4_7UInt104EPc9HashCRC32IS7_EEEEEEDaRT_
Unexecuted instantiation: dependency.cpp:_ZZN5doris8pipeline14AggSharedState16reset_hash_tableEvENK3$_1clINS_10vectorized15MethodKeysFixedI9PHHashMapIN4wide7integerILm128EjEEPc9HashCRC32IS9_EEEEEEDaRT_
Unexecuted instantiation: dependency.cpp:_ZZN5doris8pipeline14AggSharedState16reset_hash_tableEvENK3$_1clINS_10vectorized15MethodKeysFixedI9PHHashMapINS4_7UInt136EPc9HashCRC32IS7_EEEEEEDaRT_
Unexecuted instantiation: dependency.cpp:_ZZN5doris8pipeline14AggSharedState16reset_hash_tableEvENK3$_1clINS_10vectorized15MethodKeysFixedI9PHHashMapIN4wide7integerILm256EjEEPc9HashCRC32IS9_EEEEEEDaRT_
318
2.88k
            agg_data->method_variant);
319
2.88k
}
320
321
313
void PartitionedAggSharedState::init_spill_params(size_t spill_partition_count) {
322
313
    partition_count = spill_partition_count;
323
313
    max_partition_index = partition_count - 1;
324
325
10.3k
    for (int i = 0; i < partition_count; ++i) {
326
10.0k
        spill_partitions.emplace_back(std::make_shared<AggSpillPartition>());
327
10.0k
    }
328
313
}
329
330
301
void PartitionedAggSharedState::update_spill_stream_profiles(RuntimeProfile* source_profile) {
331
9.63k
    for (auto& partition : spill_partitions) {
332
9.63k
        if (partition->spilling_stream_) {
333
0
            partition->spilling_stream_->update_shared_profiles(source_profile);
334
0
        }
335
9.63k
        for (auto& stream : partition->spill_streams_) {
336
1.84k
            if (stream) {
337
1.84k
                stream->update_shared_profiles(source_profile);
338
1.84k
            }
339
1.84k
        }
340
9.63k
    }
341
301
}
342
343
Status AggSpillPartition::get_spill_stream(RuntimeState* state, int node_id,
344
                                           RuntimeProfile* profile,
345
4.33k
                                           vectorized::SpillStreamSPtr& spill_stream) {
346
4.33k
    if (spilling_stream_) {
347
2.43k
        spill_stream = spilling_stream_;
348
2.43k
        return Status::OK();
349
2.43k
    }
350
1.89k
    RETURN_IF_ERROR(ExecEnv::GetInstance()->spill_stream_mgr()->register_spill_stream(
351
1.89k
            state, spilling_stream_, print_id(state->query_id()), "agg", node_id,
352
1.89k
            std::numeric_limits<int32_t>::max(), std::numeric_limits<size_t>::max(), profile));
353
1.89k
    spill_streams_.emplace_back(spilling_stream_);
354
1.89k
    spill_stream = spilling_stream_;
355
1.89k
    return Status::OK();
356
1.89k
}
357
7.08k
void AggSpillPartition::close() {
358
7.08k
    if (spilling_stream_) {
359
1
        spilling_stream_.reset();
360
1
    }
361
7.08k
    for (auto& stream : spill_streams_) {
362
5
        (void)ExecEnv::GetInstance()->spill_stream_mgr()->delete_spill_stream(stream);
363
5
    }
364
7.08k
    spill_streams_.clear();
365
7.08k
}
366
367
348
void PartitionedAggSharedState::close() {
368
    // need to use CAS instead of only `if (!is_closed)` statement,
369
    // to avoid concurrent entry of close() both pass the if statement
370
348
    bool false_close = false;
371
348
    if (!is_closed.compare_exchange_strong(false_close, true)) {
372
42
        return;
373
42
    }
374
348
    DCHECK(!false_close && is_closed);
375
7.08k
    for (auto partition : spill_partitions) {
376
7.08k
        partition->close();
377
7.08k
    }
378
306
    spill_partitions.clear();
379
306
}
380
381
15
void SpillSortSharedState::update_spill_stream_profiles(RuntimeProfile* source_profile) {
382
28
    for (auto& stream : sorted_streams) {
383
28
        if (stream) {
384
28
            stream->update_shared_profiles(source_profile);
385
28
        }
386
28
    }
387
15
}
388
389
17
void SpillSortSharedState::close() {
390
    // need to use CAS instead of only `if (!is_closed)` statement,
391
    // to avoid concurrent entry of close() both pass the if statement
392
17
    bool false_close = false;
393
17
    if (!is_closed.compare_exchange_strong(false_close, true)) {
394
1
        return;
395
1
    }
396
17
    DCHECK(!false_close && is_closed);
397
16
    for (auto& stream : sorted_streams) {
398
1
        (void)ExecEnv::GetInstance()->spill_stream_mgr()->delete_spill_stream(stream);
399
1
    }
400
16
    sorted_streams.clear();
401
16
}
402
403
MultiCastSharedState::MultiCastSharedState(ObjectPool* pool, int cast_sender_count, int node_id)
404
1.72k
        : multi_cast_data_streamer(std::make_unique<pipeline::MultiCastDataStreamer>(
405
1.72k
                  pool, cast_sender_count, node_id)) {}
406
407
0
void MultiCastSharedState::update_spill_stream_profiles(RuntimeProfile* source_profile) {}
408
409
106k
int AggSharedState::get_slot_column_id(const vectorized::AggFnEvaluator* evaluator) {
410
106k
    auto ctxs = evaluator->input_exprs_ctxs();
411
18.4E
    CHECK(ctxs.size() == 1 && ctxs[0]->root()->is_slot_ref())
412
18.4E
            << "input_exprs_ctxs is invalid, input_exprs_ctx[0]="
413
18.4E
            << ctxs[0]->root()->debug_string();
414
106k
    return ((vectorized::VSlotRef*)ctxs[0]->root().get())->column_id();
415
106k
}
416
417
2.58M
void AggSharedState::_destroy_agg_status(vectorized::AggregateDataPtr data) {
418
5.41M
    for (int i = 0; i < aggregate_evaluators.size(); ++i) {
419
2.82M
        aggregate_evaluators[i]->function()->destroy(data + offsets_of_aggregate_states[i]);
420
2.82M
    }
421
2.58M
}
422
423
98.9k
LocalExchangeSharedState::~LocalExchangeSharedState() = default;
424
425
1.56k
Status SetSharedState::update_build_not_ignore_null(const vectorized::VExprContextSPtrs& ctxs) {
426
1.56k
    if (ctxs.size() > build_not_ignore_null.size()) {
427
0
        return Status::InternalError("build_not_ignore_null not initialized");
428
0
    }
429
430
4.01k
    for (int i = 0; i < ctxs.size(); ++i) {
431
2.44k
        build_not_ignore_null[i] = build_not_ignore_null[i] || ctxs[i]->root()->is_nullable();
432
2.44k
    }
433
434
1.56k
    return Status::OK();
435
1.56k
}
436
437
2.42k
size_t SetSharedState::get_hash_table_size() const {
438
2.42k
    size_t hash_table_size = 0;
439
2.42k
    std::visit(
440
2.42k
            [&](auto&& arg) {
441
2.42k
                using HashTableCtxType = std::decay_t<decltype(arg)>;
442
2.42k
                if constexpr (!std::is_same_v<HashTableCtxType, std::monostate>) {
443
2.42k
                    hash_table_size = arg.hash_table->size();
444
2.42k
                }
445
2.42k
            },
Unexecuted instantiation: dependency.cpp:_ZZNK5doris8pipeline14SetSharedState19get_hash_table_sizeEvENK3$_0clIRSt9monostateEEDaOT_
dependency.cpp:_ZZNK5doris8pipeline14SetSharedState19get_hash_table_sizeEvENK3$_0clIRNS_10vectorized16MethodSerializedI9PHHashMapINS_9StringRefENS_14RowRefWithFlagE11DefaultHashIS7_vEEEEEEDaOT_
Line
Count
Source
440
1.10k
            [&](auto&& arg) {
441
1.10k
                using HashTableCtxType = std::decay_t<decltype(arg)>;
442
1.10k
                if constexpr (!std::is_same_v<HashTableCtxType, std::monostate>) {
443
1.10k
                    hash_table_size = arg.hash_table->size();
444
1.10k
                }
445
1.10k
            },
dependency.cpp:_ZZNK5doris8pipeline14SetSharedState19get_hash_table_sizeEvENK3$_0clIRNS_10vectorized19MethodStringNoCacheI9PHHashMapINS_9StringRefENS_14RowRefWithFlagE11DefaultHashIS7_vEEEEEEDaOT_
Line
Count
Source
440
260
            [&](auto&& arg) {
441
260
                using HashTableCtxType = std::decay_t<decltype(arg)>;
442
260
                if constexpr (!std::is_same_v<HashTableCtxType, std::monostate>) {
443
260
                    hash_table_size = arg.hash_table->size();
444
260
                }
445
260
            },
dependency.cpp:_ZZNK5doris8pipeline14SetSharedState19get_hash_table_sizeEvENK3$_0clIRNS_10vectorized26MethodSingleNullableColumnINS4_15MethodOneNumberIhNS4_15DataWithNullKeyI9PHHashMapIhNS_14RowRefWithFlagE9HashCRC32IhEEEEEEEEEEDaOT_
Line
Count
Source
440
57
            [&](auto&& arg) {
441
57
                using HashTableCtxType = std::decay_t<decltype(arg)>;
442
57
                if constexpr (!std::is_same_v<HashTableCtxType, std::monostate>) {
443
57
                    hash_table_size = arg.hash_table->size();
444
57
                }
445
57
            },
Unexecuted instantiation: dependency.cpp:_ZZNK5doris8pipeline14SetSharedState19get_hash_table_sizeEvENK3$_0clIRNS_10vectorized26MethodSingleNullableColumnINS4_15MethodOneNumberItNS4_15DataWithNullKeyI9PHHashMapItNS_14RowRefWithFlagE9HashCRC32ItEEEEEEEEEEDaOT_
dependency.cpp:_ZZNK5doris8pipeline14SetSharedState19get_hash_table_sizeEvENK3$_0clIRNS_10vectorized26MethodSingleNullableColumnINS4_15MethodOneNumberIjNS4_15DataWithNullKeyI9PHHashMapIjNS_14RowRefWithFlagE9HashCRC32IjEEEEEEEEEEDaOT_
Line
Count
Source
440
696
            [&](auto&& arg) {
441
696
                using HashTableCtxType = std::decay_t<decltype(arg)>;
442
696
                if constexpr (!std::is_same_v<HashTableCtxType, std::monostate>) {
443
696
                    hash_table_size = arg.hash_table->size();
444
696
                }
445
696
            },
dependency.cpp:_ZZNK5doris8pipeline14SetSharedState19get_hash_table_sizeEvENK3$_0clIRNS_10vectorized26MethodSingleNullableColumnINS4_15MethodOneNumberImNS4_15DataWithNullKeyI9PHHashMapImNS_14RowRefWithFlagE9HashCRC32ImEEEEEEEEEEDaOT_
Line
Count
Source
440
85
            [&](auto&& arg) {
441
85
                using HashTableCtxType = std::decay_t<decltype(arg)>;
442
85
                if constexpr (!std::is_same_v<HashTableCtxType, std::monostate>) {
443
85
                    hash_table_size = arg.hash_table->size();
444
85
                }
445
85
            },
dependency.cpp:_ZZNK5doris8pipeline14SetSharedState19get_hash_table_sizeEvENK3$_0clIRNS_10vectorized26MethodSingleNullableColumnINS4_15MethodOneNumberIN4wide7integerILm128EjEENS4_15DataWithNullKeyI9PHHashMapIS9_NS_14RowRefWithFlagE9HashCRC32IS9_EEEEEEEEEEDaOT_
Line
Count
Source
440
12
            [&](auto&& arg) {
441
12
                using HashTableCtxType = std::decay_t<decltype(arg)>;
442
12
                if constexpr (!std::is_same_v<HashTableCtxType, std::monostate>) {
443
12
                    hash_table_size = arg.hash_table->size();
444
12
                }
445
12
            },
Unexecuted instantiation: dependency.cpp:_ZZNK5doris8pipeline14SetSharedState19get_hash_table_sizeEvENK3$_0clIRNS_10vectorized26MethodSingleNullableColumnINS4_15MethodOneNumberIN4wide7integerILm256EjEENS4_15DataWithNullKeyI9PHHashMapIS9_NS_14RowRefWithFlagE9HashCRC32IS9_EEEEEEEEEEDaOT_
Unexecuted instantiation: dependency.cpp:_ZZNK5doris8pipeline14SetSharedState19get_hash_table_sizeEvENK3$_0clIRNS_10vectorized15MethodOneNumberIh9PHHashMapIhNS_14RowRefWithFlagE9HashCRC32IhEEEEEEDaOT_
Unexecuted instantiation: dependency.cpp:_ZZNK5doris8pipeline14SetSharedState19get_hash_table_sizeEvENK3$_0clIRNS_10vectorized15MethodOneNumberIt9PHHashMapItNS_14RowRefWithFlagE9HashCRC32ItEEEEEEDaOT_
dependency.cpp:_ZZNK5doris8pipeline14SetSharedState19get_hash_table_sizeEvENK3$_0clIRNS_10vectorized15MethodOneNumberIj9PHHashMapIjNS_14RowRefWithFlagE9HashCRC32IjEEEEEEDaOT_
Line
Count
Source
440
30
            [&](auto&& arg) {
441
30
                using HashTableCtxType = std::decay_t<decltype(arg)>;
442
30
                if constexpr (!std::is_same_v<HashTableCtxType, std::monostate>) {
443
30
                    hash_table_size = arg.hash_table->size();
444
30
                }
445
30
            },
dependency.cpp:_ZZNK5doris8pipeline14SetSharedState19get_hash_table_sizeEvENK3$_0clIRNS_10vectorized15MethodOneNumberIm9PHHashMapImNS_14RowRefWithFlagE9HashCRC32ImEEEEEEDaOT_
Line
Count
Source
440
16
            [&](auto&& arg) {
441
16
                using HashTableCtxType = std::decay_t<decltype(arg)>;
442
16
                if constexpr (!std::is_same_v<HashTableCtxType, std::monostate>) {
443
16
                    hash_table_size = arg.hash_table->size();
444
16
                }
445
16
            },
Unexecuted instantiation: dependency.cpp:_ZZNK5doris8pipeline14SetSharedState19get_hash_table_sizeEvENK3$_0clIRNS_10vectorized15MethodOneNumberIN4wide7integerILm128EjEE9PHHashMapIS8_NS_14RowRefWithFlagE9HashCRC32IS8_EEEEEEDaOT_
Unexecuted instantiation: dependency.cpp:_ZZNK5doris8pipeline14SetSharedState19get_hash_table_sizeEvENK3$_0clIRNS_10vectorized15MethodOneNumberIN4wide7integerILm256EjEE9PHHashMapIS8_NS_14RowRefWithFlagE9HashCRC32IS8_EEEEEEDaOT_
dependency.cpp:_ZZNK5doris8pipeline14SetSharedState19get_hash_table_sizeEvENK3$_0clIRNS_10vectorized15MethodKeysFixedI9PHHashMapImNS_14RowRefWithFlagE9HashCRC32ImEEEEEEDaOT_
Line
Count
Source
440
24
            [&](auto&& arg) {
441
24
                using HashTableCtxType = std::decay_t<decltype(arg)>;
442
24
                if constexpr (!std::is_same_v<HashTableCtxType, std::monostate>) {
443
24
                    hash_table_size = arg.hash_table->size();
444
24
                }
445
24
            },
dependency.cpp:_ZZNK5doris8pipeline14SetSharedState19get_hash_table_sizeEvENK3$_0clIRNS_10vectorized15MethodKeysFixedI9PHHashMapINS4_6UInt72ENS_14RowRefWithFlagE9HashCRC32IS7_EEEEEEDaOT_
Line
Count
Source
440
21
            [&](auto&& arg) {
441
21
                using HashTableCtxType = std::decay_t<decltype(arg)>;
442
21
                if constexpr (!std::is_same_v<HashTableCtxType, std::monostate>) {
443
21
                    hash_table_size = arg.hash_table->size();
444
21
                }
445
21
            },
dependency.cpp:_ZZNK5doris8pipeline14SetSharedState19get_hash_table_sizeEvENK3$_0clIRNS_10vectorized15MethodKeysFixedI9PHHashMapINS4_6UInt96ENS_14RowRefWithFlagE9HashCRC32IS7_EEEEEEDaOT_
Line
Count
Source
440
12
            [&](auto&& arg) {
441
12
                using HashTableCtxType = std::decay_t<decltype(arg)>;
442
12
                if constexpr (!std::is_same_v<HashTableCtxType, std::monostate>) {
443
12
                    hash_table_size = arg.hash_table->size();
444
12
                }
445
12
            },
dependency.cpp:_ZZNK5doris8pipeline14SetSharedState19get_hash_table_sizeEvENK3$_0clIRNS_10vectorized15MethodKeysFixedI9PHHashMapINS4_7UInt104ENS_14RowRefWithFlagE9HashCRC32IS7_EEEEEEDaOT_
Line
Count
Source
440
63
            [&](auto&& arg) {
441
63
                using HashTableCtxType = std::decay_t<decltype(arg)>;
442
63
                if constexpr (!std::is_same_v<HashTableCtxType, std::monostate>) {
443
63
                    hash_table_size = arg.hash_table->size();
444
63
                }
445
63
            },
Unexecuted instantiation: dependency.cpp:_ZZNK5doris8pipeline14SetSharedState19get_hash_table_sizeEvENK3$_0clIRNS_10vectorized15MethodKeysFixedI9PHHashMapIN4wide7integerILm128EjEENS_14RowRefWithFlagE9HashCRC32IS9_EEEEEEDaOT_
dependency.cpp:_ZZNK5doris8pipeline14SetSharedState19get_hash_table_sizeEvENK3$_0clIRNS_10vectorized15MethodKeysFixedI9PHHashMapIN4wide7integerILm256EjEENS_14RowRefWithFlagE9HashCRC32IS9_EEEEEEDaOT_
Line
Count
Source
440
4
            [&](auto&& arg) {
441
4
                using HashTableCtxType = std::decay_t<decltype(arg)>;
442
4
                if constexpr (!std::is_same_v<HashTableCtxType, std::monostate>) {
443
4
                    hash_table_size = arg.hash_table->size();
444
4
                }
445
4
            },
dependency.cpp:_ZZNK5doris8pipeline14SetSharedState19get_hash_table_sizeEvENK3$_0clIRNS_10vectorized15MethodKeysFixedI9PHHashMapINS4_7UInt136ENS_14RowRefWithFlagE9HashCRC32IS7_EEEEEEDaOT_
Line
Count
Source
440
38
            [&](auto&& arg) {
441
38
                using HashTableCtxType = std::decay_t<decltype(arg)>;
442
38
                if constexpr (!std::is_same_v<HashTableCtxType, std::monostate>) {
443
38
                    hash_table_size = arg.hash_table->size();
444
38
                }
445
38
            },
446
2.42k
            hash_table_variants->method_variant);
447
2.42k
    return hash_table_size;
448
2.42k
}
449
450
723
Status SetSharedState::hash_table_init() {
451
723
    std::vector<vectorized::DataTypePtr> data_types;
452
1.88k
    for (size_t i = 0; i != child_exprs_lists[0].size(); ++i) {
453
1.15k
        auto& ctx = child_exprs_lists[0][i];
454
1.15k
        auto data_type = ctx->root()->data_type();
455
1.15k
        if (build_not_ignore_null[i]) {
456
993
            data_type = vectorized::make_nullable(data_type);
457
993
        }
458
1.15k
        data_types.emplace_back(std::move(data_type));
459
1.15k
    }
460
723
    return init_hash_method<SetDataVariants>(hash_table_variants.get(), data_types, true);
461
723
}
462
463
void AggSharedState::refresh_top_limit(size_t row_id,
464
553
                                       const vectorized::ColumnRawPtrs& key_columns) {
465
1.79k
    for (int j = 0; j < key_columns.size(); ++j) {
466
1.23k
        limit_columns[j]->insert_from(*key_columns[j], row_id);
467
1.23k
    }
468
553
    limit_heap.emplace(limit_columns[0]->size() - 1, limit_columns, order_directions,
469
553
                       null_directions);
470
471
553
    limit_heap.pop();
472
553
    limit_columns_min = limit_heap.top()._row_id;
473
553
}
474
475
} // namespace doris::pipeline