Coverage Report

Created: 2026-03-30 19:02

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
be/src/runtime/runtime_state.cpp
Line
Count
Source
1
// Licensed to the Apache Software Foundation (ASF) under one
2
// or more contributor license agreements.  See the NOTICE file
3
// distributed with this work for additional information
4
// regarding copyright ownership.  The ASF licenses this file
5
// to you under the Apache License, Version 2.0 (the
6
// "License"); you may not use this file except in compliance
7
// with the License.  You may obtain a copy of the License at
8
//
9
//   http://www.apache.org/licenses/LICENSE-2.0
10
//
11
// Unless required by applicable law or agreed to in writing,
12
// software distributed under the License is distributed on an
13
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
14
// KIND, either express or implied.  See the License for the
15
// specific language governing permissions and limitations
16
// under the License.
17
// This file is copied from
18
// https://github.com/apache/impala/blob/branch-2.9.0/be/src/runtime/runtime-state.cpp
19
// and modified by Doris
20
21
#include "runtime/runtime_state.h"
22
23
#include <fmt/format.h>
24
#include <gen_cpp/PaloInternalService_types.h>
25
#include <gen_cpp/Types_types.h>
26
#include <glog/logging.h>
27
28
#include <fstream>
29
#include <memory>
30
#include <string>
31
32
#include "cloud/cloud_storage_engine.h"
33
#include "cloud/config.h"
34
#include "common/config.h"
35
#include "common/logging.h"
36
#include "common/object_pool.h"
37
#include "common/status.h"
38
#include "core/value/vdatetime_value.h"
39
#include "exec/operator/operator.h"
40
#include "exec/pipeline/pipeline_fragment_context.h"
41
#include "exec/pipeline/pipeline_task.h"
42
#include "exec/runtime_filter/runtime_filter_consumer.h"
43
#include "exec/runtime_filter/runtime_filter_mgr.h"
44
#include "exec/runtime_filter/runtime_filter_producer.h"
45
#include "exprs/function/cast/cast_to_date_or_datetime_impl.hpp"
46
#include "io/fs/s3_file_system.h"
47
#include "load/load_path_mgr.h"
48
#include "runtime/exec_env.h"
49
#include "runtime/fragment_mgr.h"
50
#include "runtime/memory/mem_tracker_limiter.h"
51
#include "runtime/query_context.h"
52
#include "runtime/thread_context.h"
53
#include "storage/id_manager.h"
54
#include "storage/storage_engine.h"
55
#include "util/timezone_utils.h"
56
#include "util/uid_util.h"
57
58
namespace doris {
59
#include "common/compile_check_begin.h"
60
using namespace ErrorCode;
61
62
RuntimeState::RuntimeState(const TPlanFragmentExecParams& fragment_exec_params,
63
                           const TQueryOptions& query_options, const TQueryGlobals& query_globals,
64
                           ExecEnv* exec_env, QueryContext* ctx,
65
                           const std::shared_ptr<MemTrackerLimiter>& query_mem_tracker)
66
0
        : _profile("Fragment " + print_id(fragment_exec_params.fragment_instance_id)),
67
0
          _load_channel_profile("<unnamed>"),
68
0
          _obj_pool(new ObjectPool()),
69
0
          _unreported_error_idx(0),
70
0
          _query_id(fragment_exec_params.query_id),
71
0
          _per_fragment_instance_idx(0),
72
0
          _num_rows_load_total(0),
73
0
          _num_rows_load_filtered(0),
74
0
          _num_rows_load_unselected(0),
75
0
          _num_print_error_rows(0),
76
0
          _num_bytes_load_total(0),
77
0
          _num_finished_scan_range(0),
78
0
          _query_ctx(ctx) {
79
0
    Status status =
80
0
            init(fragment_exec_params.fragment_instance_id, query_options, query_globals, exec_env);
81
0
    DCHECK(status.ok());
82
0
    _query_mem_tracker = query_mem_tracker;
83
0
    DCHECK(_query_mem_tracker != nullptr);
84
0
}
85
86
RuntimeState::RuntimeState(const TUniqueId& instance_id, const TUniqueId& query_id,
87
                           int32_t fragment_id, const TQueryOptions& query_options,
88
                           const TQueryGlobals& query_globals, ExecEnv* exec_env, QueryContext* ctx)
89
80
        : _profile("Fragment " + print_id(instance_id)),
90
80
          _load_channel_profile("<unnamed>"),
91
80
          _obj_pool(new ObjectPool()),
92
80
          _unreported_error_idx(0),
93
80
          _query_id(query_id),
94
80
          _fragment_id(fragment_id),
95
80
          _per_fragment_instance_idx(0),
96
80
          _num_rows_load_total(0),
97
80
          _num_rows_load_filtered(0),
98
80
          _num_rows_load_unselected(0),
99
80
          _num_rows_filtered_in_strict_mode_partial_update(0),
100
80
          _num_print_error_rows(0),
101
80
          _num_bytes_load_total(0),
102
80
          _num_finished_scan_range(0),
103
80
          _query_ctx(ctx) {
104
80
    [[maybe_unused]] auto status = init(instance_id, query_options, query_globals, exec_env);
105
80
    DCHECK(status.ok());
106
80
    _query_mem_tracker = ctx->query_mem_tracker();
107
80
}
108
109
RuntimeState::RuntimeState(const TUniqueId& query_id, int32_t fragment_id,
110
                           const TQueryOptions& query_options, const TQueryGlobals& query_globals,
111
                           ExecEnv* exec_env, QueryContext* ctx)
112
112
        : _profile(fmt::format("PipelineX(fragment_id={})", fragment_id)),
113
112
          _load_channel_profile("<unnamed>"),
114
112
          _obj_pool(new ObjectPool()),
115
112
          _unreported_error_idx(0),
116
112
          _query_id(query_id),
117
112
          _fragment_id(fragment_id),
118
112
          _per_fragment_instance_idx(0),
119
112
          _num_rows_load_total(0),
120
112
          _num_rows_load_filtered(0),
121
112
          _num_rows_load_unselected(0),
122
112
          _num_rows_filtered_in_strict_mode_partial_update(0),
123
112
          _num_print_error_rows(0),
124
112
          _num_bytes_load_total(0),
125
112
          _num_finished_scan_range(0),
126
112
          _query_ctx(ctx) {
127
    // TODO: do we really need instance id?
128
112
    Status status = init(TUniqueId(), query_options, query_globals, exec_env);
129
112
    DCHECK(status.ok());
130
112
    _query_mem_tracker = ctx->query_mem_tracker();
131
112
}
132
133
RuntimeState::RuntimeState(const TUniqueId& query_id, int32_t fragment_id,
134
                           const TQueryOptions& query_options, const TQueryGlobals& query_globals,
135
                           ExecEnv* exec_env,
136
                           const std::shared_ptr<MemTrackerLimiter>& query_mem_tracker)
137
0
        : _profile(fmt::format("PipelineX(fragment_id={})", fragment_id)),
138
0
          _load_channel_profile("<unnamed>"),
139
0
          _obj_pool(new ObjectPool()),
140
0
          _unreported_error_idx(0),
141
0
          _query_id(query_id),
142
0
          _fragment_id(fragment_id),
143
0
          _per_fragment_instance_idx(0),
144
0
          _num_rows_load_total(0),
145
0
          _num_rows_load_filtered(0),
146
0
          _num_rows_load_unselected(0),
147
0
          _num_rows_filtered_in_strict_mode_partial_update(0),
148
0
          _num_print_error_rows(0),
149
0
          _num_bytes_load_total(0),
150
0
          _num_finished_scan_range(0) {
151
0
    Status status = init(TUniqueId(), query_options, query_globals, exec_env);
152
0
    DCHECK(status.ok());
153
0
    _query_mem_tracker = query_mem_tracker;
154
0
    DCHECK(_query_mem_tracker != nullptr);
155
0
}
156
157
RuntimeState::RuntimeState(const TQueryOptions& query_options, const TQueryGlobals& query_globals)
158
49.3k
        : _profile("<unnamed>"),
159
49.3k
          _load_channel_profile("<unnamed>"),
160
49.3k
          _obj_pool(new ObjectPool()),
161
49.3k
          _unreported_error_idx(0),
162
49.3k
          _per_fragment_instance_idx(0) {
163
49.3k
    Status status = init(TUniqueId(), query_options, query_globals, nullptr);
164
49.3k
    _exec_env = ExecEnv::GetInstance();
165
49.3k
    init_mem_trackers("<unnamed>");
166
49.3k
    DCHECK(status.ok());
167
49.3k
}
168
169
RuntimeState::RuntimeState()
170
130k
        : _profile("<unnamed>"),
171
130k
          _load_channel_profile("<unnamed>"),
172
130k
          _obj_pool(new ObjectPool()),
173
130k
          _unreported_error_idx(0),
174
130k
          _per_fragment_instance_idx(0) {
175
130k
    _query_options.batch_size = DEFAULT_BATCH_SIZE;
176
130k
    _query_options.be_exec_version = BeExecVersionManager::get_newest_version();
177
130k
    _timezone = TimezoneUtils::default_time_zone;
178
130k
    _timestamp_ms = 0;
179
130k
    _nano_seconds = 0;
180
130k
    TimezoneUtils::find_cctz_time_zone(_timezone, _timezone_obj);
181
130k
    _exec_env = ExecEnv::GetInstance();
182
130k
    init_mem_trackers("<unnamed>");
183
130k
}
184
185
179k
RuntimeState::~RuntimeState() {
186
179k
    SCOPED_SWITCH_THREAD_MEM_TRACKER_LIMITER(_query_mem_tracker);
187
    // close error log file
188
179k
    if (_error_log_file != nullptr && _error_log_file->is_open()) {
189
0
        _error_log_file->close();
190
0
    }
191
179k
    _obj_pool->clear();
192
179k
}
193
194
2
const std::set<int>& RuntimeState::get_deregister_runtime_filter() const {
195
2
    return _registered_runtime_filter_ids;
196
2
}
197
198
2
void RuntimeState::merge_register_runtime_filter(const std::set<int>& runtime_filter_ids) {
199
2
    _registered_runtime_filter_ids.insert(runtime_filter_ids.begin(), runtime_filter_ids.end());
200
2
}
201
202
Status RuntimeState::init(const TUniqueId& fragment_instance_id, const TQueryOptions& query_options,
203
49.5k
                          const TQueryGlobals& query_globals, ExecEnv* exec_env) {
204
49.5k
    _fragment_instance_id = fragment_instance_id;
205
49.5k
    _query_options = query_options;
206
49.5k
    _lc_time_names = query_globals.lc_time_names;
207
49.5k
    if (query_globals.__isset.time_zone && query_globals.__isset.nano_seconds) {
208
49.2k
        _timezone = query_globals.time_zone;
209
49.2k
        _timestamp_ms = query_globals.timestamp_ms;
210
49.2k
        _nano_seconds = query_globals.nano_seconds;
211
49.2k
    } else if (query_globals.__isset.time_zone) {
212
0
        _timezone = query_globals.time_zone;
213
0
        _timestamp_ms = query_globals.timestamp_ms;
214
0
        _nano_seconds = 0;
215
313
    } else if (!query_globals.now_string.empty()) {
216
0
        _timezone = TimezoneUtils::default_time_zone;
217
0
        VecDateTimeValue dt;
218
0
        CastParameters params;
219
0
        DORIS_CHECK((CastToDateOrDatetime::from_string_strict_mode<DatelikeParseMode::STRICT,
220
0
                                                                   DatelikeTargetType::DATE_TIME>(
221
0
                {query_globals.now_string.c_str(), query_globals.now_string.size()}, dt, nullptr,
222
0
                params)));
223
0
        int64_t timestamp;
224
0
        dt.unix_timestamp(&timestamp, _timezone);
225
0
        _timestamp_ms = timestamp * 1000;
226
0
        _nano_seconds = 0;
227
313
    } else {
228
        //Unit test may set into here
229
313
        _timezone = TimezoneUtils::default_time_zone;
230
313
        _timestamp_ms = 0;
231
313
        _nano_seconds = 0;
232
313
    }
233
49.5k
    TimezoneUtils::find_cctz_time_zone(_timezone, _timezone_obj);
234
235
49.5k
    if (query_globals.__isset.load_zero_tolerance) {
236
49.5k
        _load_zero_tolerance = query_globals.load_zero_tolerance;
237
49.5k
    }
238
239
49.5k
    _exec_env = exec_env;
240
241
49.5k
    if (_query_options.max_errors <= 0) {
242
        // TODO: fix linker error and uncomment this
243
        //_query_options.max_errors = config::max_errors;
244
49.5k
        _query_options.max_errors = 100;
245
49.5k
    }
246
247
49.5k
    if (_query_options.batch_size <= 0) {
248
49.4k
        _query_options.batch_size = DEFAULT_BATCH_SIZE;
249
49.4k
    }
250
251
49.5k
    _db_name = "insert_stmt";
252
49.5k
    _import_label = print_id(fragment_instance_id);
253
254
49.5k
    _profile_level = query_options.__isset.profile_level ? query_options.profile_level : 2;
255
256
49.5k
    return Status::OK();
257
49.5k
}
258
259
0
std::weak_ptr<QueryContext> RuntimeState::get_query_ctx_weak() {
260
0
    return _exec_env->fragment_mgr()->get_query_ctx(_query_ctx->query_id());
261
0
}
262
263
179k
void RuntimeState::init_mem_trackers(const std::string& name, const TUniqueId& id) {
264
179k
    _query_mem_tracker = MemTrackerLimiter::create_shared(
265
179k
            MemTrackerLimiter::Type::OTHER, fmt::format("{}#Id={}", name, print_id(id)));
266
179k
}
267
268
173
std::shared_ptr<MemTrackerLimiter> RuntimeState::query_mem_tracker() const {
269
173
    CHECK(_query_mem_tracker != nullptr);
270
173
    return _query_mem_tracker;
271
173
}
272
273
11
WorkloadGroupPtr RuntimeState::workload_group() {
274
11
    return _query_ctx->workload_group();
275
11
}
276
277
0
bool RuntimeState::log_error(const std::string& error) {
278
0
    std::lock_guard<std::mutex> l(_error_log_lock);
279
280
0
    if (_error_log.size() < _query_options.max_errors) {
281
0
        _error_log.push_back(error);
282
0
        return true;
283
0
    }
284
285
0
    return false;
286
0
}
287
288
0
void RuntimeState::get_unreported_errors(std::vector<std::string>* new_errors) {
289
0
    std::lock_guard<std::mutex> l(_error_log_lock);
290
291
0
    if (_unreported_error_idx < _error_log.size()) {
292
0
        new_errors->assign(_error_log.begin() + _unreported_error_idx, _error_log.end());
293
0
        _unreported_error_idx = (int)_error_log.size();
294
0
    }
295
0
}
296
297
1.10M
bool RuntimeState::is_cancelled() const {
298
    // Maybe we should just return _is_cancelled.load()
299
1.10M
    return !_exec_status.ok() || (_query_ctx && _query_ctx->is_cancelled());
300
1.10M
}
301
302
0
Status RuntimeState::cancel_reason() const {
303
0
    if (!_exec_status.ok()) {
304
0
        return _exec_status.status();
305
0
    }
306
307
0
    if (_query_ctx) {
308
0
        return _query_ctx->exec_status();
309
0
    }
310
311
0
    return Status::Cancelled("Query cancelled");
312
0
}
313
314
const int64_t MAX_ERROR_NUM = 50;
315
316
0
Status RuntimeState::create_error_log_file() {
317
0
    if (config::save_load_error_log_to_s3 && config::is_cloud_mode()) {
318
0
        _s3_error_fs = std::dynamic_pointer_cast<io::S3FileSystem>(
319
0
                ExecEnv::GetInstance()->storage_engine().to_cloud().latest_fs());
320
0
        if (_s3_error_fs) {
321
0
            std::stringstream ss;
322
            // https://dev.mysql.com/doc/dev/mysql-server/latest/page_protocol_basic_err_packet.html
323
            // shorten the path as much as possible to prevent the length of the presigned URL from
324
            // exceeding the MySQL error packet size limit
325
0
            ss << "error_log/" << std::hex << _fragment_instance_id.lo;
326
0
            _s3_error_log_file_path = ss.str();
327
0
        }
328
0
    }
329
330
0
    static_cast<void>(_exec_env->load_path_mgr()->get_load_error_file_name(
331
0
            _db_name, _import_label, _fragment_instance_id, &_error_log_file_path));
332
0
    std::string error_log_absolute_path =
333
0
            _exec_env->load_path_mgr()->get_load_error_absolute_path(_error_log_file_path);
334
0
    _error_log_file = std::make_unique<std::ofstream>(error_log_absolute_path, std::ifstream::out);
335
0
    if (!_error_log_file->is_open()) {
336
0
        std::stringstream error_msg;
337
0
        error_msg << "Fail to open error file: [" << _error_log_file_path << "].";
338
0
        LOG(WARNING) << error_msg.str();
339
0
        return Status::InternalError(error_msg.str());
340
0
    }
341
0
    LOG(INFO) << "create error log file: " << _error_log_file_path
342
0
              << ", query id: " << print_id(_query_id)
343
0
              << ", fragment instance id: " << print_id(_fragment_instance_id);
344
345
0
    return Status::OK();
346
0
}
347
348
Status RuntimeState::append_error_msg_to_file(std::function<std::string()> line,
349
0
                                              std::function<std::string()> error_msg) {
350
0
    if (query_type() != TQueryType::LOAD) {
351
0
        return Status::OK();
352
0
    }
353
    // If file haven't been opened, open it here
354
0
    if (_error_log_file == nullptr) {
355
0
        Status status = create_error_log_file();
356
0
        if (!status.ok()) {
357
0
            LOG(WARNING) << "Create error file log failed. because: " << status;
358
0
            if (_error_log_file != nullptr) {
359
0
                _error_log_file->close();
360
0
            }
361
0
            return status;
362
0
        }
363
        // record the first error message if the file is just created
364
0
        _first_error_msg = error_msg() + ". Src line: " + line();
365
0
        LOG(INFO) << "The first error message: " << _first_error_msg;
366
0
    }
367
    // If num of printed error row exceeds the limit, don't add error messages to error log file any more
368
0
    if (_num_print_error_rows.fetch_add(1, std::memory_order_relaxed) > MAX_ERROR_NUM) {
369
        // if _load_zero_tolerance, return Error to stop the load process immediately.
370
0
        if (_load_zero_tolerance) {
371
0
            return Status::DataQualityError(
372
0
                    "Encountered unqualified data, stop processing. Please check if the source "
373
0
                    "data matches the schema, and consider disabling strict mode or increasing "
374
0
                    "max_filter_ratio.");
375
0
        }
376
0
        return Status::OK();
377
0
    }
378
379
0
    fmt::memory_buffer out;
380
    // Note: export reason first in case src line too long and be truncated.
381
0
    fmt::format_to(out, "Reason: {}. src line [{}]; ", error_msg(), line());
382
383
0
    size_t error_row_size = out.size();
384
0
    if (error_row_size > 0) {
385
0
        if (error_row_size > config::load_error_log_limit_bytes) {
386
0
            fmt::memory_buffer limit_byte_out;
387
0
            limit_byte_out.append(out.data(), out.data() + config::load_error_log_limit_bytes);
388
0
            (*_error_log_file) << fmt::to_string(limit_byte_out) + "error log is too long"
389
0
                               << std::endl;
390
0
        } else {
391
0
            (*_error_log_file) << fmt::to_string(out) << std::endl;
392
0
        }
393
0
    }
394
395
0
    return Status::OK();
396
0
}
397
398
0
std::string RuntimeState::get_error_log_file_path() {
399
0
    DBUG_EXECUTE_IF("RuntimeState::get_error_log_file_path.block", {
400
0
        if (!_error_log_file_path.empty()) {
401
0
            std::this_thread::sleep_for(std::chrono::seconds(1));
402
0
        }
403
0
    });
404
0
    std::lock_guard<std::mutex> l(_s3_error_log_file_lock);
405
0
    if (_s3_error_fs && _error_log_file && _error_log_file->is_open()) {
406
        // close error log file
407
0
        _error_log_file->close();
408
0
        std::string error_log_absolute_path =
409
0
                _exec_env->load_path_mgr()->get_load_error_absolute_path(_error_log_file_path);
410
        // upload error log file to s3
411
0
        Status st = _s3_error_fs->upload(error_log_absolute_path, _s3_error_log_file_path);
412
0
        if (!st.ok()) {
413
            // upload failed and return local error log file path
414
0
            LOG(WARNING) << "Fail to upload error file to s3, error_log_file_path="
415
0
                         << _error_log_file_path << ", error=" << st;
416
0
            return _error_log_file_path;
417
0
        }
418
        // expiration must be less than a week (in seconds) for presigned url
419
0
        static const unsigned EXPIRATION_SECONDS = 7 * 24 * 60 * 60 - 1;
420
        // Use public or private endpoint based on configuration
421
0
        _error_log_file_path =
422
0
                _s3_error_fs->generate_presigned_url(_s3_error_log_file_path, EXPIRATION_SECONDS,
423
0
                                                     config::use_public_endpoint_for_error_log);
424
0
    }
425
0
    return _error_log_file_path;
426
0
}
427
428
72.3k
void RuntimeState::resize_op_id_to_local_state(int operator_size) {
429
72.3k
    _op_id_to_local_state.resize(-operator_size);
430
72.3k
}
431
432
void RuntimeState::emplace_local_state(int id,
433
24.3k
                                       std::unique_ptr<doris::PipelineXLocalStateBase> state) {
434
24.3k
    id = -id;
435
24.3k
    DCHECK_LT(id, _op_id_to_local_state.size())
436
0
            << state->parent()->get_name() << " node id = " << state->parent()->node_id();
437
24.3k
    DCHECK(!_op_id_to_local_state[id]);
438
24.3k
    _op_id_to_local_state[id] = std::move(state);
439
24.3k
}
440
441
2.82M
doris::PipelineXLocalStateBase* RuntimeState::get_local_state(int id) {
442
2.82M
    DCHECK_GT(_op_id_to_local_state.size(), -id);
443
2.82M
    return _op_id_to_local_state[-id].get();
444
2.82M
}
445
446
24.0k
Result<RuntimeState::LocalState*> RuntimeState::get_local_state_result(int id) {
447
24.0k
    id = -id;
448
24.0k
    if (id >= _op_id_to_local_state.size()) {
449
0
        return ResultError(Status::InternalError("get_local_state out of range size:{} , id:{}",
450
0
                                                 _op_id_to_local_state.size(), id));
451
0
    }
452
24.0k
    if (!_op_id_to_local_state[id]) {
453
0
        return ResultError(Status::InternalError("get_local_state id:{} is null", id));
454
0
    }
455
24.0k
    return _op_id_to_local_state[id].get();
456
24.0k
};
457
458
void RuntimeState::emplace_sink_local_state(
459
72.3k
        int id, std::unique_ptr<doris::PipelineXSinkLocalStateBase> state) {
460
72.3k
    DCHECK(!_sink_local_state) << " id=" << id << " state: " << state->debug_string(0);
461
72.3k
    _sink_local_state = std::move(state);
462
72.3k
}
463
464
440k
doris::PipelineXSinkLocalStateBase* RuntimeState::get_sink_local_state() {
465
440k
    return _sink_local_state.get();
466
440k
}
467
468
1.48M
Result<RuntimeState::SinkLocalState*> RuntimeState::get_sink_local_state_result() {
469
1.48M
    if (!_sink_local_state) {
470
0
        return ResultError(Status::InternalError("_op_id_to_sink_local_state not exist"));
471
0
    }
472
1.48M
    return _sink_local_state.get();
473
1.48M
}
474
475
0
bool RuntimeState::enable_page_cache() const {
476
0
    return !config::disable_storage_page_cache &&
477
0
           (_query_options.__isset.enable_page_cache && _query_options.enable_page_cache);
478
0
}
479
480
60
RuntimeFilterMgr* RuntimeState::global_runtime_filter_mgr() {
481
60
    return _query_ctx->runtime_filter_mgr();
482
60
}
483
484
Status RuntimeState::register_producer_runtime_filter(
485
29
        const TRuntimeFilterDesc& desc, std::shared_ptr<RuntimeFilterProducer>* producer_filter) {
486
29
    _registered_runtime_filter_ids.insert(desc.filter_id);
487
    // Producers are created by local runtime filter mgr and shared by global runtime filter manager.
488
    // When RF is published, consumers in both global and local RF mgr will be found.
489
29
    RETURN_IF_ERROR(local_runtime_filter_mgr()->register_producer_filter(_query_ctx, desc,
490
29
                                                                         producer_filter));
491
    // Stamp the producer with the current recursive CTE stage so that outgoing merge RPCs
492
    // carry the correct round number and stale messages from old rounds are discarded.
493
    // PFC must still be alive: this runs inside a pipeline task, so the execution context
494
    // cannot have expired yet.
495
    // In unit-test scenarios the task execution context is never set (no PipelineFragmentContext
496
    // exists), so skip the stage stamping — the default stage (0) is correct.
497
29
    if (task_execution_context_inited()) {
498
2
        auto pfc = std::static_pointer_cast<PipelineFragmentContext>(
499
2
                get_task_execution_context().lock());
500
2
        DORIS_CHECK(pfc);
501
2
        (*producer_filter)->set_stage(pfc->rec_cte_stage());
502
2
    }
503
29
    RETURN_IF_ERROR(global_runtime_filter_mgr()->register_local_merger_producer_filter(
504
29
            _query_ctx, desc, *producer_filter));
505
29
    return Status::OK();
506
29
}
507
508
Status RuntimeState::register_consumer_runtime_filter(
509
        const TRuntimeFilterDesc& desc, bool need_local_merge, int node_id,
510
6
        std::shared_ptr<RuntimeFilterConsumer>* consumer_filter) {
511
6
    _registered_runtime_filter_ids.insert(desc.filter_id);
512
6
    bool need_merge = desc.has_remote_targets || need_local_merge;
513
6
    RuntimeFilterMgr* mgr = need_merge ? global_runtime_filter_mgr() : local_runtime_filter_mgr();
514
6
    RETURN_IF_ERROR(mgr->register_consumer_filter(this, desc, node_id, consumer_filter));
515
    // Stamp the consumer with the current recursive CTE stage so that incoming publish RPCs
516
    // from old rounds are detected and discarded.
517
    // PFC must still be alive: this runs inside a pipeline task, so the execution context
518
    // cannot have expired yet.
519
    // In unit-test scenarios the task execution context is never set (no PipelineFragmentContext
520
    // exists), so skip the stage stamping — the default stage (0) is correct.
521
6
    if (task_execution_context_inited()) {
522
0
        auto pfc = std::static_pointer_cast<PipelineFragmentContext>(
523
0
                get_task_execution_context().lock());
524
0
        DORIS_CHECK(pfc);
525
0
        (*consumer_filter)->set_stage(pfc->rec_cte_stage());
526
0
    }
527
6
    return Status::OK();
528
6
}
529
530
72
bool RuntimeState::is_nereids() const {
531
72
    return _query_ctx->is_nereids();
532
72
}
533
534
0
std::vector<std::shared_ptr<RuntimeProfile>> RuntimeState::pipeline_id_to_profile() {
535
0
    std::shared_lock lc(_pipeline_profile_lock);
536
0
    return _pipeline_id_to_profile;
537
0
}
538
539
std::vector<std::shared_ptr<RuntimeProfile>> RuntimeState::build_pipeline_profile(
540
0
        std::size_t pipeline_size) {
541
0
    std::unique_lock lc(_pipeline_profile_lock);
542
0
    if (!_pipeline_id_to_profile.empty()) {
543
0
        return _pipeline_id_to_profile;
544
0
    }
545
0
    _pipeline_id_to_profile.resize(pipeline_size);
546
0
    {
547
0
        size_t pip_idx = 0;
548
0
        for (auto& pipeline_profile : _pipeline_id_to_profile) {
549
0
            pipeline_profile =
550
0
                    std::make_shared<RuntimeProfile>(fmt::format("Pipeline(id={})", pip_idx));
551
0
            pip_idx++;
552
0
        }
553
0
    }
554
0
    return _pipeline_id_to_profile;
555
0
}
556
557
916k
bool RuntimeState::low_memory_mode() const {
558
916k
#ifdef BE_TEST
559
916k
    if (!_query_ctx) {
560
0
        return false;
561
0
    }
562
916k
#endif
563
916k
    return _query_ctx->low_memory_mode();
564
916k
}
565
566
0
void RuntimeState::set_id_file_map() {
567
0
    _id_file_map = _exec_env->get_id_manager()->add_id_file_map(_query_id, execution_timeout());
568
0
}
569
#include "common/compile_check_end.h"
570
} // end namespace doris