Coverage Report

Created: 2026-05-21 06:29

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
be/src/exec/exchange/vdata_stream_recvr.cpp
Line
Count
Source
1
// Licensed to the Apache Software Foundation (ASF) under one
2
// or more contributor license agreements.  See the NOTICE file
3
// distributed with this work for additional information
4
// regarding copyright ownership.  The ASF licenses this file
5
// to you under the Apache License, Version 2.0 (the
6
// "License"); you may not use this file except in compliance
7
// with the License.  You may obtain a copy of the License at
8
//
9
//   http://www.apache.org/licenses/LICENSE-2.0
10
//
11
// Unless required by applicable law or agreed to in writing,
12
// software distributed under the License is distributed on an
13
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
14
// KIND, either express or implied.  See the License for the
15
// specific language governing permissions and limitations
16
// under the License.
17
18
#include "exec/exchange/vdata_stream_recvr.h"
19
20
#include <fmt/format.h>
21
#include <gen_cpp/Metrics_types.h>
22
#include <gen_cpp/Types_types.h>
23
#include <gen_cpp/data.pb.h>
24
25
#include <algorithm>
26
#include <functional>
27
#include <string>
28
29
#include "common/logging.h"
30
#include "core/block/block.h"
31
#include "core/block/materialize_block.h"
32
#include "exec/exchange/vdata_stream_mgr.h"
33
#include "exec/operator/exchange_sink_operator.h"
34
#include "exec/operator/exchange_source_operator.h"
35
#include "exec/sort/sort_cursor.h"
36
#include "exec/sort/vsorted_run_merger.h"
37
#include "runtime/memory/mem_tracker.h"
38
#include "runtime/runtime_state.h"
39
#include "runtime/thread_context.h"
40
#include "util/defer_op.h"
41
#include "util/uid_util.h"
42
43
namespace doris {
44
45
VDataStreamRecvr::SenderQueue::SenderQueue(VDataStreamRecvr* parent_recvr, int num_senders,
46
                                           std::shared_ptr<Dependency> local_channel_dependency)
47
679k
        : _recvr(parent_recvr),
48
679k
          _is_cancelled(false),
49
679k
          _num_remaining_senders(num_senders),
50
679k
          _local_channel_dependency(local_channel_dependency) {
51
679k
    _cancel_status = Status::OK();
52
679k
    _queue_mem_tracker = std::make_unique<MemTracker>("local data queue mem tracker");
53
679k
}
54
55
685k
VDataStreamRecvr::SenderQueue::~SenderQueue() {
56
685k
    run_block_queue_done_callbacks(_block_queue);
57
685k
    _block_queue.clear();
58
685k
}
59
60
1.05M
Status VDataStreamRecvr::SenderQueue::get_batch(Block* block, bool* eos) {
61
1.05M
    BlockItem block_item;
62
1.05M
    {
63
1.05M
        INJECT_MOCK_SLEEP(std::lock_guard<std::mutex> l(_lock));
64
1.05M
#ifndef NDEBUG
65
1.06M
        if (!_is_cancelled && _block_queue.empty() && _num_remaining_senders > 0) {
66
0
            throw doris::Exception(ErrorCode::INTERNAL_ERROR,
67
0
                                   "_is_cancelled: {}, _block_queue_empty: {}, "
68
0
                                   "_num_remaining_senders: {}",
69
0
                                   _is_cancelled, _block_queue.empty(), _num_remaining_senders);
70
0
        }
71
1.05M
#endif
72
        //check and get block_item from data_queue
73
1.05M
        if (_is_cancelled) {
74
3
            RETURN_IF_ERROR(_cancel_status);
75
2
            return Status::Cancelled("Cancelled");
76
3
        }
77
78
1.05M
        if (_block_queue.empty()) {
79
669k
            if (_num_remaining_senders != 0) {
80
0
                return Status::InternalError(
81
0
                        "Data queue is empty but there are still remaining senders. "
82
0
                        "_num_remaining_senders: {}",
83
0
                        _num_remaining_senders);
84
0
            }
85
669k
            *eos = true;
86
669k
            return Status::OK();
87
669k
        }
88
89
1.05M
        DCHECK(!_block_queue.empty());
90
389k
        block_item = std::move(_block_queue.front());
91
389k
        _block_queue.pop_front();
92
389k
    }
93
0
    BlockUPtr next_block;
94
389k
    RETURN_IF_ERROR(block_item.get_block(next_block));
95
389k
    size_t block_byte_size = block_item.block_byte_size();
96
389k
    COUNTER_UPDATE(_recvr->_deserialize_row_batch_timer, block_item.deserialize_time());
97
389k
    COUNTER_UPDATE(_recvr->_decompress_timer, block_item.decompress_time());
98
389k
    COUNTER_UPDATE(_recvr->_decompress_bytes, block_item.decompress_bytes());
99
389k
    _recvr->_memory_used_counter->update(-(int64_t)block_byte_size);
100
389k
    INJECT_MOCK_SLEEP(std::lock_guard<std::mutex> l(_lock));
101
389k
    sub_blocks_memory_usage(block_byte_size);
102
389k
    if (_block_queue.empty() && _source_dependency) {
103
324k
        if (!_is_cancelled && _num_remaining_senders > 0) {
104
132k
            _source_dependency->block();
105
132k
        }
106
324k
    }
107
108
389k
    block_item.call_done(_recvr);
109
110
389k
    DCHECK(block->empty());
111
389k
    block->swap(*next_block);
112
389k
    *eos = false;
113
389k
    return Status::OK();
114
389k
}
115
116
1.75M
void VDataStreamRecvr::SenderQueue::set_source_ready(std::lock_guard<std::mutex>&) {
117
    // Here, it is necessary to check if _source_dependency is not nullptr.
118
    // This is because the queue might be closed before setting the source dependency.
119
1.75M
    if (!_source_dependency) {
120
46
        return;
121
46
    }
122
1.75M
    const bool should_wait = !_is_cancelled && _block_queue.empty() && _num_remaining_senders > 0;
123
1.75M
    if (!should_wait) {
124
1.75M
        _source_dependency->set_ready();
125
1.75M
    }
126
1.75M
}
127
128
void VDataStreamRecvr::SenderQueue::run_block_queue_done_callbacks(
129
1.37M
        std::list<BlockItem>& block_queue) {
130
1.37M
    for (auto& block_item : block_queue) {
131
1.55k
        block_item.call_done(_recvr);
132
1.55k
    }
133
1.37M
}
134
135
13
std::string VDataStreamRecvr::SenderQueue::debug_string() {
136
13
    std::lock_guard<std::mutex> l(_lock);
137
13
    fmt::memory_buffer debug_string_buffer;
138
13
    fmt::format_to(debug_string_buffer,
139
13
                   "_num_remaining_senders = {}, block_queue size = {}, _is_cancelled: {}, "
140
13
                   "_cancel_status: {}, _sender_eos_set: (",
141
13
                   _num_remaining_senders, _block_queue.size(), _is_cancelled,
142
13
                   _cancel_status.to_string());
143
13
    for (auto& i : _sender_eos_set) {
144
2
        fmt::format_to(debug_string_buffer, "{}, ", i);
145
2
    }
146
13
    fmt::format_to(debug_string_buffer, ")");
147
13
    return fmt::to_string(debug_string_buffer);
148
13
}
149
150
Status VDataStreamRecvr::SenderQueue::add_block(std::unique_ptr<PBlock> pblock, int be_number,
151
                                                int64_t packet_seq,
152
                                                ::google::protobuf::Closure** done,
153
                                                const int64_t wait_for_worker,
154
2.09k
                                                const uint64_t time_to_find_recvr) {
155
2.09k
    {
156
2.09k
        INJECT_MOCK_SLEEP(std::lock_guard<std::mutex> l(_lock));
157
2.09k
        if (_is_cancelled) {
158
1.56k
            return Status::OK();
159
1.56k
        }
160
530
        auto iter = _packet_seq_map.find(be_number);
161
530
        if (iter != _packet_seq_map.end()) {
162
525
            if (iter->second >= packet_seq) {
163
0
                return Status::InternalError(
164
0
                        "packet already exist [cur_packet_id= {} receive_packet_id={}]",
165
0
                        iter->second, packet_seq);
166
0
            }
167
525
            iter->second = packet_seq;
168
525
        } else {
169
5
            _packet_seq_map.emplace(be_number, packet_seq);
170
5
        }
171
172
530
        DCHECK(_num_remaining_senders >= 0);
173
530
        if (_num_remaining_senders == 0) {
174
0
            DCHECK(_sender_eos_set.contains(be_number));
175
0
            return Status::OK();
176
0
        }
177
530
    }
178
179
530
    INJECT_MOCK_SLEEP(std::lock_guard<std::mutex> l(_lock));
180
530
    if (_is_cancelled) {
181
5
        return Status::OK();
182
5
    }
183
184
525
    const auto block_byte_size = pblock->ByteSizeLong();
185
525
    COUNTER_UPDATE(_recvr->_blocks_produced_counter, 1);
186
525
    if (_recvr->_max_wait_worker_time->value() < wait_for_worker) {
187
0
        _recvr->_max_wait_worker_time->set(wait_for_worker);
188
0
    }
189
190
525
    if (_recvr->_max_find_recvr_time->value() < time_to_find_recvr) {
191
0
        _recvr->_max_find_recvr_time->set((int64_t)time_to_find_recvr);
192
0
    }
193
194
525
    _block_queue.emplace_back(std::move(pblock), block_byte_size);
195
525
    COUNTER_UPDATE(_recvr->_remote_bytes_received_counter, block_byte_size);
196
525
    set_source_ready(l);
197
198
    // if done is nullptr, this function can't delay this response
199
535
    if (done != nullptr && _recvr->exceeds_limit(block_byte_size)) {
200
34
        _block_queue.back().set_done(*done);
201
34
        *done = nullptr;
202
34
    }
203
525
    _recvr->_memory_used_counter->update(block_byte_size);
204
525
    add_blocks_memory_usage(block_byte_size);
205
525
    return Status::OK();
206
530
}
207
208
Status VDataStreamRecvr::SenderQueue::add_blocks(const PTransmitDataParams* request,
209
                                                 ::google::protobuf::Closure** done,
210
                                                 const int64_t wait_for_worker,
211
119k
                                                 const uint64_t time_to_find_recvr) {
212
119k
    {
213
119k
        INJECT_MOCK_SLEEP(std::lock_guard<std::mutex> l(_lock));
214
119k
        if (_is_cancelled) {
215
0
            return Status::OK();
216
0
        }
217
119k
        const int be_number = request->be_number();
218
        // In the request, the packet_seq for blocks is [request->packet_seq() - blocks_size(), request->packet_seq())
219
        // Note this is a left-closed, right-open interval; the packet_seq of the last block is request->packet_seq() - 1
220
        // We store the packet_seq of the last block in _packet_seq_map so we can compare it with the packet_seq of the next received packet
221
119k
        const int64_t packet_seq = request->packet_seq() - 1;
222
119k
        auto iter = _packet_seq_map.find(be_number);
223
119k
        if (iter != _packet_seq_map.end()) {
224
20.6k
            if (iter->second > (packet_seq - request->blocks_size())) {
225
0
                return Status::InternalError(
226
0
                        "packet already exist [cur_packet_id= {} receive_packet_id={}]",
227
0
                        iter->second, packet_seq);
228
0
            }
229
20.6k
            iter->second = packet_seq;
230
98.3k
        } else {
231
98.3k
            _packet_seq_map.emplace(be_number, packet_seq);
232
98.3k
        }
233
234
119k
        DCHECK(_num_remaining_senders >= 0);
235
119k
        if (_num_remaining_senders == 0) {
236
0
            DCHECK(_sender_eos_set.end() != _sender_eos_set.find(be_number));
237
0
            return Status::OK();
238
0
        }
239
119k
    }
240
241
119k
    INJECT_MOCK_SLEEP(std::lock_guard<std::mutex> l(_lock));
242
119k
    if (_is_cancelled) {
243
0
        return Status::OK();
244
0
    }
245
246
119k
    int64_t total_block_byte_size = 0;
247
238k
    for (int i = 0; i < request->blocks_size(); i++) {
248
119k
        std::unique_ptr<PBlock> pblock = std::make_unique<PBlock>();
249
119k
        pblock->CopyFrom(request->blocks(i));
250
251
119k
        const auto block_byte_size = pblock->ByteSizeLong();
252
119k
        COUNTER_UPDATE(_recvr->_blocks_produced_counter, 1);
253
119k
        if (_recvr->_max_wait_worker_time->value() < wait_for_worker) {
254
1
            _recvr->_max_wait_worker_time->set(wait_for_worker);
255
1
        }
256
257
119k
        if (_recvr->_max_find_recvr_time->value() < time_to_find_recvr) {
258
93.5k
            _recvr->_max_find_recvr_time->set((int64_t)time_to_find_recvr);
259
93.5k
        }
260
261
119k
        _block_queue.emplace_back(std::move(pblock), block_byte_size);
262
119k
        COUNTER_UPDATE(_recvr->_remote_bytes_received_counter, block_byte_size);
263
119k
        total_block_byte_size += block_byte_size;
264
119k
    }
265
266
119k
    set_source_ready(l);
267
268
    // if done is nullptr, this function can't delay this response
269
119k
    if (done != nullptr && _recvr->exceeds_limit(total_block_byte_size)) {
270
1
        _block_queue.back().set_done(*done);
271
1
        *done = nullptr;
272
1
    }
273
119k
    _recvr->_memory_used_counter->update(total_block_byte_size);
274
119k
    add_blocks_memory_usage(total_block_byte_size);
275
119k
    return Status::OK();
276
119k
}
277
278
272k
void VDataStreamRecvr::SenderQueue::add_block(Block* block, bool use_move) {
279
272k
    if (block->rows() == 0) {
280
0
        return;
281
0
    }
282
272k
    {
283
272k
        INJECT_MOCK_SLEEP(std::unique_lock<std::mutex> l(_lock));
284
272k
        if (_is_cancelled) {
285
297
            return;
286
297
        }
287
272k
        DCHECK(_num_remaining_senders >= 0);
288
272k
        if (_num_remaining_senders == 0) {
289
1
            return;
290
1
        }
291
272k
    }
292
272k
    BlockUPtr nblock = Block::create_unique(block->get_columns_with_type_and_name());
293
294
    // local exchange should copy the block contented if use move == false
295
272k
    if (use_move) {
296
264k
        block->clear();
297
264k
    } else {
298
7.56k
        auto rows = block->rows();
299
20.8k
        for (int i = 0; i < nblock->columns(); ++i) {
300
13.2k
            nblock->get_by_position(i).column =
301
13.2k
                    nblock->get_by_position(i).column->clone_resized(rows);
302
13.2k
        }
303
7.56k
    }
304
272k
    materialize_block_inplace(*nblock);
305
306
272k
    auto block_mem_size = nblock->allocated_bytes();
307
272k
    {
308
272k
        INJECT_MOCK_SLEEP(std::lock_guard<std::mutex> l(_lock));
309
272k
        if (_is_cancelled) {
310
1
            return;
311
1
        }
312
272k
        _block_queue.emplace_back(std::move(nblock), block_mem_size);
313
272k
        set_source_ready(l);
314
272k
        COUNTER_UPDATE(_recvr->_local_bytes_received_counter, block_mem_size);
315
272k
        _recvr->_memory_used_counter->update(block_mem_size);
316
272k
        add_blocks_memory_usage(block_mem_size);
317
272k
    }
318
272k
}
319
320
3.27M
void VDataStreamRecvr::SenderQueue::decrement_senders(int be_number) {
321
3.27M
    INJECT_MOCK_SLEEP(std::lock_guard<std::mutex> l(_lock));
322
3.27M
    if (_sender_eos_set.end() != _sender_eos_set.find(be_number)) {
323
0
        return;
324
0
    }
325
3.27M
    _sender_eos_set.insert(be_number);
326
3.27M
    DCHECK_GT(_num_remaining_senders, 0);
327
3.27M
    _num_remaining_senders--;
328
18.4E
    VLOG_FILE << "decremented senders: fragment_instance_id="
329
18.4E
              << print_id(_recvr->fragment_instance_id()) << " node_id=" << _recvr->dest_node_id()
330
18.4E
              << " #senders=" << _num_remaining_senders;
331
3.27M
    if (_num_remaining_senders == 0) {
332
676k
        set_source_ready(l);
333
676k
    }
334
3.27M
}
335
336
685k
void VDataStreamRecvr::SenderQueue::cancel(Status cancel_status) {
337
685k
    std::list<BlockItem> block_queue;
338
685k
    {
339
685k
        INJECT_MOCK_SLEEP(std::lock_guard<std::mutex> l(_lock));
340
686k
        if (_is_cancelled) {
341
686k
            return;
342
686k
        }
343
18.4E
        _is_cancelled = true;
344
18.4E
        _cancel_status = cancel_status;
345
18.4E
        set_source_ready(l);
346
18.4E
        VLOG_QUERY << "cancelled stream: _fragment_instance_id="
347
18.4E
                   << print_id(_recvr->fragment_instance_id())
348
18.4E
                   << " node_id=" << _recvr->dest_node_id();
349
18.4E
        block_queue.splice(block_queue.end(), _block_queue);
350
18.4E
    }
351
0
    run_block_queue_done_callbacks(block_queue);
352
18.4E
}
353
354
685k
void VDataStreamRecvr::SenderQueue::close() {
355
    // If _is_cancelled is not set to true, there may be concurrent send
356
    // which add batch to _block_queue. The batch added after _block_queue
357
    // is clear will be memory leak
358
685k
    std::list<BlockItem> block_queue;
359
685k
    {
360
685k
        INJECT_MOCK_SLEEP(std::lock_guard<std::mutex> l(_lock));
361
685k
        _is_cancelled = true;
362
685k
        set_source_ready(l);
363
685k
        block_queue.splice(block_queue.end(), _block_queue);
364
685k
    }
365
    // Release delayed RPC callbacks after the queue state is fully closed.
366
685k
    run_block_queue_done_callbacks(block_queue);
367
685k
}
368
369
VDataStreamRecvr::VDataStreamRecvr(VDataStreamMgr* stream_mgr,
370
                                   RuntimeProfile::HighWaterMarkCounter* memory_used_counter,
371
                                   RuntimeState* state, const TUniqueId& fragment_instance_id,
372
                                   PlanNodeId dest_node_id, int num_senders, bool is_merging,
373
                                   RuntimeProfile* profile, size_t data_queue_capacity)
374
469k
        : HasTaskExecutionCtx(state),
375
469k
          _mgr(stream_mgr),
376
469k
          _memory_used_counter(memory_used_counter),
377
469k
          _resource_ctx(state->get_query_ctx()->resource_ctx()),
378
469k
          _query_context(state->get_query_ctx()->shared_from_this()),
379
469k
          _fragment_instance_id(fragment_instance_id),
380
469k
          _dest_node_id(dest_node_id),
381
469k
          _is_merging(is_merging),
382
469k
          _is_closed(false),
383
469k
          _sender_queue_mem_limit(data_queue_capacity),
384
469k
          _profile(profile) {
385
    // DataStreamRecvr may be destructed after the instance execution thread ends.
386
469k
    _mem_tracker =
387
469k
            std::make_unique<MemTracker>("VDataStreamRecvr:" + print_id(_fragment_instance_id));
388
469k
    SCOPED_CONSUME_MEM_TRACKER(_mem_tracker.get());
389
390
    // Create one queue per sender if is_merging is true.
391
469k
    int num_queues = is_merging ? num_senders : 1;
392
469k
    _sender_to_local_channel_dependency.resize(num_queues);
393
1.15M
    for (size_t i = 0; i < num_queues; i++) {
394
682k
        _sender_to_local_channel_dependency[i] = Dependency::create_shared(
395
682k
                _dest_node_id, _dest_node_id, fmt::format("LocalExchangeChannelDependency_{}", i),
396
682k
                true);
397
682k
    }
398
469k
    _sender_queues.reserve(num_queues);
399
469k
    int num_sender_per_queue = is_merging ? 1 : num_senders;
400
1.15M
    for (int i = 0; i < num_queues; ++i) {
401
682k
        SenderQueue* queue = nullptr;
402
682k
        queue = _sender_queue_pool.add(new SenderQueue(this, num_sender_per_queue,
403
682k
                                                       _sender_to_local_channel_dependency[i]));
404
682k
        _sender_queues.push_back(queue);
405
682k
    }
406
407
    // Initialize the counters
408
469k
    _remote_bytes_received_counter = ADD_COUNTER(_profile, "RemoteBytesReceived", TUnit::BYTES);
409
469k
    _local_bytes_received_counter = ADD_COUNTER(_profile, "LocalBytesReceived", TUnit::BYTES);
410
411
469k
    _deserialize_row_batch_timer = ADD_TIMER(_profile, "DeserializeRowBatchTimer");
412
469k
    _data_arrival_timer = ADD_TIMER(_profile, "DataArrivalWaitTime");
413
469k
    _buffer_full_total_timer = ADD_TIMER(_profile, "SendersBlockedTotalTimer(*)");
414
469k
    _first_batch_wait_total_timer = ADD_TIMER(_profile, "FirstBatchArrivalWaitTime");
415
469k
    _decompress_timer = ADD_TIMER(_profile, "DecompressTime");
416
469k
    _decompress_bytes = ADD_COUNTER(_profile, "DecompressBytes", TUnit::BYTES);
417
469k
    _blocks_produced_counter = ADD_COUNTER(_profile, "BlocksProduced", TUnit::UNIT);
418
469k
    _max_wait_worker_time = ADD_COUNTER(_profile, "MaxWaitForWorkerTime", TUnit::UNIT);
419
469k
    _max_wait_to_process_time = ADD_COUNTER(_profile, "MaxWaitToProcessTime", TUnit::UNIT);
420
469k
    _max_find_recvr_time = ADD_COUNTER(_profile, "MaxFindRecvrTime(NS)", TUnit::UNIT);
421
469k
}
422
423
471k
VDataStreamRecvr::~VDataStreamRecvr() {
424
18.4E
    DCHECK(_mgr == nullptr) << "Must call close()";
425
471k
}
426
427
Status VDataStreamRecvr::create_merger(const VExprContextSPtrs& ordering_expr,
428
                                       const std::vector<bool>& is_asc_order,
429
                                       const std::vector<bool>& nulls_first, size_t batch_size,
430
52.4k
                                       int64_t limit, size_t offset) {
431
52.4k
    DCHECK(_is_merging);
432
52.4k
    SCOPED_CONSUME_MEM_TRACKER(_mem_tracker.get());
433
52.4k
    std::vector<BlockSupplier> child_block_suppliers;
434
    // Create the merger that will a single stream of sorted rows.
435
52.4k
    _merger.reset(new VSortedRunMerger(ordering_expr, is_asc_order, nulls_first, batch_size, limit,
436
52.4k
                                       offset, _profile));
437
438
318k
    for (int i = 0; i < _sender_queues.size(); ++i) {
439
265k
        child_block_suppliers.emplace_back(std::bind(std::mem_fn(&SenderQueue::get_batch),
440
265k
                                                     _sender_queues[i], std::placeholders::_1,
441
265k
                                                     std::placeholders::_2));
442
265k
    }
443
52.4k
    RETURN_IF_ERROR(_merger->prepare(child_block_suppliers));
444
52.4k
    return Status::OK();
445
52.4k
}
446
447
Status VDataStreamRecvr::add_block(std::unique_ptr<PBlock> pblock, int sender_id, int be_number,
448
                                   int64_t packet_seq, ::google::protobuf::Closure** done,
449
                                   const int64_t wait_for_worker,
450
0
                                   const uint64_t time_to_find_recvr) {
451
0
    SCOPED_ATTACH_TASK(_resource_ctx);
452
0
    if (_query_context->low_memory_mode()) {
453
0
        set_low_memory_mode();
454
0
    }
455
456
0
    int use_sender_id = _is_merging ? sender_id : 0;
457
0
    return _sender_queues[use_sender_id]->add_block(std::move(pblock), be_number, packet_seq, done,
458
0
                                                    wait_for_worker, time_to_find_recvr);
459
0
}
460
461
Status VDataStreamRecvr::add_blocks(const PTransmitDataParams* request,
462
                                    ::google::protobuf::Closure** done,
463
                                    const int64_t wait_for_worker,
464
118k
                                    const uint64_t time_to_find_recvr) {
465
118k
    SCOPED_ATTACH_TASK(_resource_ctx);
466
118k
    if (_query_context->low_memory_mode()) {
467
0
        set_low_memory_mode();
468
0
    }
469
118k
    int use_sender_id = _is_merging ? request->sender_id() : 0;
470
118k
    return _sender_queues[use_sender_id]->add_blocks(request, done, wait_for_worker,
471
118k
                                                     time_to_find_recvr);
472
118k
}
473
474
271k
void VDataStreamRecvr::add_block(Block* block, int sender_id, bool use_move) {
475
271k
    if (_query_context->low_memory_mode()) {
476
0
        set_low_memory_mode();
477
0
    }
478
271k
    int use_sender_id = _is_merging ? sender_id : 0;
479
271k
    _sender_queues[use_sender_id]->add_block(block, use_move);
480
271k
}
481
482
11
std::string VDataStreamRecvr::debug_string() {
483
11
    fmt::memory_buffer debug_string_buffer;
484
11
    fmt::format_to(debug_string_buffer,
485
11
                   "fragment_instance_id: {}, _dest_node_id: {}, _is_merging: {}, _is_closed: {}",
486
11
                   print_id(_fragment_instance_id), _dest_node_id, _is_merging, _is_closed);
487
24
    for (size_t i = 0; i < _sender_queues.size(); i++) {
488
13
        fmt::format_to(debug_string_buffer, "No. {} queue: {}", i,
489
13
                       _sender_queues[i]->debug_string());
490
13
    }
491
11
    return fmt::to_string(debug_string_buffer);
492
11
}
493
494
1.91M
std::shared_ptr<Dependency> VDataStreamRecvr::get_local_channel_dependency(int sender_id) {
495
1.91M
    DCHECK(_sender_to_local_channel_dependency[_is_merging ? sender_id : 0] != nullptr);
496
1.91M
    return _sender_to_local_channel_dependency[_is_merging ? sender_id : 0];
497
1.91M
}
498
499
845k
Status VDataStreamRecvr::get_next(Block* block, bool* eos) {
500
845k
    if (!_is_merging) {
501
717k
        block->clear();
502
717k
        return _sender_queues[0]->get_batch(block, eos);
503
717k
    } else {
504
127k
        return _merger->get_next(block, eos);
505
127k
    }
506
845k
}
507
508
3.27M
void VDataStreamRecvr::remove_sender(int sender_id, int be_number, Status exec_status) {
509
3.27M
    if (!exec_status.ok()) {
510
0
        cancel_stream(exec_status);
511
0
        return;
512
0
    }
513
3.27M
    int use_sender_id = _is_merging ? sender_id : 0;
514
3.27M
    _sender_queues[use_sender_id]->decrement_senders(be_number);
515
3.27M
}
516
517
471k
void VDataStreamRecvr::cancel_stream(Status exec_status) {
518
18.4E
    VLOG_QUERY << "cancel_stream: fragment_instance_id=" << print_id(_fragment_instance_id)
519
18.4E
               << exec_status;
520
521
1.15M
    for (int i = 0; i < _sender_queues.size(); ++i) {
522
686k
        _sender_queues[i]->cancel(exec_status);
523
686k
    }
524
471k
}
525
526
391k
void VDataStreamRecvr::SenderQueue::add_blocks_memory_usage(int64_t size) {
527
391k
    DCHECK(size >= 0);
528
391k
    _recvr->_mem_tracker->consume(size);
529
391k
    _queue_mem_tracker->consume(size);
530
391k
    if (_local_channel_dependency && exceeds_limit()) {
531
6.78k
        _local_channel_dependency->block();
532
6.78k
    }
533
391k
}
534
535
390k
void VDataStreamRecvr::SenderQueue::sub_blocks_memory_usage(int64_t size) {
536
390k
    DCHECK(size >= 0);
537
390k
    _recvr->_mem_tracker->release(size);
538
390k
    _queue_mem_tracker->release(size);
539
390k
    if (_local_channel_dependency && (!exceeds_limit())) {
540
389k
        _local_channel_dependency->set_ready();
541
389k
    }
542
390k
}
543
544
782k
bool VDataStreamRecvr::SenderQueue::exceeds_limit() {
545
782k
    const size_t queue_byte_size = _queue_mem_tracker->consumption();
546
782k
    return _recvr->queue_exceeds_limit(queue_byte_size);
547
782k
}
548
549
119k
bool VDataStreamRecvr::exceeds_limit(size_t block_byte_size) {
550
119k
    return _mem_tracker->consumption() + block_byte_size > config::exchg_node_buffer_size_bytes;
551
119k
}
552
553
782k
bool VDataStreamRecvr::queue_exceeds_limit(size_t queue_byte_size) const {
554
782k
    return queue_byte_size >= _sender_queue_mem_limit;
555
782k
}
556
557
940k
void VDataStreamRecvr::close() {
558
940k
    if (_is_closed) {
559
469k
        return;
560
469k
    }
561
470k
    _is_closed = true;
562
685k
    for (auto& it : _sender_to_local_channel_dependency) {
563
685k
        it->set_always_ready();
564
685k
    }
565
1.15M
    for (int i = 0; i < _sender_queues.size(); ++i) {
566
685k
        _sender_queues[i]->close();
567
685k
    }
568
    // Remove this receiver from the DataStreamMgr that created it.
569
    // TODO: log error msg
570
471k
    if (_mgr) {
571
471k
        static_cast<void>(_mgr->deregister_recvr(fragment_instance_id(), dest_node_id()));
572
471k
    }
573
470k
    _mgr = nullptr;
574
575
470k
    _merger.reset();
576
470k
}
577
578
463k
void VDataStreamRecvr::set_sink_dep_always_ready() const {
579
676k
    for (auto dep : _sender_to_local_channel_dependency) {
580
676k
        dep->set_always_ready();
581
676k
    }
582
463k
}
583
584
} // namespace doris