Coverage Report

Created: 2026-04-15 18:56

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
be/src/exec/exchange/vdata_stream_recvr.cpp
Line
Count
Source
1
// Licensed to the Apache Software Foundation (ASF) under one
2
// or more contributor license agreements.  See the NOTICE file
3
// distributed with this work for additional information
4
// regarding copyright ownership.  The ASF licenses this file
5
// to you under the Apache License, Version 2.0 (the
6
// "License"); you may not use this file except in compliance
7
// with the License.  You may obtain a copy of the License at
8
//
9
//   http://www.apache.org/licenses/LICENSE-2.0
10
//
11
// Unless required by applicable law or agreed to in writing,
12
// software distributed under the License is distributed on an
13
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
14
// KIND, either express or implied.  See the License for the
15
// specific language governing permissions and limitations
16
// under the License.
17
18
#include "exec/exchange/vdata_stream_recvr.h"
19
20
#include <fmt/format.h>
21
#include <gen_cpp/Metrics_types.h>
22
#include <gen_cpp/Types_types.h>
23
#include <gen_cpp/data.pb.h>
24
25
#include <algorithm>
26
#include <functional>
27
#include <string>
28
29
#include "common/logging.h"
30
#include "core/block/block.h"
31
#include "core/block/materialize_block.h"
32
#include "exec/exchange/vdata_stream_mgr.h"
33
#include "exec/operator/exchange_sink_operator.h"
34
#include "exec/operator/exchange_source_operator.h"
35
#include "exec/sort/sort_cursor.h"
36
#include "exec/sort/vsorted_run_merger.h"
37
#include "runtime/memory/mem_tracker.h"
38
#include "runtime/runtime_state.h"
39
#include "runtime/thread_context.h"
40
#include "util/defer_op.h"
41
#include "util/uid_util.h"
42
43
namespace doris {
44
45
VDataStreamRecvr::SenderQueue::SenderQueue(VDataStreamRecvr* parent_recvr, int num_senders,
46
                                           std::shared_ptr<Dependency> local_channel_dependency)
47
634k
        : _recvr(parent_recvr),
48
634k
          _is_cancelled(false),
49
634k
          _num_remaining_senders(num_senders),
50
634k
          _local_channel_dependency(local_channel_dependency) {
51
634k
    _cancel_status = Status::OK();
52
634k
    _queue_mem_tracker = std::make_unique<MemTracker>("local data queue mem tracker");
53
634k
}
54
55
643k
VDataStreamRecvr::SenderQueue::~SenderQueue() {
56
643k
    for (auto& block_item : _block_queue) {
57
0
        block_item.call_done(_recvr);
58
0
    }
59
643k
    _block_queue.clear();
60
643k
}
61
62
867k
Status VDataStreamRecvr::SenderQueue::get_batch(Block* block, bool* eos) {
63
867k
#ifndef NDEBUG
64
867k
    if (!_is_cancelled && _block_queue.empty() && _num_remaining_senders > 0) {
65
0
        throw doris::Exception(ErrorCode::INTERNAL_ERROR,
66
0
                               "_is_cancelled: {}, _block_queue_empty: {}, "
67
0
                               "_num_remaining_senders: {}",
68
0
                               _is_cancelled, _block_queue.empty(), _num_remaining_senders);
69
0
    }
70
867k
#endif
71
867k
    BlockItem block_item;
72
867k
    {
73
867k
        INJECT_MOCK_SLEEP(std::lock_guard<std::mutex> l(_lock));
74
        //check and get block_item from data_queue
75
867k
        if (_is_cancelled) {
76
1
            RETURN_IF_ERROR(_cancel_status);
77
1
            return Status::Cancelled("Cancelled");
78
1
        }
79
80
867k
        if (_block_queue.empty()) {
81
625k
            if (_num_remaining_senders != 0) {
82
0
                return Status::InternalError(
83
0
                        "Data queue is empty but there are still remaining senders. "
84
0
                        "_num_remaining_senders: {}",
85
0
                        _num_remaining_senders);
86
0
            }
87
625k
            *eos = true;
88
625k
            return Status::OK();
89
625k
        }
90
91
867k
        DCHECK(!_block_queue.empty());
92
241k
        block_item = std::move(_block_queue.front());
93
241k
        _block_queue.pop_front();
94
241k
    }
95
0
    BlockUPtr next_block;
96
241k
    RETURN_IF_ERROR(block_item.get_block(next_block));
97
241k
    size_t block_byte_size = block_item.block_byte_size();
98
241k
    COUNTER_UPDATE(_recvr->_deserialize_row_batch_timer, block_item.deserialize_time());
99
241k
    COUNTER_UPDATE(_recvr->_decompress_timer, block_item.decompress_time());
100
241k
    COUNTER_UPDATE(_recvr->_decompress_bytes, block_item.decompress_bytes());
101
241k
    _recvr->_memory_used_counter->update(-(int64_t)block_byte_size);
102
241k
    INJECT_MOCK_SLEEP(std::lock_guard<std::mutex> l(_lock));
103
241k
    sub_blocks_memory_usage(block_byte_size);
104
241k
    if (_block_queue.empty() && _source_dependency) {
105
193k
        if (!_is_cancelled && _num_remaining_senders > 0) {
106
80.0k
            _source_dependency->block();
107
80.0k
        }
108
193k
    }
109
110
241k
    block_item.call_done(_recvr);
111
112
241k
    DCHECK(block->empty());
113
241k
    block->swap(*next_block);
114
241k
    *eos = false;
115
241k
    return Status::OK();
116
241k
}
117
118
1.52M
void VDataStreamRecvr::SenderQueue::set_source_ready(std::lock_guard<std::mutex>&) {
119
    // Here, it is necessary to check if _source_dependency is not nullptr.
120
    // This is because the queue might be closed before setting the source dependency.
121
1.52M
    if (!_source_dependency) {
122
11
        return;
123
11
    }
124
1.52M
    const bool should_wait = !_is_cancelled && _block_queue.empty() && _num_remaining_senders > 0;
125
1.52M
    if (!should_wait) {
126
1.52M
        _source_dependency->set_ready();
127
1.52M
    }
128
1.52M
}
129
130
32
std::string VDataStreamRecvr::SenderQueue::debug_string() {
131
32
    fmt::memory_buffer debug_string_buffer;
132
32
    fmt::format_to(debug_string_buffer,
133
32
                   "_num_remaining_senders = {}, block_queue size = {}, _is_cancelled: {}, "
134
32
                   "_cancel_status: {}, _sender_eos_set: (",
135
32
                   _num_remaining_senders, _block_queue.size(), _is_cancelled,
136
32
                   _cancel_status.to_string());
137
32
    std::lock_guard<std::mutex> l(_lock);
138
32
    for (auto& i : _sender_eos_set) {
139
5
        fmt::format_to(debug_string_buffer, "{}, ", i);
140
5
    }
141
32
    fmt::format_to(debug_string_buffer, ")");
142
32
    return fmt::to_string(debug_string_buffer);
143
32
}
144
145
Status VDataStreamRecvr::SenderQueue::add_block(std::unique_ptr<PBlock> pblock, int be_number,
146
                                                int64_t packet_seq,
147
                                                ::google::protobuf::Closure** done,
148
                                                const int64_t wait_for_worker,
149
500
                                                const uint64_t time_to_find_recvr) {
150
500
    {
151
500
        INJECT_MOCK_SLEEP(std::lock_guard<std::mutex> l(_lock));
152
500
        if (_is_cancelled) {
153
0
            return Status::OK();
154
0
        }
155
500
        auto iter = _packet_seq_map.find(be_number);
156
500
        if (iter != _packet_seq_map.end()) {
157
495
            if (iter->second >= packet_seq) {
158
0
                return Status::InternalError(
159
0
                        "packet already exist [cur_packet_id= {} receive_packet_id={}]",
160
0
                        iter->second, packet_seq);
161
0
            }
162
495
            iter->second = packet_seq;
163
495
        } else {
164
5
            _packet_seq_map.emplace(be_number, packet_seq);
165
5
        }
166
167
500
        DCHECK(_num_remaining_senders >= 0);
168
500
        if (_num_remaining_senders == 0) {
169
0
            DCHECK(_sender_eos_set.contains(be_number));
170
0
            return Status::OK();
171
0
        }
172
500
    }
173
174
500
    INJECT_MOCK_SLEEP(std::lock_guard<std::mutex> l(_lock));
175
500
    if (_is_cancelled) {
176
0
        return Status::OK();
177
0
    }
178
179
500
    const auto block_byte_size = pblock->ByteSizeLong();
180
500
    COUNTER_UPDATE(_recvr->_blocks_produced_counter, 1);
181
500
    if (_recvr->_max_wait_worker_time->value() < wait_for_worker) {
182
0
        _recvr->_max_wait_worker_time->set(wait_for_worker);
183
0
    }
184
185
500
    if (_recvr->_max_find_recvr_time->value() < time_to_find_recvr) {
186
0
        _recvr->_max_find_recvr_time->set((int64_t)time_to_find_recvr);
187
0
    }
188
189
500
    _block_queue.emplace_back(std::move(pblock), block_byte_size);
190
500
    COUNTER_UPDATE(_recvr->_remote_bytes_received_counter, block_byte_size);
191
500
    set_source_ready(l);
192
193
    // if done is nullptr, this function can't delay this response
194
502
    if (done != nullptr && _recvr->exceeds_limit(block_byte_size)) {
195
1
        _block_queue.back().set_done(*done);
196
1
        *done = nullptr;
197
1
    }
198
500
    _recvr->_memory_used_counter->update(block_byte_size);
199
500
    add_blocks_memory_usage(block_byte_size);
200
500
    return Status::OK();
201
500
}
202
203
Status VDataStreamRecvr::SenderQueue::add_blocks(const PTransmitDataParams* request,
204
                                                 ::google::protobuf::Closure** done,
205
                                                 const int64_t wait_for_worker,
206
67.5k
                                                 const uint64_t time_to_find_recvr) {
207
67.5k
    {
208
67.5k
        INJECT_MOCK_SLEEP(std::lock_guard<std::mutex> l(_lock));
209
67.5k
        if (_is_cancelled) {
210
1
            return Status::OK();
211
1
        }
212
67.5k
        const int be_number = request->be_number();
213
        // In the request, the packet_seq for blocks is [request->packet_seq() - blocks_size(), request->packet_seq())
214
        // Note this is a left-closed, right-open interval; the packet_seq of the last block is request->packet_seq() - 1
215
        // We store the packet_seq of the last block in _packet_seq_map so we can compare it with the packet_seq of the next received packet
216
67.5k
        const int64_t packet_seq = request->packet_seq() - 1;
217
67.5k
        auto iter = _packet_seq_map.find(be_number);
218
67.5k
        if (iter != _packet_seq_map.end()) {
219
6.55k
            if (iter->second > (packet_seq - request->blocks_size())) {
220
0
                return Status::InternalError(
221
0
                        "packet already exist [cur_packet_id= {} receive_packet_id={}]",
222
0
                        iter->second, packet_seq);
223
0
            }
224
6.55k
            iter->second = packet_seq;
225
61.0k
        } else {
226
61.0k
            _packet_seq_map.emplace(be_number, packet_seq);
227
61.0k
        }
228
229
67.5k
        DCHECK(_num_remaining_senders >= 0);
230
67.5k
        if (_num_remaining_senders == 0) {
231
0
            DCHECK(_sender_eos_set.end() != _sender_eos_set.find(be_number));
232
0
            return Status::OK();
233
0
        }
234
67.5k
    }
235
236
67.5k
    INJECT_MOCK_SLEEP(std::lock_guard<std::mutex> l(_lock));
237
67.5k
    if (_is_cancelled) {
238
0
        return Status::OK();
239
0
    }
240
241
67.5k
    int64_t total_block_byte_size = 0;
242
135k
    for (int i = 0; i < request->blocks_size(); i++) {
243
67.5k
        std::unique_ptr<PBlock> pblock = std::make_unique<PBlock>();
244
67.5k
        pblock->CopyFrom(request->blocks(i));
245
246
67.5k
        const auto block_byte_size = pblock->ByteSizeLong();
247
67.5k
        COUNTER_UPDATE(_recvr->_blocks_produced_counter, 1);
248
67.5k
        if (_recvr->_max_wait_worker_time->value() < wait_for_worker) {
249
1
            _recvr->_max_wait_worker_time->set(wait_for_worker);
250
1
        }
251
252
67.5k
        if (_recvr->_max_find_recvr_time->value() < time_to_find_recvr) {
253
50.6k
            _recvr->_max_find_recvr_time->set((int64_t)time_to_find_recvr);
254
50.6k
        }
255
256
67.5k
        _block_queue.emplace_back(std::move(pblock), block_byte_size);
257
67.5k
        COUNTER_UPDATE(_recvr->_remote_bytes_received_counter, block_byte_size);
258
67.5k
        total_block_byte_size += block_byte_size;
259
67.5k
    }
260
261
67.5k
    set_source_ready(l);
262
263
    // if done is nullptr, this function can't delay this response
264
67.6k
    if (done != nullptr && _recvr->exceeds_limit(total_block_byte_size)) {
265
2
        _block_queue.back().set_done(*done);
266
2
        *done = nullptr;
267
2
    }
268
67.5k
    _recvr->_memory_used_counter->update(total_block_byte_size);
269
67.5k
    add_blocks_memory_usage(total_block_byte_size);
270
67.5k
    return Status::OK();
271
67.5k
}
272
273
175k
void VDataStreamRecvr::SenderQueue::add_block(Block* block, bool use_move) {
274
175k
    if (block->rows() == 0) {
275
0
        return;
276
0
    }
277
175k
    {
278
175k
        INJECT_MOCK_SLEEP(std::unique_lock<std::mutex> l(_lock));
279
175k
        if (_is_cancelled) {
280
297
            return;
281
297
        }
282
175k
        DCHECK(_num_remaining_senders >= 0);
283
175k
        if (_num_remaining_senders == 0) {
284
1
            return;
285
1
        }
286
175k
    }
287
175k
    BlockUPtr nblock = Block::create_unique(block->get_columns_with_type_and_name());
288
289
    // local exchange should copy the block contented if use move == false
290
175k
    if (use_move) {
291
163k
        block->clear();
292
163k
    } else {
293
11.3k
        auto rows = block->rows();
294
37.3k
        for (int i = 0; i < nblock->columns(); ++i) {
295
25.9k
            nblock->get_by_position(i).column =
296
25.9k
                    nblock->get_by_position(i).column->clone_resized(rows);
297
25.9k
        }
298
11.3k
    }
299
175k
    materialize_block_inplace(*nblock);
300
301
175k
    auto block_mem_size = nblock->allocated_bytes();
302
175k
    {
303
175k
        INJECT_MOCK_SLEEP(std::lock_guard<std::mutex> l(_lock));
304
175k
        if (_is_cancelled) {
305
4
            return;
306
4
        }
307
175k
        _block_queue.emplace_back(std::move(nblock), block_mem_size);
308
175k
        set_source_ready(l);
309
175k
        COUNTER_UPDATE(_recvr->_local_bytes_received_counter, block_mem_size);
310
175k
        _recvr->_memory_used_counter->update(block_mem_size);
311
175k
        add_blocks_memory_usage(block_mem_size);
312
175k
    }
313
175k
}
314
315
4.12M
void VDataStreamRecvr::SenderQueue::decrement_senders(int be_number) {
316
4.12M
    INJECT_MOCK_SLEEP(std::lock_guard<std::mutex> l(_lock));
317
4.12M
    if (_sender_eos_set.end() != _sender_eos_set.find(be_number)) {
318
0
        return;
319
0
    }
320
4.12M
    _sender_eos_set.insert(be_number);
321
4.12M
    DCHECK_GT(_num_remaining_senders, 0);
322
4.12M
    _num_remaining_senders--;
323
18.4E
    VLOG_FILE << "decremented senders: fragment_instance_id="
324
18.4E
              << print_id(_recvr->fragment_instance_id()) << " node_id=" << _recvr->dest_node_id()
325
18.4E
              << " #senders=" << _num_remaining_senders;
326
4.12M
    if (_num_remaining_senders == 0) {
327
634k
        set_source_ready(l);
328
634k
    }
329
4.12M
}
330
331
644k
void VDataStreamRecvr::SenderQueue::cancel(Status cancel_status) {
332
644k
    {
333
644k
        INJECT_MOCK_SLEEP(std::lock_guard<std::mutex> l(_lock));
334
644k
        if (_is_cancelled) {
335
644k
            return;
336
644k
        }
337
18.4E
        _is_cancelled = true;
338
18.4E
        _cancel_status = cancel_status;
339
18.4E
        set_source_ready(l);
340
18.4E
        VLOG_QUERY << "cancelled stream: _fragment_instance_id="
341
18.4E
                   << print_id(_recvr->fragment_instance_id())
342
18.4E
                   << " node_id=" << _recvr->dest_node_id();
343
18.4E
    }
344
0
    {
345
18.4E
        INJECT_MOCK_SLEEP(std::lock_guard<std::mutex> l(_lock));
346
18.4E
        for (auto& block_item : _block_queue) {
347
0
            block_item.call_done(_recvr);
348
0
        }
349
18.4E
        _block_queue.clear();
350
18.4E
    }
351
18.4E
}
352
353
643k
void VDataStreamRecvr::SenderQueue::close() {
354
    // If _is_cancelled is not set to true, there may be concurrent send
355
    // which add batch to _block_queue. The batch added after _block_queue
356
    // is clear will be memory leak
357
643k
    INJECT_MOCK_SLEEP(std::lock_guard<std::mutex> l(_lock));
358
643k
    _is_cancelled = true;
359
643k
    set_source_ready(l);
360
361
643k
    for (auto& block_item : _block_queue) {
362
1.57k
        block_item.call_done(_recvr);
363
1.57k
    }
364
    // Delete any batches queued in _block_queue
365
643k
    _block_queue.clear();
366
643k
}
367
368
VDataStreamRecvr::VDataStreamRecvr(VDataStreamMgr* stream_mgr,
369
                                   RuntimeProfile::HighWaterMarkCounter* memory_used_counter,
370
                                   RuntimeState* state, const TUniqueId& fragment_instance_id,
371
                                   PlanNodeId dest_node_id, int num_senders, bool is_merging,
372
                                   RuntimeProfile* profile, size_t data_queue_capacity)
373
435k
        : HasTaskExecutionCtx(state),
374
435k
          _mgr(stream_mgr),
375
435k
          _memory_used_counter(memory_used_counter),
376
435k
          _resource_ctx(state->get_query_ctx()->resource_ctx()),
377
435k
          _query_context(state->get_query_ctx()->shared_from_this()),
378
435k
          _fragment_instance_id(fragment_instance_id),
379
435k
          _dest_node_id(dest_node_id),
380
435k
          _is_merging(is_merging),
381
435k
          _is_closed(false),
382
435k
          _sender_queue_mem_limit(data_queue_capacity),
383
435k
          _profile(profile) {
384
    // DataStreamRecvr may be destructed after the instance execution thread ends.
385
435k
    _mem_tracker =
386
435k
            std::make_unique<MemTracker>("VDataStreamRecvr:" + print_id(_fragment_instance_id));
387
435k
    SCOPED_CONSUME_MEM_TRACKER(_mem_tracker.get());
388
389
    // Create one queue per sender if is_merging is true.
390
435k
    int num_queues = is_merging ? num_senders : 1;
391
435k
    _sender_to_local_channel_dependency.resize(num_queues);
392
1.07M
    for (size_t i = 0; i < num_queues; i++) {
393
637k
        _sender_to_local_channel_dependency[i] = Dependency::create_shared(
394
637k
                _dest_node_id, _dest_node_id, fmt::format("LocalExchangeChannelDependency_{}", i),
395
637k
                true);
396
637k
    }
397
435k
    _sender_queues.reserve(num_queues);
398
435k
    int num_sender_per_queue = is_merging ? 1 : num_senders;
399
1.07M
    for (int i = 0; i < num_queues; ++i) {
400
637k
        SenderQueue* queue = nullptr;
401
637k
        queue = _sender_queue_pool.add(new SenderQueue(this, num_sender_per_queue,
402
637k
                                                       _sender_to_local_channel_dependency[i]));
403
637k
        _sender_queues.push_back(queue);
404
637k
    }
405
406
    // Initialize the counters
407
435k
    _remote_bytes_received_counter = ADD_COUNTER(_profile, "RemoteBytesReceived", TUnit::BYTES);
408
435k
    _local_bytes_received_counter = ADD_COUNTER(_profile, "LocalBytesReceived", TUnit::BYTES);
409
410
435k
    _deserialize_row_batch_timer = ADD_TIMER(_profile, "DeserializeRowBatchTimer");
411
435k
    _data_arrival_timer = ADD_TIMER(_profile, "DataArrivalWaitTime");
412
435k
    _buffer_full_total_timer = ADD_TIMER(_profile, "SendersBlockedTotalTimer(*)");
413
435k
    _first_batch_wait_total_timer = ADD_TIMER(_profile, "FirstBatchArrivalWaitTime");
414
435k
    _decompress_timer = ADD_TIMER(_profile, "DecompressTime");
415
435k
    _decompress_bytes = ADD_COUNTER(_profile, "DecompressBytes", TUnit::BYTES);
416
435k
    _blocks_produced_counter = ADD_COUNTER(_profile, "BlocksProduced", TUnit::UNIT);
417
435k
    _max_wait_worker_time = ADD_COUNTER(_profile, "MaxWaitForWorkerTime", TUnit::UNIT);
418
435k
    _max_wait_to_process_time = ADD_COUNTER(_profile, "MaxWaitToProcessTime", TUnit::UNIT);
419
435k
    _max_find_recvr_time = ADD_COUNTER(_profile, "MaxFindRecvrTime(NS)", TUnit::UNIT);
420
435k
}
421
422
440k
VDataStreamRecvr::~VDataStreamRecvr() {
423
18.4E
    DCHECK(_mgr == nullptr) << "Must call close()";
424
440k
}
425
426
Status VDataStreamRecvr::create_merger(const VExprContextSPtrs& ordering_expr,
427
                                       const std::vector<bool>& is_asc_order,
428
                                       const std::vector<bool>& nulls_first, size_t batch_size,
429
41.4k
                                       int64_t limit, size_t offset) {
430
41.4k
    DCHECK(_is_merging);
431
41.4k
    SCOPED_CONSUME_MEM_TRACKER(_mem_tracker.get());
432
41.4k
    std::vector<BlockSupplier> child_block_suppliers;
433
    // Create the merger that will a single stream of sorted rows.
434
41.4k
    _merger.reset(new VSortedRunMerger(ordering_expr, is_asc_order, nulls_first, batch_size, limit,
435
41.4k
                                       offset, _profile));
436
437
285k
    for (int i = 0; i < _sender_queues.size(); ++i) {
438
243k
        child_block_suppliers.emplace_back(std::bind(std::mem_fn(&SenderQueue::get_batch),
439
243k
                                                     _sender_queues[i], std::placeholders::_1,
440
243k
                                                     std::placeholders::_2));
441
243k
    }
442
41.4k
    RETURN_IF_ERROR(_merger->prepare(child_block_suppliers));
443
41.4k
    return Status::OK();
444
41.4k
}
445
446
Status VDataStreamRecvr::add_block(std::unique_ptr<PBlock> pblock, int sender_id, int be_number,
447
                                   int64_t packet_seq, ::google::protobuf::Closure** done,
448
                                   const int64_t wait_for_worker,
449
0
                                   const uint64_t time_to_find_recvr) {
450
0
    SCOPED_ATTACH_TASK(_resource_ctx);
451
0
    if (_query_context->low_memory_mode()) {
452
0
        set_low_memory_mode();
453
0
    }
454
455
0
    int use_sender_id = _is_merging ? sender_id : 0;
456
0
    return _sender_queues[use_sender_id]->add_block(std::move(pblock), be_number, packet_seq, done,
457
0
                                                    wait_for_worker, time_to_find_recvr);
458
0
}
459
460
Status VDataStreamRecvr::add_blocks(const PTransmitDataParams* request,
461
                                    ::google::protobuf::Closure** done,
462
                                    const int64_t wait_for_worker,
463
67.5k
                                    const uint64_t time_to_find_recvr) {
464
67.5k
    SCOPED_ATTACH_TASK(_resource_ctx);
465
67.5k
    if (_query_context->low_memory_mode()) {
466
0
        set_low_memory_mode();
467
0
    }
468
67.5k
    int use_sender_id = _is_merging ? request->sender_id() : 0;
469
67.5k
    return _sender_queues[use_sender_id]->add_blocks(request, done, wait_for_worker,
470
67.5k
                                                     time_to_find_recvr);
471
67.5k
}
472
473
174k
void VDataStreamRecvr::add_block(Block* block, int sender_id, bool use_move) {
474
174k
    if (_query_context->low_memory_mode()) {
475
0
        set_low_memory_mode();
476
0
    }
477
174k
    int use_sender_id = _is_merging ? sender_id : 0;
478
174k
    _sender_queues[use_sender_id]->add_block(block, use_move);
479
174k
}
480
481
27
std::string VDataStreamRecvr::debug_string() {
482
27
    fmt::memory_buffer debug_string_buffer;
483
27
    fmt::format_to(debug_string_buffer,
484
27
                   "fragment_instance_id: {}, _dest_node_id: {}, _is_merging: {}, _is_closed: {}",
485
27
                   print_id(_fragment_instance_id), _dest_node_id, _is_merging, _is_closed);
486
59
    for (size_t i = 0; i < _sender_queues.size(); i++) {
487
32
        fmt::format_to(debug_string_buffer, "No. {} queue: {}", i,
488
32
                       _sender_queues[i]->debug_string());
489
32
    }
490
27
    return fmt::to_string(debug_string_buffer);
491
27
}
492
493
2.02M
std::shared_ptr<Dependency> VDataStreamRecvr::get_local_channel_dependency(int sender_id) {
494
2.02M
    DCHECK(_sender_to_local_channel_dependency[_is_merging ? sender_id : 0] != nullptr);
495
2.02M
    return _sender_to_local_channel_dependency[_is_merging ? sender_id : 0];
496
2.02M
}
497
498
664k
Status VDataStreamRecvr::get_next(Block* block, bool* eos) {
499
664k
    if (!_is_merging) {
500
556k
        block->clear();
501
556k
        return _sender_queues[0]->get_batch(block, eos);
502
556k
    } else {
503
108k
        return _merger->get_next(block, eos);
504
108k
    }
505
664k
}
506
507
4.12M
void VDataStreamRecvr::remove_sender(int sender_id, int be_number, Status exec_status) {
508
4.12M
    if (!exec_status.ok()) {
509
0
        cancel_stream(exec_status);
510
0
        return;
511
0
    }
512
4.12M
    int use_sender_id = _is_merging ? sender_id : 0;
513
4.12M
    _sender_queues[use_sender_id]->decrement_senders(be_number);
514
4.12M
}
515
516
440k
void VDataStreamRecvr::cancel_stream(Status exec_status) {
517
18.4E
    VLOG_QUERY << "cancel_stream: fragment_instance_id=" << print_id(_fragment_instance_id)
518
18.4E
               << exec_status;
519
520
1.08M
    for (int i = 0; i < _sender_queues.size(); ++i) {
521
644k
        _sender_queues[i]->cancel(exec_status);
522
644k
    }
523
440k
}
524
525
243k
void VDataStreamRecvr::SenderQueue::add_blocks_memory_usage(int64_t size) {
526
243k
    DCHECK(size >= 0);
527
243k
    _recvr->_mem_tracker->consume(size);
528
243k
    _queue_mem_tracker->consume(size);
529
243k
    if (_local_channel_dependency && exceeds_limit()) {
530
2.09k
        _local_channel_dependency->block();
531
2.09k
    }
532
243k
}
533
534
241k
void VDataStreamRecvr::SenderQueue::sub_blocks_memory_usage(int64_t size) {
535
241k
    DCHECK(size >= 0);
536
241k
    _recvr->_mem_tracker->release(size);
537
241k
    _queue_mem_tracker->release(size);
538
241k
    if (_local_channel_dependency && (!exceeds_limit())) {
539
241k
        _local_channel_dependency->set_ready();
540
241k
    }
541
241k
}
542
543
485k
bool VDataStreamRecvr::SenderQueue::exceeds_limit() {
544
485k
    const size_t queue_byte_size = _queue_mem_tracker->consumption();
545
485k
    return _recvr->queue_exceeds_limit(queue_byte_size);
546
485k
}
547
548
68.1k
bool VDataStreamRecvr::exceeds_limit(size_t block_byte_size) {
549
68.1k
    return _mem_tracker->consumption() + block_byte_size > config::exchg_node_buffer_size_bytes;
550
68.1k
}
551
552
485k
bool VDataStreamRecvr::queue_exceeds_limit(size_t queue_byte_size) const {
553
485k
    return queue_byte_size >= _sender_queue_mem_limit;
554
485k
}
555
556
878k
void VDataStreamRecvr::close() {
557
878k
    if (_is_closed) {
558
438k
        return;
559
438k
    }
560
439k
    _is_closed = true;
561
643k
    for (auto& it : _sender_to_local_channel_dependency) {
562
643k
        it->set_always_ready();
563
643k
    }
564
1.08M
    for (int i = 0; i < _sender_queues.size(); ++i) {
565
643k
        _sender_queues[i]->close();
566
643k
    }
567
    // Remove this receiver from the DataStreamMgr that created it.
568
    // TODO: log error msg
569
440k
    if (_mgr) {
570
440k
        static_cast<void>(_mgr->deregister_recvr(fragment_instance_id(), dest_node_id()));
571
440k
    }
572
439k
    _mgr = nullptr;
573
574
439k
    _merger.reset();
575
439k
}
576
577
429k
void VDataStreamRecvr::set_sink_dep_always_ready() const {
578
632k
    for (auto dep : _sender_to_local_channel_dependency) {
579
632k
        dep->set_always_ready();
580
632k
    }
581
429k
}
582
583
} // namespace doris