Coverage Report

Created: 2026-01-29 20:00

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/root/doris/be/src/vec/runtime/partitioner.h
Line
Count
Source
1
// Licensed to the Apache Software Foundation (ASF) under one
2
// or more contributor license agreements.  See the NOTICE file
3
// distributed with this work for additional information
4
// regarding copyright ownership.  The ASF licenses this file
5
// to you under the Apache License, Version 2.0 (the
6
// "License"); you may not use this file except in compliance
7
// with the License.  You may obtain a copy of the License at
8
//
9
//   http://www.apache.org/licenses/LICENSE-2.0
10
//
11
// Unless required by applicable law or agreed to in writing,
12
// software distributed under the License is distributed on an
13
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
14
// KIND, either express or implied.  See the License for the
15
// specific language governing permissions and limitations
16
// under the License.
17
18
#pragma once
19
20
#include <algorithm>
21
22
#include "vec/core/block.h"
23
#include "vec/exprs/vexpr.h"
24
#include "vec/exprs/vexpr_context.h"
25
26
namespace doris::vectorized {
27
#include "common/compile_check_begin.h"
28
29
class PartitionerBase {
30
public:
31
    using HashValType = uint32_t;
32
33
22
    PartitionerBase(HashValType partition_count) : _partition_count(partition_count) {}
34
22
    virtual ~PartitionerBase() = default;
35
36
    virtual Status init(const std::vector<TExpr>& texprs) = 0;
37
38
    virtual Status prepare(RuntimeState* state, const RowDescriptor& row_desc) = 0;
39
40
    virtual Status open(RuntimeState* state) = 0;
41
42
    virtual Status close(RuntimeState* state) = 0;
43
44
    virtual Status do_partitioning(RuntimeState* state, Block* block) const = 0;
45
46
    virtual const std::vector<HashValType>& get_channel_ids() const = 0;
47
48
    virtual Status clone(RuntimeState* state, std::unique_ptr<PartitionerBase>& partitioner) = 0;
49
50
    // use _partition_count as invalid sentinel value. since modulo operation result is [0, partition_count-1]
51
6
    HashValType partition_count() const { return _partition_count; }
52
    // use a individual function to highlight its special meaning
53
4
    HashValType invalid_sentinel() const { return partition_count(); }
54
55
protected:
56
    const HashValType _partition_count;
57
};
58
59
template <typename ChannelIds>
60
class Crc32HashPartitioner : public PartitionerBase {
61
public:
62
19
    Crc32HashPartitioner(int partition_count) : PartitionerBase(partition_count) {}
_ZN5doris10vectorized20Crc32HashPartitionerINS0_17ShuffleChannelIdsEEC2Ei
Line
Count
Source
62
5
    Crc32HashPartitioner(int partition_count) : PartitionerBase(partition_count) {}
_ZN5doris10vectorized20Crc32HashPartitionerINS0_24SpillPartitionChannelIdsEEC2Ei
Line
Count
Source
62
14
    Crc32HashPartitioner(int partition_count) : PartitionerBase(partition_count) {}
Unexecuted instantiation: _ZN5doris10vectorized20Crc32HashPartitionerINS0_15ShiftChannelIdsEEC2Ei
63
19
    ~Crc32HashPartitioner() override = default;
_ZN5doris10vectorized20Crc32HashPartitionerINS0_17ShuffleChannelIdsEED2Ev
Line
Count
Source
63
5
    ~Crc32HashPartitioner() override = default;
_ZN5doris10vectorized20Crc32HashPartitionerINS0_24SpillPartitionChannelIdsEED2Ev
Line
Count
Source
63
14
    ~Crc32HashPartitioner() override = default;
Unexecuted instantiation: _ZN5doris10vectorized20Crc32HashPartitionerINS0_15ShiftChannelIdsEED2Ev
64
65
11
    Status init(const std::vector<TExpr>& texprs) override {
66
11
        return VExpr::create_expr_trees(texprs, _partition_expr_ctxs);
67
11
    }
Unexecuted instantiation: _ZN5doris10vectorized20Crc32HashPartitionerINS0_15ShiftChannelIdsEE4initERKSt6vectorINS_5TExprESaIS5_EE
Unexecuted instantiation: _ZN5doris10vectorized20Crc32HashPartitionerINS0_17ShuffleChannelIdsEE4initERKSt6vectorINS_5TExprESaIS5_EE
_ZN5doris10vectorized20Crc32HashPartitionerINS0_24SpillPartitionChannelIdsEE4initERKSt6vectorINS_5TExprESaIS5_EE
Line
Count
Source
65
11
    Status init(const std::vector<TExpr>& texprs) override {
66
11
        return VExpr::create_expr_trees(texprs, _partition_expr_ctxs);
67
11
    }
68
69
9
    Status prepare(RuntimeState* state, const RowDescriptor& row_desc) override {
70
9
        return VExpr::prepare(_partition_expr_ctxs, state, row_desc);
71
9
    }
Unexecuted instantiation: _ZN5doris10vectorized20Crc32HashPartitionerINS0_15ShiftChannelIdsEE7prepareEPNS_12RuntimeStateERKNS_13RowDescriptorE
Unexecuted instantiation: _ZN5doris10vectorized20Crc32HashPartitionerINS0_17ShuffleChannelIdsEE7prepareEPNS_12RuntimeStateERKNS_13RowDescriptorE
_ZN5doris10vectorized20Crc32HashPartitionerINS0_24SpillPartitionChannelIdsEE7prepareEPNS_12RuntimeStateERKNS_13RowDescriptorE
Line
Count
Source
69
9
    Status prepare(RuntimeState* state, const RowDescriptor& row_desc) override {
70
9
        return VExpr::prepare(_partition_expr_ctxs, state, row_desc);
71
9
    }
72
73
4
    Status open(RuntimeState* state) override { return VExpr::open(_partition_expr_ctxs, state); }
Unexecuted instantiation: _ZN5doris10vectorized20Crc32HashPartitionerINS0_15ShiftChannelIdsEE4openEPNS_12RuntimeStateE
Unexecuted instantiation: _ZN5doris10vectorized20Crc32HashPartitionerINS0_17ShuffleChannelIdsEE4openEPNS_12RuntimeStateE
_ZN5doris10vectorized20Crc32HashPartitionerINS0_24SpillPartitionChannelIdsEE4openEPNS_12RuntimeStateE
Line
Count
Source
73
4
    Status open(RuntimeState* state) override { return VExpr::open(_partition_expr_ctxs, state); }
74
75
0
    Status close(RuntimeState* state) override { return Status::OK(); }
Unexecuted instantiation: _ZN5doris10vectorized20Crc32HashPartitionerINS0_15ShiftChannelIdsEE5closeEPNS_12RuntimeStateE
Unexecuted instantiation: _ZN5doris10vectorized20Crc32HashPartitionerINS0_17ShuffleChannelIdsEE5closeEPNS_12RuntimeStateE
Unexecuted instantiation: _ZN5doris10vectorized20Crc32HashPartitionerINS0_24SpillPartitionChannelIdsEE5closeEPNS_12RuntimeStateE
76
77
    Status do_partitioning(RuntimeState* state, Block* block) const override;
78
79
27
    const std::vector<HashValType>& get_channel_ids() const override { return _hash_vals; }
Unexecuted instantiation: _ZNK5doris10vectorized20Crc32HashPartitionerINS0_15ShiftChannelIdsEE15get_channel_idsEv
_ZNK5doris10vectorized20Crc32HashPartitionerINS0_17ShuffleChannelIdsEE15get_channel_idsEv
Line
Count
Source
79
21
    const std::vector<HashValType>& get_channel_ids() const override { return _hash_vals; }
_ZNK5doris10vectorized20Crc32HashPartitionerINS0_24SpillPartitionChannelIdsEE15get_channel_idsEv
Line
Count
Source
79
6
    const std::vector<HashValType>& get_channel_ids() const override { return _hash_vals; }
80
81
    Status clone(RuntimeState* state, std::unique_ptr<PartitionerBase>& partitioner) override;
82
83
protected:
84
27
    Status _get_partition_column_result(Block* block, std::vector<int>& result) const {
85
27
        int counter = 0;
86
27
        for (auto ctx : _partition_expr_ctxs) {
87
27
            RETURN_IF_ERROR(ctx->execute(block, &result[counter++]));
88
27
        }
89
27
        return Status::OK();
90
27
    }
_ZNK5doris10vectorized20Crc32HashPartitionerINS0_17ShuffleChannelIdsEE28_get_partition_column_resultEPNS0_5BlockERSt6vectorIiSaIiEE
Line
Count
Source
84
21
    Status _get_partition_column_result(Block* block, std::vector<int>& result) const {
85
21
        int counter = 0;
86
21
        for (auto ctx : _partition_expr_ctxs) {
87
21
            RETURN_IF_ERROR(ctx->execute(block, &result[counter++]));
88
21
        }
89
21
        return Status::OK();
90
21
    }
_ZNK5doris10vectorized20Crc32HashPartitionerINS0_24SpillPartitionChannelIdsEE28_get_partition_column_resultEPNS0_5BlockERSt6vectorIiSaIiEE
Line
Count
Source
84
6
    Status _get_partition_column_result(Block* block, std::vector<int>& result) const {
85
6
        int counter = 0;
86
6
        for (auto ctx : _partition_expr_ctxs) {
87
6
            RETURN_IF_ERROR(ctx->execute(block, &result[counter++]));
88
6
        }
89
6
        return Status::OK();
90
6
    }
Unexecuted instantiation: _ZNK5doris10vectorized20Crc32HashPartitionerINS0_15ShiftChannelIdsEE28_get_partition_column_resultEPNS0_5BlockERSt6vectorIiSaIiEE
91
92
3
    Status _clone_expr_ctxs(RuntimeState* state, VExprContextSPtrs& new_partition_expr_ctxs) const {
93
3
        new_partition_expr_ctxs.resize(_partition_expr_ctxs.size());
94
6
        for (size_t i = 0; i < _partition_expr_ctxs.size(); i++) {
95
3
            RETURN_IF_ERROR(_partition_expr_ctxs[i]->clone(state, new_partition_expr_ctxs[i]));
96
3
        }
97
3
        return Status::OK();
98
3
    }
Unexecuted instantiation: _ZNK5doris10vectorized20Crc32HashPartitionerINS0_17ShuffleChannelIdsEE16_clone_expr_ctxsEPNS_12RuntimeStateERSt6vectorISt10shared_ptrINS0_12VExprContextEESaIS9_EE
_ZNK5doris10vectorized20Crc32HashPartitionerINS0_24SpillPartitionChannelIdsEE16_clone_expr_ctxsEPNS_12RuntimeStateERSt6vectorISt10shared_ptrINS0_12VExprContextEESaIS9_EE
Line
Count
Source
92
3
    Status _clone_expr_ctxs(RuntimeState* state, VExprContextSPtrs& new_partition_expr_ctxs) const {
93
3
        new_partition_expr_ctxs.resize(_partition_expr_ctxs.size());
94
6
        for (size_t i = 0; i < _partition_expr_ctxs.size(); i++) {
95
3
            RETURN_IF_ERROR(_partition_expr_ctxs[i]->clone(state, new_partition_expr_ctxs[i]));
96
3
        }
97
3
        return Status::OK();
98
3
    }
Unexecuted instantiation: _ZNK5doris10vectorized20Crc32HashPartitionerINS0_15ShiftChannelIdsEE16_clone_expr_ctxsEPNS_12RuntimeStateERSt6vectorISt10shared_ptrINS0_12VExprContextEESaIS9_EE
99
100
    virtual void _do_hash(const ColumnPtr& column, HashValType* __restrict result, int idx) const;
101
27
    virtual void _initialize_hash_vals(size_t rows) const {
102
27
        _hash_vals.resize(rows);
103
27
        std::ranges::fill(_hash_vals, 0);
104
27
    }
Unexecuted instantiation: _ZNK5doris10vectorized20Crc32HashPartitionerINS0_15ShiftChannelIdsEE21_initialize_hash_valsEm
_ZNK5doris10vectorized20Crc32HashPartitionerINS0_17ShuffleChannelIdsEE21_initialize_hash_valsEm
Line
Count
Source
101
21
    virtual void _initialize_hash_vals(size_t rows) const {
102
21
        _hash_vals.resize(rows);
103
21
        std::ranges::fill(_hash_vals, 0);
104
21
    }
_ZNK5doris10vectorized20Crc32HashPartitionerINS0_24SpillPartitionChannelIdsEE21_initialize_hash_valsEm
Line
Count
Source
101
6
    virtual void _initialize_hash_vals(size_t rows) const {
102
6
        _hash_vals.resize(rows);
103
6
        std::ranges::fill(_hash_vals, 0);
104
6
    }
105
106
    VExprContextSPtrs _partition_expr_ctxs;
107
    mutable std::vector<HashValType> _hash_vals;
108
};
109
110
struct ShuffleChannelIds {
111
    using HashValType = PartitionerBase::HashValType;
112
210
    HashValType operator()(HashValType l, size_t r) { return l % r; }
113
};
114
115
struct SpillPartitionChannelIds {
116
    using HashValType = PartitionerBase::HashValType;
117
3.14M
    HashValType operator()(HashValType l, size_t r) { return ((l >> 16) | (l << 16)) % r; }
118
};
119
120
0
static inline PartitionerBase::HashValType crc32c_shuffle_mix(PartitionerBase::HashValType h) {
121
    // Step 1: fold high entropy into low bits
122
0
    h ^= h >> 16;
123
    // Step 2: odd multiplicative scramble (cheap avalanche)
124
0
    h *= 0xA5B35705U;
125
    // Step 3: final fold to break remaining linearity
126
0
    h ^= h >> 13;
127
0
    return h;
128
0
}
Unexecuted instantiation: wal_manager_test.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: multi_cast_data_streamer_test.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: vdata_stream_recvr_test.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: local_exchanger_test.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: agg_operator_group_by_limit_opt_test.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: agg_operator_test.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: analytic_sink_operator_test.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: assert_nums_rows_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: datagen_operator_test.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: distinct_streaming_aggregation_operator_test.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: empty_set_operator_test.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: exchange_sink_operator_test.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: exchange_source_operator_test.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: hash_join_test_helper.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: hashjoin_build_sink_test.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: hashjoin_probe_operator_test.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: join_test_helper.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: local_merge_sort_source_operator_test.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: materialization_shared_state_test.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: partition_sort_sink_operator_test.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: partitioned_aggregation_sink_operator_test.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: partitioned_aggregation_source_operator_test.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: partitioned_aggregation_test_helper.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: partitioned_hash_join_probe_operator_test.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: partitioned_hash_join_sink_operator_test.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: partitioned_hash_join_test_helper.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: query_cache_operator_test.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: repeat_operator_test.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: scan_normalize_predicate_test.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: set_operator_test.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: sort_operator_test.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: spill_sort_sink_operator_test.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: spill_sort_source_operator_test.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: spill_sort_test_helper.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: spillable_operator_test_helper.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: streaming_agg_operator_test.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: table_function_operator_test.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: union_operator_test.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: pipeline_task_test.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: pipeline_test.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: exchange_writer_test.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: memory_reclamation_test.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: workload_sched_policy_test.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: runtime_filter_consumer_helper_test.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: runtime_filter_consumer_test.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: runtime_filter_merger_test.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: runtime_filter_mgr_test.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: runtime_filter_producer_helper_cross_test.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: runtime_filter_producer_helper_set_test.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: runtime_filter_producer_helper_test.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: runtime_filter_producer_test.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: scanner_context_test.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: profile_spec_test.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: exchange_sink_test.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: parquet_read_lines.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: orc_convert_to_orc_literal_test.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: orc_read_lines.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: scan_operator_test.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: vfile_scanner_exception_test.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: tablet_sink_hash_partitioner_test.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: vrow_distribution_test.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: exec_env_init.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: fragment_mgr.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: query_context.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: runtime_state.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: workload_group.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: workload_group_manager.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: query_task_controller.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: runtime_filter_producer_helper.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: rowid_fetcher.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: pipeline_task_action.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: vparquet_reader.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: file_scanner.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: olap_scanner.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: scanner.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: scanner_context.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: scanner_scheduler.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: vectorized_fn_call.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: vexpr.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: partitioner.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: vdata_stream_recvr.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: tablet_sink_hash_partitioner.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: vdata_stream_sender.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: dependency.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: aggregation_sink_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: aggregation_source_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: analytic_sink_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: analytic_source_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: assert_num_rows_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: cache_sink_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: cache_source_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: datagen_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: distinct_streaming_aggregation_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: empty_set_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: exchange_sink_buffer.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: exchange_sink_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: exchange_source_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: file_scan_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: hashjoin_build_sink.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: hashjoin_probe_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: full_outer_join_impl.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: inner_join_impl.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: left_anti_join_impl.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: left_outer_join_impl.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: left_semi_join_impl.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: null_aware_left_anti_join_impl.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: null_aware_left_semi_join_impl.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: right_anti_join_impl.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: right_outer_join_impl.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: right_semi_join_impl.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: join_build_sink_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: join_probe_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: local_merge_sort_source_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: materialization_opertor.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: multi_cast_data_streamer.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: nested_loop_join_build_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: nested_loop_join_probe_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: olap_scan_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: parallel_scanner_builder.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: memory_scratch_sink_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: hive_table_sink_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: iceberg_table_sink_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: blackhole_sink_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: multi_cast_data_stream_sink.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: group_commit_block_sink_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: dict_sink_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: group_commit_scan_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: jdbc_scan_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: jdbc_scanner.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: es_scan_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: es_scanner.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: multi_cast_data_stream_source.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: meta_scan_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: vfile_result_writer.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: jdbc_table_sink_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: partition_sort_sink_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: partition_sort_source_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: partitioned_aggregation_sink_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: partitioned_aggregation_source_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: partitioned_hash_join_probe_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: partitioned_hash_join_sink_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: rec_cte_anchor_sink_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: rec_cte_sink_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: rec_cte_source_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: repeat_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: result_file_sink_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: result_sink_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: scan_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: schema_scan_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: set_probe_sink_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: set_sink_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: set_source_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: sort_sink_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: sort_source_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: spill_sort_sink_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: spill_sort_source_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: streaming_aggregation_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: table_function_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: union_sink_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: union_source_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: local_exchange_sink_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: local_exchange_source_operator.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: local_exchanger.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: pipeline.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: pipeline_fragment_context.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: pipeline_task.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: exchange_writer.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: task_queue.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
Unexecuted instantiation: task_scheduler.cpp:_ZN5doris10vectorizedL18crc32c_shuffle_mixEj
129
130
// use high 16 bits as channel id to avoid conflict with crc32c hash table
131
// shuffle hash function same with crc32c hash table(eg join hash table) will lead bad performance
132
// hash table offten use low 16 bits as bucket index, so we shift 16 bits to high bits to avoid conflict
133
struct ShiftChannelIds {
134
    using HashValType = PartitionerBase::HashValType;
135
0
    HashValType operator()(HashValType l, size_t r) { return crc32c_shuffle_mix(l) % r; }
136
};
137
138
class Crc32CHashPartitioner : public Crc32HashPartitioner<ShiftChannelIds> {
139
public:
140
    Crc32CHashPartitioner(int partition_count)
141
0
            : Crc32HashPartitioner<ShiftChannelIds>(partition_count) {}
142
143
    Status clone(RuntimeState* state, std::unique_ptr<PartitionerBase>& partitioner) override;
144
145
private:
146
    void _do_hash(const ColumnPtr& column, HashValType* __restrict result, int idx) const override;
147
148
0
    void _initialize_hash_vals(size_t rows) const override {
149
0
        _hash_vals.resize(rows);
150
        // use golden ratio to initialize hash values to avoid collision with hash table's hash function
151
0
        constexpr HashValType CRC32C_SHUFFLE_SEED = 0x9E3779B9U;
152
0
        std::ranges::fill(_hash_vals, CRC32C_SHUFFLE_SEED);
153
0
    }
154
};
155
156
#include "common/compile_check_end.h"
157
} // namespace doris::vectorized