Coverage Report

Created: 2025-11-14 17:29

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/root/doris/be/src/util/counts.h
Line
Count
Source
1
// Licensed to the Apache Software Foundation (ASF) under one
2
// or more contributor license agreements.  See the NOTICE file
3
// distributed with this work for additional information
4
// regarding copyright ownership.  The ASF licenses this file
5
// to you under the Apache License, Version 2.0 (the
6
// "License"); you may not use this file except in compliance
7
// with the License.  You may obtain a copy of the License at
8
//
9
//   http://www.apache.org/licenses/LICENSE-2.0
10
//
11
// Unless required by applicable law or agreed to in writing,
12
// software distributed under the License is distributed on an
13
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
14
// KIND, either express or implied.  See the License for the
15
// specific language governing permissions and limitations
16
// under the License.
17
18
#pragma once
19
20
#include <pdqsort.h>
21
22
#include <algorithm>
23
#include <cmath>
24
#include <queue>
25
26
#include "udf/udf.h"
27
#include "vec/common/pod_array.h"
28
#include "vec/common/string_buffer.hpp"
29
#include "vec/io/io_helper.h"
30
31
namespace doris {
32
33
template <typename Ty>
34
class Counts {
35
public:
36
3.65k
    Counts() = default;
_ZN5doris6CountsIaEC2Ev
Line
Count
Source
36
43
    Counts() = default;
_ZN5doris6CountsIsEC2Ev
Line
Count
Source
36
213
    Counts() = default;
_ZN5doris6CountsIiEC2Ev
Line
Count
Source
36
2.23k
    Counts() = default;
_ZN5doris6CountsIlEC2Ev
Line
Count
Source
36
837
    Counts() = default;
_ZN5doris6CountsInEC2Ev
Line
Count
Source
36
39
    Counts() = default;
_ZN5doris6CountsIfEC2Ev
Line
Count
Source
36
9
    Counts() = default;
_ZN5doris6CountsIdEC2Ev
Line
Count
Source
36
284
    Counts() = default;
37
38
1.31k
    void merge(Counts* other) {
39
1.31k
        if (other != nullptr && !other->_nums.empty()) {
40
1.31k
            _sorted_nums_vec.emplace_back(std::move(other->_nums));
41
1.31k
        }
42
1.31k
    }
_ZN5doris6CountsIaE5mergeEPS1_
Line
Count
Source
38
3
    void merge(Counts* other) {
39
3
        if (other != nullptr && !other->_nums.empty()) {
40
3
            _sorted_nums_vec.emplace_back(std::move(other->_nums));
41
3
        }
42
3
    }
_ZN5doris6CountsIsE5mergeEPS1_
Line
Count
Source
38
15
    void merge(Counts* other) {
39
15
        if (other != nullptr && !other->_nums.empty()) {
40
15
            _sorted_nums_vec.emplace_back(std::move(other->_nums));
41
15
        }
42
15
    }
_ZN5doris6CountsIiE5mergeEPS1_
Line
Count
Source
38
835
    void merge(Counts* other) {
39
835
        if (other != nullptr && !other->_nums.empty()) {
40
835
            _sorted_nums_vec.emplace_back(std::move(other->_nums));
41
835
        }
42
835
    }
_ZN5doris6CountsIlE5mergeEPS1_
Line
Count
Source
38
351
    void merge(Counts* other) {
39
351
        if (other != nullptr && !other->_nums.empty()) {
40
351
            _sorted_nums_vec.emplace_back(std::move(other->_nums));
41
351
        }
42
351
    }
_ZN5doris6CountsInE5mergeEPS1_
Line
Count
Source
38
3
    void merge(Counts* other) {
39
3
        if (other != nullptr && !other->_nums.empty()) {
40
3
            _sorted_nums_vec.emplace_back(std::move(other->_nums));
41
3
        }
42
3
    }
_ZN5doris6CountsIfE5mergeEPS1_
Line
Count
Source
38
3
    void merge(Counts* other) {
39
3
        if (other != nullptr && !other->_nums.empty()) {
40
3
            _sorted_nums_vec.emplace_back(std::move(other->_nums));
41
3
        }
42
3
    }
_ZN5doris6CountsIdE5mergeEPS1_
Line
Count
Source
38
101
    void merge(Counts* other) {
39
101
        if (other != nullptr && !other->_nums.empty()) {
40
101
            _sorted_nums_vec.emplace_back(std::move(other->_nums));
41
101
        }
42
101
    }
43
44
    void increment(Ty key, uint32_t i) {
45
        auto old_size = _nums.size();
46
        _nums.resize(_nums.size() + i);
47
        for (uint32_t j = 0; j < i; ++j) {
48
            _nums[old_size + j] = key;
49
        }
50
    }
51
52
2.93k
    void increment(Ty key) { _nums.push_back(key); }
_ZN5doris6CountsIaE9incrementEa
Line
Count
Source
52
73
    void increment(Ty key) { _nums.push_back(key); }
_ZN5doris6CountsIsE9incrementEs
Line
Count
Source
52
552
    void increment(Ty key) { _nums.push_back(key); }
_ZN5doris6CountsIiE9incrementEi
Line
Count
Source
52
1.59k
    void increment(Ty key) { _nums.push_back(key); }
_ZN5doris6CountsIlE9incrementEl
Line
Count
Source
52
401
    void increment(Ty key) { _nums.push_back(key); }
_ZN5doris6CountsInE9incrementEn
Line
Count
Source
52
45
    void increment(Ty key) { _nums.push_back(key); }
_ZN5doris6CountsIfE9incrementEf
Line
Count
Source
52
9
    void increment(Ty key) { _nums.push_back(key); }
_ZN5doris6CountsIdE9incrementEd
Line
Count
Source
52
259
    void increment(Ty key) { _nums.push_back(key); }
53
54
5
    void increment_batch(const vectorized::PaddedPODArray<Ty>& keys) {
55
5
        _nums.insert(keys.begin(), keys.end());
56
5
    }
Unexecuted instantiation: _ZN5doris6CountsIaE15increment_batchERKNS_10vectorized8PODArrayIaLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb0EEELm16ELm15EEE
Unexecuted instantiation: _ZN5doris6CountsIsE15increment_batchERKNS_10vectorized8PODArrayIsLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb0EEELm16ELm15EEE
Unexecuted instantiation: _ZN5doris6CountsIiE15increment_batchERKNS_10vectorized8PODArrayIiLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb0EEELm16ELm15EEE
_ZN5doris6CountsIlE15increment_batchERKNS_10vectorized8PODArrayIlLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb0EEELm16ELm15EEE
Line
Count
Source
54
5
    void increment_batch(const vectorized::PaddedPODArray<Ty>& keys) {
55
5
        _nums.insert(keys.begin(), keys.end());
56
5
    }
Unexecuted instantiation: _ZN5doris6CountsInE15increment_batchERKNS_10vectorized8PODArrayInLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb0EEELm16ELm15EEE
Unexecuted instantiation: _ZN5doris6CountsIfE15increment_batchERKNS_10vectorized8PODArrayIfLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb0EEELm16ELm15EEE
Unexecuted instantiation: _ZN5doris6CountsIdE15increment_batchERKNS_10vectorized8PODArrayIdLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb0EEELm16ELm15EEE
57
58
1.71k
    void serialize(vectorized::BufferWritable& buf) {
59
1.71k
        if (!_nums.empty()) {
60
1.42k
            pdqsort(_nums.begin(), _nums.end());
61
1.42k
            size_t size = _nums.size();
62
1.42k
            buf.write_binary(size);
63
1.42k
            buf.write(reinterpret_cast<const char*>(_nums.data()), sizeof(Ty) * size);
64
1.42k
        } else {
65
            // convert _sorted_nums_vec to _nums and do seiralize again
66
288
            _convert_sorted_num_vec_to_nums();
67
288
            serialize(buf);
68
288
        }
69
1.71k
    }
_ZN5doris6CountsIaE9serializeERNS_10vectorized14BufferWritableE
Line
Count
Source
58
3
    void serialize(vectorized::BufferWritable& buf) {
59
3
        if (!_nums.empty()) {
60
3
            pdqsort(_nums.begin(), _nums.end());
61
3
            size_t size = _nums.size();
62
3
            buf.write_binary(size);
63
3
            buf.write(reinterpret_cast<const char*>(_nums.data()), sizeof(Ty) * size);
64
3
        } else {
65
            // convert _sorted_nums_vec to _nums and do seiralize again
66
0
            _convert_sorted_num_vec_to_nums();
67
0
            serialize(buf);
68
0
        }
69
3
    }
_ZN5doris6CountsIsE9serializeERNS_10vectorized14BufferWritableE
Line
Count
Source
58
15
    void serialize(vectorized::BufferWritable& buf) {
59
15
        if (!_nums.empty()) {
60
15
            pdqsort(_nums.begin(), _nums.end());
61
15
            size_t size = _nums.size();
62
15
            buf.write_binary(size);
63
15
            buf.write(reinterpret_cast<const char*>(_nums.data()), sizeof(Ty) * size);
64
15
        } else {
65
            // convert _sorted_nums_vec to _nums and do seiralize again
66
0
            _convert_sorted_num_vec_to_nums();
67
0
            serialize(buf);
68
0
        }
69
15
    }
_ZN5doris6CountsIiE9serializeERNS_10vectorized14BufferWritableE
Line
Count
Source
58
1.10k
    void serialize(vectorized::BufferWritable& buf) {
59
1.10k
        if (!_nums.empty()) {
60
952
            pdqsort(_nums.begin(), _nums.end());
61
952
            size_t size = _nums.size();
62
952
            buf.write_binary(size);
63
952
            buf.write(reinterpret_cast<const char*>(_nums.data()), sizeof(Ty) * size);
64
952
        } else {
65
            // convert _sorted_nums_vec to _nums and do seiralize again
66
156
            _convert_sorted_num_vec_to_nums();
67
156
            serialize(buf);
68
156
        }
69
1.10k
    }
_ZN5doris6CountsIlE9serializeERNS_10vectorized14BufferWritableE
Line
Count
Source
58
483
    void serialize(vectorized::BufferWritable& buf) {
59
483
        if (!_nums.empty()) {
60
351
            pdqsort(_nums.begin(), _nums.end());
61
351
            size_t size = _nums.size();
62
351
            buf.write_binary(size);
63
351
            buf.write(reinterpret_cast<const char*>(_nums.data()), sizeof(Ty) * size);
64
351
        } else {
65
            // convert _sorted_nums_vec to _nums and do seiralize again
66
132
            _convert_sorted_num_vec_to_nums();
67
132
            serialize(buf);
68
132
        }
69
483
    }
_ZN5doris6CountsInE9serializeERNS_10vectorized14BufferWritableE
Line
Count
Source
58
3
    void serialize(vectorized::BufferWritable& buf) {
59
3
        if (!_nums.empty()) {
60
3
            pdqsort(_nums.begin(), _nums.end());
61
3
            size_t size = _nums.size();
62
3
            buf.write_binary(size);
63
3
            buf.write(reinterpret_cast<const char*>(_nums.data()), sizeof(Ty) * size);
64
3
        } else {
65
            // convert _sorted_nums_vec to _nums and do seiralize again
66
0
            _convert_sorted_num_vec_to_nums();
67
0
            serialize(buf);
68
0
        }
69
3
    }
_ZN5doris6CountsIfE9serializeERNS_10vectorized14BufferWritableE
Line
Count
Source
58
3
    void serialize(vectorized::BufferWritable& buf) {
59
3
        if (!_nums.empty()) {
60
3
            pdqsort(_nums.begin(), _nums.end());
61
3
            size_t size = _nums.size();
62
3
            buf.write_binary(size);
63
3
            buf.write(reinterpret_cast<const char*>(_nums.data()), sizeof(Ty) * size);
64
3
        } else {
65
            // convert _sorted_nums_vec to _nums and do seiralize again
66
0
            _convert_sorted_num_vec_to_nums();
67
0
            serialize(buf);
68
0
        }
69
3
    }
_ZN5doris6CountsIdE9serializeERNS_10vectorized14BufferWritableE
Line
Count
Source
58
101
    void serialize(vectorized::BufferWritable& buf) {
59
101
        if (!_nums.empty()) {
60
101
            pdqsort(_nums.begin(), _nums.end());
61
101
            size_t size = _nums.size();
62
101
            buf.write_binary(size);
63
101
            buf.write(reinterpret_cast<const char*>(_nums.data()), sizeof(Ty) * size);
64
101
        } else {
65
            // convert _sorted_nums_vec to _nums and do seiralize again
66
0
            _convert_sorted_num_vec_to_nums();
67
0
            serialize(buf);
68
0
        }
69
101
    }
70
71
1.31k
    void unserialize(vectorized::BufferReadable& buf) {
72
1.31k
        size_t size;
73
1.31k
        buf.read_binary(size);
74
1.31k
        _nums.resize(size);
75
1.31k
        auto buff = buf.read(sizeof(Ty) * size);
76
1.31k
        memcpy(_nums.data(), buff.data, buff.size);
77
1.31k
    }
_ZN5doris6CountsIaE11unserializeERNS_10vectorized14BufferReadableE
Line
Count
Source
71
3
    void unserialize(vectorized::BufferReadable& buf) {
72
3
        size_t size;
73
3
        buf.read_binary(size);
74
3
        _nums.resize(size);
75
3
        auto buff = buf.read(sizeof(Ty) * size);
76
3
        memcpy(_nums.data(), buff.data, buff.size);
77
3
    }
_ZN5doris6CountsIsE11unserializeERNS_10vectorized14BufferReadableE
Line
Count
Source
71
15
    void unserialize(vectorized::BufferReadable& buf) {
72
15
        size_t size;
73
15
        buf.read_binary(size);
74
15
        _nums.resize(size);
75
15
        auto buff = buf.read(sizeof(Ty) * size);
76
15
        memcpy(_nums.data(), buff.data, buff.size);
77
15
    }
_ZN5doris6CountsIiE11unserializeERNS_10vectorized14BufferReadableE
Line
Count
Source
71
835
    void unserialize(vectorized::BufferReadable& buf) {
72
835
        size_t size;
73
835
        buf.read_binary(size);
74
835
        _nums.resize(size);
75
835
        auto buff = buf.read(sizeof(Ty) * size);
76
835
        memcpy(_nums.data(), buff.data, buff.size);
77
835
    }
_ZN5doris6CountsIlE11unserializeERNS_10vectorized14BufferReadableE
Line
Count
Source
71
351
    void unserialize(vectorized::BufferReadable& buf) {
72
351
        size_t size;
73
351
        buf.read_binary(size);
74
351
        _nums.resize(size);
75
351
        auto buff = buf.read(sizeof(Ty) * size);
76
351
        memcpy(_nums.data(), buff.data, buff.size);
77
351
    }
_ZN5doris6CountsInE11unserializeERNS_10vectorized14BufferReadableE
Line
Count
Source
71
3
    void unserialize(vectorized::BufferReadable& buf) {
72
3
        size_t size;
73
3
        buf.read_binary(size);
74
3
        _nums.resize(size);
75
3
        auto buff = buf.read(sizeof(Ty) * size);
76
3
        memcpy(_nums.data(), buff.data, buff.size);
77
3
    }
_ZN5doris6CountsIfE11unserializeERNS_10vectorized14BufferReadableE
Line
Count
Source
71
3
    void unserialize(vectorized::BufferReadable& buf) {
72
3
        size_t size;
73
3
        buf.read_binary(size);
74
3
        _nums.resize(size);
75
3
        auto buff = buf.read(sizeof(Ty) * size);
76
3
        memcpy(_nums.data(), buff.data, buff.size);
77
3
    }
_ZN5doris6CountsIdE11unserializeERNS_10vectorized14BufferReadableE
Line
Count
Source
71
101
    void unserialize(vectorized::BufferReadable& buf) {
72
101
        size_t size;
73
101
        buf.read_binary(size);
74
101
        _nums.resize(size);
75
101
        auto buff = buf.read(sizeof(Ty) * size);
76
101
        memcpy(_nums.data(), buff.data, buff.size);
77
101
    }
78
79
1.10k
    double terminate(double quantile) {
80
1.10k
        if (_sorted_nums_vec.size() <= 1) {
81
959
            if (_sorted_nums_vec.size() == 1) {
82
306
                _nums = std::move(_sorted_nums_vec[0]);
83
306
            }
84
85
959
            if (_nums.empty()) {
86
                // Although set null here, but the value is 0.0 and the call method just
87
                // get val in aggregate_function_percentile_approx.h
88
0
                return 0.0;
89
0
            }
90
91
959
            if (UNLIKELY(!std::is_sorted(_nums.begin(), _nums.end()))) {
92
180
                pdqsort(_nums.begin(), _nums.end());
93
180
            }
94
95
959
            if (quantile == 1 || _nums.size() == 1) {
96
473
                return _nums.back();
97
473
            }
98
99
486
            double u = (_nums.size() - 1) * quantile;
100
486
            auto index = static_cast<uint32_t>(u);
101
486
            return _nums[index] +
102
486
                   (u - static_cast<double>(index)) * (static_cast<double>(_nums[index + 1]) -
103
486
                                                       static_cast<double>(_nums[index]));
104
959
        } else {
105
146
            DCHECK(_nums.empty());
106
146
            size_t rows = 0;
107
419
            for (const auto& i : _sorted_nums_vec) {
108
419
                rows += i.size();
109
419
            }
110
146
            const bool reverse = quantile > 0.5 && rows > 2;
111
146
            double u = (rows - 1) * quantile;
112
146
            auto index = static_cast<uint32_t>(u);
113
            // if reverse, the step of target should start 0 like not reverse
114
            // so here rows need to minus index + 2
115
            // eg: rows = 10, index = 5
116
            // if not reverse, so the first number loc is 5, the second number loc is 6
117
            // if reverse, so the second number is 3, the first number is 4
118
            // 5 + 4 = 3 + 6 = 9 = rows - 1.
119
            // the rows must GE 2 beacuse `_sorted_nums_vec` size GE 2
120
146
            size_t target = reverse ? rows - index - 2 : index;
121
146
            if (quantile == 1) {
122
0
                target = 0;
123
0
            }
124
146
            auto [first_number, second_number] = _merge_sort_and_get_numbers(target, reverse);
125
146
            if (quantile == 1) {
126
0
                return second_number;
127
0
            }
128
146
            return first_number +
129
146
                   (u - static_cast<double>(index)) *
130
146
                           (static_cast<double>(second_number) - static_cast<double>(first_number));
131
146
        }
132
1.10k
    }
_ZN5doris6CountsIaE9terminateEd
Line
Count
Source
79
61
    double terminate(double quantile) {
80
61
        if (_sorted_nums_vec.size() <= 1) {
81
61
            if (_sorted_nums_vec.size() == 1) {
82
3
                _nums = std::move(_sorted_nums_vec[0]);
83
3
            }
84
85
61
            if (_nums.empty()) {
86
                // Although set null here, but the value is 0.0 and the call method just
87
                // get val in aggregate_function_percentile_approx.h
88
0
                return 0.0;
89
0
            }
90
91
61
            if (UNLIKELY(!std::is_sorted(_nums.begin(), _nums.end()))) {
92
24
                pdqsort(_nums.begin(), _nums.end());
93
24
            }
94
95
61
            if (quantile == 1 || _nums.size() == 1) {
96
34
                return _nums.back();
97
34
            }
98
99
27
            double u = (_nums.size() - 1) * quantile;
100
27
            auto index = static_cast<uint32_t>(u);
101
27
            return _nums[index] +
102
27
                   (u - static_cast<double>(index)) * (static_cast<double>(_nums[index + 1]) -
103
27
                                                       static_cast<double>(_nums[index]));
104
61
        } else {
105
0
            DCHECK(_nums.empty());
106
0
            size_t rows = 0;
107
0
            for (const auto& i : _sorted_nums_vec) {
108
0
                rows += i.size();
109
0
            }
110
0
            const bool reverse = quantile > 0.5 && rows > 2;
111
0
            double u = (rows - 1) * quantile;
112
0
            auto index = static_cast<uint32_t>(u);
113
            // if reverse, the step of target should start 0 like not reverse
114
            // so here rows need to minus index + 2
115
            // eg: rows = 10, index = 5
116
            // if not reverse, so the first number loc is 5, the second number loc is 6
117
            // if reverse, so the second number is 3, the first number is 4
118
            // 5 + 4 = 3 + 6 = 9 = rows - 1.
119
            // the rows must GE 2 beacuse `_sorted_nums_vec` size GE 2
120
0
            size_t target = reverse ? rows - index - 2 : index;
121
0
            if (quantile == 1) {
122
0
                target = 0;
123
0
            }
124
0
            auto [first_number, second_number] = _merge_sort_and_get_numbers(target, reverse);
125
0
            if (quantile == 1) {
126
0
                return second_number;
127
0
            }
128
0
            return first_number +
129
0
                   (u - static_cast<double>(index)) *
130
0
                           (static_cast<double>(second_number) - static_cast<double>(first_number));
131
0
        }
132
61
    }
_ZN5doris6CountsIsE9terminateEd
Line
Count
Source
79
300
    double terminate(double quantile) {
80
300
        if (_sorted_nums_vec.size() <= 1) {
81
297
            if (_sorted_nums_vec.size() == 1) {
82
3
                _nums = std::move(_sorted_nums_vec[0]);
83
3
            }
84
85
297
            if (_nums.empty()) {
86
                // Although set null here, but the value is 0.0 and the call method just
87
                // get val in aggregate_function_percentile_approx.h
88
0
                return 0.0;
89
0
            }
90
91
297
            if (UNLIKELY(!std::is_sorted(_nums.begin(), _nums.end()))) {
92
144
                pdqsort(_nums.begin(), _nums.end());
93
144
            }
94
95
297
            if (quantile == 1 || _nums.size() == 1) {
96
87
                return _nums.back();
97
87
            }
98
99
210
            double u = (_nums.size() - 1) * quantile;
100
210
            auto index = static_cast<uint32_t>(u);
101
210
            return _nums[index] +
102
210
                   (u - static_cast<double>(index)) * (static_cast<double>(_nums[index + 1]) -
103
210
                                                       static_cast<double>(_nums[index]));
104
297
        } else {
105
3
            DCHECK(_nums.empty());
106
3
            size_t rows = 0;
107
12
            for (const auto& i : _sorted_nums_vec) {
108
12
                rows += i.size();
109
12
            }
110
3
            const bool reverse = quantile > 0.5 && rows > 2;
111
3
            double u = (rows - 1) * quantile;
112
3
            auto index = static_cast<uint32_t>(u);
113
            // if reverse, the step of target should start 0 like not reverse
114
            // so here rows need to minus index + 2
115
            // eg: rows = 10, index = 5
116
            // if not reverse, so the first number loc is 5, the second number loc is 6
117
            // if reverse, so the second number is 3, the first number is 4
118
            // 5 + 4 = 3 + 6 = 9 = rows - 1.
119
            // the rows must GE 2 beacuse `_sorted_nums_vec` size GE 2
120
3
            size_t target = reverse ? rows - index - 2 : index;
121
3
            if (quantile == 1) {
122
0
                target = 0;
123
0
            }
124
3
            auto [first_number, second_number] = _merge_sort_and_get_numbers(target, reverse);
125
3
            if (quantile == 1) {
126
0
                return second_number;
127
0
            }
128
3
            return first_number +
129
3
                   (u - static_cast<double>(index)) *
130
3
                           (static_cast<double>(second_number) - static_cast<double>(first_number));
131
3
        }
132
300
    }
_ZN5doris6CountsIiE9terminateEd
Line
Count
Source
79
444
    double terminate(double quantile) {
80
444
        if (_sorted_nums_vec.size() <= 1) {
81
347
            if (_sorted_nums_vec.size() == 1) {
82
229
                _nums = std::move(_sorted_nums_vec[0]);
83
229
            }
84
85
347
            if (_nums.empty()) {
86
                // Although set null here, but the value is 0.0 and the call method just
87
                // get val in aggregate_function_percentile_approx.h
88
0
                return 0.0;
89
0
            }
90
91
347
            if (UNLIKELY(!std::is_sorted(_nums.begin(), _nums.end()))) {
92
11
                pdqsort(_nums.begin(), _nums.end());
93
11
            }
94
95
347
            if (quantile == 1 || _nums.size() == 1) {
96
239
                return _nums.back();
97
239
            }
98
99
108
            double u = (_nums.size() - 1) * quantile;
100
108
            auto index = static_cast<uint32_t>(u);
101
108
            return _nums[index] +
102
108
                   (u - static_cast<double>(index)) * (static_cast<double>(_nums[index + 1]) -
103
108
                                                       static_cast<double>(_nums[index]));
104
347
        } else {
105
97
            DCHECK(_nums.empty());
106
97
            size_t rows = 0;
107
267
            for (const auto& i : _sorted_nums_vec) {
108
267
                rows += i.size();
109
267
            }
110
97
            const bool reverse = quantile > 0.5 && rows > 2;
111
97
            double u = (rows - 1) * quantile;
112
97
            auto index = static_cast<uint32_t>(u);
113
            // if reverse, the step of target should start 0 like not reverse
114
            // so here rows need to minus index + 2
115
            // eg: rows = 10, index = 5
116
            // if not reverse, so the first number loc is 5, the second number loc is 6
117
            // if reverse, so the second number is 3, the first number is 4
118
            // 5 + 4 = 3 + 6 = 9 = rows - 1.
119
            // the rows must GE 2 beacuse `_sorted_nums_vec` size GE 2
120
97
            size_t target = reverse ? rows - index - 2 : index;
121
97
            if (quantile == 1) {
122
0
                target = 0;
123
0
            }
124
97
            auto [first_number, second_number] = _merge_sort_and_get_numbers(target, reverse);
125
97
            if (quantile == 1) {
126
0
                return second_number;
127
0
            }
128
97
            return first_number +
129
97
                   (u - static_cast<double>(index)) *
130
97
                           (static_cast<double>(second_number) - static_cast<double>(first_number));
131
97
        }
132
444
    }
_ZN5doris6CountsIlE9terminateEd
Line
Count
Source
79
128
    double terminate(double quantile) {
80
128
        if (_sorted_nums_vec.size() <= 1) {
81
106
            if (_sorted_nums_vec.size() == 1) {
82
36
                _nums = std::move(_sorted_nums_vec[0]);
83
36
            }
84
85
106
            if (_nums.empty()) {
86
                // Although set null here, but the value is 0.0 and the call method just
87
                // get val in aggregate_function_percentile_approx.h
88
0
                return 0.0;
89
0
            }
90
91
106
            if (UNLIKELY(!std::is_sorted(_nums.begin(), _nums.end()))) {
92
1
                pdqsort(_nums.begin(), _nums.end());
93
1
            }
94
95
106
            if (quantile == 1 || _nums.size() == 1) {
96
59
                return _nums.back();
97
59
            }
98
99
47
            double u = (_nums.size() - 1) * quantile;
100
47
            auto index = static_cast<uint32_t>(u);
101
47
            return _nums[index] +
102
47
                   (u - static_cast<double>(index)) * (static_cast<double>(_nums[index + 1]) -
103
47
                                                       static_cast<double>(_nums[index]));
104
106
        } else {
105
22
            DCHECK(_nums.empty());
106
22
            size_t rows = 0;
107
68
            for (const auto& i : _sorted_nums_vec) {
108
68
                rows += i.size();
109
68
            }
110
22
            const bool reverse = quantile > 0.5 && rows > 2;
111
22
            double u = (rows - 1) * quantile;
112
22
            auto index = static_cast<uint32_t>(u);
113
            // if reverse, the step of target should start 0 like not reverse
114
            // so here rows need to minus index + 2
115
            // eg: rows = 10, index = 5
116
            // if not reverse, so the first number loc is 5, the second number loc is 6
117
            // if reverse, so the second number is 3, the first number is 4
118
            // 5 + 4 = 3 + 6 = 9 = rows - 1.
119
            // the rows must GE 2 beacuse `_sorted_nums_vec` size GE 2
120
22
            size_t target = reverse ? rows - index - 2 : index;
121
22
            if (quantile == 1) {
122
0
                target = 0;
123
0
            }
124
22
            auto [first_number, second_number] = _merge_sort_and_get_numbers(target, reverse);
125
22
            if (quantile == 1) {
126
0
                return second_number;
127
0
            }
128
22
            return first_number +
129
22
                   (u - static_cast<double>(index)) *
130
22
                           (static_cast<double>(second_number) - static_cast<double>(first_number));
131
22
        }
132
128
    }
_ZN5doris6CountsInE9terminateEd
Line
Count
Source
79
33
    double terminate(double quantile) {
80
33
        if (_sorted_nums_vec.size() <= 1) {
81
33
            if (_sorted_nums_vec.size() == 1) {
82
3
                _nums = std::move(_sorted_nums_vec[0]);
83
3
            }
84
85
33
            if (_nums.empty()) {
86
                // Although set null here, but the value is 0.0 and the call method just
87
                // get val in aggregate_function_percentile_approx.h
88
0
                return 0.0;
89
0
            }
90
91
33
            if (UNLIKELY(!std::is_sorted(_nums.begin(), _nums.end()))) {
92
0
                pdqsort(_nums.begin(), _nums.end());
93
0
            }
94
95
33
            if (quantile == 1 || _nums.size() == 1) {
96
24
                return _nums.back();
97
24
            }
98
99
9
            double u = (_nums.size() - 1) * quantile;
100
9
            auto index = static_cast<uint32_t>(u);
101
9
            return _nums[index] +
102
9
                   (u - static_cast<double>(index)) * (static_cast<double>(_nums[index + 1]) -
103
9
                                                       static_cast<double>(_nums[index]));
104
33
        } else {
105
0
            DCHECK(_nums.empty());
106
0
            size_t rows = 0;
107
0
            for (const auto& i : _sorted_nums_vec) {
108
0
                rows += i.size();
109
0
            }
110
0
            const bool reverse = quantile > 0.5 && rows > 2;
111
0
            double u = (rows - 1) * quantile;
112
0
            auto index = static_cast<uint32_t>(u);
113
            // if reverse, the step of target should start 0 like not reverse
114
            // so here rows need to minus index + 2
115
            // eg: rows = 10, index = 5
116
            // if not reverse, so the first number loc is 5, the second number loc is 6
117
            // if reverse, so the second number is 3, the first number is 4
118
            // 5 + 4 = 3 + 6 = 9 = rows - 1.
119
            // the rows must GE 2 beacuse `_sorted_nums_vec` size GE 2
120
0
            size_t target = reverse ? rows - index - 2 : index;
121
0
            if (quantile == 1) {
122
0
                target = 0;
123
0
            }
124
0
            auto [first_number, second_number] = _merge_sort_and_get_numbers(target, reverse);
125
0
            if (quantile == 1) {
126
0
                return second_number;
127
0
            }
128
0
            return first_number +
129
0
                   (u - static_cast<double>(index)) *
130
0
                           (static_cast<double>(second_number) - static_cast<double>(first_number));
131
0
        }
132
33
    }
_ZN5doris6CountsIfE9terminateEd
Line
Count
Source
79
3
    double terminate(double quantile) {
80
3
        if (_sorted_nums_vec.size() <= 1) {
81
3
            if (_sorted_nums_vec.size() == 1) {
82
3
                _nums = std::move(_sorted_nums_vec[0]);
83
3
            }
84
85
3
            if (_nums.empty()) {
86
                // Although set null here, but the value is 0.0 and the call method just
87
                // get val in aggregate_function_percentile_approx.h
88
0
                return 0.0;
89
0
            }
90
91
3
            if (UNLIKELY(!std::is_sorted(_nums.begin(), _nums.end()))) {
92
0
                pdqsort(_nums.begin(), _nums.end());
93
0
            }
94
95
3
            if (quantile == 1 || _nums.size() == 1) {
96
0
                return _nums.back();
97
0
            }
98
99
3
            double u = (_nums.size() - 1) * quantile;
100
3
            auto index = static_cast<uint32_t>(u);
101
3
            return _nums[index] +
102
3
                   (u - static_cast<double>(index)) * (static_cast<double>(_nums[index + 1]) -
103
3
                                                       static_cast<double>(_nums[index]));
104
3
        } else {
105
0
            DCHECK(_nums.empty());
106
0
            size_t rows = 0;
107
0
            for (const auto& i : _sorted_nums_vec) {
108
0
                rows += i.size();
109
0
            }
110
0
            const bool reverse = quantile > 0.5 && rows > 2;
111
0
            double u = (rows - 1) * quantile;
112
0
            auto index = static_cast<uint32_t>(u);
113
            // if reverse, the step of target should start 0 like not reverse
114
            // so here rows need to minus index + 2
115
            // eg: rows = 10, index = 5
116
            // if not reverse, so the first number loc is 5, the second number loc is 6
117
            // if reverse, so the second number is 3, the first number is 4
118
            // 5 + 4 = 3 + 6 = 9 = rows - 1.
119
            // the rows must GE 2 beacuse `_sorted_nums_vec` size GE 2
120
0
            size_t target = reverse ? rows - index - 2 : index;
121
0
            if (quantile == 1) {
122
0
                target = 0;
123
0
            }
124
0
            auto [first_number, second_number] = _merge_sort_and_get_numbers(target, reverse);
125
0
            if (quantile == 1) {
126
0
                return second_number;
127
0
            }
128
0
            return first_number +
129
0
                   (u - static_cast<double>(index)) *
130
0
                           (static_cast<double>(second_number) - static_cast<double>(first_number));
131
0
        }
132
3
    }
_ZN5doris6CountsIdE9terminateEd
Line
Count
Source
79
136
    double terminate(double quantile) {
80
136
        if (_sorted_nums_vec.size() <= 1) {
81
112
            if (_sorted_nums_vec.size() == 1) {
82
29
                _nums = std::move(_sorted_nums_vec[0]);
83
29
            }
84
85
112
            if (_nums.empty()) {
86
                // Although set null here, but the value is 0.0 and the call method just
87
                // get val in aggregate_function_percentile_approx.h
88
0
                return 0.0;
89
0
            }
90
91
112
            if (UNLIKELY(!std::is_sorted(_nums.begin(), _nums.end()))) {
92
0
                pdqsort(_nums.begin(), _nums.end());
93
0
            }
94
95
112
            if (quantile == 1 || _nums.size() == 1) {
96
30
                return _nums.back();
97
30
            }
98
99
82
            double u = (_nums.size() - 1) * quantile;
100
82
            auto index = static_cast<uint32_t>(u);
101
82
            return _nums[index] +
102
82
                   (u - static_cast<double>(index)) * (static_cast<double>(_nums[index + 1]) -
103
82
                                                       static_cast<double>(_nums[index]));
104
112
        } else {
105
24
            DCHECK(_nums.empty());
106
24
            size_t rows = 0;
107
72
            for (const auto& i : _sorted_nums_vec) {
108
72
                rows += i.size();
109
72
            }
110
24
            const bool reverse = quantile > 0.5 && rows > 2;
111
24
            double u = (rows - 1) * quantile;
112
24
            auto index = static_cast<uint32_t>(u);
113
            // if reverse, the step of target should start 0 like not reverse
114
            // so here rows need to minus index + 2
115
            // eg: rows = 10, index = 5
116
            // if not reverse, so the first number loc is 5, the second number loc is 6
117
            // if reverse, so the second number is 3, the first number is 4
118
            // 5 + 4 = 3 + 6 = 9 = rows - 1.
119
            // the rows must GE 2 beacuse `_sorted_nums_vec` size GE 2
120
24
            size_t target = reverse ? rows - index - 2 : index;
121
24
            if (quantile == 1) {
122
0
                target = 0;
123
0
            }
124
24
            auto [first_number, second_number] = _merge_sort_and_get_numbers(target, reverse);
125
24
            if (quantile == 1) {
126
0
                return second_number;
127
0
            }
128
24
            return first_number +
129
24
                   (u - static_cast<double>(index)) *
130
24
                           (static_cast<double>(second_number) - static_cast<double>(first_number));
131
24
        }
132
136
    }
133
134
private:
135
    struct Node {
136
        Ty value;
137
        int array_index;
138
        int64_t element_index;
139
140
1.50k
        auto operator<=>(const Node& other) const { return value <=> other.value; }
Unexecuted instantiation: _ZNK5doris6CountsIaE4NodessERKS2_
_ZNK5doris6CountsIsE4NodessERKS2_
Line
Count
Source
140
68
        auto operator<=>(const Node& other) const { return value <=> other.value; }
_ZNK5doris6CountsIiE4NodessERKS2_
Line
Count
Source
140
926
        auto operator<=>(const Node& other) const { return value <=> other.value; }
_ZNK5doris6CountsIlE4NodessERKS2_
Line
Count
Source
140
417
        auto operator<=>(const Node& other) const { return value <=> other.value; }
Unexecuted instantiation: _ZNK5doris6CountsInE4NodessERKS2_
Unexecuted instantiation: _ZNK5doris6CountsIfE4NodessERKS2_
_ZNK5doris6CountsIdE4NodessERKS2_
Line
Count
Source
140
94
        auto operator<=>(const Node& other) const { return value <=> other.value; }
141
    };
142
143
288
    void _convert_sorted_num_vec_to_nums() {
144
288
        size_t rows = 0;
145
586
        for (const auto& i : _sorted_nums_vec) {
146
586
            rows += i.size();
147
586
        }
148
288
        _nums.resize(rows);
149
288
        size_t count = 0;
150
151
288
        std::priority_queue<Node, std::vector<Node>, std::greater<Node>> min_heap;
152
874
        for (int i = 0; i < _sorted_nums_vec.size(); ++i) {
153
586
            if (!_sorted_nums_vec[i].empty()) {
154
586
                min_heap.emplace(_sorted_nums_vec[i][0], i, 0);
155
586
            }
156
586
        }
157
158
1.02k
        while (!min_heap.empty()) {
159
737
            Node node = min_heap.top();
160
737
            min_heap.pop();
161
737
            _nums[count++] = node.value;
162
737
            if (++node.element_index < _sorted_nums_vec[node.array_index].size()) {
163
151
                node.value = _sorted_nums_vec[node.array_index][node.element_index];
164
151
                min_heap.push(node);
165
151
            }
166
737
        }
167
288
        _sorted_nums_vec.clear();
168
288
    }
Unexecuted instantiation: _ZN5doris6CountsIaE31_convert_sorted_num_vec_to_numsEv
Unexecuted instantiation: _ZN5doris6CountsIsE31_convert_sorted_num_vec_to_numsEv
_ZN5doris6CountsIiE31_convert_sorted_num_vec_to_numsEv
Line
Count
Source
143
156
    void _convert_sorted_num_vec_to_nums() {
144
156
        size_t rows = 0;
145
339
        for (const auto& i : _sorted_nums_vec) {
146
339
            rows += i.size();
147
339
        }
148
156
        _nums.resize(rows);
149
156
        size_t count = 0;
150
151
156
        std::priority_queue<Node, std::vector<Node>, std::greater<Node>> min_heap;
152
495
        for (int i = 0; i < _sorted_nums_vec.size(); ++i) {
153
339
            if (!_sorted_nums_vec[i].empty()) {
154
339
                min_heap.emplace(_sorted_nums_vec[i][0], i, 0);
155
339
            }
156
339
        }
157
158
531
        while (!min_heap.empty()) {
159
375
            Node node = min_heap.top();
160
375
            min_heap.pop();
161
375
            _nums[count++] = node.value;
162
375
            if (++node.element_index < _sorted_nums_vec[node.array_index].size()) {
163
36
                node.value = _sorted_nums_vec[node.array_index][node.element_index];
164
36
                min_heap.push(node);
165
36
            }
166
375
        }
167
156
        _sorted_nums_vec.clear();
168
156
    }
_ZN5doris6CountsIlE31_convert_sorted_num_vec_to_numsEv
Line
Count
Source
143
132
    void _convert_sorted_num_vec_to_nums() {
144
132
        size_t rows = 0;
145
247
        for (const auto& i : _sorted_nums_vec) {
146
247
            rows += i.size();
147
247
        }
148
132
        _nums.resize(rows);
149
132
        size_t count = 0;
150
151
132
        std::priority_queue<Node, std::vector<Node>, std::greater<Node>> min_heap;
152
379
        for (int i = 0; i < _sorted_nums_vec.size(); ++i) {
153
247
            if (!_sorted_nums_vec[i].empty()) {
154
247
                min_heap.emplace(_sorted_nums_vec[i][0], i, 0);
155
247
            }
156
247
        }
157
158
494
        while (!min_heap.empty()) {
159
362
            Node node = min_heap.top();
160
362
            min_heap.pop();
161
362
            _nums[count++] = node.value;
162
362
            if (++node.element_index < _sorted_nums_vec[node.array_index].size()) {
163
115
                node.value = _sorted_nums_vec[node.array_index][node.element_index];
164
115
                min_heap.push(node);
165
115
            }
166
362
        }
167
132
        _sorted_nums_vec.clear();
168
132
    }
Unexecuted instantiation: _ZN5doris6CountsInE31_convert_sorted_num_vec_to_numsEv
Unexecuted instantiation: _ZN5doris6CountsIfE31_convert_sorted_num_vec_to_numsEv
Unexecuted instantiation: _ZN5doris6CountsIdE31_convert_sorted_num_vec_to_numsEv
169
170
146
    std::pair<Ty, Ty> _merge_sort_and_get_numbers(int64_t target, bool reverse) {
171
146
        Ty first_number = 0, second_number = 0;
172
146
        size_t count = 0;
173
146
        if (reverse) {
174
28
            std::priority_queue<Node> max_heap;
175
120
            for (int i = 0; i < _sorted_nums_vec.size(); ++i) {
176
92
                if (!_sorted_nums_vec[i].empty()) {
177
92
                    max_heap.emplace(_sorted_nums_vec[i][_sorted_nums_vec[i].size() - 1], i,
178
92
                                     _sorted_nums_vec[i].size() - 1);
179
92
                }
180
92
            }
181
182
113
            while (!max_heap.empty()) {
183
113
                Node node = max_heap.top();
184
113
                max_heap.pop();
185
113
                if (count == target) {
186
28
                    second_number = node.value;
187
85
                } else if (count == target + 1) {
188
28
                    first_number = node.value;
189
28
                    break;
190
28
                }
191
85
                ++count;
192
85
                if (--node.element_index >= 0) {
193
68
                    node.value = _sorted_nums_vec[node.array_index][node.element_index];
194
68
                    max_heap.push(node);
195
68
                }
196
85
            }
197
198
118
        } else {
199
118
            std::priority_queue<Node, std::vector<Node>, std::greater<Node>> min_heap;
200
445
            for (int i = 0; i < _sorted_nums_vec.size(); ++i) {
201
327
                if (!_sorted_nums_vec[i].empty()) {
202
327
                    min_heap.emplace(_sorted_nums_vec[i][0], i, 0);
203
327
                }
204
327
            }
205
206
331
            while (!min_heap.empty()) {
207
331
                Node node = min_heap.top();
208
331
                min_heap.pop();
209
331
                if (count == target) {
210
118
                    first_number = node.value;
211
213
                } else if (count == target + 1) {
212
118
                    second_number = node.value;
213
118
                    break;
214
118
                }
215
213
                ++count;
216
213
                if (++node.element_index < _sorted_nums_vec[node.array_index].size()) {
217
127
                    node.value = _sorted_nums_vec[node.array_index][node.element_index];
218
127
                    min_heap.push(node);
219
127
                }
220
213
            }
221
118
        }
222
223
146
        return {first_number, second_number};
224
146
    }
Unexecuted instantiation: _ZN5doris6CountsIaE27_merge_sort_and_get_numbersElb
_ZN5doris6CountsIsE27_merge_sort_and_get_numbersElb
Line
Count
Source
170
3
    std::pair<Ty, Ty> _merge_sort_and_get_numbers(int64_t target, bool reverse) {
171
3
        Ty first_number = 0, second_number = 0;
172
3
        size_t count = 0;
173
3
        if (reverse) {
174
1
            std::priority_queue<Node> max_heap;
175
5
            for (int i = 0; i < _sorted_nums_vec.size(); ++i) {
176
4
                if (!_sorted_nums_vec[i].empty()) {
177
4
                    max_heap.emplace(_sorted_nums_vec[i][_sorted_nums_vec[i].size() - 1], i,
178
4
                                     _sorted_nums_vec[i].size() - 1);
179
4
                }
180
4
            }
181
182
6
            while (!max_heap.empty()) {
183
6
                Node node = max_heap.top();
184
6
                max_heap.pop();
185
6
                if (count == target) {
186
1
                    second_number = node.value;
187
5
                } else if (count == target + 1) {
188
1
                    first_number = node.value;
189
1
                    break;
190
1
                }
191
5
                ++count;
192
5
                if (--node.element_index >= 0) {
193
3
                    node.value = _sorted_nums_vec[node.array_index][node.element_index];
194
3
                    max_heap.push(node);
195
3
                }
196
5
            }
197
198
2
        } else {
199
2
            std::priority_queue<Node, std::vector<Node>, std::greater<Node>> min_heap;
200
10
            for (int i = 0; i < _sorted_nums_vec.size(); ++i) {
201
8
                if (!_sorted_nums_vec[i].empty()) {
202
8
                    min_heap.emplace(_sorted_nums_vec[i][0], i, 0);
203
8
                }
204
8
            }
205
206
13
            while (!min_heap.empty()) {
207
13
                Node node = min_heap.top();
208
13
                min_heap.pop();
209
13
                if (count == target) {
210
2
                    first_number = node.value;
211
11
                } else if (count == target + 1) {
212
2
                    second_number = node.value;
213
2
                    break;
214
2
                }
215
11
                ++count;
216
11
                if (++node.element_index < _sorted_nums_vec[node.array_index].size()) {
217
11
                    node.value = _sorted_nums_vec[node.array_index][node.element_index];
218
11
                    min_heap.push(node);
219
11
                }
220
11
            }
221
2
        }
222
223
3
        return {first_number, second_number};
224
3
    }
_ZN5doris6CountsIiE27_merge_sort_and_get_numbersElb
Line
Count
Source
170
97
    std::pair<Ty, Ty> _merge_sort_and_get_numbers(int64_t target, bool reverse) {
171
97
        Ty first_number = 0, second_number = 0;
172
97
        size_t count = 0;
173
97
        if (reverse) {
174
10
            std::priority_queue<Node> max_heap;
175
38
            for (int i = 0; i < _sorted_nums_vec.size(); ++i) {
176
28
                if (!_sorted_nums_vec[i].empty()) {
177
28
                    max_heap.emplace(_sorted_nums_vec[i][_sorted_nums_vec[i].size() - 1], i,
178
28
                                     _sorted_nums_vec[i].size() - 1);
179
28
                }
180
28
            }
181
182
39
            while (!max_heap.empty()) {
183
39
                Node node = max_heap.top();
184
39
                max_heap.pop();
185
39
                if (count == target) {
186
10
                    second_number = node.value;
187
29
                } else if (count == target + 1) {
188
10
                    first_number = node.value;
189
10
                    break;
190
10
                }
191
29
                ++count;
192
29
                if (--node.element_index >= 0) {
193
22
                    node.value = _sorted_nums_vec[node.array_index][node.element_index];
194
22
                    max_heap.push(node);
195
22
                }
196
29
            }
197
198
87
        } else {
199
87
            std::priority_queue<Node, std::vector<Node>, std::greater<Node>> min_heap;
200
326
            for (int i = 0; i < _sorted_nums_vec.size(); ++i) {
201
239
                if (!_sorted_nums_vec[i].empty()) {
202
239
                    min_heap.emplace(_sorted_nums_vec[i][0], i, 0);
203
239
                }
204
239
            }
205
206
244
            while (!min_heap.empty()) {
207
244
                Node node = min_heap.top();
208
244
                min_heap.pop();
209
244
                if (count == target) {
210
87
                    first_number = node.value;
211
157
                } else if (count == target + 1) {
212
87
                    second_number = node.value;
213
87
                    break;
214
87
                }
215
157
                ++count;
216
157
                if (++node.element_index < _sorted_nums_vec[node.array_index].size()) {
217
100
                    node.value = _sorted_nums_vec[node.array_index][node.element_index];
218
100
                    min_heap.push(node);
219
100
                }
220
157
            }
221
87
        }
222
223
97
        return {first_number, second_number};
224
97
    }
_ZN5doris6CountsIlE27_merge_sort_and_get_numbersElb
Line
Count
Source
170
22
    std::pair<Ty, Ty> _merge_sort_and_get_numbers(int64_t target, bool reverse) {
171
22
        Ty first_number = 0, second_number = 0;
172
22
        size_t count = 0;
173
22
        if (reverse) {
174
15
            std::priority_queue<Node> max_heap;
175
67
            for (int i = 0; i < _sorted_nums_vec.size(); ++i) {
176
52
                if (!_sorted_nums_vec[i].empty()) {
177
52
                    max_heap.emplace(_sorted_nums_vec[i][_sorted_nums_vec[i].size() - 1], i,
178
52
                                     _sorted_nums_vec[i].size() - 1);
179
52
                }
180
52
            }
181
182
63
            while (!max_heap.empty()) {
183
63
                Node node = max_heap.top();
184
63
                max_heap.pop();
185
63
                if (count == target) {
186
15
                    second_number = node.value;
187
48
                } else if (count == target + 1) {
188
15
                    first_number = node.value;
189
15
                    break;
190
15
                }
191
48
                ++count;
192
48
                if (--node.element_index >= 0) {
193
42
                    node.value = _sorted_nums_vec[node.array_index][node.element_index];
194
42
                    max_heap.push(node);
195
42
                }
196
48
            }
197
198
15
        } else {
199
7
            std::priority_queue<Node, std::vector<Node>, std::greater<Node>> min_heap;
200
23
            for (int i = 0; i < _sorted_nums_vec.size(); ++i) {
201
16
                if (!_sorted_nums_vec[i].empty()) {
202
16
                    min_heap.emplace(_sorted_nums_vec[i][0], i, 0);
203
16
                }
204
16
            }
205
206
22
            while (!min_heap.empty()) {
207
22
                Node node = min_heap.top();
208
22
                min_heap.pop();
209
22
                if (count == target) {
210
7
                    first_number = node.value;
211
15
                } else if (count == target + 1) {
212
7
                    second_number = node.value;
213
7
                    break;
214
7
                }
215
15
                ++count;
216
15
                if (++node.element_index < _sorted_nums_vec[node.array_index].size()) {
217
14
                    node.value = _sorted_nums_vec[node.array_index][node.element_index];
218
14
                    min_heap.push(node);
219
14
                }
220
15
            }
221
7
        }
222
223
22
        return {first_number, second_number};
224
22
    }
Unexecuted instantiation: _ZN5doris6CountsInE27_merge_sort_and_get_numbersElb
Unexecuted instantiation: _ZN5doris6CountsIfE27_merge_sort_and_get_numbersElb
_ZN5doris6CountsIdE27_merge_sort_and_get_numbersElb
Line
Count
Source
170
24
    std::pair<Ty, Ty> _merge_sort_and_get_numbers(int64_t target, bool reverse) {
171
24
        Ty first_number = 0, second_number = 0;
172
24
        size_t count = 0;
173
24
        if (reverse) {
174
2
            std::priority_queue<Node> max_heap;
175
10
            for (int i = 0; i < _sorted_nums_vec.size(); ++i) {
176
8
                if (!_sorted_nums_vec[i].empty()) {
177
8
                    max_heap.emplace(_sorted_nums_vec[i][_sorted_nums_vec[i].size() - 1], i,
178
8
                                     _sorted_nums_vec[i].size() - 1);
179
8
                }
180
8
            }
181
182
5
            while (!max_heap.empty()) {
183
5
                Node node = max_heap.top();
184
5
                max_heap.pop();
185
5
                if (count == target) {
186
2
                    second_number = node.value;
187
3
                } else if (count == target + 1) {
188
2
                    first_number = node.value;
189
2
                    break;
190
2
                }
191
3
                ++count;
192
3
                if (--node.element_index >= 0) {
193
1
                    node.value = _sorted_nums_vec[node.array_index][node.element_index];
194
1
                    max_heap.push(node);
195
1
                }
196
3
            }
197
198
22
        } else {
199
22
            std::priority_queue<Node, std::vector<Node>, std::greater<Node>> min_heap;
200
86
            for (int i = 0; i < _sorted_nums_vec.size(); ++i) {
201
64
                if (!_sorted_nums_vec[i].empty()) {
202
64
                    min_heap.emplace(_sorted_nums_vec[i][0], i, 0);
203
64
                }
204
64
            }
205
206
52
            while (!min_heap.empty()) {
207
52
                Node node = min_heap.top();
208
52
                min_heap.pop();
209
52
                if (count == target) {
210
22
                    first_number = node.value;
211
30
                } else if (count == target + 1) {
212
22
                    second_number = node.value;
213
22
                    break;
214
22
                }
215
30
                ++count;
216
30
                if (++node.element_index < _sorted_nums_vec[node.array_index].size()) {
217
2
                    node.value = _sorted_nums_vec[node.array_index][node.element_index];
218
2
                    min_heap.push(node);
219
2
                }
220
30
            }
221
22
        }
222
223
24
        return {first_number, second_number};
224
24
    }
225
226
    vectorized::PODArray<Ty> _nums;
227
    std::vector<vectorized::PODArray<Ty>> _sorted_nums_vec;
228
};
229
230
} // namespace doris