Coverage Report

Created: 2026-01-30 01:45

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/root/doris/be/src/runtime/runtime_predicate.cpp
Line
Count
Source
1
// Licensed to the Apache Software Foundation (ASF) under one
2
// or more contributor license agreements.  See the NOTICE file
3
// distributed with this work for additional information
4
// regarding copyright ownership.  The ASF licenses this file
5
// to you under the Apache License, Version 2.0 (the
6
// "License"); you may not use this file except in compliance
7
// with the License.  You may obtain a copy of the License at
8
//
9
//   http://www.apache.org/licenses/LICENSE-2.0
10
//
11
// Unless required by applicable law or agreed to in writing,
12
// software distributed under the License is distributed on an
13
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
14
// KIND, either express or implied.  See the License for the
15
// specific language governing permissions and limitations
16
// under the License.
17
18
#include "runtime/runtime_predicate.h"
19
20
#include <memory>
21
22
#include "common/compiler_util.h" // IWYU pragma: keep
23
#include "common/exception.h"
24
#include "common/status.h"
25
#include "olap/accept_null_predicate.h"
26
#include "olap/column_predicate.h"
27
#include "olap/predicate_creator.h"
28
#include "runtime/define_primitive_type.h"
29
30
namespace doris::vectorized {
31
32
RuntimePredicate::RuntimePredicate(const TTopnFilterDesc& desc)
33
0
        : _nulls_first(desc.null_first), _is_asc(desc.is_asc) {
34
0
    DCHECK(!desc.target_node_id_to_target_expr.empty());
35
0
    for (auto p : desc.target_node_id_to_target_expr) {
36
0
        _contexts[p.first].expr = p.second;
37
0
    }
38
39
0
    _type = thrift_to_type(desc.target_node_id_to_target_expr.begin()
40
0
                                   ->second.nodes[0]
41
0
                                   .type.types[0]
42
0
                                   .scalar_type.type);
43
0
    if (!_init(_type)) {
44
0
        std::stringstream ss;
45
0
        desc.target_node_id_to_target_expr.begin()->second.nodes[0].printTo(ss);
46
0
        throw Exception(ErrorCode::INTERNAL_ERROR, "meet invalid type, type={}, expr={}",
47
0
                        type_to_string(_type), ss.str());
48
0
    }
49
50
    // For ASC  sort, create runtime predicate col_name <= max_top_value
51
    // since values that > min_top_value are large than any value in current topn values
52
    // For DESC sort, create runtime predicate col_name >= min_top_value
53
    // since values that < min_top_value are less than any value in current topn values
54
0
    _pred_constructor = _is_asc ? create_comparison_predicate0<PredicateType::LE>
55
0
                                : create_comparison_predicate0<PredicateType::GE>;
56
0
}
57
58
Status RuntimePredicate::init_target(
59
        int32_t target_node_id, phmap::flat_hash_map<int, SlotDescriptor*> slot_id_to_slot_desc,
60
0
        const int column_id) {
61
0
    if (column_id < 0) {
62
0
        return Status::OK();
63
0
    }
64
0
    std::unique_lock<std::shared_mutex> wlock(_rwlock);
65
0
    check_target_node_id(target_node_id);
66
    // order by abs(col1) limit x;
67
    // cannot be used min-max filter, no need create predicate.
68
    // but can used in VTopNPred.execute_column
69
0
    if (target_is_slot(target_node_id)) {
70
0
        _contexts[target_node_id].col_name =
71
0
                slot_id_to_slot_desc[get_texpr(target_node_id).nodes[0].slot_ref.slot_id]
72
0
                        ->col_name();
73
0
        _contexts[target_node_id].col_data_type =
74
0
                slot_id_to_slot_desc[get_texpr(target_node_id).nodes[0].slot_ref.slot_id]->type();
75
0
        _contexts[target_node_id].predicate = SharedPredicate::create_shared(
76
0
                cast_set<uint32_t>(column_id), _contexts[target_node_id].col_name);
77
0
    }
78
0
    _detected_target = true;
79
0
    return Status::OK();
80
0
}
81
82
0
StringRef RuntimePredicate::_get_string_ref(const Field& field, const PrimitiveType type) {
83
0
    switch (type) {
84
0
    case PrimitiveType::TYPE_BOOLEAN: {
85
0
        const auto& v = field.get<TYPE_BOOLEAN>();
86
0
        return StringRef((char*)&v, sizeof(v));
87
0
    }
88
0
    case PrimitiveType::TYPE_TINYINT: {
89
0
        const auto& v = field.get<TYPE_TINYINT>();
90
0
        return StringRef((char*)&v, sizeof(v));
91
0
    }
92
0
    case PrimitiveType::TYPE_SMALLINT: {
93
0
        const auto& v = field.get<TYPE_SMALLINT>();
94
0
        return StringRef((char*)&v, sizeof(v));
95
0
    }
96
0
    case PrimitiveType::TYPE_INT: {
97
0
        const auto& v = field.get<TYPE_INT>();
98
0
        return StringRef((char*)&v, sizeof(v));
99
0
    }
100
0
    case PrimitiveType::TYPE_BIGINT: {
101
0
        const auto& v = field.get<TYPE_BIGINT>();
102
0
        return StringRef((char*)&v, sizeof(v));
103
0
    }
104
0
    case PrimitiveType::TYPE_LARGEINT: {
105
0
        const auto& v = field.get<TYPE_LARGEINT>();
106
0
        return StringRef((char*)&v, sizeof(v));
107
0
    }
108
0
    case PrimitiveType::TYPE_CHAR:
109
0
    case PrimitiveType::TYPE_VARCHAR:
110
0
    case PrimitiveType::TYPE_STRING: {
111
0
        const auto& v = field.get<TYPE_STRING>();
112
0
        auto length = v.size();
113
0
        char* buffer = _predicate_arena.alloc(length);
114
0
        memset(buffer, 0, length);
115
0
        memcpy(buffer, v.data(), v.length());
116
117
0
        return {buffer, length};
118
0
    }
119
0
    case PrimitiveType::TYPE_DATEV2: {
120
0
        const auto& v = field.get<TYPE_DATEV2>();
121
0
        return StringRef((char*)&v, sizeof(v));
122
0
    }
123
0
    case PrimitiveType::TYPE_DATETIMEV2: {
124
0
        const auto& v = field.get<TYPE_DATETIMEV2>();
125
0
        return StringRef((char*)&v, sizeof(v));
126
0
    }
127
0
    case PrimitiveType::TYPE_TIMESTAMPTZ: {
128
0
        const auto& v = field.get<TYPE_TIMESTAMPTZ>();
129
0
        return StringRef((char*)&v, sizeof(v));
130
0
        break;
131
0
    }
132
0
    case PrimitiveType::TYPE_DATE: {
133
0
        const auto& v = field.get<TYPE_DATE>();
134
0
        return StringRef((char*)&v, sizeof(v));
135
0
    }
136
0
    case PrimitiveType::TYPE_DATETIME: {
137
0
        const auto& v = field.get<TYPE_DATETIME>();
138
0
        return StringRef((char*)&v, sizeof(v));
139
0
    }
140
0
    case PrimitiveType::TYPE_TIMEV2: {
141
0
        const auto& v = field.get<TYPE_TIMEV2>();
142
0
        return StringRef((char*)&v, sizeof(v));
143
0
    }
144
0
    case PrimitiveType::TYPE_DECIMAL32: {
145
0
        const auto& v = field.get<TYPE_DECIMAL32>();
146
0
        return StringRef((char*)&v, sizeof(v));
147
0
    }
148
0
    case PrimitiveType::TYPE_DECIMAL64: {
149
0
        const auto& v = field.get<TYPE_DECIMAL64>();
150
0
        return StringRef((char*)&v, sizeof(v));
151
0
    }
152
0
    case PrimitiveType::TYPE_DECIMALV2: {
153
0
        const auto& v = field.get<TYPE_DECIMALV2>();
154
0
        return StringRef((char*)&v, sizeof(v));
155
0
    }
156
0
    case PrimitiveType::TYPE_DECIMAL128I: {
157
0
        const auto& v = field.get<TYPE_DECIMAL128I>();
158
0
        return StringRef((char*)&v, sizeof(v));
159
0
    }
160
0
    case PrimitiveType::TYPE_DECIMAL256: {
161
0
        const auto& v = field.get<TYPE_DECIMAL256>();
162
0
        return StringRef((char*)&v, sizeof(v));
163
0
    }
164
0
    case PrimitiveType::TYPE_IPV4: {
165
0
        const auto& v = field.get<TYPE_IPV4>();
166
0
        return StringRef((char*)&v, sizeof(v));
167
0
    }
168
0
    case PrimitiveType::TYPE_IPV6: {
169
0
        const auto& v = field.get<TYPE_IPV6>();
170
0
        return StringRef((char*)&v, sizeof(v));
171
0
    }
172
0
    case doris::PrimitiveType::TYPE_VARBINARY: {
173
0
        const auto& v = field.get<TYPE_VARBINARY>();
174
0
        auto length = v.size();
175
0
        char* buffer = _predicate_arena.alloc(length);
176
0
        memset(buffer, 0, length);
177
0
        memcpy(buffer, v.data(), length);
178
0
        return {buffer, length};
179
0
    }
180
0
    default:
181
0
        break;
182
0
    }
183
184
0
    throw Exception(ErrorCode::INTERNAL_ERROR, "meet invalid type, type={}", type_to_string(type));
185
0
    return {};
186
0
}
187
188
0
bool RuntimePredicate::_init(PrimitiveType type) {
189
0
    return is_int_or_bool(type) || is_decimal(type) || is_string_type(type) || is_date_type(type) ||
190
0
           is_time_type(type) || is_ip(type) || is_varbinary(type);
191
0
}
192
193
0
Status RuntimePredicate::update(const Field& value) {
194
0
    std::unique_lock<std::shared_mutex> wlock(_rwlock);
195
    // skip null value
196
0
    if (value.is_null()) {
197
0
        return Status::OK();
198
0
    }
199
200
0
    bool updated = false;
201
202
0
    if (UNLIKELY(_orderby_extrem.is_null())) {
203
0
        _orderby_extrem = value;
204
0
        updated = true;
205
0
    } else {
206
0
        if ((_is_asc && value < _orderby_extrem) || (!_is_asc && value > _orderby_extrem)) {
207
0
            _orderby_extrem = value;
208
0
            updated = true;
209
0
        }
210
0
    }
211
212
0
    _has_value = true;
213
214
0
    if (!updated) {
215
0
        return Status::OK();
216
0
    }
217
0
    for (auto p : _contexts) {
218
0
        auto ctx = p.second;
219
0
        if (ctx.predicate == nullptr) {
220
            // 1. `init_target` will not create predicate. example : `order by abs(col1) limit x;`
221
            // So don't need create new `ColumnPredicate`,
222
            // but need update `_orderby_extrem` for  `VTopNPred.execute_column`
223
            // 2. this `RuntimePredicate` will associate multiple scan nodes.
224
            // When the sort node is updated, some scan nodes may not have called `init_target` yet.
225
            // example:
226
            //SELECT subq1.pk AS pk1 FROM (
227
            //    ( SELECT t1.pk  FROM tb AS t1 )
228
            //    UNION ALL
229
            //    ( SELECT t1.pk  FROM tb AS t1  ORDER BY t1.pk ))
230
            //    subq1
231
            //WHERE subq1.pk <> (
232
            //    SELECT t1.pk  FROM tb AS t1  ORDER BY t1.pk LIMIT 1
233
            //) ORDER BY 1 LIMIT 1 ;
234
0
            continue;
235
0
        }
236
0
        auto str_ref = _get_string_ref(_orderby_extrem, _type);
237
0
        std::shared_ptr<ColumnPredicate> pred =
238
0
                _pred_constructor(ctx.predicate->column_id(), ctx.col_name, ctx.col_data_type,
239
0
                                  str_ref, false, _predicate_arena);
240
241
        // For NULLS FIRST, wrap a AcceptNullPredicate to return true for NULL
242
        // since ORDER BY ASC/DESC should get NULL first but pred returns NULL
243
        // and NULL in where predicate will be treated as FALSE
244
0
        if (_nulls_first) {
245
0
            pred = AcceptNullPredicate::create_shared(pred);
246
0
        }
247
248
0
        ((SharedPredicate*)ctx.predicate.get())->set_nested(pred);
249
0
    }
250
0
    return Status::OK();
251
0
}
252
253
} // namespace doris::vectorized