Coverage Report

Created: 2026-06-12 14:10

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
be/src/exprs/function/function_map.cpp
Line
Count
Source
1
// Licensed to the Apache Software Foundation (ASF) under one
2
// or more contributor license agreements.  See the NOTICE file
3
// distributed with this work for additional information
4
// regarding copyright ownership.  The ASF licenses this file
5
// to you under the Apache License, Version 2.0 (the
6
// "License"); you may not use this file except in compliance
7
// with the License.  You may obtain a copy of the License at
8
//
9
//   http://www.apache.org/licenses/LICENSE-2.0
10
//
11
// Unless required by applicable law or agreed to in writing,
12
// software distributed under the License is distributed on an
13
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
14
// KIND, either express or implied.  See the License for the
15
// specific language governing permissions and limitations
16
// under the License.
17
18
#include <glog/logging.h>
19
#include <stddef.h>
20
21
#include <algorithm>
22
#include <boost/iterator/iterator_facade.hpp>
23
#include <memory>
24
#include <ostream>
25
#include <string>
26
#include <string_view>
27
#include <tuple>
28
#include <utility>
29
30
#include "common/status.h"
31
#include "core/assert_cast.h"
32
#include "core/block/block.h"
33
#include "core/block/column_numbers.h"
34
#include "core/block/column_with_type_and_name.h"
35
#include "core/call_on_type_index.h"
36
#include "core/column/column.h"
37
#include "core/column/column_array.h"
38
#include "core/column/column_const.h"
39
#include "core/column/column_map.h"
40
#include "core/column/column_nullable.h"
41
#include "core/column/column_vector.h"
42
#include "core/data_type/data_type.h"
43
#include "core/data_type/data_type_array.h"
44
#include "core/data_type/data_type_map.h"
45
#include "core/data_type/data_type_nullable.h"
46
#include "core/data_type/data_type_number.h"
47
#include "core/data_type/data_type_string.h"
48
#include "core/data_type/data_type_struct.h"
49
#include "core/data_type/primitive_type.h"
50
#include "core/typeid_cast.h"
51
#include "core/types.h"
52
#include "exprs/aggregate/aggregate_function.h"
53
#include "exprs/function/array/function_array_index.h"
54
#include "exprs/function/function.h"
55
#include "exprs/function/simple_function_factory.h"
56
#include "util/simd/vstring_function.h"
57
58
namespace doris {
59
class FunctionContext;
60
} // namespace doris
61
62
namespace doris {
63
64
// construct a map
65
// map(key1, value2, key2, value2) -> {key1: value2, key2: value2}
66
class FunctionMap : public IFunction {
67
public:
68
    static constexpr auto name = "map";
69
2
    static FunctionPtr create() { return std::make_shared<FunctionMap>(); }
70
71
    /// Get function name.
72
0
    String get_name() const override { return name; }
73
74
1
    bool is_variadic() const override { return true; }
75
76
0
    bool use_default_implementation_for_nulls() const override { return false; }
77
78
0
    size_t get_number_of_arguments() const override { return 0; }
79
80
0
    DataTypePtr get_return_type_impl(const DataTypes& arguments) const override {
81
0
        DCHECK(arguments.size() % 2 == 0)
82
0
                << "function: " << get_name() << ", arguments should not be even number";
83
0
        return std::make_shared<DataTypeMap>(make_nullable(arguments[0]),
84
0
                                             make_nullable(arguments[1]));
85
0
    }
86
87
    Status execute_impl(FunctionContext* context, Block& block, const ColumnNumbers& arguments,
88
0
                        uint32_t result, size_t input_rows_count) const override {
89
0
        DCHECK(arguments.size() % 2 == 0)
90
0
                << "function: " << get_name() << ", arguments should not be even number";
91
92
0
        size_t num_element = arguments.size();
93
94
0
        auto result_col = block.get_by_position(result).type->create_column();
95
0
        auto* map_column = assert_cast<ColumnMap*>(result_col.get());
96
97
        // map keys column
98
0
        auto& result_col_map_keys_data = map_column->get_keys();
99
0
        result_col_map_keys_data.reserve(input_rows_count * num_element / 2);
100
        // map values column
101
0
        auto& result_col_map_vals_data = map_column->get_values();
102
0
        result_col_map_vals_data.reserve(input_rows_count * num_element / 2);
103
        // map offsets column
104
0
        auto& result_col_map_offsets = map_column->get_offsets();
105
0
        result_col_map_offsets.resize(input_rows_count);
106
107
0
        std::unique_ptr<bool[]> col_const = std::make_unique_for_overwrite<bool[]>(num_element);
108
0
        std::vector<ColumnPtr> arg(num_element);
109
0
        for (size_t i = 0; i < num_element; ++i) {
110
0
            auto& col = block.get_by_position(arguments[i]).column;
111
0
            std::tie(col, col_const[i]) = unpack_if_const(col);
112
0
            bool is_nullable = i % 2 == 0 ? result_col_map_keys_data.is_nullable()
113
0
                                          : result_col_map_vals_data.is_nullable();
114
            // convert to nullable column
115
0
            arg[i] = col;
116
0
            if (is_nullable && !col->is_nullable()) {
117
0
                arg[i] = ColumnNullable::create(col, ColumnUInt8::create(col->size(), 0));
118
0
            }
119
0
        }
120
121
        // insert value into map
122
0
        ColumnArray::Offset64 offset = 0;
123
0
        for (size_t row = 0; row < input_rows_count; ++row) {
124
0
            for (size_t i = 0; i < num_element; i += 2) {
125
0
                result_col_map_keys_data.insert_from(*arg[i], index_check_const(row, col_const[i]));
126
0
                result_col_map_vals_data.insert_from(*arg[i + 1],
127
0
                                                     index_check_const(row, col_const[i + 1]));
128
0
            }
129
0
            offset += num_element / 2;
130
0
            result_col_map_offsets[row] = offset;
131
0
        }
132
133
0
        RETURN_IF_ERROR(map_column->deduplicate_keys());
134
0
        block.replace_by_position(result, std::move(result_col));
135
0
        return Status::OK();
136
0
    }
137
};
138
139
template <bool is_key, bool OldVersion = false>
140
class FunctionMapContains : public IFunction {
141
public:
142
    static constexpr auto name = is_key ? "map_contains_key" : "map_contains_value";
143
4
    static FunctionPtr create() { return std::make_shared<FunctionMapContains>(); }
_ZN5doris19FunctionMapContainsILb1ELb0EE6createEv
Line
Count
Source
143
2
    static FunctionPtr create() { return std::make_shared<FunctionMapContains>(); }
_ZN5doris19FunctionMapContainsILb0ELb0EE6createEv
Line
Count
Source
143
2
    static FunctionPtr create() { return std::make_shared<FunctionMapContains>(); }
144
145
    /// Get function name.
146
2
    String get_name() const override { return name; }
_ZNK5doris19FunctionMapContainsILb1ELb0EE8get_nameB5cxx11Ev
Line
Count
Source
146
1
    String get_name() const override { return name; }
_ZNK5doris19FunctionMapContainsILb0ELb0EE8get_nameB5cxx11Ev
Line
Count
Source
146
1
    String get_name() const override { return name; }
147
148
2
    bool is_variadic() const override { return false; }
_ZNK5doris19FunctionMapContainsILb1ELb0EE11is_variadicEv
Line
Count
Source
148
1
    bool is_variadic() const override { return false; }
_ZNK5doris19FunctionMapContainsILb0ELb0EE11is_variadicEv
Line
Count
Source
148
1
    bool is_variadic() const override { return false; }
149
150
0
    size_t get_number_of_arguments() const override { return 2; }
Unexecuted instantiation: _ZNK5doris19FunctionMapContainsILb1ELb0EE23get_number_of_argumentsEv
Unexecuted instantiation: _ZNK5doris19FunctionMapContainsILb0ELb0EE23get_number_of_argumentsEv
151
152
0
    bool use_default_implementation_for_nulls() const override {
153
0
        return FunctionArrayIndex<ArrayContainsAction> {}.use_default_implementation_for_nulls();
154
0
    }
Unexecuted instantiation: _ZNK5doris19FunctionMapContainsILb1ELb0EE36use_default_implementation_for_nullsEv
Unexecuted instantiation: _ZNK5doris19FunctionMapContainsILb0ELb0EE36use_default_implementation_for_nullsEv
155
156
0
    DataTypePtr get_return_type_impl(const DataTypes& arguments) const override {
157
0
        DataTypePtr datatype = arguments[0];
158
0
        if (datatype->is_nullable()) {
159
0
            datatype = assert_cast<const DataTypeNullable*>(datatype.get())->get_nested_type();
160
0
        }
161
0
        DCHECK(datatype->get_primitive_type() == TYPE_MAP)
162
0
                << "first argument for function: " << name << " should be DataTypeMap";
163
164
        if constexpr (OldVersion) {
165
            return make_nullable(std::make_shared<DataTypeBool>());
166
0
        } else {
167
0
            if (arguments[0]->is_nullable()) {
168
0
                return make_nullable(std::make_shared<DataTypeBool>());
169
0
            } else {
170
0
                return std::make_shared<DataTypeBool>();
171
0
            }
172
0
        }
173
0
    }
Unexecuted instantiation: _ZNK5doris19FunctionMapContainsILb1ELb0EE20get_return_type_implERKSt6vectorISt10shared_ptrIKNS_9IDataTypeEESaIS6_EE
Unexecuted instantiation: _ZNK5doris19FunctionMapContainsILb0ELb0EE20get_return_type_implERKSt6vectorISt10shared_ptrIKNS_9IDataTypeEESaIS6_EE
174
175
    Status execute_impl(FunctionContext* context, Block& block, const ColumnNumbers& arguments,
176
0
                        uint32_t result, size_t input_rows_count) const override {
177
        // backup original argument 0
178
0
        auto orig_arg0 = block.get_by_position(arguments[0]);
179
0
        auto left_column =
180
0
                block.get_by_position(arguments[0]).column->convert_to_full_column_if_const();
181
0
        const ColumnMap* map_column = nullptr;
182
0
        ColumnPtr nullmap_column = nullptr;
183
0
        if (const auto* nullable_column = check_and_get_column<ColumnNullable>(left_column.get())) {
184
0
            map_column = check_and_get_column<ColumnMap>(nullable_column->get_nested_column());
185
0
            nullmap_column = nullable_column->get_null_map_column_ptr();
186
0
        } else {
187
0
            map_column = check_and_get_column<ColumnMap>(*left_column.get());
188
0
        }
189
0
        if (!map_column) {
190
0
            return Status::RuntimeError("unsupported types for function {}({})", get_name(),
191
0
                                        block.get_by_position(arguments[0]).type->get_name());
192
0
        }
193
194
0
        DataTypePtr datatype = block.get_by_position(arguments[0]).type;
195
0
        if (datatype->is_nullable()) {
196
0
            datatype = assert_cast<const DataTypeNullable*>(datatype.get())->get_nested_type();
197
0
        }
198
0
        const auto datatype_map = static_cast<const DataTypeMap*>(datatype.get());
199
0
        if constexpr (is_key) {
200
0
            const auto& array_column = map_column->get_keys_array_ptr();
201
0
            const auto datatype_array =
202
0
                    std::make_shared<DataTypeArray>(datatype_map->get_key_type());
203
0
            if (nullmap_column) {
204
0
                block.get_by_position(arguments[0]) = {
205
0
                        ColumnNullable::create(array_column, nullmap_column),
206
0
                        make_nullable(datatype_array),
207
0
                        block.get_by_position(arguments[0]).name + ".keys"};
208
0
            } else {
209
0
                block.get_by_position(arguments[0]) = {
210
0
                        array_column, datatype_array,
211
0
                        block.get_by_position(arguments[0]).name + ".keys"};
212
0
            }
213
0
        } else {
214
0
            const auto& array_column = map_column->get_values_array_ptr();
215
0
            const auto datatype_array =
216
0
                    std::make_shared<DataTypeArray>(datatype_map->get_value_type());
217
0
            if (nullmap_column) {
218
0
                block.get_by_position(arguments[0]) = {
219
0
                        ColumnNullable::create(array_column, nullmap_column),
220
0
                        make_nullable(datatype_array),
221
0
                        block.get_by_position(arguments[0]).name + ".values"};
222
0
            } else {
223
0
                block.get_by_position(arguments[0]) = {
224
0
                        array_column, datatype_array,
225
0
                        block.get_by_position(arguments[0]).name + ".values"};
226
0
            }
227
0
        }
228
229
0
        RETURN_IF_ERROR(FunctionArrayIndex<ArrayContainsAction> {}.execute_impl(
230
0
                context, block, arguments, result, input_rows_count));
231
232
        // restore original argument 0
233
0
        block.get_by_position(arguments[0]) = orig_arg0;
234
0
        return Status::OK();
235
0
    }
Unexecuted instantiation: _ZNK5doris19FunctionMapContainsILb1ELb0EE12execute_implEPNS_15FunctionContextERNS_5BlockERKSt6vectorIjSaIjEEjm
Unexecuted instantiation: _ZNK5doris19FunctionMapContainsILb0ELb0EE12execute_implEPNS_15FunctionContextERNS_5BlockERKSt6vectorIjSaIjEEjm
236
};
237
238
template <bool is_key>
239
class FunctionMapKeysOrValues : public IFunction {
240
public:
241
    static constexpr auto name = is_key ? "map_keys" : "map_values";
242
4
    static FunctionPtr create() { return std::make_shared<FunctionMapKeysOrValues>(); }
_ZN5doris23FunctionMapKeysOrValuesILb1EE6createEv
Line
Count
Source
242
2
    static FunctionPtr create() { return std::make_shared<FunctionMapKeysOrValues>(); }
_ZN5doris23FunctionMapKeysOrValuesILb0EE6createEv
Line
Count
Source
242
2
    static FunctionPtr create() { return std::make_shared<FunctionMapKeysOrValues>(); }
243
244
    /// Get function name.
245
2
    String get_name() const override { return name; }
_ZNK5doris23FunctionMapKeysOrValuesILb1EE8get_nameB5cxx11Ev
Line
Count
Source
245
1
    String get_name() const override { return name; }
_ZNK5doris23FunctionMapKeysOrValuesILb0EE8get_nameB5cxx11Ev
Line
Count
Source
245
1
    String get_name() const override { return name; }
246
247
2
    bool is_variadic() const override { return false; }
_ZNK5doris23FunctionMapKeysOrValuesILb1EE11is_variadicEv
Line
Count
Source
247
1
    bool is_variadic() const override { return false; }
_ZNK5doris23FunctionMapKeysOrValuesILb0EE11is_variadicEv
Line
Count
Source
247
1
    bool is_variadic() const override { return false; }
248
249
0
    size_t get_number_of_arguments() const override { return 1; }
Unexecuted instantiation: _ZNK5doris23FunctionMapKeysOrValuesILb1EE23get_number_of_argumentsEv
Unexecuted instantiation: _ZNK5doris23FunctionMapKeysOrValuesILb0EE23get_number_of_argumentsEv
250
251
0
    DataTypePtr get_return_type_impl(const DataTypes& arguments) const override {
252
0
        DataTypePtr datatype = arguments[0];
253
0
        if (datatype->is_nullable()) {
254
0
            datatype = assert_cast<const DataTypeNullable*>(datatype.get())->get_nested_type();
255
0
        }
256
0
        DCHECK(datatype->get_primitive_type() == TYPE_MAP)
257
0
                << "first argument for function: " << name << " should be DataTypeMap";
258
0
        const auto datatype_map = static_cast<const DataTypeMap*>(datatype.get());
259
0
        if (is_key) {
260
0
            return std::make_shared<DataTypeArray>(datatype_map->get_key_type());
261
0
        } else {
262
0
            return std::make_shared<DataTypeArray>(datatype_map->get_value_type());
263
0
        }
264
0
    }
Unexecuted instantiation: _ZNK5doris23FunctionMapKeysOrValuesILb1EE20get_return_type_implERKSt6vectorISt10shared_ptrIKNS_9IDataTypeEESaIS6_EE
Unexecuted instantiation: _ZNK5doris23FunctionMapKeysOrValuesILb0EE20get_return_type_implERKSt6vectorISt10shared_ptrIKNS_9IDataTypeEESaIS6_EE
265
266
    Status execute_impl(FunctionContext* context, Block& block, const ColumnNumbers& arguments,
267
0
                        uint32_t result, size_t input_rows_count) const override {
268
0
        auto left_column =
269
0
                block.get_by_position(arguments[0]).column->convert_to_full_column_if_const();
270
0
        const ColumnMap* map_column = nullptr;
271
0
        if (const auto* nullable_column = check_and_get_column<ColumnNullable>(left_column.get())) {
272
0
            map_column = check_and_get_column<ColumnMap>(nullable_column->get_nested_column());
273
0
        } else {
274
0
            map_column = check_and_get_column<ColumnMap>(*left_column.get());
275
0
        }
276
0
        if (!map_column) {
277
0
            return Status::RuntimeError("unsupported types for function {}({})", get_name(),
278
0
                                        block.get_by_position(arguments[0]).type->get_name());
279
0
        }
280
281
0
        if constexpr (is_key) {
282
0
            block.replace_by_position(result, map_column->get_keys_array_ptr());
283
0
        } else {
284
0
            block.replace_by_position(result, map_column->get_values_array_ptr());
285
0
        }
286
287
0
        return Status::OK();
288
0
    }
Unexecuted instantiation: _ZNK5doris23FunctionMapKeysOrValuesILb1EE12execute_implEPNS_15FunctionContextERNS_5BlockERKSt6vectorIjSaIjEEjm
Unexecuted instantiation: _ZNK5doris23FunctionMapKeysOrValuesILb0EE12execute_implEPNS_15FunctionContextERNS_5BlockERKSt6vectorIjSaIjEEjm
289
};
290
291
class FunctionMapEntries : public IFunction {
292
public:
293
    static constexpr auto name = "map_entries";
294
2
    static FunctionPtr create() { return std::make_shared<FunctionMapEntries>(); }
295
296
    /// Get function name.
297
1
    String get_name() const override { return name; }
298
299
1
    bool is_variadic() const override { return false; }
300
301
0
    size_t get_number_of_arguments() const override { return 1; }
302
303
0
    DataTypePtr get_return_type_impl(const DataTypes& arguments) const override {
304
0
        const auto* const datatype_map = assert_cast<const DataTypeMap*>(arguments[0].get());
305
306
        // Create struct type with named fields "key" and "value"
307
        // key and value are always nullable
308
0
        auto struct_type = std::make_shared<DataTypeStruct>(
309
0
                DataTypes {make_nullable(datatype_map->get_key_type()),
310
0
                           make_nullable(datatype_map->get_value_type())},
311
0
                Strings {"key", "value"});
312
313
        // Theoretically, the struct element will never be null,
314
        // but FE expects the array element to be nullable
315
0
        return std::make_shared<DataTypeArray>(make_nullable(struct_type));
316
0
    }
317
318
    Status execute_impl(FunctionContext* context, Block& block, const ColumnNumbers& arguments,
319
0
                        uint32_t result, size_t input_rows_count) const override {
320
0
        const auto* map_column =
321
0
                assert_cast<const ColumnMap*>(block.get_by_position(arguments[0]).column.get());
322
323
0
        auto struct_column = ColumnStruct::create(
324
0
                Columns {map_column->get_keys_ptr(), map_column->get_values_ptr()});
325
326
        // all struct elements are not null
327
0
        auto struct_null_map = ColumnUInt8::create(struct_column->size(), 0);
328
0
        auto nullable_struct_column =
329
0
                ColumnNullable::create(std::move(struct_column), std::move(struct_null_map));
330
331
0
        auto result_array_column = ColumnArray::create(std::move(nullable_struct_column),
332
0
                                                       map_column->get_offsets_ptr());
333
334
0
        block.replace_by_position(result, std::move(result_array_column));
335
336
0
        return Status::OK();
337
0
    }
338
};
339
340
class FunctionStrToMap : public IFunction {
341
public:
342
    static constexpr auto name = "str_to_map";
343
2
    static FunctionPtr create() { return std::make_shared<FunctionStrToMap>(); }
344
345
1
    String get_name() const override { return name; }
346
347
0
    size_t get_number_of_arguments() const override { return 3; }
348
349
0
    DataTypePtr get_return_type_impl(const DataTypes& arguments) const override {
350
0
        return std::make_shared<DataTypeMap>(make_nullable(std::make_shared<DataTypeString>()),
351
0
                                             make_nullable(std::make_shared<DataTypeString>()));
352
0
    }
353
354
    Status execute_impl(FunctionContext* context, Block& block, const ColumnNumbers& arguments,
355
0
                        uint32_t result, size_t input_rows_count) const override {
356
0
        DCHECK(arguments.size() == 3);
357
358
0
        bool cols_const[2];
359
0
        ColumnPtr cols[2];
360
0
        for (size_t i = 0; i < 2; ++i) {
361
0
            cols_const[i] = is_column_const(*block.get_by_position(arguments[i]).column);
362
0
        }
363
        // convert to full column if necessary
364
0
        default_preprocess_parameter_columns(cols, cols_const, {0, 1}, block, arguments);
365
0
        const auto& [col3, col3_const] =
366
0
                unpack_if_const(block.get_by_position(arguments[2]).column);
367
368
0
        const auto& str_column = assert_cast<const ColumnString*>(cols[0].get());
369
0
        const auto& pair_delim_column = assert_cast<const ColumnString*>(cols[1].get());
370
0
        const auto& kv_delim_column = assert_cast<const ColumnString*>(col3.get());
371
372
0
        ColumnPtr result_col;
373
0
        if (cols_const[0] && cols_const[1]) {
374
0
            result_col = execute_vector<true, false>(input_rows_count, *str_column,
375
0
                                                     *pair_delim_column, *kv_delim_column);
376
0
        } else if (col3_const) {
377
0
            result_col = execute_vector<false, true>(input_rows_count, *str_column,
378
0
                                                     *pair_delim_column, *kv_delim_column);
379
0
        } else {
380
0
            result_col = execute_vector<false, false>(input_rows_count, *str_column,
381
0
                                                      *pair_delim_column, *kv_delim_column);
382
0
        }
383
384
0
        block.replace_by_position(result, std::move(result_col));
385
386
0
        return Status::OK();
387
0
    }
388
389
private:
390
    template <bool is_str_and_pair_delim_const, bool is_kv_delim_const>
391
    static ColumnPtr execute_vector(const size_t input_rows_count, const ColumnString& str_col,
392
                                    const ColumnString& pair_delim_col,
393
0
                                    const ColumnString& kv_delim_col) {
394
        // map keys column
395
0
        auto result_col_map_keys_data =
396
0
                ColumnNullable::create(ColumnString::create(), ColumnUInt8::create());
397
0
        result_col_map_keys_data->reserve(input_rows_count);
398
        // map values column
399
0
        auto result_col_map_vals_data =
400
0
                ColumnNullable::create(ColumnString::create(), ColumnUInt8::create());
401
0
        result_col_map_vals_data->reserve(input_rows_count);
402
        // map offsets column
403
0
        auto result_col_map_offsets = ColumnOffset64::create();
404
0
        result_col_map_offsets->reserve(input_rows_count);
405
406
0
        std::vector<std::string_view> kvs;
407
0
        std::string_view kv_delim;
408
0
        if constexpr (is_str_and_pair_delim_const) {
409
0
            auto str = str_col.get_data_at(0).to_string_view();
410
0
            auto pair_delim = pair_delim_col.get_data_at(0).to_string_view();
411
0
            kvs = split_pair_by_delim(str, pair_delim);
412
0
        }
413
0
        if constexpr (is_kv_delim_const) {
414
0
            kv_delim = kv_delim_col.get_data_at(0).to_string_view();
415
0
        }
416
417
0
        for (size_t i = 0; i < input_rows_count; ++i) {
418
0
            if constexpr (!is_str_and_pair_delim_const) {
419
0
                auto str = str_col.get_data_at(i).to_string_view();
420
0
                auto pair_delim = pair_delim_col.get_data_at(i).to_string_view();
421
0
                kvs = split_pair_by_delim(str, pair_delim);
422
0
            }
423
0
            if constexpr (!is_kv_delim_const) {
424
0
                kv_delim = kv_delim_col.get_data_at(i).to_string_view();
425
0
            }
426
427
0
            for (const auto& kv : kvs) {
428
0
                auto kv_parts = split_kv_by_delim(kv, kv_delim);
429
0
                if (kv_parts.size() == 2) {
430
0
                    result_col_map_keys_data->insert_data(kv_parts[0].data(), kv_parts[0].size());
431
0
                    result_col_map_vals_data->insert_data(kv_parts[1].data(), kv_parts[1].size());
432
0
                } else {
433
0
                    result_col_map_keys_data->insert_data(kv.data(), kv.size());
434
0
                    result_col_map_vals_data->insert_default();
435
0
                }
436
0
            }
437
0
            result_col_map_offsets->insert_value(result_col_map_keys_data->size());
438
0
        }
439
440
0
        auto map_column = ColumnMap::create(std::move(result_col_map_keys_data),
441
0
                                            std::move(result_col_map_vals_data),
442
0
                                            std::move(result_col_map_offsets));
443
444
        // `deduplicate_keys` always return ok
445
0
        static_cast<void>(map_column->deduplicate_keys());
446
0
        return map_column;
447
0
    }
Unexecuted instantiation: _ZN5doris16FunctionStrToMap14execute_vectorILb1ELb0EEENS_3COWINS_7IColumnEE13immutable_ptrIS3_EEmRKNS_9ColumnStrIjEESA_SA_
Unexecuted instantiation: _ZN5doris16FunctionStrToMap14execute_vectorILb0ELb1EEENS_3COWINS_7IColumnEE13immutable_ptrIS3_EEmRKNS_9ColumnStrIjEESA_SA_
Unexecuted instantiation: _ZN5doris16FunctionStrToMap14execute_vectorILb0ELb0EEENS_3COWINS_7IColumnEE13immutable_ptrIS3_EEmRKNS_9ColumnStrIjEESA_SA_
448
449
    static std::vector<std::string_view> split_pair_by_delim(const std::string_view& str,
450
0
                                                             const std::string_view& delim) {
451
0
        if (str.empty()) {
452
0
            return {str};
453
0
        }
454
0
        if (delim.empty()) {
455
0
            std::vector<std::string_view> result;
456
0
            size_t offset = 0;
457
0
            while (offset < str.size()) {
458
0
                auto len = get_utf8_byte_length(str[offset]);
459
0
                result.push_back(str.substr(offset, len));
460
0
                offset += len;
461
0
            }
462
0
            return result;
463
0
        }
464
0
        std::vector<std::string_view> result;
465
0
        size_t offset = 0;
466
0
        while (offset < str.size()) {
467
0
            auto pos = str.find(delim, offset);
468
0
            if (pos == std::string::npos) {
469
0
                result.push_back(str.substr(offset));
470
0
                break;
471
0
            }
472
0
            result.push_back(str.substr(offset, pos - offset));
473
0
            offset = pos + delim.size();
474
0
        }
475
0
        return result;
476
0
    }
477
478
    static std::vector<std::string_view> split_kv_by_delim(const std::string_view& str,
479
0
                                                           const std::string_view& delim) {
480
0
        if (str.empty()) {
481
0
            return {str};
482
0
        }
483
0
        if (delim.empty()) {
484
0
            auto len = get_utf8_byte_length(str[0]);
485
0
            return {str.substr(0, len), str.substr(len)};
486
0
        }
487
0
        auto pos = str.find(delim);
488
0
        if (pos == std::string::npos) {
489
0
            return {str};
490
0
        } else {
491
0
            return {str.substr(0, pos), str.substr(pos + delim.size())};
492
0
        }
493
0
    }
494
};
495
496
class FunctionMapContainsEntry : public IFunction {
497
public:
498
    static constexpr auto name = "map_contains_entry";
499
2
    static FunctionPtr create() { return std::make_shared<FunctionMapContainsEntry>(); }
500
501
1
    String get_name() const override { return name; }
502
0
    size_t get_number_of_arguments() const override { return 3; }
503
0
    bool use_default_implementation_for_nulls() const override { return false; }
504
505
0
    DataTypePtr get_return_type_impl(const DataTypes& arguments) const override {
506
0
        DataTypePtr datatype = arguments[0];
507
0
        if (datatype->is_nullable()) {
508
0
            datatype = assert_cast<const DataTypeNullable*>(datatype.get())->get_nested_type();
509
0
        }
510
0
        DCHECK_EQ(datatype->get_primitive_type(), PrimitiveType::TYPE_MAP)
511
0
                << "first argument for function: " << name << " should be DataTypeMap";
512
513
0
        if (arguments[0]->is_nullable()) {
514
0
            return make_nullable(std::make_shared<DataTypeBool>());
515
0
        } else {
516
0
            return std::make_shared<DataTypeBool>();
517
0
        }
518
0
    }
519
520
    Status execute_impl(FunctionContext* context, Block& block, const ColumnNumbers& arguments,
521
0
                        uint32_t result, size_t input_rows_count) const override {
522
0
        return _execute_type_check_and_dispatch(block, arguments, result);
523
0
    }
524
525
private:
526
    // assume result_matches is initialized to all 1s
527
    template <typename ColumnType>
528
    void _execute_column_comparison(const IColumn& map_entry_column, const UInt8* map_entry_nullmap,
529
                                    const IColumn& search_column, const UInt8* search_nullmap,
530
                                    const ColumnArray::Offsets64& map_offsets,
531
                                    const UInt8* map_row_nullmap, bool search_is_const,
532
0
                                    ColumnUInt8& result_matches) const {
533
0
        auto& result_data = result_matches.get_data();
534
0
        for (size_t row = 0; row < map_offsets.size(); ++row) {
535
0
            if (map_row_nullmap && map_row_nullmap[row]) {
536
0
                continue;
537
0
            }
538
0
            size_t map_start = row == 0 ? 0 : map_offsets[row - 1];
539
0
            size_t map_end = map_offsets[row];
540
            // const column always uses index 0
541
0
            size_t search_idx = search_is_const ? 0 : row;
542
0
            for (size_t i = map_start; i < map_end; ++i) {
543
0
                result_data[i] &=
544
0
                        compare_values<ColumnType>(map_entry_column, i, map_entry_nullmap,
545
0
                                                   search_column, search_idx, search_nullmap)
546
0
                                ? 1
547
0
                                : 0;
548
0
            }
549
0
        }
550
0
    }
Unexecuted instantiation: _ZNK5doris24FunctionMapContainsEntry26_execute_column_comparisonINS_12ColumnVectorILNS_13PrimitiveTypeE2EEEEEvRKNS_7IColumnEPKhS7_S9_RKNS_8PODArrayImLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEES9_bRS4_
Unexecuted instantiation: _ZNK5doris24FunctionMapContainsEntry26_execute_column_comparisonINS_12ColumnVectorILNS_13PrimitiveTypeE3EEEEEvRKNS_7IColumnEPKhS7_S9_RKNS_8PODArrayImLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEES9_bRNS2_ILS3_2EEE
Unexecuted instantiation: _ZNK5doris24FunctionMapContainsEntry26_execute_column_comparisonINS_12ColumnVectorILNS_13PrimitiveTypeE4EEEEEvRKNS_7IColumnEPKhS7_S9_RKNS_8PODArrayImLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEES9_bRNS2_ILS3_2EEE
Unexecuted instantiation: _ZNK5doris24FunctionMapContainsEntry26_execute_column_comparisonINS_12ColumnVectorILNS_13PrimitiveTypeE5EEEEEvRKNS_7IColumnEPKhS7_S9_RKNS_8PODArrayImLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEES9_bRNS2_ILS3_2EEE
Unexecuted instantiation: _ZNK5doris24FunctionMapContainsEntry26_execute_column_comparisonINS_12ColumnVectorILNS_13PrimitiveTypeE6EEEEEvRKNS_7IColumnEPKhS7_S9_RKNS_8PODArrayImLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEES9_bRNS2_ILS3_2EEE
Unexecuted instantiation: _ZNK5doris24FunctionMapContainsEntry26_execute_column_comparisonINS_12ColumnVectorILNS_13PrimitiveTypeE7EEEEEvRKNS_7IColumnEPKhS7_S9_RKNS_8PODArrayImLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEES9_bRNS2_ILS3_2EEE
Unexecuted instantiation: _ZNK5doris24FunctionMapContainsEntry26_execute_column_comparisonINS_12ColumnVectorILNS_13PrimitiveTypeE8EEEEEvRKNS_7IColumnEPKhS7_S9_RKNS_8PODArrayImLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEES9_bRNS2_ILS3_2EEE
Unexecuted instantiation: _ZNK5doris24FunctionMapContainsEntry26_execute_column_comparisonINS_12ColumnVectorILNS_13PrimitiveTypeE9EEEEEvRKNS_7IColumnEPKhS7_S9_RKNS_8PODArrayImLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEES9_bRNS2_ILS3_2EEE
Unexecuted instantiation: _ZNK5doris24FunctionMapContainsEntry26_execute_column_comparisonINS_13ColumnDecimalILNS_13PrimitiveTypeE28EEEEEvRKNS_7IColumnEPKhS7_S9_RKNS_8PODArrayImLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEES9_bRNS_12ColumnVectorILS3_2EEE
Unexecuted instantiation: _ZNK5doris24FunctionMapContainsEntry26_execute_column_comparisonINS_13ColumnDecimalILNS_13PrimitiveTypeE29EEEEEvRKNS_7IColumnEPKhS7_S9_RKNS_8PODArrayImLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEES9_bRNS_12ColumnVectorILS3_2EEE
Unexecuted instantiation: _ZNK5doris24FunctionMapContainsEntry26_execute_column_comparisonINS_13ColumnDecimalILNS_13PrimitiveTypeE20EEEEEvRKNS_7IColumnEPKhS7_S9_RKNS_8PODArrayImLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEES9_bRNS_12ColumnVectorILS3_2EEE
Unexecuted instantiation: _ZNK5doris24FunctionMapContainsEntry26_execute_column_comparisonINS_13ColumnDecimalILNS_13PrimitiveTypeE30EEEEEvRKNS_7IColumnEPKhS7_S9_RKNS_8PODArrayImLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEES9_bRNS_12ColumnVectorILS3_2EEE
Unexecuted instantiation: _ZNK5doris24FunctionMapContainsEntry26_execute_column_comparisonINS_13ColumnDecimalILNS_13PrimitiveTypeE35EEEEEvRKNS_7IColumnEPKhS7_S9_RKNS_8PODArrayImLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEES9_bRNS_12ColumnVectorILS3_2EEE
Unexecuted instantiation: _ZNK5doris24FunctionMapContainsEntry26_execute_column_comparisonINS_12ColumnVectorILNS_13PrimitiveTypeE11EEEEEvRKNS_7IColumnEPKhS7_S9_RKNS_8PODArrayImLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEES9_bRNS2_ILS3_2EEE
Unexecuted instantiation: _ZNK5doris24FunctionMapContainsEntry26_execute_column_comparisonINS_12ColumnVectorILNS_13PrimitiveTypeE25EEEEEvRKNS_7IColumnEPKhS7_S9_RKNS_8PODArrayImLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEES9_bRNS2_ILS3_2EEE
Unexecuted instantiation: _ZNK5doris24FunctionMapContainsEntry26_execute_column_comparisonINS_12ColumnVectorILNS_13PrimitiveTypeE26EEEEEvRKNS_7IColumnEPKhS7_S9_RKNS_8PODArrayImLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEES9_bRNS2_ILS3_2EEE
Unexecuted instantiation: _ZNK5doris24FunctionMapContainsEntry26_execute_column_comparisonINS_12ColumnVectorILNS_13PrimitiveTypeE12EEEEEvRKNS_7IColumnEPKhS7_S9_RKNS_8PODArrayImLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEES9_bRNS2_ILS3_2EEE
Unexecuted instantiation: _ZNK5doris24FunctionMapContainsEntry26_execute_column_comparisonINS_12ColumnVectorILNS_13PrimitiveTypeE27EEEEEvRKNS_7IColumnEPKhS7_S9_RKNS_8PODArrayImLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEES9_bRNS2_ILS3_2EEE
Unexecuted instantiation: _ZNK5doris24FunctionMapContainsEntry26_execute_column_comparisonINS_12ColumnVectorILNS_13PrimitiveTypeE42EEEEEvRKNS_7IColumnEPKhS7_S9_RKNS_8PODArrayImLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEES9_bRNS2_ILS3_2EEE
Unexecuted instantiation: _ZNK5doris24FunctionMapContainsEntry26_execute_column_comparisonINS_12ColumnVectorILNS_13PrimitiveTypeE36EEEEEvRKNS_7IColumnEPKhS7_S9_RKNS_8PODArrayImLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEES9_bRNS2_ILS3_2EEE
Unexecuted instantiation: _ZNK5doris24FunctionMapContainsEntry26_execute_column_comparisonINS_12ColumnVectorILNS_13PrimitiveTypeE37EEEEEvRKNS_7IColumnEPKhS7_S9_RKNS_8PODArrayImLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEES9_bRNS2_ILS3_2EEE
Unexecuted instantiation: _ZNK5doris24FunctionMapContainsEntry26_execute_column_comparisonINS_9ColumnStrIjEEEEvRKNS_7IColumnEPKhS6_S8_RKNS_8PODArrayImLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEES8_bRNS_12ColumnVectorILNS_13PrimitiveTypeE2EEE
551
552
    // dispatch column comparison by type, map_entry_column is the column of map's key or value, search_column is the column of search key or value
553
    void _dispatch_column_comparison(PrimitiveType type, const IColumn& map_entry_column,
554
                                     const UInt8* map_entry_nullmap, const IColumn& search_column,
555
                                     const UInt8* search_nullmap,
556
                                     const ColumnArray::Offsets64& map_offsets,
557
                                     const UInt8* map_row_nullmap, bool search_is_const,
558
0
                                     ColumnUInt8& result_matches) const {
559
0
        auto call = [&](const auto& type) -> bool {
560
0
            using DispatchType = std::decay_t<decltype(type)>;
561
562
0
            _execute_column_comparison<typename DispatchType::ColumnType>(
563
0
                    map_entry_column, map_entry_nullmap, search_column, search_nullmap, map_offsets,
564
0
                    map_row_nullmap, search_is_const, result_matches);
565
566
0
            return true;
567
0
        };
Unexecuted instantiation: _ZZNK5doris24FunctionMapContainsEntry27_dispatch_column_comparisonENS_13PrimitiveTypeERKNS_7IColumnEPKhS4_S6_RKNS_8PODArrayImLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEES6_bRNS_12ColumnVectorILS1_2EEEENKUlRKT_E_clINS_16DispatchDataTypeILS1_2EEEEEbSJ_
Unexecuted instantiation: _ZZNK5doris24FunctionMapContainsEntry27_dispatch_column_comparisonENS_13PrimitiveTypeERKNS_7IColumnEPKhS4_S6_RKNS_8PODArrayImLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEES6_bRNS_12ColumnVectorILS1_2EEEENKUlRKT_E_clINS_16DispatchDataTypeILS1_3EEEEEbSJ_
Unexecuted instantiation: _ZZNK5doris24FunctionMapContainsEntry27_dispatch_column_comparisonENS_13PrimitiveTypeERKNS_7IColumnEPKhS4_S6_RKNS_8PODArrayImLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEES6_bRNS_12ColumnVectorILS1_2EEEENKUlRKT_E_clINS_16DispatchDataTypeILS1_4EEEEEbSJ_
Unexecuted instantiation: _ZZNK5doris24FunctionMapContainsEntry27_dispatch_column_comparisonENS_13PrimitiveTypeERKNS_7IColumnEPKhS4_S6_RKNS_8PODArrayImLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEES6_bRNS_12ColumnVectorILS1_2EEEENKUlRKT_E_clINS_16DispatchDataTypeILS1_5EEEEEbSJ_
Unexecuted instantiation: _ZZNK5doris24FunctionMapContainsEntry27_dispatch_column_comparisonENS_13PrimitiveTypeERKNS_7IColumnEPKhS4_S6_RKNS_8PODArrayImLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEES6_bRNS_12ColumnVectorILS1_2EEEENKUlRKT_E_clINS_16DispatchDataTypeILS1_6EEEEEbSJ_
Unexecuted instantiation: _ZZNK5doris24FunctionMapContainsEntry27_dispatch_column_comparisonENS_13PrimitiveTypeERKNS_7IColumnEPKhS4_S6_RKNS_8PODArrayImLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEES6_bRNS_12ColumnVectorILS1_2EEEENKUlRKT_E_clINS_16DispatchDataTypeILS1_7EEEEEbSJ_
Unexecuted instantiation: _ZZNK5doris24FunctionMapContainsEntry27_dispatch_column_comparisonENS_13PrimitiveTypeERKNS_7IColumnEPKhS4_S6_RKNS_8PODArrayImLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEES6_bRNS_12ColumnVectorILS1_2EEEENKUlRKT_E_clINS_16DispatchDataTypeILS1_8EEEEEbSJ_
Unexecuted instantiation: _ZZNK5doris24FunctionMapContainsEntry27_dispatch_column_comparisonENS_13PrimitiveTypeERKNS_7IColumnEPKhS4_S6_RKNS_8PODArrayImLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEES6_bRNS_12ColumnVectorILS1_2EEEENKUlRKT_E_clINS_16DispatchDataTypeILS1_9EEEEEbSJ_
Unexecuted instantiation: _ZZNK5doris24FunctionMapContainsEntry27_dispatch_column_comparisonENS_13PrimitiveTypeERKNS_7IColumnEPKhS4_S6_RKNS_8PODArrayImLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEES6_bRNS_12ColumnVectorILS1_2EEEENKUlRKT_E_clINS_16DispatchDataTypeILS1_28EEEEEbSJ_
Unexecuted instantiation: _ZZNK5doris24FunctionMapContainsEntry27_dispatch_column_comparisonENS_13PrimitiveTypeERKNS_7IColumnEPKhS4_S6_RKNS_8PODArrayImLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEES6_bRNS_12ColumnVectorILS1_2EEEENKUlRKT_E_clINS_16DispatchDataTypeILS1_29EEEEEbSJ_
Unexecuted instantiation: _ZZNK5doris24FunctionMapContainsEntry27_dispatch_column_comparisonENS_13PrimitiveTypeERKNS_7IColumnEPKhS4_S6_RKNS_8PODArrayImLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEES6_bRNS_12ColumnVectorILS1_2EEEENKUlRKT_E_clINS_16DispatchDataTypeILS1_20EEEEEbSJ_
Unexecuted instantiation: _ZZNK5doris24FunctionMapContainsEntry27_dispatch_column_comparisonENS_13PrimitiveTypeERKNS_7IColumnEPKhS4_S6_RKNS_8PODArrayImLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEES6_bRNS_12ColumnVectorILS1_2EEEENKUlRKT_E_clINS_16DispatchDataTypeILS1_30EEEEEbSJ_
Unexecuted instantiation: _ZZNK5doris24FunctionMapContainsEntry27_dispatch_column_comparisonENS_13PrimitiveTypeERKNS_7IColumnEPKhS4_S6_RKNS_8PODArrayImLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEES6_bRNS_12ColumnVectorILS1_2EEEENKUlRKT_E_clINS_16DispatchDataTypeILS1_35EEEEEbSJ_
Unexecuted instantiation: _ZZNK5doris24FunctionMapContainsEntry27_dispatch_column_comparisonENS_13PrimitiveTypeERKNS_7IColumnEPKhS4_S6_RKNS_8PODArrayImLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEES6_bRNS_12ColumnVectorILS1_2EEEENKUlRKT_E_clINS_16DispatchDataTypeILS1_11EEEEEbSJ_
Unexecuted instantiation: _ZZNK5doris24FunctionMapContainsEntry27_dispatch_column_comparisonENS_13PrimitiveTypeERKNS_7IColumnEPKhS4_S6_RKNS_8PODArrayImLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEES6_bRNS_12ColumnVectorILS1_2EEEENKUlRKT_E_clINS_16DispatchDataTypeILS1_25EEEEEbSJ_
Unexecuted instantiation: _ZZNK5doris24FunctionMapContainsEntry27_dispatch_column_comparisonENS_13PrimitiveTypeERKNS_7IColumnEPKhS4_S6_RKNS_8PODArrayImLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEES6_bRNS_12ColumnVectorILS1_2EEEENKUlRKT_E_clINS_16DispatchDataTypeILS1_26EEEEEbSJ_
Unexecuted instantiation: _ZZNK5doris24FunctionMapContainsEntry27_dispatch_column_comparisonENS_13PrimitiveTypeERKNS_7IColumnEPKhS4_S6_RKNS_8PODArrayImLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEES6_bRNS_12ColumnVectorILS1_2EEEENKUlRKT_E_clINS_16DispatchDataTypeILS1_12EEEEEbSJ_
Unexecuted instantiation: _ZZNK5doris24FunctionMapContainsEntry27_dispatch_column_comparisonENS_13PrimitiveTypeERKNS_7IColumnEPKhS4_S6_RKNS_8PODArrayImLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEES6_bRNS_12ColumnVectorILS1_2EEEENKUlRKT_E_clINS_16DispatchDataTypeILS1_27EEEEEbSJ_
Unexecuted instantiation: _ZZNK5doris24FunctionMapContainsEntry27_dispatch_column_comparisonENS_13PrimitiveTypeERKNS_7IColumnEPKhS4_S6_RKNS_8PODArrayImLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEES6_bRNS_12ColumnVectorILS1_2EEEENKUlRKT_E_clINS_16DispatchDataTypeILS1_42EEEEEbSJ_
Unexecuted instantiation: _ZZNK5doris24FunctionMapContainsEntry27_dispatch_column_comparisonENS_13PrimitiveTypeERKNS_7IColumnEPKhS4_S6_RKNS_8PODArrayImLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEES6_bRNS_12ColumnVectorILS1_2EEEENKUlRKT_E_clINS_16DispatchDataTypeILS1_36EEEEEbSJ_
Unexecuted instantiation: _ZZNK5doris24FunctionMapContainsEntry27_dispatch_column_comparisonENS_13PrimitiveTypeERKNS_7IColumnEPKhS4_S6_RKNS_8PODArrayImLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEES6_bRNS_12ColumnVectorILS1_2EEEENKUlRKT_E_clINS_16DispatchDataTypeILS1_37EEEEEbSJ_
Unexecuted instantiation: _ZZNK5doris24FunctionMapContainsEntry27_dispatch_column_comparisonENS_13PrimitiveTypeERKNS_7IColumnEPKhS4_S6_RKNS_8PODArrayImLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEES6_bRNS_12ColumnVectorILS1_2EEEENKUlRKT_E_clINS_16DispatchDataTypeILS1_23EEEEEbSJ_
568
569
0
        if (!dispatch_switch_all(type, call)) {
570
0
            throw doris::Exception(ErrorCode::INTERNAL_ERROR, "not support type {}",
571
0
                                   type_to_string(type));
572
0
        }
573
0
    }
574
575
    // main loop function
576
    ColumnPtr _execute_all_rows(const ColumnMap* map_column, const ColumnPtr& map_row_nullmap_col,
577
                                const IColumn& key_column, const UInt8* key_nullmap,
578
                                const IColumn& value_column, const UInt8* value_nullmap,
579
                                PrimitiveType key_type, PrimitiveType value_type, bool key_is_const,
580
0
                                bool value_is_const) const {
581
0
        const auto& map_offsets = map_column->get_offsets();
582
583
        // remove the nullable wrapper of map's key and value
584
0
        const auto& map_keys_nullable =
585
0
                reinterpret_cast<const ColumnNullable&>(map_column->get_keys());
586
0
        const IColumn* map_keys_column = &map_keys_nullable.get_nested_column();
587
0
        const auto& map_keys_nullmap = map_keys_nullable.get_null_map_column().get_data().data();
588
589
0
        const auto& map_values_nullable =
590
0
                reinterpret_cast<const ColumnNullable&>(map_column->get_values());
591
0
        const IColumn* map_values_column = &map_values_nullable.get_nested_column();
592
0
        const auto& map_values_nullmap =
593
0
                map_values_nullable.get_null_map_column().get_data().data();
594
595
0
        auto result_column = ColumnUInt8::create(map_offsets.size(), 0);
596
0
        auto& result_data = result_column->get_data();
597
598
0
        const UInt8* map_row_nullmap = nullptr;
599
0
        if (map_row_nullmap_col) {
600
0
            map_row_nullmap =
601
0
                    assert_cast<const ColumnUInt8&>(*map_row_nullmap_col).get_data().data();
602
0
        }
603
604
0
        auto matches = ColumnUInt8::create(map_keys_column->size(), 1);
605
606
        // matches &= key_compare
607
0
        _dispatch_column_comparison(key_type, *map_keys_column, map_keys_nullmap, key_column,
608
0
                                    key_nullmap, map_offsets, map_row_nullmap, key_is_const,
609
0
                                    *matches);
610
611
        // matches &= value_compare
612
0
        _dispatch_column_comparison(value_type, *map_values_column, map_values_nullmap,
613
0
                                    value_column, value_nullmap, map_offsets, map_row_nullmap,
614
0
                                    value_is_const, *matches);
615
616
        // aggregate results by map boundaries
617
0
        auto& matches_data = matches->get_data();
618
0
        for (size_t row = 0; row < map_offsets.size(); ++row) {
619
0
            if (map_row_nullmap && map_row_nullmap[row]) {
620
                // result is null for this row
621
0
                continue;
622
0
            }
623
624
0
            size_t map_start = row == 0 ? 0 : map_offsets[row - 1];
625
0
            size_t map_end = map_offsets[row];
626
627
0
            bool found = false;
628
0
            for (size_t i = map_start; i < map_end && !found; ++i) {
629
0
                if (matches_data[i]) {
630
0
                    found = true;
631
0
                    break;
632
0
                }
633
0
            }
634
0
            result_data[row] = found;
635
0
        }
636
637
0
        if (map_row_nullmap_col) {
638
0
            return ColumnNullable::create(std::move(result_column), map_row_nullmap_col);
639
0
        }
640
0
        return result_column;
641
0
    }
642
643
    // type comparability check and dispatch
644
    Status _execute_type_check_and_dispatch(Block& block, const ColumnNumbers& arguments,
645
0
                                            uint32_t result) const {
646
        // get type information
647
0
        auto map_type = remove_nullable(block.get_by_position(arguments[0]).type);
648
0
        const auto* map_datatype = assert_cast<const DataTypeMap*>(map_type.get());
649
0
        auto map_key_type = remove_nullable(map_datatype->get_key_type());
650
0
        auto map_value_type = remove_nullable(map_datatype->get_value_type());
651
0
        auto search_key_type = remove_nullable(block.get_by_position(arguments[1]).type);
652
0
        auto search_value_type = remove_nullable(block.get_by_position(arguments[2]).type);
653
654
0
        PrimitiveType key_primitive_type = map_key_type->get_primitive_type();
655
0
        PrimitiveType value_primitive_type = map_value_type->get_primitive_type();
656
657
        // FE should ensure the column types are the same,
658
        // but primitive type may be different (eg. TYPE_STRING and TYPE_VARCHAR both use ColumnString)
659
660
        // check whether this function supports equality comparison for the types
661
0
        if (!is_equality_comparison_supported(key_primitive_type) ||
662
0
            !is_equality_comparison_supported(value_primitive_type)) {
663
0
            return Status::RuntimeError(
664
0
                    "Trying to do equality comparison on unsupported types for function {}. "
665
0
                    "Map key type: {}, search key type: {}. "
666
0
                    "Map value type: {}, search value type: {}. "
667
0
                    "Key primitive type: {}, value primitive type: {}.",
668
0
                    get_name(), map_key_type->get_name(), search_key_type->get_name(),
669
0
                    map_value_type->get_name(), search_value_type->get_name(),
670
0
                    type_to_string(key_primitive_type), type_to_string(value_primitive_type));
671
0
        }
672
673
        // type check passed, extract columns and execute
674
        // extract map column
675
0
        auto map_column_ptr =
676
0
                block.get_by_position(arguments[0]).column->convert_to_full_column_if_const();
677
0
        const ColumnMap* map_column = nullptr;
678
0
        ColumnPtr map_row_nullmap_col = nullptr;
679
0
        if (const auto* nullable_column =
680
0
                    check_and_get_column<ColumnNullable>(map_column_ptr.get())) {
681
0
            map_column = check_and_get_column<ColumnMap>(nullable_column->get_nested_column());
682
0
            map_row_nullmap_col = nullable_column->get_null_map_column_ptr();
683
0
        } else {
684
0
            map_column = check_and_get_column<ColumnMap>(*map_column_ptr.get());
685
0
        }
686
0
        if (!map_column) {
687
0
            return Status::RuntimeError("unsupported types for function {}({})", get_name(),
688
0
                                        block.get_by_position(arguments[0]).type->get_name());
689
0
        }
690
691
        // extract (search) key and value columns
692
0
        const auto& [key_column_ptr, key_is_const] =
693
0
                unpack_if_const(block.get_by_position(arguments[1]).column);
694
0
        const auto& [value_column_ptr, value_is_const] =
695
0
                unpack_if_const(block.get_by_position(arguments[2]).column);
696
697
0
        const IColumn* key_column = nullptr;
698
0
        const IColumn* value_column = nullptr;
699
0
        const UInt8* key_nullmap = nullptr;
700
0
        const UInt8* value_nullmap = nullptr;
701
702
0
        if (const auto* nullable_column =
703
0
                    check_and_get_column<ColumnNullable>(key_column_ptr.get())) {
704
0
            key_column = &nullable_column->get_nested_column();
705
0
            key_nullmap = nullable_column->get_null_map_column().get_data().data();
706
0
        } else {
707
0
            key_column = key_column_ptr.get();
708
0
        }
709
710
0
        if (const auto* nullable_column =
711
0
                    check_and_get_column<ColumnNullable>(value_column_ptr.get())) {
712
0
            value_column = &nullable_column->get_nested_column();
713
0
            value_nullmap = nullable_column->get_null_map_column().get_data().data();
714
0
        } else {
715
0
            value_column = value_column_ptr.get();
716
0
        }
717
718
0
        ColumnPtr return_column =
719
0
                _execute_all_rows(map_column, map_row_nullmap_col, *key_column, key_nullmap,
720
0
                                  *value_column, value_nullmap, key_primitive_type,
721
0
                                  value_primitive_type, key_is_const, value_is_const);
722
723
0
        if (return_column) {
724
0
            block.replace_by_position(result, std::move(return_column));
725
0
            return Status::OK();
726
0
        }
727
728
0
        return Status::RuntimeError(
729
0
                "execute failed or unsupported types for function {}({}, {}, {})", get_name(),
730
0
                block.get_by_position(arguments[0]).type->get_name(),
731
0
                block.get_by_position(arguments[1]).type->get_name(),
732
0
                block.get_by_position(arguments[2]).type->get_name());
733
0
    }
734
735
    // generic type-specialized comparison function
736
    template <typename ColumnType>
737
    bool compare_values(const IColumn& left_col, size_t left_idx, const UInt8* left_nullmap,
738
                        const IColumn& right_col, size_t right_idx,
739
0
                        const UInt8* right_nullmap) const {
740
        // handle null values
741
0
        bool left_is_null = left_nullmap && left_nullmap[left_idx];
742
0
        bool right_is_null = right_nullmap && right_nullmap[right_idx];
743
744
0
        if (left_is_null && right_is_null) {
745
0
            return true;
746
0
        }
747
0
        if (left_is_null || right_is_null) {
748
0
            return false;
749
0
        }
750
751
        // use compare_at from typed column
752
0
        const auto& typed_left_col = assert_cast<const ColumnType&>(left_col);
753
0
        const auto& typed_right_col = assert_cast<const ColumnType&>(right_col);
754
0
        return typed_left_col.compare_at(left_idx, right_idx, typed_right_col,
755
0
                                         /*nan_direction_hint=*/1) == 0;
756
0
    }
Unexecuted instantiation: _ZNK5doris24FunctionMapContainsEntry14compare_valuesINS_12ColumnVectorILNS_13PrimitiveTypeE2EEEEEbRKNS_7IColumnEmPKhS7_mS9_
Unexecuted instantiation: _ZNK5doris24FunctionMapContainsEntry14compare_valuesINS_12ColumnVectorILNS_13PrimitiveTypeE3EEEEEbRKNS_7IColumnEmPKhS7_mS9_
Unexecuted instantiation: _ZNK5doris24FunctionMapContainsEntry14compare_valuesINS_12ColumnVectorILNS_13PrimitiveTypeE4EEEEEbRKNS_7IColumnEmPKhS7_mS9_
Unexecuted instantiation: _ZNK5doris24FunctionMapContainsEntry14compare_valuesINS_12ColumnVectorILNS_13PrimitiveTypeE5EEEEEbRKNS_7IColumnEmPKhS7_mS9_
Unexecuted instantiation: _ZNK5doris24FunctionMapContainsEntry14compare_valuesINS_12ColumnVectorILNS_13PrimitiveTypeE6EEEEEbRKNS_7IColumnEmPKhS7_mS9_
Unexecuted instantiation: _ZNK5doris24FunctionMapContainsEntry14compare_valuesINS_12ColumnVectorILNS_13PrimitiveTypeE7EEEEEbRKNS_7IColumnEmPKhS7_mS9_
Unexecuted instantiation: _ZNK5doris24FunctionMapContainsEntry14compare_valuesINS_12ColumnVectorILNS_13PrimitiveTypeE8EEEEEbRKNS_7IColumnEmPKhS7_mS9_
Unexecuted instantiation: _ZNK5doris24FunctionMapContainsEntry14compare_valuesINS_12ColumnVectorILNS_13PrimitiveTypeE9EEEEEbRKNS_7IColumnEmPKhS7_mS9_
Unexecuted instantiation: _ZNK5doris24FunctionMapContainsEntry14compare_valuesINS_13ColumnDecimalILNS_13PrimitiveTypeE28EEEEEbRKNS_7IColumnEmPKhS7_mS9_
Unexecuted instantiation: _ZNK5doris24FunctionMapContainsEntry14compare_valuesINS_13ColumnDecimalILNS_13PrimitiveTypeE29EEEEEbRKNS_7IColumnEmPKhS7_mS9_
Unexecuted instantiation: _ZNK5doris24FunctionMapContainsEntry14compare_valuesINS_13ColumnDecimalILNS_13PrimitiveTypeE20EEEEEbRKNS_7IColumnEmPKhS7_mS9_
Unexecuted instantiation: _ZNK5doris24FunctionMapContainsEntry14compare_valuesINS_13ColumnDecimalILNS_13PrimitiveTypeE30EEEEEbRKNS_7IColumnEmPKhS7_mS9_
Unexecuted instantiation: _ZNK5doris24FunctionMapContainsEntry14compare_valuesINS_13ColumnDecimalILNS_13PrimitiveTypeE35EEEEEbRKNS_7IColumnEmPKhS7_mS9_
Unexecuted instantiation: _ZNK5doris24FunctionMapContainsEntry14compare_valuesINS_12ColumnVectorILNS_13PrimitiveTypeE11EEEEEbRKNS_7IColumnEmPKhS7_mS9_
Unexecuted instantiation: _ZNK5doris24FunctionMapContainsEntry14compare_valuesINS_12ColumnVectorILNS_13PrimitiveTypeE25EEEEEbRKNS_7IColumnEmPKhS7_mS9_
Unexecuted instantiation: _ZNK5doris24FunctionMapContainsEntry14compare_valuesINS_12ColumnVectorILNS_13PrimitiveTypeE26EEEEEbRKNS_7IColumnEmPKhS7_mS9_
Unexecuted instantiation: _ZNK5doris24FunctionMapContainsEntry14compare_valuesINS_12ColumnVectorILNS_13PrimitiveTypeE12EEEEEbRKNS_7IColumnEmPKhS7_mS9_
Unexecuted instantiation: _ZNK5doris24FunctionMapContainsEntry14compare_valuesINS_12ColumnVectorILNS_13PrimitiveTypeE27EEEEEbRKNS_7IColumnEmPKhS7_mS9_
Unexecuted instantiation: _ZNK5doris24FunctionMapContainsEntry14compare_valuesINS_12ColumnVectorILNS_13PrimitiveTypeE42EEEEEbRKNS_7IColumnEmPKhS7_mS9_
Unexecuted instantiation: _ZNK5doris24FunctionMapContainsEntry14compare_valuesINS_12ColumnVectorILNS_13PrimitiveTypeE36EEEEEbRKNS_7IColumnEmPKhS7_mS9_
Unexecuted instantiation: _ZNK5doris24FunctionMapContainsEntry14compare_valuesINS_12ColumnVectorILNS_13PrimitiveTypeE37EEEEEbRKNS_7IColumnEmPKhS7_mS9_
Unexecuted instantiation: _ZNK5doris24FunctionMapContainsEntry14compare_valuesINS_9ColumnStrIjEEEEbRKNS_7IColumnEmPKhS6_mS8_
757
758
    // whether this function supports equality comparison for the given primitive type.
759
    // Uses dispatch_switch_all as the single source of truth so any type supported
760
    // by the dispatch layer is automatically accepted here.
761
0
    bool is_equality_comparison_supported(PrimitiveType type) const {
762
0
        return dispatch_switch_all(type, [](const auto&) { return true; });
Unexecuted instantiation: _ZZNK5doris24FunctionMapContainsEntry32is_equality_comparison_supportedENS_13PrimitiveTypeEENKUlRKT_E_clINS_16DispatchDataTypeILS1_2EEEEEDaS4_
Unexecuted instantiation: _ZZNK5doris24FunctionMapContainsEntry32is_equality_comparison_supportedENS_13PrimitiveTypeEENKUlRKT_E_clINS_16DispatchDataTypeILS1_3EEEEEDaS4_
Unexecuted instantiation: _ZZNK5doris24FunctionMapContainsEntry32is_equality_comparison_supportedENS_13PrimitiveTypeEENKUlRKT_E_clINS_16DispatchDataTypeILS1_4EEEEEDaS4_
Unexecuted instantiation: _ZZNK5doris24FunctionMapContainsEntry32is_equality_comparison_supportedENS_13PrimitiveTypeEENKUlRKT_E_clINS_16DispatchDataTypeILS1_5EEEEEDaS4_
Unexecuted instantiation: _ZZNK5doris24FunctionMapContainsEntry32is_equality_comparison_supportedENS_13PrimitiveTypeEENKUlRKT_E_clINS_16DispatchDataTypeILS1_6EEEEEDaS4_
Unexecuted instantiation: _ZZNK5doris24FunctionMapContainsEntry32is_equality_comparison_supportedENS_13PrimitiveTypeEENKUlRKT_E_clINS_16DispatchDataTypeILS1_7EEEEEDaS4_
Unexecuted instantiation: _ZZNK5doris24FunctionMapContainsEntry32is_equality_comparison_supportedENS_13PrimitiveTypeEENKUlRKT_E_clINS_16DispatchDataTypeILS1_8EEEEEDaS4_
Unexecuted instantiation: _ZZNK5doris24FunctionMapContainsEntry32is_equality_comparison_supportedENS_13PrimitiveTypeEENKUlRKT_E_clINS_16DispatchDataTypeILS1_9EEEEEDaS4_
Unexecuted instantiation: _ZZNK5doris24FunctionMapContainsEntry32is_equality_comparison_supportedENS_13PrimitiveTypeEENKUlRKT_E_clINS_16DispatchDataTypeILS1_28EEEEEDaS4_
Unexecuted instantiation: _ZZNK5doris24FunctionMapContainsEntry32is_equality_comparison_supportedENS_13PrimitiveTypeEENKUlRKT_E_clINS_16DispatchDataTypeILS1_29EEEEEDaS4_
Unexecuted instantiation: _ZZNK5doris24FunctionMapContainsEntry32is_equality_comparison_supportedENS_13PrimitiveTypeEENKUlRKT_E_clINS_16DispatchDataTypeILS1_20EEEEEDaS4_
Unexecuted instantiation: _ZZNK5doris24FunctionMapContainsEntry32is_equality_comparison_supportedENS_13PrimitiveTypeEENKUlRKT_E_clINS_16DispatchDataTypeILS1_30EEEEEDaS4_
Unexecuted instantiation: _ZZNK5doris24FunctionMapContainsEntry32is_equality_comparison_supportedENS_13PrimitiveTypeEENKUlRKT_E_clINS_16DispatchDataTypeILS1_35EEEEEDaS4_
Unexecuted instantiation: _ZZNK5doris24FunctionMapContainsEntry32is_equality_comparison_supportedENS_13PrimitiveTypeEENKUlRKT_E_clINS_16DispatchDataTypeILS1_11EEEEEDaS4_
Unexecuted instantiation: _ZZNK5doris24FunctionMapContainsEntry32is_equality_comparison_supportedENS_13PrimitiveTypeEENKUlRKT_E_clINS_16DispatchDataTypeILS1_25EEEEEDaS4_
Unexecuted instantiation: _ZZNK5doris24FunctionMapContainsEntry32is_equality_comparison_supportedENS_13PrimitiveTypeEENKUlRKT_E_clINS_16DispatchDataTypeILS1_26EEEEEDaS4_
Unexecuted instantiation: _ZZNK5doris24FunctionMapContainsEntry32is_equality_comparison_supportedENS_13PrimitiveTypeEENKUlRKT_E_clINS_16DispatchDataTypeILS1_12EEEEEDaS4_
Unexecuted instantiation: _ZZNK5doris24FunctionMapContainsEntry32is_equality_comparison_supportedENS_13PrimitiveTypeEENKUlRKT_E_clINS_16DispatchDataTypeILS1_27EEEEEDaS4_
Unexecuted instantiation: _ZZNK5doris24FunctionMapContainsEntry32is_equality_comparison_supportedENS_13PrimitiveTypeEENKUlRKT_E_clINS_16DispatchDataTypeILS1_42EEEEEDaS4_
Unexecuted instantiation: _ZZNK5doris24FunctionMapContainsEntry32is_equality_comparison_supportedENS_13PrimitiveTypeEENKUlRKT_E_clINS_16DispatchDataTypeILS1_36EEEEEDaS4_
Unexecuted instantiation: _ZZNK5doris24FunctionMapContainsEntry32is_equality_comparison_supportedENS_13PrimitiveTypeEENKUlRKT_E_clINS_16DispatchDataTypeILS1_37EEEEEDaS4_
Unexecuted instantiation: _ZZNK5doris24FunctionMapContainsEntry32is_equality_comparison_supportedENS_13PrimitiveTypeEENKUlRKT_E_clINS_16DispatchDataTypeILS1_23EEEEEDaS4_
763
0
    }
764
};
765
766
class FunctionDeduplicateMap : public IFunction {
767
public:
768
    static constexpr auto name = "deduplicate_map";
769
3
    static FunctionPtr create() { return std::make_shared<FunctionDeduplicateMap>(); }
770
771
1
    String get_name() const override { return name; }
772
1
    size_t get_number_of_arguments() const override { return 1; }
773
2
    bool use_default_implementation_for_nulls() const override { return true; }
774
775
1
    DataTypePtr get_return_type_impl(const DataTypes& arguments) const override {
776
1
        return arguments[0];
777
1
    }
778
779
    Status execute_impl(FunctionContext* context, Block& block, const ColumnNumbers& arguments,
780
1
                        uint32_t result, size_t input_rows_count) const override {
781
1
        DCHECK_EQ(arguments.size(), 1);
782
1
        auto col_ptr = block.get_by_position(arguments[0]).column->clone_resized(input_rows_count);
783
1
        auto& col_map = assert_cast<ColumnMap&>(*col_ptr);
784
1
        RETURN_IF_ERROR(col_map.deduplicate_keys());
785
1
        block.replace_by_position(result, std::move(col_ptr));
786
1
        return Status::OK();
787
1
    }
788
789
private:
790
};
791
792
1
void register_function_map(SimpleFunctionFactory& factory) {
793
1
    factory.register_function<FunctionMap>();
794
1
    factory.register_function<FunctionMapContains<true>>();
795
1
    factory.register_function<FunctionMapContains<false>>();
796
1
    factory.register_function<FunctionMapKeysOrValues<true>>();
797
1
    factory.register_function<FunctionMapKeysOrValues<false>>();
798
1
    factory.register_function<FunctionMapEntries>();
799
1
    factory.register_function<FunctionStrToMap>();
800
1
    factory.register_function<FunctionMapContainsEntry>();
801
1
    factory.register_function<FunctionDeduplicateMap>();
802
1
}
803
804
} // namespace doris