Coverage Report

Created: 2026-03-16 04:30

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
be/src/exprs/function/function_conv.cpp
Line
Count
Source
1
// Licensed to the Apache Software Foundation (ASF) under one
2
// or more contributor license agreements.  See the NOTICE file
3
// distributed with this work for additional information
4
// regarding copyright ownership.  The ASF licenses this file
5
// to you under the Apache License, Version 2.0 (the
6
// "License"); you may not use this file except in compliance
7
// with the License.  You may obtain a copy of the License at
8
//
9
//   http://www.apache.org/licenses/LICENSE-2.0
10
//
11
// Unless required by applicable law or agreed to in writing,
12
// software distributed under the License is distributed on an
13
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
14
// KIND, either express or implied.  See the License for the
15
// specific language governing permissions and limitations
16
// under the License.
17
18
#include <stdint.h>
19
#include <stdlib.h>
20
21
#include <boost/iterator/iterator_facade.hpp>
22
// IWYU pragma: no_include <bits/std_abs.h>
23
#include <algorithm>
24
#include <cmath> // IWYU pragma: keep
25
#include <memory>
26
#include <utility>
27
28
#include "common/status.h"
29
#include "core/assert_cast.h"
30
#include "core/block/block.h"
31
#include "core/block/column_numbers.h"
32
#include "core/block/column_with_type_and_name.h"
33
#include "core/column/column.h"
34
#include "core/column/column_const.h"
35
#include "core/column/column_nullable.h"
36
#include "core/column/column_string.h"
37
#include "core/column/column_vector.h"
38
#include "core/data_type/data_type.h"
39
#include "core/data_type/data_type_nullable.h"
40
#include "core/data_type/data_type_number.h"
41
#include "core/data_type/data_type_string.h"
42
#include "core/string_ref.h"
43
#include "core/types.h"
44
#include "exprs/aggregate/aggregate_function.h"
45
#include "exprs/function/function.h"
46
#include "exprs/function/simple_function_factory.h"
47
#include "exprs/math_functions.h"
48
#include "util/string_parser.hpp"
49
50
namespace doris {
51
#include "common/compile_check_begin.h"
52
class FunctionContext;
53
} // namespace doris
54
55
namespace doris {
56
57
template <typename Impl>
58
class FunctionConv : public IFunction {
59
public:
60
    static constexpr auto name = "conv";
61
2
    String get_name() const override { return name; }
_ZNK5doris12FunctionConvINS_13ConvInt64ImplEE8get_nameB5cxx11Ev
Line
Count
Source
61
1
    String get_name() const override { return name; }
_ZNK5doris12FunctionConvINS_14ConvStringImplEE8get_nameB5cxx11Ev
Line
Count
Source
61
1
    String get_name() const override { return name; }
62
9
    static FunctionPtr create() { return std::make_shared<FunctionConv<Impl>>(); }
_ZN5doris12FunctionConvINS_13ConvInt64ImplEE6createEv
Line
Count
Source
62
5
    static FunctionPtr create() { return std::make_shared<FunctionConv<Impl>>(); }
_ZN5doris12FunctionConvINS_14ConvStringImplEE6createEv
Line
Count
Source
62
4
    static FunctionPtr create() { return std::make_shared<FunctionConv<Impl>>(); }
63
64
5
    DataTypePtr get_return_type_impl(const DataTypes& arguments) const override {
65
5
        return make_nullable(std::make_shared<DataTypeString>());
66
5
    }
_ZNK5doris12FunctionConvINS_13ConvInt64ImplEE20get_return_type_implERKSt6vectorISt10shared_ptrIKNS_9IDataTypeEESaIS7_EE
Line
Count
Source
64
3
    DataTypePtr get_return_type_impl(const DataTypes& arguments) const override {
65
3
        return make_nullable(std::make_shared<DataTypeString>());
66
3
    }
_ZNK5doris12FunctionConvINS_14ConvStringImplEE20get_return_type_implERKSt6vectorISt10shared_ptrIKNS_9IDataTypeEESaIS7_EE
Line
Count
Source
64
2
    DataTypePtr get_return_type_impl(const DataTypes& arguments) const override {
65
2
        return make_nullable(std::make_shared<DataTypeString>());
66
2
    }
67
7
    DataTypes get_variadic_argument_types_impl() const override {
68
7
        return {std::make_shared<typename Impl::DataType>(), std::make_shared<DataTypeInt8>(),
69
7
                std::make_shared<DataTypeInt8>()};
70
7
    }
_ZNK5doris12FunctionConvINS_13ConvInt64ImplEE32get_variadic_argument_types_implEv
Line
Count
Source
67
4
    DataTypes get_variadic_argument_types_impl() const override {
68
4
        return {std::make_shared<typename Impl::DataType>(), std::make_shared<DataTypeInt8>(),
69
4
                std::make_shared<DataTypeInt8>()};
70
4
    }
_ZNK5doris12FunctionConvINS_14ConvStringImplEE32get_variadic_argument_types_implEv
Line
Count
Source
67
3
    DataTypes get_variadic_argument_types_impl() const override {
68
3
        return {std::make_shared<typename Impl::DataType>(), std::make_shared<DataTypeInt8>(),
69
3
                std::make_shared<DataTypeInt8>()};
70
3
    }
71
5
    size_t get_number_of_arguments() const override {
72
5
        return get_variadic_argument_types_impl().size();
73
5
    }
_ZNK5doris12FunctionConvINS_13ConvInt64ImplEE23get_number_of_argumentsEv
Line
Count
Source
71
3
    size_t get_number_of_arguments() const override {
72
3
        return get_variadic_argument_types_impl().size();
73
3
    }
_ZNK5doris12FunctionConvINS_14ConvStringImplEE23get_number_of_argumentsEv
Line
Count
Source
71
2
    size_t get_number_of_arguments() const override {
72
2
        return get_variadic_argument_types_impl().size();
73
2
    }
74
75
    Status execute_impl(FunctionContext* context, Block& block, const ColumnNumbers& arguments,
76
3
                        uint32_t result, size_t input_rows_count) const override {
77
3
        auto result_column = ColumnString::create();
78
3
        auto result_null_map_column = ColumnUInt8::create(input_rows_count, 0);
79
80
3
        bool col_const[3];
81
3
        ColumnPtr argument_columns[3];
82
12
        for (int i = 0; i < 3; ++i) {
83
9
            col_const[i] = is_column_const(*block.get_by_position(arguments[i]).column);
84
9
        }
85
3
        argument_columns[0] = col_const[0] ? static_cast<const ColumnConst&>(
86
0
                                                     *block.get_by_position(arguments[0]).column)
87
0
                                                     .convert_to_full_column()
88
3
                                           : block.get_by_position(arguments[0]).column;
89
90
3
        default_preprocess_parameter_columns(argument_columns, col_const, {1, 2}, block, arguments);
91
92
3
        if (col_const[1] && col_const[2]) {
93
0
            execute_scalar_args(
94
0
                    context,
95
0
                    assert_cast<const typename Impl::DataType::ColumnType*>(
96
0
                            argument_columns[0].get()),
97
0
                    assert_cast<const ColumnInt8*>(argument_columns[1].get())->get_element(0),
98
0
                    assert_cast<const ColumnInt8*>(argument_columns[2].get())->get_element(0),
99
0
                    assert_cast<ColumnString*>(result_column.get()),
100
0
                    assert_cast<ColumnUInt8*>(result_null_map_column.get())->get_data(),
101
0
                    input_rows_count);
102
3
        } else {
103
3
            execute_straight(context,
104
3
                             assert_cast<const typename Impl::DataType::ColumnType*>(
105
3
                                     argument_columns[0].get()),
106
3
                             assert_cast<const ColumnInt8*>(argument_columns[1].get()),
107
3
                             assert_cast<const ColumnInt8*>(argument_columns[2].get()),
108
3
                             assert_cast<ColumnString*>(result_column.get()),
109
3
                             assert_cast<ColumnUInt8*>(result_null_map_column.get())->get_data(),
110
3
                             input_rows_count);
111
3
        }
112
113
3
        block.get_by_position(result).column =
114
3
                ColumnNullable::create(std::move(result_column), std::move(result_null_map_column));
115
3
        return Status::OK();
116
3
    }
_ZNK5doris12FunctionConvINS_13ConvInt64ImplEE12execute_implEPNS_15FunctionContextERNS_5BlockERKSt6vectorIjSaIjEEjm
Line
Count
Source
76
2
                        uint32_t result, size_t input_rows_count) const override {
77
2
        auto result_column = ColumnString::create();
78
2
        auto result_null_map_column = ColumnUInt8::create(input_rows_count, 0);
79
80
2
        bool col_const[3];
81
2
        ColumnPtr argument_columns[3];
82
8
        for (int i = 0; i < 3; ++i) {
83
6
            col_const[i] = is_column_const(*block.get_by_position(arguments[i]).column);
84
6
        }
85
2
        argument_columns[0] = col_const[0] ? static_cast<const ColumnConst&>(
86
0
                                                     *block.get_by_position(arguments[0]).column)
87
0
                                                     .convert_to_full_column()
88
2
                                           : block.get_by_position(arguments[0]).column;
89
90
2
        default_preprocess_parameter_columns(argument_columns, col_const, {1, 2}, block, arguments);
91
92
2
        if (col_const[1] && col_const[2]) {
93
0
            execute_scalar_args(
94
0
                    context,
95
0
                    assert_cast<const typename Impl::DataType::ColumnType*>(
96
0
                            argument_columns[0].get()),
97
0
                    assert_cast<const ColumnInt8*>(argument_columns[1].get())->get_element(0),
98
0
                    assert_cast<const ColumnInt8*>(argument_columns[2].get())->get_element(0),
99
0
                    assert_cast<ColumnString*>(result_column.get()),
100
0
                    assert_cast<ColumnUInt8*>(result_null_map_column.get())->get_data(),
101
0
                    input_rows_count);
102
2
        } else {
103
2
            execute_straight(context,
104
2
                             assert_cast<const typename Impl::DataType::ColumnType*>(
105
2
                                     argument_columns[0].get()),
106
2
                             assert_cast<const ColumnInt8*>(argument_columns[1].get()),
107
2
                             assert_cast<const ColumnInt8*>(argument_columns[2].get()),
108
2
                             assert_cast<ColumnString*>(result_column.get()),
109
2
                             assert_cast<ColumnUInt8*>(result_null_map_column.get())->get_data(),
110
2
                             input_rows_count);
111
2
        }
112
113
2
        block.get_by_position(result).column =
114
2
                ColumnNullable::create(std::move(result_column), std::move(result_null_map_column));
115
2
        return Status::OK();
116
2
    }
_ZNK5doris12FunctionConvINS_14ConvStringImplEE12execute_implEPNS_15FunctionContextERNS_5BlockERKSt6vectorIjSaIjEEjm
Line
Count
Source
76
1
                        uint32_t result, size_t input_rows_count) const override {
77
1
        auto result_column = ColumnString::create();
78
1
        auto result_null_map_column = ColumnUInt8::create(input_rows_count, 0);
79
80
1
        bool col_const[3];
81
1
        ColumnPtr argument_columns[3];
82
4
        for (int i = 0; i < 3; ++i) {
83
3
            col_const[i] = is_column_const(*block.get_by_position(arguments[i]).column);
84
3
        }
85
1
        argument_columns[0] = col_const[0] ? static_cast<const ColumnConst&>(
86
0
                                                     *block.get_by_position(arguments[0]).column)
87
0
                                                     .convert_to_full_column()
88
1
                                           : block.get_by_position(arguments[0]).column;
89
90
1
        default_preprocess_parameter_columns(argument_columns, col_const, {1, 2}, block, arguments);
91
92
1
        if (col_const[1] && col_const[2]) {
93
0
            execute_scalar_args(
94
0
                    context,
95
0
                    assert_cast<const typename Impl::DataType::ColumnType*>(
96
0
                            argument_columns[0].get()),
97
0
                    assert_cast<const ColumnInt8*>(argument_columns[1].get())->get_element(0),
98
0
                    assert_cast<const ColumnInt8*>(argument_columns[2].get())->get_element(0),
99
0
                    assert_cast<ColumnString*>(result_column.get()),
100
0
                    assert_cast<ColumnUInt8*>(result_null_map_column.get())->get_data(),
101
0
                    input_rows_count);
102
1
        } else {
103
1
            execute_straight(context,
104
1
                             assert_cast<const typename Impl::DataType::ColumnType*>(
105
1
                                     argument_columns[0].get()),
106
1
                             assert_cast<const ColumnInt8*>(argument_columns[1].get()),
107
1
                             assert_cast<const ColumnInt8*>(argument_columns[2].get()),
108
1
                             assert_cast<ColumnString*>(result_column.get()),
109
1
                             assert_cast<ColumnUInt8*>(result_null_map_column.get())->get_data(),
110
1
                             input_rows_count);
111
1
        }
112
113
1
        block.get_by_position(result).column =
114
1
                ColumnNullable::create(std::move(result_column), std::move(result_null_map_column));
115
1
        return Status::OK();
116
1
    }
117
118
private:
119
    // check out of bound.
120
3
    static bool _check_oob(const Int8 src_base, const Int8 dst_base) {
121
3
        return std::abs(src_base) < MathFunctions::MIN_BASE ||
122
3
               std::abs(src_base) > MathFunctions::MAX_BASE ||
123
3
               std::abs(dst_base) < MathFunctions::MIN_BASE ||
124
3
               std::abs(dst_base) > MathFunctions::MAX_BASE;
125
3
    }
_ZN5doris12FunctionConvINS_13ConvInt64ImplEE10_check_oobEaa
Line
Count
Source
120
2
    static bool _check_oob(const Int8 src_base, const Int8 dst_base) {
121
2
        return std::abs(src_base) < MathFunctions::MIN_BASE ||
122
2
               std::abs(src_base) > MathFunctions::MAX_BASE ||
123
2
               std::abs(dst_base) < MathFunctions::MIN_BASE ||
124
2
               std::abs(dst_base) > MathFunctions::MAX_BASE;
125
2
    }
_ZN5doris12FunctionConvINS_14ConvStringImplEE10_check_oobEaa
Line
Count
Source
120
1
    static bool _check_oob(const Int8 src_base, const Int8 dst_base) {
121
1
        return std::abs(src_base) < MathFunctions::MIN_BASE ||
122
1
               std::abs(src_base) > MathFunctions::MAX_BASE ||
123
1
               std::abs(dst_base) < MathFunctions::MIN_BASE ||
124
1
               std::abs(dst_base) > MathFunctions::MAX_BASE;
125
1
    }
126
    static void execute_straight(FunctionContext* context,
127
                                 const typename Impl::DataType::ColumnType* data_column,
128
                                 const ColumnInt8* src_base_column,
129
                                 const ColumnInt8* dst_base_column, ColumnString* result_column,
130
3
                                 NullMap& result_null_map, size_t input_rows_count) {
131
6
        for (size_t i = 0; i < input_rows_count; i++) {
132
3
            Int8 src_base = src_base_column->get_element(i);
133
3
            Int8 dst_base = dst_base_column->get_element(i);
134
3
            if (_check_oob(src_base, dst_base)) {
135
0
                result_null_map[i] = true;
136
0
                result_column->insert_default();
137
3
            } else {
138
3
                Impl::calculate_cell(context, data_column, src_base, dst_base, result_column,
139
3
                                     result_null_map, i);
140
3
            }
141
3
        }
142
3
    }
_ZN5doris12FunctionConvINS_13ConvInt64ImplEE16execute_straightEPNS_15FunctionContextEPKNS_12ColumnVectorILNS_13PrimitiveTypeE6EEEPKNS5_ILS6_3EEESC_PNS_9ColumnStrIjEERNS_8PODArrayIhLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEEm
Line
Count
Source
130
2
                                 NullMap& result_null_map, size_t input_rows_count) {
131
4
        for (size_t i = 0; i < input_rows_count; i++) {
132
2
            Int8 src_base = src_base_column->get_element(i);
133
2
            Int8 dst_base = dst_base_column->get_element(i);
134
2
            if (_check_oob(src_base, dst_base)) {
135
0
                result_null_map[i] = true;
136
0
                result_column->insert_default();
137
2
            } else {
138
2
                Impl::calculate_cell(context, data_column, src_base, dst_base, result_column,
139
2
                                     result_null_map, i);
140
2
            }
141
2
        }
142
2
    }
_ZN5doris12FunctionConvINS_14ConvStringImplEE16execute_straightEPNS_15FunctionContextEPKNS_9ColumnStrIjEEPKNS_12ColumnVectorILNS_13PrimitiveTypeE3EEESD_PS6_RNS_8PODArrayIhLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEEm
Line
Count
Source
130
1
                                 NullMap& result_null_map, size_t input_rows_count) {
131
2
        for (size_t i = 0; i < input_rows_count; i++) {
132
1
            Int8 src_base = src_base_column->get_element(i);
133
1
            Int8 dst_base = dst_base_column->get_element(i);
134
1
            if (_check_oob(src_base, dst_base)) {
135
0
                result_null_map[i] = true;
136
0
                result_column->insert_default();
137
1
            } else {
138
1
                Impl::calculate_cell(context, data_column, src_base, dst_base, result_column,
139
1
                                     result_null_map, i);
140
1
            }
141
1
        }
142
1
    }
143
    static void execute_scalar_args(FunctionContext* context,
144
                                    const typename Impl::DataType::ColumnType* data_column,
145
                                    const Int8 src_base, const Int8 dst_base,
146
                                    ColumnString* result_column, NullMap& result_null_map,
147
0
                                    size_t input_rows_count) {
148
0
        if (_check_oob(src_base, dst_base)) {
149
0
            result_null_map.assign(input_rows_count, UInt8 {true});
150
0
            result_column->insert_many_defaults(input_rows_count);
151
0
            return;
152
0
        }
153
0
        for (size_t i = 0; i < input_rows_count; i++) {
154
0
            Impl::calculate_cell(context, data_column, src_base, dst_base, result_column,
155
0
                                 result_null_map, i);
156
0
        }
157
0
    }
Unexecuted instantiation: _ZN5doris12FunctionConvINS_13ConvInt64ImplEE19execute_scalar_argsEPNS_15FunctionContextEPKNS_12ColumnVectorILNS_13PrimitiveTypeE6EEEaaPNS_9ColumnStrIjEERNS_8PODArrayIhLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEEm
Unexecuted instantiation: _ZN5doris12FunctionConvINS_14ConvStringImplEE19execute_scalar_argsEPNS_15FunctionContextEPKNS_9ColumnStrIjEEaaPS6_RNS_8PODArrayIhLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEEm
158
};
159
160
struct ConvInt64Impl {
161
    using DataType = DataTypeInt64;
162
163
    static void calculate_cell(FunctionContext* context, const DataType::ColumnType* data_column,
164
                               const Int8 src_base, const Int8 dst_base,
165
                               ColumnString* result_column, NullMap& result_null_map,
166
2
                               size_t index) {
167
2
        Int64 num = data_column->get_element(index);
168
2
        if (src_base < 0 && num >= 0) {
169
0
            result_null_map[index] = true;
170
0
            result_column->insert_default();
171
0
            return;
172
0
        }
173
174
2
        int64_t decimal_num = num;
175
2
        if (src_base != 10) {
176
0
            if (!MathFunctions::decimal_in_base_to_decimal(num, src_base, &decimal_num)) {
177
0
                MathFunctions::handle_parse_result(dst_base, &decimal_num,
178
0
                                                   StringParser::PARSE_OVERFLOW);
179
0
            }
180
0
        }
181
2
        StringRef str = MathFunctions::decimal_to_base(context, decimal_num, dst_base);
182
2
        result_column->insert_data(reinterpret_cast<const char*>(str.data), str.size);
183
2
    }
184
};
185
186
struct ConvStringImpl {
187
    using DataType = DataTypeString;
188
189
    static void calculate_cell(FunctionContext* context, const DataType::ColumnType* data_column,
190
                               const Int8 src_base, const Int8 dst_base,
191
                               ColumnString* result_column, NullMap& result_null_map,
192
1
                               size_t index) {
193
1
        StringRef str = data_column->get_data_at(index);
194
1
        auto new_size = str.size;
195
        // eg: select conv('1.464868',10,2); the result should be return 1.
196
        // But StringParser::string_to_int will PARSE_FAILURE and return 0,
197
        // so should handle the point part of number firstly if need convert '1.464868' to number 1
198
1
        if (auto pos = str.to_string_view().find_first_of('.'); pos != std::string::npos) {
199
0
            new_size = pos;
200
0
        }
201
1
        StringParser::ParseResult parse_res;
202
        // select conv('ffffffffffffff', 24, 2);
203
        // if 'ffffffffffffff' parse as int64_t will be overflow, will be get max value: std::numeric_limits<int64_t>::max()
204
        // so change it parse as uint64_t, and return value could still use int64_t, in function decimal_to_base could handle it.
205
        // But if the value is still overflow in uint64_t, will get max value of uint64_t
206
1
        int64_t decimal_num =
207
1
                StringParser::string_to_int<uint64_t>(str.data, new_size, src_base, &parse_res);
208
1
        if (src_base < 0 && decimal_num >= 0) {
209
0
            result_null_map[index] = true;
210
0
            result_column->insert_default();
211
0
            return;
212
0
        }
213
214
1
        if (!MathFunctions::handle_parse_result(dst_base, &decimal_num, parse_res)) {
215
0
            result_column->insert_data("0", 1);
216
1
        } else {
217
1
            StringRef str_base = MathFunctions::decimal_to_base(context, decimal_num, dst_base);
218
1
            result_column->insert_data(reinterpret_cast<const char*>(str_base.data), str_base.size);
219
1
        }
220
1
    }
221
};
222
223
1
void register_function_conv(SimpleFunctionFactory& factory) {
224
1
    factory.register_function<FunctionConv<ConvInt64Impl>>();
225
1
    factory.register_function<FunctionConv<ConvStringImpl>>();
226
1
}
227
228
} // namespace doris