Coverage Report

Created: 2026-04-14 10:14

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
be/src/exprs/function/function_conv.cpp
Line
Count
Source
1
// Licensed to the Apache Software Foundation (ASF) under one
2
// or more contributor license agreements.  See the NOTICE file
3
// distributed with this work for additional information
4
// regarding copyright ownership.  The ASF licenses this file
5
// to you under the Apache License, Version 2.0 (the
6
// "License"); you may not use this file except in compliance
7
// with the License.  You may obtain a copy of the License at
8
//
9
//   http://www.apache.org/licenses/LICENSE-2.0
10
//
11
// Unless required by applicable law or agreed to in writing,
12
// software distributed under the License is distributed on an
13
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
14
// KIND, either express or implied.  See the License for the
15
// specific language governing permissions and limitations
16
// under the License.
17
18
#include <stdint.h>
19
#include <stdlib.h>
20
21
#include <boost/iterator/iterator_facade.hpp>
22
// IWYU pragma: no_include <bits/std_abs.h>
23
#include <algorithm>
24
#include <cmath> // IWYU pragma: keep
25
#include <memory>
26
#include <utility>
27
28
#include "common/status.h"
29
#include "core/assert_cast.h"
30
#include "core/block/block.h"
31
#include "core/block/column_numbers.h"
32
#include "core/block/column_with_type_and_name.h"
33
#include "core/column/column.h"
34
#include "core/column/column_const.h"
35
#include "core/column/column_nullable.h"
36
#include "core/column/column_string.h"
37
#include "core/column/column_vector.h"
38
#include "core/data_type/data_type.h"
39
#include "core/data_type/data_type_nullable.h"
40
#include "core/data_type/data_type_number.h"
41
#include "core/data_type/data_type_string.h"
42
#include "core/string_ref.h"
43
#include "core/types.h"
44
#include "exprs/aggregate/aggregate_function.h"
45
#include "exprs/function/function.h"
46
#include "exprs/function/simple_function_factory.h"
47
#include "exprs/math_functions.h"
48
#include "util/string_parser.hpp"
49
50
namespace doris {
51
class FunctionContext;
52
} // namespace doris
53
54
namespace doris {
55
56
template <typename Impl>
57
class FunctionConv : public IFunction {
58
public:
59
    static constexpr auto name = "conv";
60
2
    String get_name() const override { return name; }
_ZNK5doris12FunctionConvINS_13ConvInt64ImplEE8get_nameB5cxx11Ev
Line
Count
Source
60
1
    String get_name() const override { return name; }
_ZNK5doris12FunctionConvINS_14ConvStringImplEE8get_nameB5cxx11Ev
Line
Count
Source
60
1
    String get_name() const override { return name; }
61
78
    static FunctionPtr create() { return std::make_shared<FunctionConv<Impl>>(); }
_ZN5doris12FunctionConvINS_13ConvInt64ImplEE6createEv
Line
Count
Source
61
40
    static FunctionPtr create() { return std::make_shared<FunctionConv<Impl>>(); }
_ZN5doris12FunctionConvINS_14ConvStringImplEE6createEv
Line
Count
Source
61
38
    static FunctionPtr create() { return std::make_shared<FunctionConv<Impl>>(); }
62
63
60
    DataTypePtr get_return_type_impl(const DataTypes& arguments) const override {
64
60
        return make_nullable(std::make_shared<DataTypeString>());
65
60
    }
_ZNK5doris12FunctionConvINS_13ConvInt64ImplEE20get_return_type_implERKSt6vectorISt10shared_ptrIKNS_9IDataTypeEESaIS7_EE
Line
Count
Source
63
31
    DataTypePtr get_return_type_impl(const DataTypes& arguments) const override {
64
31
        return make_nullable(std::make_shared<DataTypeString>());
65
31
    }
_ZNK5doris12FunctionConvINS_14ConvStringImplEE20get_return_type_implERKSt6vectorISt10shared_ptrIKNS_9IDataTypeEESaIS7_EE
Line
Count
Source
63
29
    DataTypePtr get_return_type_impl(const DataTypes& arguments) const override {
64
29
        return make_nullable(std::make_shared<DataTypeString>());
65
29
    }
66
76
    DataTypes get_variadic_argument_types_impl() const override {
67
76
        return {std::make_shared<typename Impl::DataType>(), std::make_shared<DataTypeInt8>(),
68
76
                std::make_shared<DataTypeInt8>()};
69
76
    }
_ZNK5doris12FunctionConvINS_13ConvInt64ImplEE32get_variadic_argument_types_implEv
Line
Count
Source
66
39
    DataTypes get_variadic_argument_types_impl() const override {
67
39
        return {std::make_shared<typename Impl::DataType>(), std::make_shared<DataTypeInt8>(),
68
39
                std::make_shared<DataTypeInt8>()};
69
39
    }
_ZNK5doris12FunctionConvINS_14ConvStringImplEE32get_variadic_argument_types_implEv
Line
Count
Source
66
37
    DataTypes get_variadic_argument_types_impl() const override {
67
37
        return {std::make_shared<typename Impl::DataType>(), std::make_shared<DataTypeInt8>(),
68
37
                std::make_shared<DataTypeInt8>()};
69
37
    }
70
60
    size_t get_number_of_arguments() const override {
71
60
        return get_variadic_argument_types_impl().size();
72
60
    }
_ZNK5doris12FunctionConvINS_13ConvInt64ImplEE23get_number_of_argumentsEv
Line
Count
Source
70
31
    size_t get_number_of_arguments() const override {
71
31
        return get_variadic_argument_types_impl().size();
72
31
    }
_ZNK5doris12FunctionConvINS_14ConvStringImplEE23get_number_of_argumentsEv
Line
Count
Source
70
29
    size_t get_number_of_arguments() const override {
71
29
        return get_variadic_argument_types_impl().size();
72
29
    }
73
74
    Status execute_impl(FunctionContext* context, Block& block, const ColumnNumbers& arguments,
75
61
                        uint32_t result, size_t input_rows_count) const override {
76
61
        auto result_column = ColumnString::create();
77
61
        auto result_null_map_column = ColumnUInt8::create(input_rows_count, 0);
78
79
61
        bool col_const[3];
80
61
        ColumnPtr argument_columns[3];
81
244
        for (int i = 0; i < 3; ++i) {
82
183
            col_const[i] = is_column_const(*block.get_by_position(arguments[i]).column);
83
183
        }
84
61
        argument_columns[0] = col_const[0] ? static_cast<const ColumnConst&>(
85
0
                                                     *block.get_by_position(arguments[0]).column)
86
0
                                                     .convert_to_full_column()
87
61
                                           : block.get_by_position(arguments[0]).column;
88
89
61
        default_preprocess_parameter_columns(argument_columns, col_const, {1, 2}, block, arguments);
90
91
61
        if (col_const[1] && col_const[2]) {
92
2
            execute_scalar_args(
93
2
                    context,
94
2
                    assert_cast<const typename Impl::DataType::ColumnType*>(
95
2
                            argument_columns[0].get()),
96
2
                    assert_cast<const ColumnInt8*>(argument_columns[1].get())->get_element(0),
97
2
                    assert_cast<const ColumnInt8*>(argument_columns[2].get())->get_element(0),
98
2
                    assert_cast<ColumnString*>(result_column.get()),
99
2
                    assert_cast<ColumnUInt8*>(result_null_map_column.get())->get_data(),
100
2
                    input_rows_count);
101
59
        } else {
102
59
            execute_straight(context,
103
59
                             assert_cast<const typename Impl::DataType::ColumnType*>(
104
59
                                     argument_columns[0].get()),
105
59
                             assert_cast<const ColumnInt8*>(argument_columns[1].get()),
106
59
                             assert_cast<const ColumnInt8*>(argument_columns[2].get()),
107
59
                             assert_cast<ColumnString*>(result_column.get()),
108
59
                             assert_cast<ColumnUInt8*>(result_null_map_column.get())->get_data(),
109
59
                             input_rows_count);
110
59
        }
111
112
61
        block.get_by_position(result).column =
113
61
                ColumnNullable::create(std::move(result_column), std::move(result_null_map_column));
114
61
        return Status::OK();
115
61
    }
_ZNK5doris12FunctionConvINS_13ConvInt64ImplEE12execute_implEPNS_15FunctionContextERNS_5BlockERKSt6vectorIjSaIjEEjm
Line
Count
Source
75
22
                        uint32_t result, size_t input_rows_count) const override {
76
22
        auto result_column = ColumnString::create();
77
22
        auto result_null_map_column = ColumnUInt8::create(input_rows_count, 0);
78
79
22
        bool col_const[3];
80
22
        ColumnPtr argument_columns[3];
81
88
        for (int i = 0; i < 3; ++i) {
82
66
            col_const[i] = is_column_const(*block.get_by_position(arguments[i]).column);
83
66
        }
84
22
        argument_columns[0] = col_const[0] ? static_cast<const ColumnConst&>(
85
0
                                                     *block.get_by_position(arguments[0]).column)
86
0
                                                     .convert_to_full_column()
87
22
                                           : block.get_by_position(arguments[0]).column;
88
89
22
        default_preprocess_parameter_columns(argument_columns, col_const, {1, 2}, block, arguments);
90
91
22
        if (col_const[1] && col_const[2]) {
92
0
            execute_scalar_args(
93
0
                    context,
94
0
                    assert_cast<const typename Impl::DataType::ColumnType*>(
95
0
                            argument_columns[0].get()),
96
0
                    assert_cast<const ColumnInt8*>(argument_columns[1].get())->get_element(0),
97
0
                    assert_cast<const ColumnInt8*>(argument_columns[2].get())->get_element(0),
98
0
                    assert_cast<ColumnString*>(result_column.get()),
99
0
                    assert_cast<ColumnUInt8*>(result_null_map_column.get())->get_data(),
100
0
                    input_rows_count);
101
22
        } else {
102
22
            execute_straight(context,
103
22
                             assert_cast<const typename Impl::DataType::ColumnType*>(
104
22
                                     argument_columns[0].get()),
105
22
                             assert_cast<const ColumnInt8*>(argument_columns[1].get()),
106
22
                             assert_cast<const ColumnInt8*>(argument_columns[2].get()),
107
22
                             assert_cast<ColumnString*>(result_column.get()),
108
22
                             assert_cast<ColumnUInt8*>(result_null_map_column.get())->get_data(),
109
22
                             input_rows_count);
110
22
        }
111
112
22
        block.get_by_position(result).column =
113
22
                ColumnNullable::create(std::move(result_column), std::move(result_null_map_column));
114
22
        return Status::OK();
115
22
    }
_ZNK5doris12FunctionConvINS_14ConvStringImplEE12execute_implEPNS_15FunctionContextERNS_5BlockERKSt6vectorIjSaIjEEjm
Line
Count
Source
75
39
                        uint32_t result, size_t input_rows_count) const override {
76
39
        auto result_column = ColumnString::create();
77
39
        auto result_null_map_column = ColumnUInt8::create(input_rows_count, 0);
78
79
39
        bool col_const[3];
80
39
        ColumnPtr argument_columns[3];
81
156
        for (int i = 0; i < 3; ++i) {
82
117
            col_const[i] = is_column_const(*block.get_by_position(arguments[i]).column);
83
117
        }
84
39
        argument_columns[0] = col_const[0] ? static_cast<const ColumnConst&>(
85
0
                                                     *block.get_by_position(arguments[0]).column)
86
0
                                                     .convert_to_full_column()
87
39
                                           : block.get_by_position(arguments[0]).column;
88
89
39
        default_preprocess_parameter_columns(argument_columns, col_const, {1, 2}, block, arguments);
90
91
39
        if (col_const[1] && col_const[2]) {
92
2
            execute_scalar_args(
93
2
                    context,
94
2
                    assert_cast<const typename Impl::DataType::ColumnType*>(
95
2
                            argument_columns[0].get()),
96
2
                    assert_cast<const ColumnInt8*>(argument_columns[1].get())->get_element(0),
97
2
                    assert_cast<const ColumnInt8*>(argument_columns[2].get())->get_element(0),
98
2
                    assert_cast<ColumnString*>(result_column.get()),
99
2
                    assert_cast<ColumnUInt8*>(result_null_map_column.get())->get_data(),
100
2
                    input_rows_count);
101
37
        } else {
102
37
            execute_straight(context,
103
37
                             assert_cast<const typename Impl::DataType::ColumnType*>(
104
37
                                     argument_columns[0].get()),
105
37
                             assert_cast<const ColumnInt8*>(argument_columns[1].get()),
106
37
                             assert_cast<const ColumnInt8*>(argument_columns[2].get()),
107
37
                             assert_cast<ColumnString*>(result_column.get()),
108
37
                             assert_cast<ColumnUInt8*>(result_null_map_column.get())->get_data(),
109
37
                             input_rows_count);
110
37
        }
111
112
39
        block.get_by_position(result).column =
113
39
                ColumnNullable::create(std::move(result_column), std::move(result_null_map_column));
114
39
        return Status::OK();
115
39
    }
116
117
private:
118
    // check out of bound.
119
112
    static bool _check_oob(const Int8 src_base, const Int8 dst_base) {
120
112
        return std::abs(src_base) < MathFunctions::MIN_BASE ||
121
112
               std::abs(src_base) > MathFunctions::MAX_BASE ||
122
112
               std::abs(dst_base) < MathFunctions::MIN_BASE ||
123
112
               std::abs(dst_base) > MathFunctions::MAX_BASE;
124
112
    }
_ZN5doris12FunctionConvINS_13ConvInt64ImplEE10_check_oobEaa
Line
Count
Source
119
39
    static bool _check_oob(const Int8 src_base, const Int8 dst_base) {
120
39
        return std::abs(src_base) < MathFunctions::MIN_BASE ||
121
39
               std::abs(src_base) > MathFunctions::MAX_BASE ||
122
39
               std::abs(dst_base) < MathFunctions::MIN_BASE ||
123
39
               std::abs(dst_base) > MathFunctions::MAX_BASE;
124
39
    }
_ZN5doris12FunctionConvINS_14ConvStringImplEE10_check_oobEaa
Line
Count
Source
119
73
    static bool _check_oob(const Int8 src_base, const Int8 dst_base) {
120
73
        return std::abs(src_base) < MathFunctions::MIN_BASE ||
121
73
               std::abs(src_base) > MathFunctions::MAX_BASE ||
122
73
               std::abs(dst_base) < MathFunctions::MIN_BASE ||
123
73
               std::abs(dst_base) > MathFunctions::MAX_BASE;
124
73
    }
125
    static void execute_straight(FunctionContext* context,
126
                                 const typename Impl::DataType::ColumnType* data_column,
127
                                 const ColumnInt8* src_base_column,
128
                                 const ColumnInt8* dst_base_column, ColumnString* result_column,
129
59
                                 NullMap& result_null_map, size_t input_rows_count) {
130
169
        for (size_t i = 0; i < input_rows_count; i++) {
131
110
            Int8 src_base = src_base_column->get_element(i);
132
110
            Int8 dst_base = dst_base_column->get_element(i);
133
110
            if (_check_oob(src_base, dst_base)) {
134
9
                result_null_map[i] = true;
135
9
                result_column->insert_default();
136
101
            } else {
137
101
                Impl::calculate_cell(context, data_column, src_base, dst_base, result_column,
138
101
                                     result_null_map, i);
139
101
            }
140
110
        }
141
59
    }
_ZN5doris12FunctionConvINS_13ConvInt64ImplEE16execute_straightEPNS_15FunctionContextEPKNS_12ColumnVectorILNS_13PrimitiveTypeE6EEEPKNS5_ILS6_3EEESC_PNS_9ColumnStrIjEERNS_8PODArrayIhLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEEm
Line
Count
Source
129
22
                                 NullMap& result_null_map, size_t input_rows_count) {
130
61
        for (size_t i = 0; i < input_rows_count; i++) {
131
39
            Int8 src_base = src_base_column->get_element(i);
132
39
            Int8 dst_base = dst_base_column->get_element(i);
133
39
            if (_check_oob(src_base, dst_base)) {
134
3
                result_null_map[i] = true;
135
3
                result_column->insert_default();
136
36
            } else {
137
36
                Impl::calculate_cell(context, data_column, src_base, dst_base, result_column,
138
36
                                     result_null_map, i);
139
36
            }
140
39
        }
141
22
    }
_ZN5doris12FunctionConvINS_14ConvStringImplEE16execute_straightEPNS_15FunctionContextEPKNS_9ColumnStrIjEEPKNS_12ColumnVectorILNS_13PrimitiveTypeE3EEESD_PS6_RNS_8PODArrayIhLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEEm
Line
Count
Source
129
37
                                 NullMap& result_null_map, size_t input_rows_count) {
130
108
        for (size_t i = 0; i < input_rows_count; i++) {
131
71
            Int8 src_base = src_base_column->get_element(i);
132
71
            Int8 dst_base = dst_base_column->get_element(i);
133
71
            if (_check_oob(src_base, dst_base)) {
134
6
                result_null_map[i] = true;
135
6
                result_column->insert_default();
136
65
            } else {
137
65
                Impl::calculate_cell(context, data_column, src_base, dst_base, result_column,
138
65
                                     result_null_map, i);
139
65
            }
140
71
        }
141
37
    }
142
    static void execute_scalar_args(FunctionContext* context,
143
                                    const typename Impl::DataType::ColumnType* data_column,
144
                                    const Int8 src_base, const Int8 dst_base,
145
                                    ColumnString* result_column, NullMap& result_null_map,
146
2
                                    size_t input_rows_count) {
147
2
        if (_check_oob(src_base, dst_base)) {
148
0
            result_null_map.assign(input_rows_count, UInt8 {true});
149
0
            result_column->insert_many_defaults(input_rows_count);
150
0
            return;
151
0
        }
152
10
        for (size_t i = 0; i < input_rows_count; i++) {
153
8
            Impl::calculate_cell(context, data_column, src_base, dst_base, result_column,
154
8
                                 result_null_map, i);
155
8
        }
156
2
    }
Unexecuted instantiation: _ZN5doris12FunctionConvINS_13ConvInt64ImplEE19execute_scalar_argsEPNS_15FunctionContextEPKNS_12ColumnVectorILNS_13PrimitiveTypeE6EEEaaPNS_9ColumnStrIjEERNS_8PODArrayIhLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEEm
_ZN5doris12FunctionConvINS_14ConvStringImplEE19execute_scalar_argsEPNS_15FunctionContextEPKNS_9ColumnStrIjEEaaPS6_RNS_8PODArrayIhLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEEm
Line
Count
Source
146
2
                                    size_t input_rows_count) {
147
2
        if (_check_oob(src_base, dst_base)) {
148
0
            result_null_map.assign(input_rows_count, UInt8 {true});
149
0
            result_column->insert_many_defaults(input_rows_count);
150
0
            return;
151
0
        }
152
10
        for (size_t i = 0; i < input_rows_count; i++) {
153
8
            Impl::calculate_cell(context, data_column, src_base, dst_base, result_column,
154
8
                                 result_null_map, i);
155
8
        }
156
2
    }
157
};
158
159
struct ConvInt64Impl {
160
    using DataType = DataTypeInt64;
161
162
    static void calculate_cell(FunctionContext* context, const DataType::ColumnType* data_column,
163
                               const Int8 src_base, const Int8 dst_base,
164
                               ColumnString* result_column, NullMap& result_null_map,
165
36
                               size_t index) {
166
36
        Int64 num = data_column->get_element(index);
167
36
        if (src_base < 0 && num >= 0) {
168
0
            result_null_map[index] = true;
169
0
            result_column->insert_default();
170
0
            return;
171
0
        }
172
173
36
        int64_t decimal_num = num;
174
36
        if (src_base != 10) {
175
22
            if (!MathFunctions::decimal_in_base_to_decimal(num, src_base, &decimal_num)) {
176
0
                MathFunctions::handle_parse_result(dst_base, &decimal_num,
177
0
                                                   StringParser::PARSE_OVERFLOW);
178
0
            }
179
22
        }
180
36
        StringRef str = MathFunctions::decimal_to_base(context, decimal_num, dst_base);
181
36
        result_column->insert_data(reinterpret_cast<const char*>(str.data), str.size);
182
36
    }
183
};
184
185
struct ConvStringImpl {
186
    using DataType = DataTypeString;
187
188
    static void calculate_cell(FunctionContext* context, const DataType::ColumnType* data_column,
189
                               const Int8 src_base, const Int8 dst_base,
190
                               ColumnString* result_column, NullMap& result_null_map,
191
73
                               size_t index) {
192
73
        StringRef str = data_column->get_data_at(index);
193
73
        auto new_size = str.size;
194
        // eg: select conv('1.464868',10,2); the result should be return 1.
195
        // But StringParser::string_to_int will PARSE_FAILURE and return 0,
196
        // so should handle the point part of number firstly if need convert '1.464868' to number 1
197
73
        if (auto pos = str.to_string_view().find_first_of('.'); pos != std::string::npos) {
198
3
            new_size = pos;
199
3
        }
200
73
        StringParser::ParseResult parse_res;
201
        // select conv('ffffffffffffff', 24, 2);
202
        // if 'ffffffffffffff' parse as int64_t will be overflow, will be get max value: std::numeric_limits<int64_t>::max()
203
        // so change it parse as uint64_t, and return value could still use int64_t, in function decimal_to_base could handle it.
204
        // But if the value is still overflow in uint64_t, will get max value of uint64_t
205
73
        int64_t decimal_num =
206
73
                StringParser::string_to_int<uint64_t>(str.data, new_size, src_base, &parse_res);
207
73
        if (src_base < 0 && decimal_num >= 0) {
208
0
            result_null_map[index] = true;
209
0
            result_column->insert_default();
210
0
            return;
211
0
        }
212
213
73
        if (!MathFunctions::handle_parse_result(dst_base, &decimal_num, parse_res)) {
214
2
            result_column->insert_data("0", 1);
215
71
        } else {
216
71
            StringRef str_base = MathFunctions::decimal_to_base(context, decimal_num, dst_base);
217
71
            result_column->insert_data(reinterpret_cast<const char*>(str_base.data), str_base.size);
218
71
        }
219
73
    }
220
};
221
222
8
void register_function_conv(SimpleFunctionFactory& factory) {
223
8
    factory.register_function<FunctionConv<ConvInt64Impl>>();
224
8
    factory.register_function<FunctionConv<ConvStringImpl>>();
225
8
}
226
227
} // namespace doris