Coverage Report

Created: 2026-05-13 03:56

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
be/src/exprs/function/function_conv.cpp
Line
Count
Source
1
// Licensed to the Apache Software Foundation (ASF) under one
2
// or more contributor license agreements.  See the NOTICE file
3
// distributed with this work for additional information
4
// regarding copyright ownership.  The ASF licenses this file
5
// to you under the Apache License, Version 2.0 (the
6
// "License"); you may not use this file except in compliance
7
// with the License.  You may obtain a copy of the License at
8
//
9
//   http://www.apache.org/licenses/LICENSE-2.0
10
//
11
// Unless required by applicable law or agreed to in writing,
12
// software distributed under the License is distributed on an
13
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
14
// KIND, either express or implied.  See the License for the
15
// specific language governing permissions and limitations
16
// under the License.
17
18
#include <stdint.h>
19
#include <stdlib.h>
20
21
#include <boost/iterator/iterator_facade.hpp>
22
// IWYU pragma: no_include <bits/std_abs.h>
23
#include <algorithm>
24
#include <cmath> // IWYU pragma: keep
25
#include <memory>
26
#include <utility>
27
28
#include "common/status.h"
29
#include "core/assert_cast.h"
30
#include "core/block/block.h"
31
#include "core/block/column_numbers.h"
32
#include "core/block/column_with_type_and_name.h"
33
#include "core/column/column.h"
34
#include "core/column/column_const.h"
35
#include "core/column/column_nullable.h"
36
#include "core/column/column_string.h"
37
#include "core/column/column_vector.h"
38
#include "core/data_type/data_type.h"
39
#include "core/data_type/data_type_nullable.h"
40
#include "core/data_type/data_type_number.h"
41
#include "core/data_type/data_type_string.h"
42
#include "core/string_ref.h"
43
#include "core/types.h"
44
#include "exprs/aggregate/aggregate_function.h"
45
#include "exprs/function/function.h"
46
#include "exprs/function/simple_function_factory.h"
47
#include "exprs/math_functions.h"
48
#include "util/string_parser.hpp"
49
50
namespace doris {
51
class FunctionContext;
52
} // namespace doris
53
54
namespace doris {
55
56
template <typename Impl>
57
class FunctionConv : public IFunction {
58
public:
59
    static constexpr auto name = "conv";
60
2
    String get_name() const override { return name; }
_ZNK5doris12FunctionConvINS_13ConvInt64ImplEE8get_nameB5cxx11Ev
Line
Count
Source
60
1
    String get_name() const override { return name; }
_ZNK5doris12FunctionConvINS_14ConvStringImplEE8get_nameB5cxx11Ev
Line
Count
Source
60
1
    String get_name() const override { return name; }
61
9
    static FunctionPtr create() { return std::make_shared<FunctionConv<Impl>>(); }
_ZN5doris12FunctionConvINS_13ConvInt64ImplEE6createEv
Line
Count
Source
61
5
    static FunctionPtr create() { return std::make_shared<FunctionConv<Impl>>(); }
_ZN5doris12FunctionConvINS_14ConvStringImplEE6createEv
Line
Count
Source
61
4
    static FunctionPtr create() { return std::make_shared<FunctionConv<Impl>>(); }
62
63
5
    DataTypePtr get_return_type_impl(const DataTypes& arguments) const override {
64
5
        return make_nullable(std::make_shared<DataTypeString>());
65
5
    }
_ZNK5doris12FunctionConvINS_13ConvInt64ImplEE20get_return_type_implERKSt6vectorISt10shared_ptrIKNS_9IDataTypeEESaIS7_EE
Line
Count
Source
63
3
    DataTypePtr get_return_type_impl(const DataTypes& arguments) const override {
64
3
        return make_nullable(std::make_shared<DataTypeString>());
65
3
    }
_ZNK5doris12FunctionConvINS_14ConvStringImplEE20get_return_type_implERKSt6vectorISt10shared_ptrIKNS_9IDataTypeEESaIS7_EE
Line
Count
Source
63
2
    DataTypePtr get_return_type_impl(const DataTypes& arguments) const override {
64
2
        return make_nullable(std::make_shared<DataTypeString>());
65
2
    }
66
7
    DataTypes get_variadic_argument_types_impl() const override {
67
7
        return {std::make_shared<typename Impl::DataType>(), std::make_shared<DataTypeInt8>(),
68
7
                std::make_shared<DataTypeInt8>()};
69
7
    }
_ZNK5doris12FunctionConvINS_13ConvInt64ImplEE32get_variadic_argument_types_implEv
Line
Count
Source
66
4
    DataTypes get_variadic_argument_types_impl() const override {
67
4
        return {std::make_shared<typename Impl::DataType>(), std::make_shared<DataTypeInt8>(),
68
4
                std::make_shared<DataTypeInt8>()};
69
4
    }
_ZNK5doris12FunctionConvINS_14ConvStringImplEE32get_variadic_argument_types_implEv
Line
Count
Source
66
3
    DataTypes get_variadic_argument_types_impl() const override {
67
3
        return {std::make_shared<typename Impl::DataType>(), std::make_shared<DataTypeInt8>(),
68
3
                std::make_shared<DataTypeInt8>()};
69
3
    }
70
5
    size_t get_number_of_arguments() const override {
71
5
        return get_variadic_argument_types_impl().size();
72
5
    }
_ZNK5doris12FunctionConvINS_13ConvInt64ImplEE23get_number_of_argumentsEv
Line
Count
Source
70
3
    size_t get_number_of_arguments() const override {
71
3
        return get_variadic_argument_types_impl().size();
72
3
    }
_ZNK5doris12FunctionConvINS_14ConvStringImplEE23get_number_of_argumentsEv
Line
Count
Source
70
2
    size_t get_number_of_arguments() const override {
71
2
        return get_variadic_argument_types_impl().size();
72
2
    }
73
74
    Status execute_impl(FunctionContext* context, Block& block, const ColumnNumbers& arguments,
75
3
                        uint32_t result, size_t input_rows_count) const override {
76
3
        auto result_column = ColumnString::create();
77
3
        auto result_null_map_column = ColumnUInt8::create(input_rows_count, 0);
78
79
3
        bool col_const[3];
80
3
        ColumnPtr argument_columns[3];
81
12
        for (int i = 0; i < 3; ++i) {
82
9
            col_const[i] = is_column_const(*block.get_by_position(arguments[i]).column);
83
9
        }
84
3
        argument_columns[0] = col_const[0] ? static_cast<const ColumnConst&>(
85
0
                                                     *block.get_by_position(arguments[0]).column)
86
0
                                                     .convert_to_full_column()
87
3
                                           : block.get_by_position(arguments[0]).column;
88
89
3
        default_preprocess_parameter_columns(argument_columns, col_const, {1, 2}, block, arguments);
90
91
3
        if (col_const[1] && col_const[2]) {
92
0
            execute_scalar_args(
93
0
                    context,
94
0
                    assert_cast<const typename Impl::DataType::ColumnType*>(
95
0
                            argument_columns[0].get()),
96
0
                    assert_cast<const ColumnInt8*>(argument_columns[1].get())->get_element(0),
97
0
                    assert_cast<const ColumnInt8*>(argument_columns[2].get())->get_element(0),
98
0
                    result_column.get(), result_null_map_column->get_data(), input_rows_count);
99
3
        } else {
100
3
            execute_straight(context,
101
3
                             assert_cast<const typename Impl::DataType::ColumnType*>(
102
3
                                     argument_columns[0].get()),
103
3
                             assert_cast<const ColumnInt8*>(argument_columns[1].get()),
104
3
                             assert_cast<const ColumnInt8*>(argument_columns[2].get()),
105
3
                             result_column.get(), result_null_map_column->get_data(),
106
3
                             input_rows_count);
107
3
        }
108
109
3
        block.get_by_position(result).column =
110
3
                ColumnNullable::create(std::move(result_column), std::move(result_null_map_column));
111
3
        return Status::OK();
112
3
    }
_ZNK5doris12FunctionConvINS_13ConvInt64ImplEE12execute_implEPNS_15FunctionContextERNS_5BlockERKSt6vectorIjSaIjEEjm
Line
Count
Source
75
2
                        uint32_t result, size_t input_rows_count) const override {
76
2
        auto result_column = ColumnString::create();
77
2
        auto result_null_map_column = ColumnUInt8::create(input_rows_count, 0);
78
79
2
        bool col_const[3];
80
2
        ColumnPtr argument_columns[3];
81
8
        for (int i = 0; i < 3; ++i) {
82
6
            col_const[i] = is_column_const(*block.get_by_position(arguments[i]).column);
83
6
        }
84
2
        argument_columns[0] = col_const[0] ? static_cast<const ColumnConst&>(
85
0
                                                     *block.get_by_position(arguments[0]).column)
86
0
                                                     .convert_to_full_column()
87
2
                                           : block.get_by_position(arguments[0]).column;
88
89
2
        default_preprocess_parameter_columns(argument_columns, col_const, {1, 2}, block, arguments);
90
91
2
        if (col_const[1] && col_const[2]) {
92
0
            execute_scalar_args(
93
0
                    context,
94
0
                    assert_cast<const typename Impl::DataType::ColumnType*>(
95
0
                            argument_columns[0].get()),
96
0
                    assert_cast<const ColumnInt8*>(argument_columns[1].get())->get_element(0),
97
0
                    assert_cast<const ColumnInt8*>(argument_columns[2].get())->get_element(0),
98
0
                    result_column.get(), result_null_map_column->get_data(), input_rows_count);
99
2
        } else {
100
2
            execute_straight(context,
101
2
                             assert_cast<const typename Impl::DataType::ColumnType*>(
102
2
                                     argument_columns[0].get()),
103
2
                             assert_cast<const ColumnInt8*>(argument_columns[1].get()),
104
2
                             assert_cast<const ColumnInt8*>(argument_columns[2].get()),
105
2
                             result_column.get(), result_null_map_column->get_data(),
106
2
                             input_rows_count);
107
2
        }
108
109
2
        block.get_by_position(result).column =
110
2
                ColumnNullable::create(std::move(result_column), std::move(result_null_map_column));
111
2
        return Status::OK();
112
2
    }
_ZNK5doris12FunctionConvINS_14ConvStringImplEE12execute_implEPNS_15FunctionContextERNS_5BlockERKSt6vectorIjSaIjEEjm
Line
Count
Source
75
1
                        uint32_t result, size_t input_rows_count) const override {
76
1
        auto result_column = ColumnString::create();
77
1
        auto result_null_map_column = ColumnUInt8::create(input_rows_count, 0);
78
79
1
        bool col_const[3];
80
1
        ColumnPtr argument_columns[3];
81
4
        for (int i = 0; i < 3; ++i) {
82
3
            col_const[i] = is_column_const(*block.get_by_position(arguments[i]).column);
83
3
        }
84
1
        argument_columns[0] = col_const[0] ? static_cast<const ColumnConst&>(
85
0
                                                     *block.get_by_position(arguments[0]).column)
86
0
                                                     .convert_to_full_column()
87
1
                                           : block.get_by_position(arguments[0]).column;
88
89
1
        default_preprocess_parameter_columns(argument_columns, col_const, {1, 2}, block, arguments);
90
91
1
        if (col_const[1] && col_const[2]) {
92
0
            execute_scalar_args(
93
0
                    context,
94
0
                    assert_cast<const typename Impl::DataType::ColumnType*>(
95
0
                            argument_columns[0].get()),
96
0
                    assert_cast<const ColumnInt8*>(argument_columns[1].get())->get_element(0),
97
0
                    assert_cast<const ColumnInt8*>(argument_columns[2].get())->get_element(0),
98
0
                    result_column.get(), result_null_map_column->get_data(), input_rows_count);
99
1
        } else {
100
1
            execute_straight(context,
101
1
                             assert_cast<const typename Impl::DataType::ColumnType*>(
102
1
                                     argument_columns[0].get()),
103
1
                             assert_cast<const ColumnInt8*>(argument_columns[1].get()),
104
1
                             assert_cast<const ColumnInt8*>(argument_columns[2].get()),
105
1
                             result_column.get(), result_null_map_column->get_data(),
106
1
                             input_rows_count);
107
1
        }
108
109
1
        block.get_by_position(result).column =
110
1
                ColumnNullable::create(std::move(result_column), std::move(result_null_map_column));
111
1
        return Status::OK();
112
1
    }
113
114
private:
115
    // check out of bound.
116
3
    static bool _check_oob(const Int8 src_base, const Int8 dst_base) {
117
3
        return std::abs(src_base) < MathFunctions::MIN_BASE ||
118
3
               std::abs(src_base) > MathFunctions::MAX_BASE ||
119
3
               std::abs(dst_base) < MathFunctions::MIN_BASE ||
120
3
               std::abs(dst_base) > MathFunctions::MAX_BASE;
121
3
    }
_ZN5doris12FunctionConvINS_13ConvInt64ImplEE10_check_oobEaa
Line
Count
Source
116
2
    static bool _check_oob(const Int8 src_base, const Int8 dst_base) {
117
2
        return std::abs(src_base) < MathFunctions::MIN_BASE ||
118
2
               std::abs(src_base) > MathFunctions::MAX_BASE ||
119
2
               std::abs(dst_base) < MathFunctions::MIN_BASE ||
120
2
               std::abs(dst_base) > MathFunctions::MAX_BASE;
121
2
    }
_ZN5doris12FunctionConvINS_14ConvStringImplEE10_check_oobEaa
Line
Count
Source
116
1
    static bool _check_oob(const Int8 src_base, const Int8 dst_base) {
117
1
        return std::abs(src_base) < MathFunctions::MIN_BASE ||
118
1
               std::abs(src_base) > MathFunctions::MAX_BASE ||
119
1
               std::abs(dst_base) < MathFunctions::MIN_BASE ||
120
1
               std::abs(dst_base) > MathFunctions::MAX_BASE;
121
1
    }
122
    static void execute_straight(FunctionContext* context,
123
                                 const typename Impl::DataType::ColumnType* data_column,
124
                                 const ColumnInt8* src_base_column,
125
                                 const ColumnInt8* dst_base_column, ColumnString* result_column,
126
3
                                 NullMap& result_null_map, size_t input_rows_count) {
127
6
        for (size_t i = 0; i < input_rows_count; i++) {
128
3
            Int8 src_base = src_base_column->get_element(i);
129
3
            Int8 dst_base = dst_base_column->get_element(i);
130
3
            if (_check_oob(src_base, dst_base)) {
131
0
                result_null_map[i] = true;
132
0
                result_column->insert_default();
133
3
            } else {
134
3
                Impl::calculate_cell(context, data_column, src_base, dst_base, result_column,
135
3
                                     result_null_map, i);
136
3
            }
137
3
        }
138
3
    }
_ZN5doris12FunctionConvINS_13ConvInt64ImplEE16execute_straightEPNS_15FunctionContextEPKNS_12ColumnVectorILNS_13PrimitiveTypeE6EEEPKNS5_ILS6_3EEESC_PNS_9ColumnStrIjEERNS_8PODArrayIhLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEEm
Line
Count
Source
126
2
                                 NullMap& result_null_map, size_t input_rows_count) {
127
4
        for (size_t i = 0; i < input_rows_count; i++) {
128
2
            Int8 src_base = src_base_column->get_element(i);
129
2
            Int8 dst_base = dst_base_column->get_element(i);
130
2
            if (_check_oob(src_base, dst_base)) {
131
0
                result_null_map[i] = true;
132
0
                result_column->insert_default();
133
2
            } else {
134
2
                Impl::calculate_cell(context, data_column, src_base, dst_base, result_column,
135
2
                                     result_null_map, i);
136
2
            }
137
2
        }
138
2
    }
_ZN5doris12FunctionConvINS_14ConvStringImplEE16execute_straightEPNS_15FunctionContextEPKNS_9ColumnStrIjEEPKNS_12ColumnVectorILNS_13PrimitiveTypeE3EEESD_PS6_RNS_8PODArrayIhLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEEm
Line
Count
Source
126
1
                                 NullMap& result_null_map, size_t input_rows_count) {
127
2
        for (size_t i = 0; i < input_rows_count; i++) {
128
1
            Int8 src_base = src_base_column->get_element(i);
129
1
            Int8 dst_base = dst_base_column->get_element(i);
130
1
            if (_check_oob(src_base, dst_base)) {
131
0
                result_null_map[i] = true;
132
0
                result_column->insert_default();
133
1
            } else {
134
1
                Impl::calculate_cell(context, data_column, src_base, dst_base, result_column,
135
1
                                     result_null_map, i);
136
1
            }
137
1
        }
138
1
    }
139
    static void execute_scalar_args(FunctionContext* context,
140
                                    const typename Impl::DataType::ColumnType* data_column,
141
                                    const Int8 src_base, const Int8 dst_base,
142
                                    ColumnString* result_column, NullMap& result_null_map,
143
0
                                    size_t input_rows_count) {
144
0
        if (_check_oob(src_base, dst_base)) {
145
0
            result_null_map.assign(input_rows_count, UInt8 {true});
146
0
            result_column->insert_many_defaults(input_rows_count);
147
0
            return;
148
0
        }
149
0
        for (size_t i = 0; i < input_rows_count; i++) {
150
0
            Impl::calculate_cell(context, data_column, src_base, dst_base, result_column,
151
0
                                 result_null_map, i);
152
0
        }
153
0
    }
Unexecuted instantiation: _ZN5doris12FunctionConvINS_13ConvInt64ImplEE19execute_scalar_argsEPNS_15FunctionContextEPKNS_12ColumnVectorILNS_13PrimitiveTypeE6EEEaaPNS_9ColumnStrIjEERNS_8PODArrayIhLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEEm
Unexecuted instantiation: _ZN5doris12FunctionConvINS_14ConvStringImplEE19execute_scalar_argsEPNS_15FunctionContextEPKNS_9ColumnStrIjEEaaPS6_RNS_8PODArrayIhLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEEm
154
};
155
156
struct ConvInt64Impl {
157
    using DataType = DataTypeInt64;
158
159
    static void calculate_cell(FunctionContext* context, const DataType::ColumnType* data_column,
160
                               const Int8 src_base, const Int8 dst_base,
161
                               ColumnString* result_column, NullMap& result_null_map,
162
2
                               size_t index) {
163
2
        Int64 num = data_column->get_element(index);
164
2
        if (src_base < 0 && num >= 0) {
165
0
            result_null_map[index] = true;
166
0
            result_column->insert_default();
167
0
            return;
168
0
        }
169
170
2
        int64_t decimal_num = num;
171
2
        if (src_base != 10) {
172
0
            if (!MathFunctions::decimal_in_base_to_decimal(num, src_base, &decimal_num)) {
173
0
                MathFunctions::handle_parse_result(dst_base, &decimal_num,
174
0
                                                   StringParser::PARSE_OVERFLOW);
175
0
            }
176
0
        }
177
2
        StringRef str = MathFunctions::decimal_to_base(context, decimal_num, dst_base);
178
2
        result_column->insert_data(reinterpret_cast<const char*>(str.data), str.size);
179
2
    }
180
};
181
182
struct ConvStringImpl {
183
    using DataType = DataTypeString;
184
185
    static void calculate_cell(FunctionContext* context, const DataType::ColumnType* data_column,
186
                               const Int8 src_base, const Int8 dst_base,
187
                               ColumnString* result_column, NullMap& result_null_map,
188
1
                               size_t index) {
189
1
        StringRef str = data_column->get_data_at(index);
190
1
        auto new_size = str.size;
191
        // eg: select conv('1.464868',10,2); the result should be return 1.
192
        // But StringParser::string_to_int will PARSE_FAILURE and return 0,
193
        // so should handle the point part of number firstly if need convert '1.464868' to number 1
194
1
        if (auto pos = str.to_string_view().find_first_of('.'); pos != std::string::npos) {
195
0
            new_size = pos;
196
0
        }
197
1
        StringParser::ParseResult parse_res;
198
        // select conv('ffffffffffffff', 24, 2);
199
        // if 'ffffffffffffff' parse as int64_t will be overflow, will be get max value: std::numeric_limits<int64_t>::max()
200
        // so change it parse as uint64_t, and return value could still use int64_t, in function decimal_to_base could handle it.
201
        // But if the value is still overflow in uint64_t, will get max value of uint64_t
202
1
        int64_t decimal_num =
203
1
                StringParser::string_to_int<uint64_t>(str.data, new_size, src_base, &parse_res);
204
1
        if (src_base < 0 && decimal_num >= 0) {
205
0
            result_null_map[index] = true;
206
0
            result_column->insert_default();
207
0
            return;
208
0
        }
209
210
1
        if (!MathFunctions::handle_parse_result(dst_base, &decimal_num, parse_res)) {
211
0
            result_column->insert_data("0", 1);
212
1
        } else {
213
1
            StringRef str_base = MathFunctions::decimal_to_base(context, decimal_num, dst_base);
214
1
            result_column->insert_data(reinterpret_cast<const char*>(str_base.data), str_base.size);
215
1
        }
216
1
    }
217
};
218
219
1
void register_function_conv(SimpleFunctionFactory& factory) {
220
1
    factory.register_function<FunctionConv<ConvInt64Impl>>();
221
1
    factory.register_function<FunctionConv<ConvStringImpl>>();
222
1
}
223
224
} // namespace doris