Coverage Report

Created: 2026-04-22 18:58

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
be/src/exprs/vcast_expr.cpp
Line
Count
Source
1
// Licensed to the Apache Software Foundation (ASF) under one
2
// or more contributor license agreements.  See the NOTICE file
3
// distributed with this work for additional information
4
// regarding copyright ownership.  The ASF licenses this file
5
// to you under the Apache License, Version 2.0 (the
6
// "License"); you may not use this file except in compliance
7
// with the License.  You may obtain a copy of the License at
8
//
9
//   http://www.apache.org/licenses/LICENSE-2.0
10
//
11
// Unless required by applicable law or agreed to in writing,
12
// software distributed under the License is distributed on an
13
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
14
// KIND, either express or implied.  See the License for the
15
// specific language governing permissions and limitations
16
// under the License.
17
18
#include "exprs/vcast_expr.h"
19
20
#include <fmt/format.h>
21
#include <gen_cpp/Types_types.h>
22
#include <glog/logging.h>
23
24
#include <cstddef>
25
#include <memory>
26
#include <ostream>
27
28
#include "common/exception.h"
29
#include "common/status.h"
30
#include "core/assert_cast.h"
31
#include "core/block/block.h"
32
#include "core/block/column_with_type_and_name.h"
33
#include "core/block/columns_with_type_and_name.h"
34
#include "core/column/column.h"
35
#include "core/column/column_nullable.h"
36
#include "core/data_type/data_type_nullable.h"
37
#include "exprs/function/simple_function_factory.h"
38
#include "exprs/vexpr.h"
39
#include "exprs/vexpr_context.h"
40
#include "runtime/runtime_state.h"
41
42
namespace doris {
43
class RowDescriptor;
44
class RuntimeState;
45
} // namespace doris
46
47
namespace doris {
48
49
doris::Status VCastExpr::prepare(doris::RuntimeState* state, const doris::RowDescriptor& desc,
50
2
                                 VExprContext* context) {
51
2
    RETURN_IF_ERROR_OR_PREPARED(VExpr::prepare(state, desc, context));
52
53
2
    DCHECK_EQ(_children.size(), 1);
54
2
    auto child = _children[0];
55
2
    const auto& child_name = child->expr_name();
56
57
    // create a const string column
58
2
    _target_data_type = _data_type;
59
    // TODO(xy): support return struct type name
60
2
    _target_data_type_name = _target_data_type->get_name();
61
    // Using typeindex to indicate the datatype, not using type name because
62
    // type name is not stable, but type index is stable and immutable
63
2
    _cast_param_data_type = _target_data_type;
64
65
2
    ColumnsWithTypeAndName argument_template;
66
2
    argument_template.reserve(2);
67
2
    argument_template.emplace_back(nullptr, child->data_type(), child_name);
68
2
    argument_template.emplace_back(nullptr, _cast_param_data_type, _target_data_type_name);
69
2
    _function = SimpleFunctionFactory::instance().get_function(function_name, argument_template,
70
2
                                                               _data_type, {});
71
72
2
    if (_function == nullptr) {
73
0
        return Status::NotSupported("Cast from {} to {} is not implemented",
74
0
                                    child->data_type()->get_name(), _target_data_type_name);
75
0
    }
76
2
    VExpr::register_function_context(state, context);
77
2
    _expr_name = fmt::format("({} {}({}) TO {})", cast_name(), child_name,
78
2
                             child->data_type()->get_name(), _target_data_type_name);
79
2
    _prepare_finished = true;
80
2
    return Status::OK();
81
2
}
82
83
0
const DataTypePtr& VCastExpr::get_target_type() const {
84
0
    return _target_data_type;
85
0
}
86
87
doris::Status VCastExpr::open(doris::RuntimeState* state, VExprContext* context,
88
0
                              FunctionContext::FunctionStateScope scope) {
89
0
    DCHECK(_prepare_finished);
90
0
    for (auto& i : _children) {
91
0
        RETURN_IF_ERROR(i->open(state, context, scope));
92
0
    }
93
0
    RETURN_IF_ERROR(VExpr::init_function_context(state, context, scope, _function));
94
0
    if (scope == FunctionContext::FRAGMENT_LOCAL) {
95
0
        RETURN_IF_ERROR(VExpr::get_const_col(context, nullptr));
96
0
    }
97
0
    _open_finished = true;
98
0
    return Status::OK();
99
0
}
100
101
0
void VCastExpr::close(VExprContext* context, FunctionContext::FunctionStateScope scope) {
102
0
    VExpr::close_function_context(context, scope, _function);
103
0
    VExpr::close(context, scope);
104
0
}
105
106
Status VCastExpr::execute_column_impl(VExprContext* context, const Block* block,
107
                                      const Selector* selector, size_t count,
108
0
                                      ColumnPtr& result_column) const {
109
0
    DCHECK(_open_finished || block == nullptr) << _open_finished << _expr_name;
110
0
    if (is_const_and_have_executed()) { // const have executed in open function
111
0
        result_column = get_result_from_const(count);
112
0
        return Status::OK();
113
0
    }
114
    // for each child call execute
115
116
0
    ColumnPtr from_column;
117
0
    RETURN_IF_ERROR(_children[0]->execute_column(context, block, selector, count, from_column));
118
119
0
    Block temp_block;
120
0
    temp_block.insert({from_column, _children[0]->execute_type(block), _children[0]->expr_name()});
121
0
    temp_block.insert({nullptr, _data_type, _expr_name});
122
0
    RETURN_IF_ERROR(_function->execute(context->fn_context(_fn_context_index), temp_block, {0}, 1,
123
0
                                       temp_block.rows()));
124
125
0
    result_column = temp_block.get_by_position(1).column;
126
0
    DCHECK_EQ(result_column->size(), count);
127
0
    return Status::OK();
128
0
}
129
130
7
bool cast_error_code(Status& st) {
131
    //There may be more error codes that need to be captured by try cast in the future.
132
7
    if (st.is<ErrorCode::INVALID_ARGUMENT>()) {
133
5
        return true;
134
5
    } else {
135
2
        return false;
136
2
    }
137
7
}
138
139
13
DataTypePtr TryCastExpr::original_cast_return_type() const {
140
13
    if (_original_cast_return_is_nullable) {
141
7
        return _data_type;
142
7
    } else {
143
6
        return remove_nullable(_data_type);
144
6
    }
145
13
}
146
147
Status TryCastExpr::execute_column_impl(VExprContext* context, const Block* block,
148
                                        const Selector* selector, size_t count,
149
6
                                        ColumnPtr& result_column) const {
150
6
    DCHECK(_open_finished || block == nullptr) << _open_finished << _expr_name;
151
6
    if (is_const_and_have_executed()) { // const have executed in open function
152
0
        result_column = get_result_from_const(count);
153
0
        return Status::OK();
154
0
    }
155
156
    // For try_cast, try to execute it in batches first.
157
158
    // execute child first
159
160
6
    ColumnPtr from_column;
161
6
    RETURN_IF_ERROR(_children[0]->execute_column(context, block, selector, count, from_column));
162
6
    auto from_type = _children[0]->execute_type(block);
163
164
    // prepare block
165
166
6
    Block temp_block;
167
6
    temp_block.insert({from_column, from_type, _children[0]->expr_name()});
168
6
    temp_block.insert({nullptr, original_cast_return_type(), _expr_name});
169
170
    // batch execute
171
6
    auto batch_exec_status = _function->execute(context->fn_context(_fn_context_index), temp_block,
172
6
                                                {0}, 1, temp_block.rows());
173
    // If batch is executed successfully,
174
    // it means that there is no error and it will be returned directly.
175
6
    if (batch_exec_status.ok()) {
176
2
        result_column = temp_block.get_by_position(1).column;
177
2
        result_column = make_nullable(result_column);
178
2
        return batch_exec_status;
179
2
    }
180
181
    // If there is an error that cannot be handled by try cast, it will be returned directly.
182
4
    if (!cast_error_code(batch_exec_status)) {
183
1
        return batch_exec_status;
184
1
    }
185
186
    // If there is an error that can be handled by try cast,
187
    // it will be converted into line execution.
188
3
    ColumnWithTypeAndName input_info {from_column, from_type, _children[0]->expr_name()};
189
    // distinguish whether the return value of the original cast is nullable
190
3
    if (_original_cast_return_is_nullable) {
191
2
        RETURN_IF_ERROR(single_row_execute<true>(context, input_info, result_column));
192
2
    } else {
193
1
        RETURN_IF_ERROR(single_row_execute<false>(context, input_info, result_column));
194
1
    }
195
    // wrap nullable
196
2
    result_column = make_nullable(result_column);
197
2
    DCHECK_EQ(result_column->size(), count);
198
199
2
    return Status::OK();
200
3
}
201
202
template <bool original_cast_reutrn_is_nullable>
203
Status TryCastExpr::single_row_execute(VExprContext* context,
204
                                       const ColumnWithTypeAndName& input_info,
205
3
                                       ColumnPtr& return_column) const {
206
3
    auto input_column = input_info.column;
207
3
    const auto& input_type = input_info.type;
208
3
    const auto& input_name = input_info.name;
209
3
    auto result_column = _data_type->create_column();
210
211
3
    ColumnNullable& result_null_column = assert_cast<ColumnNullable&>(*result_column);
212
213
3
    IColumn& result_nested_column = result_null_column.get_nested_column();
214
3
    auto& result_null_map_data = result_null_column.get_null_map_data();
215
216
4
    auto insert_from_single_row = [&](const IColumn& single_exec_column, size_t row) {
217
4
        DCHECK_EQ(single_exec_column.size(), 1);
218
4
        if constexpr (original_cast_reutrn_is_nullable) {
219
2
            result_null_column.insert_from(single_exec_column, 0);
220
2
        } else {
221
2
            DCHECK(!single_exec_column.is_nullable());
222
2
            result_nested_column.insert_from(single_exec_column, 0);
223
2
            result_null_map_data.push_back(0);
224
2
        }
225
4
    };
_ZZNK5doris11TryCastExpr18single_row_executeILb1EEENS_6StatusEPNS_12VExprContextERKNS_21ColumnWithTypeAndNameERNS_3COWINS_7IColumnEE13immutable_ptrIS9_EEENKUlRKS9_mE_clESF_m
Line
Count
Source
216
2
    auto insert_from_single_row = [&](const IColumn& single_exec_column, size_t row) {
217
2
        DCHECK_EQ(single_exec_column.size(), 1);
218
2
        if constexpr (original_cast_reutrn_is_nullable) {
219
2
            result_null_column.insert_from(single_exec_column, 0);
220
        } else {
221
            DCHECK(!single_exec_column.is_nullable());
222
            result_nested_column.insert_from(single_exec_column, 0);
223
            result_null_map_data.push_back(0);
224
        }
225
2
    };
_ZZNK5doris11TryCastExpr18single_row_executeILb0EEENS_6StatusEPNS_12VExprContextERKNS_21ColumnWithTypeAndNameERNS_3COWINS_7IColumnEE13immutable_ptrIS9_EEENKUlRKS9_mE_clESF_m
Line
Count
Source
216
2
    auto insert_from_single_row = [&](const IColumn& single_exec_column, size_t row) {
217
2
        DCHECK_EQ(single_exec_column.size(), 1);
218
        if constexpr (original_cast_reutrn_is_nullable) {
219
            result_null_column.insert_from(single_exec_column, 0);
220
2
        } else {
221
            DCHECK(!single_exec_column.is_nullable());
222
2
            result_nested_column.insert_from(single_exec_column, 0);
223
2
            result_null_map_data.push_back(0);
224
2
        }
225
2
    };
226
227
3
    auto insert_null = [&](size_t row) { result_null_column.insert_default(); };
_ZZNK5doris11TryCastExpr18single_row_executeILb1EEENS_6StatusEPNS_12VExprContextERKNS_21ColumnWithTypeAndNameERNS_3COWINS_7IColumnEE13immutable_ptrIS9_EEENKUlmE_clEm
Line
Count
Source
227
1
    auto insert_null = [&](size_t row) { result_null_column.insert_default(); };
_ZZNK5doris11TryCastExpr18single_row_executeILb0EEENS_6StatusEPNS_12VExprContextERKNS_21ColumnWithTypeAndNameERNS_3COWINS_7IColumnEE13immutable_ptrIS9_EEENKUlmE_clEm
Line
Count
Source
227
1
    auto insert_null = [&](size_t row) { result_null_column.insert_default(); };
228
229
3
    const auto size = input_column->size();
230
9
    for (size_t row = 0; row < size; ++row) {
231
7
        Block single_row_block;
232
7
        single_row_block.insert({input_column->cut(row, 1), input_type, input_name});
233
7
        single_row_block.insert({nullptr, original_cast_return_type(), _expr_name});
234
235
7
        auto single_exec_status = _function->execute(context->fn_context(_fn_context_index),
236
7
                                                     single_row_block, {0}, 1, 1);
237
7
        if (single_exec_status.ok()) {
238
4
            insert_from_single_row(*single_row_block.get_by_position(1).column, row);
239
4
        } else {
240
3
            if (!cast_error_code(single_exec_status)) {
241
1
                return single_exec_status;
242
1
            }
243
2
            insert_null(row);
244
2
        }
245
7
    }
246
2
    return_column = std::move(result_column);
247
2
    return Status::OK();
248
3
}
_ZNK5doris11TryCastExpr18single_row_executeILb1EEENS_6StatusEPNS_12VExprContextERKNS_21ColumnWithTypeAndNameERNS_3COWINS_7IColumnEE13immutable_ptrIS9_EE
Line
Count
Source
205
2
                                       ColumnPtr& return_column) const {
206
2
    auto input_column = input_info.column;
207
2
    const auto& input_type = input_info.type;
208
2
    const auto& input_name = input_info.name;
209
2
    auto result_column = _data_type->create_column();
210
211
2
    ColumnNullable& result_null_column = assert_cast<ColumnNullable&>(*result_column);
212
213
2
    IColumn& result_nested_column = result_null_column.get_nested_column();
214
2
    auto& result_null_map_data = result_null_column.get_null_map_data();
215
216
2
    auto insert_from_single_row = [&](const IColumn& single_exec_column, size_t row) {
217
2
        DCHECK_EQ(single_exec_column.size(), 1);
218
2
        if constexpr (original_cast_reutrn_is_nullable) {
219
2
            result_null_column.insert_from(single_exec_column, 0);
220
2
        } else {
221
2
            DCHECK(!single_exec_column.is_nullable());
222
2
            result_nested_column.insert_from(single_exec_column, 0);
223
2
            result_null_map_data.push_back(0);
224
2
        }
225
2
    };
226
227
2
    auto insert_null = [&](size_t row) { result_null_column.insert_default(); };
228
229
2
    const auto size = input_column->size();
230
5
    for (size_t row = 0; row < size; ++row) {
231
4
        Block single_row_block;
232
4
        single_row_block.insert({input_column->cut(row, 1), input_type, input_name});
233
4
        single_row_block.insert({nullptr, original_cast_return_type(), _expr_name});
234
235
4
        auto single_exec_status = _function->execute(context->fn_context(_fn_context_index),
236
4
                                                     single_row_block, {0}, 1, 1);
237
4
        if (single_exec_status.ok()) {
238
2
            insert_from_single_row(*single_row_block.get_by_position(1).column, row);
239
2
        } else {
240
2
            if (!cast_error_code(single_exec_status)) {
241
1
                return single_exec_status;
242
1
            }
243
1
            insert_null(row);
244
1
        }
245
4
    }
246
1
    return_column = std::move(result_column);
247
1
    return Status::OK();
248
2
}
_ZNK5doris11TryCastExpr18single_row_executeILb0EEENS_6StatusEPNS_12VExprContextERKNS_21ColumnWithTypeAndNameERNS_3COWINS_7IColumnEE13immutable_ptrIS9_EE
Line
Count
Source
205
1
                                       ColumnPtr& return_column) const {
206
1
    auto input_column = input_info.column;
207
1
    const auto& input_type = input_info.type;
208
1
    const auto& input_name = input_info.name;
209
1
    auto result_column = _data_type->create_column();
210
211
1
    ColumnNullable& result_null_column = assert_cast<ColumnNullable&>(*result_column);
212
213
1
    IColumn& result_nested_column = result_null_column.get_nested_column();
214
1
    auto& result_null_map_data = result_null_column.get_null_map_data();
215
216
1
    auto insert_from_single_row = [&](const IColumn& single_exec_column, size_t row) {
217
1
        DCHECK_EQ(single_exec_column.size(), 1);
218
1
        if constexpr (original_cast_reutrn_is_nullable) {
219
1
            result_null_column.insert_from(single_exec_column, 0);
220
1
        } else {
221
1
            DCHECK(!single_exec_column.is_nullable());
222
1
            result_nested_column.insert_from(single_exec_column, 0);
223
1
            result_null_map_data.push_back(0);
224
1
        }
225
1
    };
226
227
1
    auto insert_null = [&](size_t row) { result_null_column.insert_default(); };
228
229
1
    const auto size = input_column->size();
230
4
    for (size_t row = 0; row < size; ++row) {
231
3
        Block single_row_block;
232
3
        single_row_block.insert({input_column->cut(row, 1), input_type, input_name});
233
3
        single_row_block.insert({nullptr, original_cast_return_type(), _expr_name});
234
235
3
        auto single_exec_status = _function->execute(context->fn_context(_fn_context_index),
236
3
                                                     single_row_block, {0}, 1, 1);
237
3
        if (single_exec_status.ok()) {
238
2
            insert_from_single_row(*single_row_block.get_by_position(1).column, row);
239
2
        } else {
240
1
            if (!cast_error_code(single_exec_status)) {
241
0
                return single_exec_status;
242
0
            }
243
1
            insert_null(row);
244
1
        }
245
3
    }
246
1
    return_column = std::move(result_column);
247
1
    return Status::OK();
248
1
}
249
250
7
const std::string& VCastExpr::expr_name() const {
251
7
    return _expr_name;
252
7
}
253
254
0
std::string VCastExpr::debug_string() const {
255
0
    std::stringstream out;
256
0
    out << cast_name() << " Expr(CAST " << get_child(0)->data_type()->get_name() << " to "
257
0
        << _target_data_type->get_name() << "){";
258
0
    bool first = true;
259
0
    for (const auto& input_expr : children()) {
260
0
        if (first) {
261
0
            first = false;
262
0
        } else {
263
0
            out << ",";
264
0
        }
265
0
        out << input_expr->debug_string();
266
0
    }
267
0
    out << "}";
268
0
    return out.str();
269
0
}
270
271
} // namespace doris