Coverage Report

Created: 2026-03-11 10:17

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/root/doris/be/src/exprs/vcast_expr.cpp
Line
Count
Source
1
// Licensed to the Apache Software Foundation (ASF) under one
2
// or more contributor license agreements.  See the NOTICE file
3
// distributed with this work for additional information
4
// regarding copyright ownership.  The ASF licenses this file
5
// to you under the Apache License, Version 2.0 (the
6
// "License"); you may not use this file except in compliance
7
// with the License.  You may obtain a copy of the License at
8
//
9
//   http://www.apache.org/licenses/LICENSE-2.0
10
//
11
// Unless required by applicable law or agreed to in writing,
12
// software distributed under the License is distributed on an
13
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
14
// KIND, either express or implied.  See the License for the
15
// specific language governing permissions and limitations
16
// under the License.
17
18
#include "exprs/vcast_expr.h"
19
20
#include <fmt/format.h>
21
#include <gen_cpp/Types_types.h>
22
#include <glog/logging.h>
23
24
#include <cstddef>
25
#include <memory>
26
#include <ostream>
27
28
#include "common/exception.h"
29
#include "common/status.h"
30
#include "core/assert_cast.h"
31
#include "core/block/block.h"
32
#include "core/block/column_with_type_and_name.h"
33
#include "core/block/columns_with_type_and_name.h"
34
#include "core/column/column.h"
35
#include "core/column/column_nullable.h"
36
#include "core/data_type/data_type_nullable.h"
37
#include "exprs/function/simple_function_factory.h"
38
#include "exprs/vexpr.h"
39
#include "exprs/vexpr_context.h"
40
#include "runtime/runtime_state.h"
41
42
namespace doris {
43
class RowDescriptor;
44
class RuntimeState;
45
} // namespace doris
46
47
namespace doris {
48
#include "common/compile_check_begin.h"
49
50
doris::Status VCastExpr::prepare(doris::RuntimeState* state, const doris::RowDescriptor& desc,
51
2
                                 VExprContext* context) {
52
2
    RETURN_IF_ERROR_OR_PREPARED(VExpr::prepare(state, desc, context));
53
54
2
    DCHECK_EQ(_children.size(), 1);
55
2
    auto child = _children[0];
56
2
    const auto& child_name = child->expr_name();
57
58
    // create a const string column
59
2
    _target_data_type = _data_type;
60
    // TODO(xy): support return struct type name
61
2
    _target_data_type_name = _target_data_type->get_name();
62
    // Using typeindex to indicate the datatype, not using type name because
63
    // type name is not stable, but type index is stable and immutable
64
2
    _cast_param_data_type = _target_data_type;
65
66
2
    ColumnsWithTypeAndName argument_template;
67
2
    argument_template.reserve(2);
68
2
    argument_template.emplace_back(nullptr, child->data_type(), child_name);
69
2
    argument_template.emplace_back(nullptr, _cast_param_data_type, _target_data_type_name);
70
2
    _function = SimpleFunctionFactory::instance().get_function(function_name, argument_template,
71
2
                                                               _data_type, {});
72
73
2
    if (_function == nullptr) {
74
0
        return Status::NotSupported("Cast from {} to {} is not implemented",
75
0
                                    child->data_type()->get_name(), _target_data_type_name);
76
0
    }
77
2
    VExpr::register_function_context(state, context);
78
2
    _expr_name = fmt::format("({} {}({}) TO {})", cast_name(), child_name,
79
2
                             child->data_type()->get_name(), _target_data_type_name);
80
2
    _prepare_finished = true;
81
2
    return Status::OK();
82
2
}
83
84
0
const DataTypePtr& VCastExpr::get_target_type() const {
85
0
    return _target_data_type;
86
0
}
87
88
doris::Status VCastExpr::open(doris::RuntimeState* state, VExprContext* context,
89
0
                              FunctionContext::FunctionStateScope scope) {
90
0
    DCHECK(_prepare_finished);
91
0
    for (auto& i : _children) {
92
0
        RETURN_IF_ERROR(i->open(state, context, scope));
93
0
    }
94
0
    RETURN_IF_ERROR(VExpr::init_function_context(state, context, scope, _function));
95
0
    if (scope == FunctionContext::FRAGMENT_LOCAL) {
96
0
        RETURN_IF_ERROR(VExpr::get_const_col(context, nullptr));
97
0
    }
98
0
    _open_finished = true;
99
0
    return Status::OK();
100
0
}
101
102
0
void VCastExpr::close(VExprContext* context, FunctionContext::FunctionStateScope scope) {
103
0
    VExpr::close_function_context(context, scope, _function);
104
0
    VExpr::close(context, scope);
105
0
}
106
107
Status VCastExpr::execute_column(VExprContext* context, const Block* block, Selector* selector,
108
0
                                 size_t count, ColumnPtr& result_column) const {
109
0
    DCHECK(_open_finished || block == nullptr) << _open_finished << _expr_name;
110
0
    if (is_const_and_have_executed()) { // const have executed in open function
111
0
        result_column = get_result_from_const(count);
112
0
        return Status::OK();
113
0
    }
114
    // for each child call execute
115
116
0
    ColumnPtr from_column;
117
0
    RETURN_IF_ERROR(_children[0]->execute_column(context, block, selector, count, from_column));
118
119
0
    Block temp_block;
120
0
    temp_block.insert({from_column, _children[0]->execute_type(block), _children[0]->expr_name()});
121
0
    temp_block.insert({nullptr, _data_type, _expr_name});
122
0
    RETURN_IF_ERROR(_function->execute(context->fn_context(_fn_context_index), temp_block, {0}, 1,
123
0
                                       temp_block.rows()));
124
125
0
    result_column = temp_block.get_by_position(1).column;
126
0
    DCHECK_EQ(result_column->size(), count);
127
0
    return Status::OK();
128
0
}
129
130
7
bool cast_error_code(Status& st) {
131
    //There may be more error codes that need to be captured by try cast in the future.
132
7
    if (st.is<ErrorCode::INVALID_ARGUMENT>()) {
133
5
        return true;
134
5
    } else {
135
2
        return false;
136
2
    }
137
7
}
138
139
13
DataTypePtr TryCastExpr::original_cast_return_type() const {
140
13
    if (_original_cast_return_is_nullable) {
141
7
        return _data_type;
142
7
    } else {
143
6
        return remove_nullable(_data_type);
144
6
    }
145
13
}
146
147
Status TryCastExpr::execute_column(VExprContext* context, const Block* block, Selector* selector,
148
6
                                   size_t count, ColumnPtr& result_column) const {
149
6
    DCHECK(_open_finished || block == nullptr) << _open_finished << _expr_name;
150
6
    if (is_const_and_have_executed()) { // const have executed in open function
151
0
        result_column = get_result_from_const(count);
152
0
        return Status::OK();
153
0
    }
154
155
    // For try_cast, try to execute it in batches first.
156
157
    // execute child first
158
159
6
    ColumnPtr from_column;
160
6
    RETURN_IF_ERROR(_children[0]->execute_column(context, block, selector, count, from_column));
161
6
    auto from_type = _children[0]->execute_type(block);
162
163
    // prepare block
164
165
6
    Block temp_block;
166
6
    temp_block.insert({from_column, from_type, _children[0]->expr_name()});
167
6
    temp_block.insert({nullptr, original_cast_return_type(), _expr_name});
168
169
    // batch execute
170
6
    auto batch_exec_status = _function->execute(context->fn_context(_fn_context_index), temp_block,
171
6
                                                {0}, 1, temp_block.rows());
172
    // If batch is executed successfully,
173
    // it means that there is no error and it will be returned directly.
174
6
    if (batch_exec_status.ok()) {
175
2
        result_column = temp_block.get_by_position(1).column;
176
2
        result_column = make_nullable(result_column);
177
2
        return batch_exec_status;
178
2
    }
179
180
    // If there is an error that cannot be handled by try cast, it will be returned directly.
181
4
    if (!cast_error_code(batch_exec_status)) {
182
1
        return batch_exec_status;
183
1
    }
184
185
    // If there is an error that can be handled by try cast,
186
    // it will be converted into line execution.
187
3
    ColumnWithTypeAndName input_info {from_column, from_type, _children[0]->expr_name()};
188
    // distinguish whether the return value of the original cast is nullable
189
3
    if (_original_cast_return_is_nullable) {
190
2
        RETURN_IF_ERROR(single_row_execute<true>(context, input_info, result_column));
191
2
    } else {
192
1
        RETURN_IF_ERROR(single_row_execute<false>(context, input_info, result_column));
193
1
    }
194
    // wrap nullable
195
2
    result_column = make_nullable(result_column);
196
2
    DCHECK_EQ(result_column->size(), count);
197
198
2
    return Status::OK();
199
3
}
200
201
template <bool original_cast_reutrn_is_nullable>
202
Status TryCastExpr::single_row_execute(VExprContext* context,
203
                                       const ColumnWithTypeAndName& input_info,
204
3
                                       ColumnPtr& return_column) const {
205
3
    auto input_column = input_info.column;
206
3
    const auto& input_type = input_info.type;
207
3
    const auto& input_name = input_info.name;
208
3
    auto result_column = _data_type->create_column();
209
210
3
    ColumnNullable& result_null_column = assert_cast<ColumnNullable&>(*result_column);
211
212
3
    IColumn& result_nested_column = result_null_column.get_nested_column();
213
3
    auto& result_null_map_data = result_null_column.get_null_map_data();
214
215
4
    auto insert_from_single_row = [&](const IColumn& single_exec_column, size_t row) {
216
4
        DCHECK_EQ(single_exec_column.size(), 1);
217
4
        if constexpr (original_cast_reutrn_is_nullable) {
218
2
            result_null_column.insert_from(single_exec_column, 0);
219
2
        } else {
220
2
            DCHECK(!single_exec_column.is_nullable());
221
2
            result_nested_column.insert_from(single_exec_column, 0);
222
2
            result_null_map_data.push_back(0);
223
2
        }
224
4
    };
_ZZNK5doris11TryCastExpr18single_row_executeILb1EEENS_6StatusEPNS_12VExprContextERKNS_21ColumnWithTypeAndNameERNS_3COWINS_7IColumnEE13immutable_ptrIS9_EEENKUlRKS9_mE_clESF_m
Line
Count
Source
215
2
    auto insert_from_single_row = [&](const IColumn& single_exec_column, size_t row) {
216
2
        DCHECK_EQ(single_exec_column.size(), 1);
217
2
        if constexpr (original_cast_reutrn_is_nullable) {
218
2
            result_null_column.insert_from(single_exec_column, 0);
219
        } else {
220
            DCHECK(!single_exec_column.is_nullable());
221
            result_nested_column.insert_from(single_exec_column, 0);
222
            result_null_map_data.push_back(0);
223
        }
224
2
    };
_ZZNK5doris11TryCastExpr18single_row_executeILb0EEENS_6StatusEPNS_12VExprContextERKNS_21ColumnWithTypeAndNameERNS_3COWINS_7IColumnEE13immutable_ptrIS9_EEENKUlRKS9_mE_clESF_m
Line
Count
Source
215
2
    auto insert_from_single_row = [&](const IColumn& single_exec_column, size_t row) {
216
2
        DCHECK_EQ(single_exec_column.size(), 1);
217
        if constexpr (original_cast_reutrn_is_nullable) {
218
            result_null_column.insert_from(single_exec_column, 0);
219
2
        } else {
220
            DCHECK(!single_exec_column.is_nullable());
221
2
            result_nested_column.insert_from(single_exec_column, 0);
222
2
            result_null_map_data.push_back(0);
223
2
        }
224
2
    };
225
226
3
    auto insert_null = [&](size_t row) { result_null_column.insert_default(); };
_ZZNK5doris11TryCastExpr18single_row_executeILb1EEENS_6StatusEPNS_12VExprContextERKNS_21ColumnWithTypeAndNameERNS_3COWINS_7IColumnEE13immutable_ptrIS9_EEENKUlmE_clEm
Line
Count
Source
226
1
    auto insert_null = [&](size_t row) { result_null_column.insert_default(); };
_ZZNK5doris11TryCastExpr18single_row_executeILb0EEENS_6StatusEPNS_12VExprContextERKNS_21ColumnWithTypeAndNameERNS_3COWINS_7IColumnEE13immutable_ptrIS9_EEENKUlmE_clEm
Line
Count
Source
226
1
    auto insert_null = [&](size_t row) { result_null_column.insert_default(); };
227
228
3
    const auto size = input_column->size();
229
9
    for (size_t row = 0; row < size; ++row) {
230
7
        Block single_row_block;
231
7
        single_row_block.insert({input_column->cut(row, 1), input_type, input_name});
232
7
        single_row_block.insert({nullptr, original_cast_return_type(), _expr_name});
233
234
7
        auto single_exec_status = _function->execute(context->fn_context(_fn_context_index),
235
7
                                                     single_row_block, {0}, 1, 1);
236
7
        if (single_exec_status.ok()) {
237
4
            insert_from_single_row(*single_row_block.get_by_position(1).column, row);
238
4
        } else {
239
3
            if (!cast_error_code(single_exec_status)) {
240
1
                return single_exec_status;
241
1
            }
242
2
            insert_null(row);
243
2
        }
244
7
    }
245
2
    return_column = std::move(result_column);
246
2
    return Status::OK();
247
3
}
_ZNK5doris11TryCastExpr18single_row_executeILb1EEENS_6StatusEPNS_12VExprContextERKNS_21ColumnWithTypeAndNameERNS_3COWINS_7IColumnEE13immutable_ptrIS9_EE
Line
Count
Source
204
2
                                       ColumnPtr& return_column) const {
205
2
    auto input_column = input_info.column;
206
2
    const auto& input_type = input_info.type;
207
2
    const auto& input_name = input_info.name;
208
2
    auto result_column = _data_type->create_column();
209
210
2
    ColumnNullable& result_null_column = assert_cast<ColumnNullable&>(*result_column);
211
212
2
    IColumn& result_nested_column = result_null_column.get_nested_column();
213
2
    auto& result_null_map_data = result_null_column.get_null_map_data();
214
215
2
    auto insert_from_single_row = [&](const IColumn& single_exec_column, size_t row) {
216
2
        DCHECK_EQ(single_exec_column.size(), 1);
217
2
        if constexpr (original_cast_reutrn_is_nullable) {
218
2
            result_null_column.insert_from(single_exec_column, 0);
219
2
        } else {
220
2
            DCHECK(!single_exec_column.is_nullable());
221
2
            result_nested_column.insert_from(single_exec_column, 0);
222
2
            result_null_map_data.push_back(0);
223
2
        }
224
2
    };
225
226
2
    auto insert_null = [&](size_t row) { result_null_column.insert_default(); };
227
228
2
    const auto size = input_column->size();
229
5
    for (size_t row = 0; row < size; ++row) {
230
4
        Block single_row_block;
231
4
        single_row_block.insert({input_column->cut(row, 1), input_type, input_name});
232
4
        single_row_block.insert({nullptr, original_cast_return_type(), _expr_name});
233
234
4
        auto single_exec_status = _function->execute(context->fn_context(_fn_context_index),
235
4
                                                     single_row_block, {0}, 1, 1);
236
4
        if (single_exec_status.ok()) {
237
2
            insert_from_single_row(*single_row_block.get_by_position(1).column, row);
238
2
        } else {
239
2
            if (!cast_error_code(single_exec_status)) {
240
1
                return single_exec_status;
241
1
            }
242
1
            insert_null(row);
243
1
        }
244
4
    }
245
1
    return_column = std::move(result_column);
246
1
    return Status::OK();
247
2
}
_ZNK5doris11TryCastExpr18single_row_executeILb0EEENS_6StatusEPNS_12VExprContextERKNS_21ColumnWithTypeAndNameERNS_3COWINS_7IColumnEE13immutable_ptrIS9_EE
Line
Count
Source
204
1
                                       ColumnPtr& return_column) const {
205
1
    auto input_column = input_info.column;
206
1
    const auto& input_type = input_info.type;
207
1
    const auto& input_name = input_info.name;
208
1
    auto result_column = _data_type->create_column();
209
210
1
    ColumnNullable& result_null_column = assert_cast<ColumnNullable&>(*result_column);
211
212
1
    IColumn& result_nested_column = result_null_column.get_nested_column();
213
1
    auto& result_null_map_data = result_null_column.get_null_map_data();
214
215
1
    auto insert_from_single_row = [&](const IColumn& single_exec_column, size_t row) {
216
1
        DCHECK_EQ(single_exec_column.size(), 1);
217
1
        if constexpr (original_cast_reutrn_is_nullable) {
218
1
            result_null_column.insert_from(single_exec_column, 0);
219
1
        } else {
220
1
            DCHECK(!single_exec_column.is_nullable());
221
1
            result_nested_column.insert_from(single_exec_column, 0);
222
1
            result_null_map_data.push_back(0);
223
1
        }
224
1
    };
225
226
1
    auto insert_null = [&](size_t row) { result_null_column.insert_default(); };
227
228
1
    const auto size = input_column->size();
229
4
    for (size_t row = 0; row < size; ++row) {
230
3
        Block single_row_block;
231
3
        single_row_block.insert({input_column->cut(row, 1), input_type, input_name});
232
3
        single_row_block.insert({nullptr, original_cast_return_type(), _expr_name});
233
234
3
        auto single_exec_status = _function->execute(context->fn_context(_fn_context_index),
235
3
                                                     single_row_block, {0}, 1, 1);
236
3
        if (single_exec_status.ok()) {
237
2
            insert_from_single_row(*single_row_block.get_by_position(1).column, row);
238
2
        } else {
239
1
            if (!cast_error_code(single_exec_status)) {
240
0
                return single_exec_status;
241
0
            }
242
1
            insert_null(row);
243
1
        }
244
3
    }
245
1
    return_column = std::move(result_column);
246
1
    return Status::OK();
247
1
}
248
249
7
const std::string& VCastExpr::expr_name() const {
250
7
    return _expr_name;
251
7
}
252
253
0
std::string VCastExpr::debug_string() const {
254
0
    std::stringstream out;
255
0
    out << cast_name() << " Expr(CAST " << get_child(0)->data_type()->get_name() << " to "
256
0
        << _target_data_type->get_name() << "){";
257
0
    bool first = true;
258
0
    for (const auto& input_expr : children()) {
259
0
        if (first) {
260
0
            first = false;
261
0
        } else {
262
0
            out << ",";
263
0
        }
264
0
        out << input_expr->debug_string();
265
0
    }
266
0
    out << "}";
267
0
    return out.str();
268
0
}
269
270
#include "common/compile_check_end.h"
271
} // namespace doris