be/src/exprs/vbloom_predicate.cpp
Line | Count | Source |
1 | | // Licensed to the Apache Software Foundation (ASF) under one |
2 | | // or more contributor license agreements. See the NOTICE file |
3 | | // distributed with this work for additional information |
4 | | // regarding copyright ownership. The ASF licenses this file |
5 | | // to you under the Apache License, Version 2.0 (the |
6 | | // "License"); you may not use this file except in compliance |
7 | | // with the License. You may obtain a copy of the License at |
8 | | // |
9 | | // http://www.apache.org/licenses/LICENSE-2.0 |
10 | | // |
11 | | // Unless required by applicable law or agreed to in writing, |
12 | | // software distributed under the License is distributed on an |
13 | | // "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY |
14 | | // KIND, either express or implied. See the License for the |
15 | | // specific language governing permissions and limitations |
16 | | // under the License. |
17 | | |
18 | | #include "exprs/vbloom_predicate.h" |
19 | | |
20 | | #include <cstddef> |
21 | | #include <utility> |
22 | | |
23 | | #include "common/status.h" |
24 | | #include "core/block/block.h" |
25 | | #include "core/block/column_numbers.h" |
26 | | #include "core/block/column_with_type_and_name.h" |
27 | | #include "core/column/column.h" |
28 | | #include "core/column/column_nullable.h" |
29 | | #include "core/column/column_vector.h" |
30 | | #include "core/data_type/data_type.h" |
31 | | #include "core/data_type/data_type_nullable.h" |
32 | | #include "core/types.h" |
33 | | #include "exprs/bloom_filter_func.h" |
34 | | #include "runtime/runtime_state.h" |
35 | | |
36 | | namespace doris { |
37 | | class RowDescriptor; |
38 | | class TExprNode; |
39 | | |
40 | | } // namespace doris |
41 | | |
42 | | namespace doris { |
43 | | |
44 | | class VExprContext; |
45 | | |
46 | 1 | VBloomPredicate::VBloomPredicate(const TExprNode& node) : VExpr(node), _filter(nullptr) {} |
47 | | |
48 | | Status VBloomPredicate::prepare(RuntimeState* state, const RowDescriptor& desc, |
49 | 0 | VExprContext* context) { |
50 | 0 | RETURN_IF_ERROR_OR_PREPARED(VExpr::prepare(state, desc, context)); |
51 | |
|
52 | 0 | if (_children.size() != 1) { |
53 | 0 | return Status::InternalError("Invalid argument for VBloomPredicate."); |
54 | 0 | } |
55 | | |
56 | 0 | _prepare_finished = true; |
57 | 0 | return Status::OK(); |
58 | 0 | } |
59 | | |
60 | | Status VBloomPredicate::open(RuntimeState* state, VExprContext* context, |
61 | 0 | FunctionContext::FunctionStateScope scope) { |
62 | 0 | DCHECK(_prepare_finished); |
63 | 0 | RETURN_IF_ERROR(VExpr::open(state, context, scope)); |
64 | 0 | _open_finished = true; |
65 | 0 | return Status::OK(); |
66 | 0 | } |
67 | | |
68 | 0 | void VBloomPredicate::close(VExprContext* context, FunctionContext::FunctionStateScope scope) { |
69 | 0 | VExpr::close(context, scope); |
70 | 0 | } |
71 | | |
72 | | Status VBloomPredicate::_do_execute(VExprContext* context, const Block* block, |
73 | | const uint8_t* __restrict filter, Selector* selector, |
74 | 0 | size_t count, ColumnPtr& result_column) const { |
75 | 0 | DCHECK(_open_finished || block == nullptr); |
76 | 0 | DCHECK(!(filter != nullptr && selector != nullptr)) |
77 | 0 | << "filter and selector can not be both set"; |
78 | 0 | DCHECK_EQ(_children.size(), 1); |
79 | |
|
80 | 0 | ColumnPtr argument_column; |
81 | 0 | RETURN_IF_ERROR(_children[0]->execute_column(context, block, selector, count, argument_column)); |
82 | 0 | argument_column = argument_column->convert_to_full_column_if_const(); |
83 | |
|
84 | 0 | size_t sz = argument_column->size(); |
85 | 0 | auto res_data_column = ColumnUInt8::create(sz); |
86 | |
|
87 | 0 | res_data_column->resize(sz); |
88 | 0 | auto* ptr = ((ColumnUInt8*)res_data_column.get())->get_data().data(); |
89 | |
|
90 | 0 | _filter->find_fixed_len(argument_column, ptr, filter); |
91 | |
|
92 | 0 | result_column = std::move(res_data_column); |
93 | 0 | DCHECK_EQ(result_column->size(), count); |
94 | 0 | return Status::OK(); |
95 | 0 | } |
96 | | |
97 | | Status VBloomPredicate::execute_column(VExprContext* context, const Block* block, |
98 | | Selector* selector, size_t count, |
99 | 0 | ColumnPtr& result_column) const { |
100 | 0 | return _do_execute(context, block, nullptr, selector, count, result_column); |
101 | 0 | } |
102 | | |
103 | | Status VBloomPredicate::execute_runtime_filter(VExprContext* context, const Block* block, |
104 | | const uint8_t* __restrict filter, size_t count, |
105 | | ColumnPtr& result_column, |
106 | 0 | ColumnPtr* arg_column) const { |
107 | 0 | return _do_execute(context, block, filter, nullptr, count, result_column); |
108 | 0 | } |
109 | 0 | const std::string& VBloomPredicate::expr_name() const { |
110 | 0 | return EXPR_NAME; |
111 | 0 | } |
112 | | |
113 | 1 | void VBloomPredicate::set_filter(std::shared_ptr<BloomFilterFuncBase> filter) { |
114 | 1 | _filter = filter; |
115 | 1 | } |
116 | | |
117 | 0 | uint64_t VBloomPredicate::get_digest(uint64_t seed) const { |
118 | 0 | seed = _children[0]->get_digest(seed); |
119 | 0 | if (seed) { |
120 | 0 | char* data; |
121 | 0 | int len; |
122 | 0 | _filter->get_data(&data, &len); |
123 | 0 | return HashUtil::hash64(data, len, seed); |
124 | 0 | } |
125 | 0 | return 0; |
126 | 0 | } |
127 | | |
128 | | } // namespace doris |