be/src/exprs/function/in.h
Line | Count | Source |
1 | | // Licensed to the Apache Software Foundation (ASF) under one |
2 | | // or more contributor license agreements. See the NOTICE file |
3 | | // distributed with this work for additional information |
4 | | // regarding copyright ownership. The ASF licenses this file |
5 | | // to you under the Apache License, Version 2.0 (the |
6 | | // "License"); you may not use this file except in compliance |
7 | | // with the License. You may obtain a copy of the License at |
8 | | // |
9 | | // http://www.apache.org/licenses/LICENSE-2.0 |
10 | | // |
11 | | // Unless required by applicable law or agreed to in writing, |
12 | | // software distributed under the License is distributed on an |
13 | | // "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY |
14 | | // KIND, either express or implied. See the License for the |
15 | | // specific language governing permissions and limitations |
16 | | // under the License. |
17 | | // This file is copied from |
18 | | |
19 | | #pragma once |
20 | | |
21 | | #include <glog/logging.h> |
22 | | |
23 | | #include <boost/iterator/iterator_facade.hpp> |
24 | | #include <cstddef> |
25 | | #include <memory> |
26 | | #include <utility> |
27 | | #include <vector> |
28 | | |
29 | | #include "common/status.h" |
30 | | #include "core/block/block.h" |
31 | | #include "core/block/column_numbers.h" |
32 | | #include "core/block/column_with_type_and_name.h" |
33 | | #include "core/column/column.h" |
34 | | #include "core/column/column_const.h" |
35 | | #include "core/column/column_nullable.h" |
36 | | #include "core/column/column_vector.h" |
37 | | #include "core/data_type/data_type.h" |
38 | | #include "core/data_type/data_type_nullable.h" |
39 | | #include "core/data_type/data_type_number.h" |
40 | | #include "core/data_type/define_primitive_type.h" |
41 | | #include "core/string_ref.h" |
42 | | #include "core/types.h" |
43 | | #include "exprs/aggregate/aggregate_function.h" |
44 | | #include "exprs/create_predicate_function.h" |
45 | | #include "exprs/function/function.h" |
46 | | #include "exprs/function_context.h" |
47 | | #include "exprs/hybrid_set.h" |
48 | | #include "storage/index/index_reader_helper.h" |
49 | | |
50 | | namespace doris { |
51 | | |
52 | | template <typename T> |
53 | | class ColumnStr; |
54 | | using ColumnString = ColumnStr<UInt32>; |
55 | | |
56 | | struct InState { |
57 | | bool use_set = true; |
58 | | std::shared_ptr<HybridSetBase> hybrid_set; |
59 | | }; |
60 | | |
61 | | template <bool negative> |
62 | | class FunctionIn : public IFunction { |
63 | | public: |
64 | | static constexpr auto name = negative ? "not_in" : "in"; |
65 | | |
66 | 1.86k | static FunctionPtr create() { return std::make_shared<FunctionIn>(); }_ZN5doris10FunctionInILb0EE6createEv Line | Count | Source | 66 | 1.65k | static FunctionPtr create() { return std::make_shared<FunctionIn>(); } |
_ZN5doris10FunctionInILb1EE6createEv Line | Count | Source | 66 | 206 | static FunctionPtr create() { return std::make_shared<FunctionIn>(); } |
|
67 | | |
68 | 0 | String get_name() const override { return name; }Unexecuted instantiation: _ZNK5doris10FunctionInILb0EE8get_nameB5cxx11Ev Unexecuted instantiation: _ZNK5doris10FunctionInILb1EE8get_nameB5cxx11Ev |
69 | | |
70 | 1.84k | bool is_variadic() const override { return true; }_ZNK5doris10FunctionInILb0EE11is_variadicEv Line | Count | Source | 70 | 1.64k | bool is_variadic() const override { return true; } |
_ZNK5doris10FunctionInILb1EE11is_variadicEv Line | Count | Source | 70 | 198 | bool is_variadic() const override { return true; } |
|
71 | | |
72 | 0 | size_t get_number_of_arguments() const override { return 0; }Unexecuted instantiation: _ZNK5doris10FunctionInILb0EE23get_number_of_argumentsEv Unexecuted instantiation: _ZNK5doris10FunctionInILb1EE23get_number_of_argumentsEv |
73 | | |
74 | 1.84k | DataTypePtr get_return_type_impl(const DataTypes& args) const override { |
75 | 3.20k | for (const auto& arg : args) { |
76 | 3.20k | if (arg->is_nullable()) { |
77 | 1.33k | return make_nullable(std::make_shared<DataTypeUInt8>()); |
78 | 1.33k | } |
79 | 3.20k | } |
80 | 508 | return std::make_shared<DataTypeUInt8>(); |
81 | 1.84k | } _ZNK5doris10FunctionInILb0EE20get_return_type_implERKSt6vectorISt10shared_ptrIKNS_9IDataTypeEESaIS6_EE Line | Count | Source | 74 | 1.64k | DataTypePtr get_return_type_impl(const DataTypes& args) const override { | 75 | 2.90k | for (const auto& arg : args) { | 76 | 2.90k | if (arg->is_nullable()) { | 77 | 1.17k | return make_nullable(std::make_shared<DataTypeUInt8>()); | 78 | 1.17k | } | 79 | 2.90k | } | 80 | 470 | return std::make_shared<DataTypeUInt8>(); | 81 | 1.64k | } |
_ZNK5doris10FunctionInILb1EE20get_return_type_implERKSt6vectorISt10shared_ptrIKNS_9IDataTypeEESaIS6_EE Line | Count | Source | 74 | 197 | DataTypePtr get_return_type_impl(const DataTypes& args) const override { | 75 | 306 | for (const auto& arg : args) { | 76 | 306 | if (arg->is_nullable()) { | 77 | 159 | return make_nullable(std::make_shared<DataTypeUInt8>()); | 78 | 159 | } | 79 | 306 | } | 80 | 38 | return std::make_shared<DataTypeUInt8>(); | 81 | 197 | } |
|
82 | | |
83 | 15.8k | bool use_default_implementation_for_nulls() const override { return false; }_ZNK5doris10FunctionInILb0EE36use_default_implementation_for_nullsEv Line | Count | Source | 83 | 14.8k | bool use_default_implementation_for_nulls() const override { return false; } |
_ZNK5doris10FunctionInILb1EE36use_default_implementation_for_nullsEv Line | Count | Source | 83 | 1.05k | bool use_default_implementation_for_nulls() const override { return false; } |
|
84 | | |
85 | | // size of [ in ( 1 , 2 , 3 , null) ] is 3 |
86 | 1.83k | size_t get_size_with_out_null(FunctionContext* context) { |
87 | 1.83k | if ((context->get_num_args() - 1) > FIXED_CONTAINER_MAX_SIZE) { |
88 | 14 | return context->get_num_args() - 1; |
89 | 14 | } |
90 | 1.82k | size_t sz = 0; |
91 | 6.12k | for (int i = 1; i < context->get_num_args(); ++i) { |
92 | 4.30k | const auto& const_column_ptr = context->get_constant_col(i); |
93 | 4.30k | if (const_column_ptr != nullptr) { |
94 | 4.30k | auto const_data = const_column_ptr->column_ptr->get_data_at(0); |
95 | 4.30k | if (const_data.data != nullptr) { |
96 | 4.22k | sz++; |
97 | 4.22k | } |
98 | 4.30k | } |
99 | 4.30k | } |
100 | 1.82k | return sz; |
101 | 1.83k | } _ZN5doris10FunctionInILb0EE22get_size_with_out_nullEPNS_15FunctionContextE Line | Count | Source | 86 | 1.64k | size_t get_size_with_out_null(FunctionContext* context) { | 87 | 1.64k | if ((context->get_num_args() - 1) > FIXED_CONTAINER_MAX_SIZE) { | 88 | 14 | return context->get_num_args() - 1; | 89 | 14 | } | 90 | 1.63k | size_t sz = 0; | 91 | 5.44k | for (int i = 1; i < context->get_num_args(); ++i) { | 92 | 3.81k | const auto& const_column_ptr = context->get_constant_col(i); | 93 | 3.81k | if (const_column_ptr != nullptr) { | 94 | 3.81k | auto const_data = const_column_ptr->column_ptr->get_data_at(0); | 95 | 3.81k | if (const_data.data != nullptr) { | 96 | 3.76k | sz++; | 97 | 3.76k | } | 98 | 3.81k | } | 99 | 3.81k | } | 100 | 1.63k | return sz; | 101 | 1.64k | } |
_ZN5doris10FunctionInILb1EE22get_size_with_out_nullEPNS_15FunctionContextE Line | Count | Source | 86 | 195 | size_t get_size_with_out_null(FunctionContext* context) { | 87 | 195 | if ((context->get_num_args() - 1) > FIXED_CONTAINER_MAX_SIZE) { | 88 | 0 | return context->get_num_args() - 1; | 89 | 0 | } | 90 | 195 | size_t sz = 0; | 91 | 681 | for (int i = 1; i < context->get_num_args(); ++i) { | 92 | 486 | const auto& const_column_ptr = context->get_constant_col(i); | 93 | 486 | if (const_column_ptr != nullptr) { | 94 | 486 | auto const_data = const_column_ptr->column_ptr->get_data_at(0); | 95 | 486 | if (const_data.data != nullptr) { | 96 | 461 | sz++; | 97 | 461 | } | 98 | 486 | } | 99 | 486 | } | 100 | 195 | return sz; | 101 | 195 | } |
|
102 | | |
103 | 15.1k | Status open(FunctionContext* context, FunctionContext::FunctionStateScope scope) override { |
104 | 15.1k | if (scope == FunctionContext::THREAD_LOCAL) { |
105 | 13.3k | return Status::OK(); |
106 | 13.3k | } |
107 | 1.83k | std::shared_ptr<InState> state = std::make_shared<InState>(); |
108 | 1.83k | context->set_function_state(scope, state); |
109 | 1.83k | DCHECK(context->get_num_args() >= 1); |
110 | 1.83k | if (context->get_arg_type(0)->get_primitive_type() == PrimitiveType::TYPE_NULL) { |
111 | 0 | state->hybrid_set.reset(create_set(TYPE_BOOLEAN, 0, true)); |
112 | 1.83k | } else if (context->get_arg_type(0)->get_primitive_type() == PrimitiveType::TYPE_CHAR || |
113 | 1.83k | context->get_arg_type(0)->get_primitive_type() == PrimitiveType::TYPE_VARCHAR || |
114 | 1.83k | context->get_arg_type(0)->get_primitive_type() == PrimitiveType::TYPE_STRING) { |
115 | | // the StringValue's memory is held by FunctionContext, so we can use StringValueSet here directly |
116 | 485 | state->hybrid_set.reset(create_string_value_set(get_size_with_out_null(context))); |
117 | 1.35k | } else { |
118 | 1.35k | state->hybrid_set.reset(create_set(context->get_arg_type(0)->get_primitive_type(), |
119 | 1.35k | get_size_with_out_null(context), true)); |
120 | 1.35k | } |
121 | | |
122 | 6.36k | for (int i = 1; i < context->get_num_args(); ++i) { |
123 | 4.52k | const auto& const_column_ptr = context->get_constant_col(i); |
124 | 4.52k | if (const_column_ptr != nullptr) { |
125 | 4.52k | auto const_data = const_column_ptr->column_ptr->get_data_at(0); |
126 | 4.52k | state->hybrid_set->insert((void*)const_data.data, const_data.size); |
127 | 4.52k | } else { |
128 | 1 | state->use_set = false; |
129 | 1 | state->hybrid_set.reset(); |
130 | 1 | break; |
131 | 1 | } |
132 | 4.52k | } |
133 | 1.83k | return Status::OK(); |
134 | 15.1k | } _ZN5doris10FunctionInILb0EE4openEPNS_15FunctionContextENS2_18FunctionStateScopeE Line | Count | Source | 103 | 12.9k | Status open(FunctionContext* context, FunctionContext::FunctionStateScope scope) override { | 104 | 12.9k | if (scope == FunctionContext::THREAD_LOCAL) { | 105 | 11.2k | return Status::OK(); | 106 | 11.2k | } | 107 | 1.64k | std::shared_ptr<InState> state = std::make_shared<InState>(); | 108 | 1.64k | context->set_function_state(scope, state); | 109 | 1.64k | DCHECK(context->get_num_args() >= 1); | 110 | 1.64k | if (context->get_arg_type(0)->get_primitive_type() == PrimitiveType::TYPE_NULL) { | 111 | 0 | state->hybrid_set.reset(create_set(TYPE_BOOLEAN, 0, true)); | 112 | 1.64k | } else if (context->get_arg_type(0)->get_primitive_type() == PrimitiveType::TYPE_CHAR || | 113 | 1.64k | context->get_arg_type(0)->get_primitive_type() == PrimitiveType::TYPE_VARCHAR || | 114 | 1.64k | context->get_arg_type(0)->get_primitive_type() == PrimitiveType::TYPE_STRING) { | 115 | | // the StringValue's memory is held by FunctionContext, so we can use StringValueSet here directly | 116 | 390 | state->hybrid_set.reset(create_string_value_set(get_size_with_out_null(context))); | 117 | 1.25k | } else { | 118 | 1.25k | state->hybrid_set.reset(create_set(context->get_arg_type(0)->get_primitive_type(), | 119 | 1.25k | get_size_with_out_null(context), true)); | 120 | 1.25k | } | 121 | | | 122 | 5.68k | for (int i = 1; i < context->get_num_args(); ++i) { | 123 | 4.03k | const auto& const_column_ptr = context->get_constant_col(i); | 124 | 4.03k | if (const_column_ptr != nullptr) { | 125 | 4.03k | auto const_data = const_column_ptr->column_ptr->get_data_at(0); | 126 | 4.03k | state->hybrid_set->insert((void*)const_data.data, const_data.size); | 127 | 4.03k | } else { | 128 | 1 | state->use_set = false; | 129 | 1 | state->hybrid_set.reset(); | 130 | 1 | break; | 131 | 1 | } | 132 | 4.03k | } | 133 | 1.64k | return Status::OK(); | 134 | 12.9k | } |
_ZN5doris10FunctionInILb1EE4openEPNS_15FunctionContextENS2_18FunctionStateScopeE Line | Count | Source | 103 | 2.25k | Status open(FunctionContext* context, FunctionContext::FunctionStateScope scope) override { | 104 | 2.25k | if (scope == FunctionContext::THREAD_LOCAL) { | 105 | 2.06k | return Status::OK(); | 106 | 2.06k | } | 107 | 194 | std::shared_ptr<InState> state = std::make_shared<InState>(); | 108 | 194 | context->set_function_state(scope, state); | 109 | 194 | DCHECK(context->get_num_args() >= 1); | 110 | 194 | if (context->get_arg_type(0)->get_primitive_type() == PrimitiveType::TYPE_NULL) { | 111 | 0 | state->hybrid_set.reset(create_set(TYPE_BOOLEAN, 0, true)); | 112 | 194 | } else if (context->get_arg_type(0)->get_primitive_type() == PrimitiveType::TYPE_CHAR || | 113 | 194 | context->get_arg_type(0)->get_primitive_type() == PrimitiveType::TYPE_VARCHAR || | 114 | 194 | context->get_arg_type(0)->get_primitive_type() == PrimitiveType::TYPE_STRING) { | 115 | | // the StringValue's memory is held by FunctionContext, so we can use StringValueSet here directly | 116 | 95 | state->hybrid_set.reset(create_string_value_set(get_size_with_out_null(context))); | 117 | 99 | } else { | 118 | 99 | state->hybrid_set.reset(create_set(context->get_arg_type(0)->get_primitive_type(), | 119 | 99 | get_size_with_out_null(context), true)); | 120 | 99 | } | 121 | | | 122 | 680 | for (int i = 1; i < context->get_num_args(); ++i) { | 123 | 486 | const auto& const_column_ptr = context->get_constant_col(i); | 124 | 486 | if (const_column_ptr != nullptr) { | 125 | 486 | auto const_data = const_column_ptr->column_ptr->get_data_at(0); | 126 | 486 | state->hybrid_set->insert((void*)const_data.data, const_data.size); | 127 | 486 | } else { | 128 | 0 | state->use_set = false; | 129 | 0 | state->hybrid_set.reset(); | 130 | 0 | break; | 131 | 0 | } | 132 | 486 | } | 133 | 194 | return Status::OK(); | 134 | 2.25k | } |
|
135 | | |
136 | | Status evaluate_inverted_index( |
137 | | const ColumnsWithTypeAndName& arguments, |
138 | | const std::vector<IndexFieldNameAndTypePair>& data_type_with_names, |
139 | | std::vector<segment_v2::IndexIterator*> iterators, uint32_t num_rows, |
140 | | const InvertedIndexAnalyzerCtx* analyzer_ctx, |
141 | 715 | segment_v2::InvertedIndexResultBitmap& bitmap_result) const override { |
142 | 715 | DCHECK(data_type_with_names.size() == 1); |
143 | 715 | DCHECK(iterators.size() == 1); |
144 | 715 | auto* iter = iterators[0]; |
145 | 715 | auto data_type_with_name = data_type_with_names[0]; |
146 | 715 | std::shared_ptr<roaring::Roaring> roaring = std::make_shared<roaring::Roaring>(); |
147 | 715 | std::shared_ptr<roaring::Roaring> null_bitmap = std::make_shared<roaring::Roaring>(); |
148 | | |
149 | 715 | if (iter == nullptr) { |
150 | 0 | return Status::OK(); |
151 | 0 | } |
152 | 715 | if (!segment_v2::IndexReaderHelper::has_string_or_bkd_index(iter)) { |
153 | | //NOT support in list when parser is FULLTEXT for expr inverted index evaluate. |
154 | 140 | return Status::OK(); |
155 | 140 | } |
156 | 576 | if (iter->has_null()) { |
157 | 576 | segment_v2::InvertedIndexQueryCacheHandle null_bitmap_cache_handle; |
158 | 576 | RETURN_IF_ERROR(iter->read_null_bitmap(&null_bitmap_cache_handle)); |
159 | 576 | null_bitmap = null_bitmap_cache_handle.get_bitmap(); |
160 | 576 | } |
161 | 715 | for (const auto& arg : arguments) { |
162 | 715 | Field param_value; |
163 | 715 | arg.column->get(0, param_value); |
164 | 715 | auto param_type = arg.type->get_primitive_type(); |
165 | 715 | if (param_value.is_null()) { |
166 | | // predicate like column NOT IN (NULL, '') should not push down to index. |
167 | 506 | if (negative) { |
168 | 503 | return Status::OK(); |
169 | 503 | } |
170 | 3 | *roaring |= *null_bitmap; |
171 | 3 | continue; |
172 | 506 | } |
173 | 209 | std::unique_ptr<InvertedIndexQueryParamFactory> query_param = nullptr; |
174 | 209 | RETURN_IF_ERROR(InvertedIndexQueryParamFactory::create_query_value( |
175 | 209 | param_type, ¶m_value, query_param)); |
176 | 209 | InvertedIndexQueryType query_type = InvertedIndexQueryType::EQUAL_QUERY; |
177 | 209 | segment_v2::InvertedIndexParam param; |
178 | 209 | param.column_name = data_type_with_name.first; |
179 | 209 | param.column_type = data_type_with_name.second; |
180 | 209 | param.query_value = query_param->get_value(); |
181 | 209 | param.query_type = query_type; |
182 | 209 | param.num_rows = num_rows; |
183 | 209 | param.roaring = std::make_shared<roaring::Roaring>(); |
184 | 209 | param.analyzer_ctx = analyzer_ctx; |
185 | 209 | RETURN_IF_ERROR(iter->read_from_index(segment_v2::IndexParam {¶m})); |
186 | 202 | *roaring |= *param.roaring; |
187 | 202 | } |
188 | 65 | segment_v2::InvertedIndexResultBitmap result(roaring, null_bitmap); |
189 | 65 | bitmap_result = result; |
190 | 65 | bitmap_result.mask_out_null(); |
191 | 65 | if constexpr (negative) { |
192 | 32 | roaring::Roaring full_result; |
193 | 32 | full_result.addRange(0, num_rows); |
194 | 32 | bitmap_result.op_not(&full_result); |
195 | 32 | } |
196 | 65 | return Status::OK(); |
197 | 575 | } _ZNK5doris10FunctionInILb0EE23evaluate_inverted_indexERKSt6vectorINS_21ColumnWithTypeAndNameESaIS3_EERKS2_ISt4pairINSt7__cxx1112basic_stringIcSt11char_traitsIcESaIcEEESt10shared_ptrIKNS_9IDataTypeEEESaISJ_EES2_IPNS_10segment_v213IndexIteratorESaISQ_EEjPKNS_24InvertedIndexAnalyzerCtxERNSO_25InvertedIndexResultBitmapE Line | Count | Source | 141 | 97 | segment_v2::InvertedIndexResultBitmap& bitmap_result) const override { | 142 | 97 | DCHECK(data_type_with_names.size() == 1); | 143 | 97 | DCHECK(iterators.size() == 1); | 144 | 97 | auto* iter = iterators[0]; | 145 | 97 | auto data_type_with_name = data_type_with_names[0]; | 146 | 97 | std::shared_ptr<roaring::Roaring> roaring = std::make_shared<roaring::Roaring>(); | 147 | 97 | std::shared_ptr<roaring::Roaring> null_bitmap = std::make_shared<roaring::Roaring>(); | 148 | | | 149 | 97 | if (iter == nullptr) { | 150 | 0 | return Status::OK(); | 151 | 0 | } | 152 | 97 | if (!segment_v2::IndexReaderHelper::has_string_or_bkd_index(iter)) { | 153 | | //NOT support in list when parser is FULLTEXT for expr inverted index evaluate. | 154 | 64 | return Status::OK(); | 155 | 64 | } | 156 | 33 | if (iter->has_null()) { | 157 | 33 | segment_v2::InvertedIndexQueryCacheHandle null_bitmap_cache_handle; | 158 | 33 | RETURN_IF_ERROR(iter->read_null_bitmap(&null_bitmap_cache_handle)); | 159 | 33 | null_bitmap = null_bitmap_cache_handle.get_bitmap(); | 160 | 33 | } | 161 | 65 | for (const auto& arg : arguments) { | 162 | 65 | Field param_value; | 163 | 65 | arg.column->get(0, param_value); | 164 | 65 | auto param_type = arg.type->get_primitive_type(); | 165 | 65 | if (param_value.is_null()) { | 166 | | // predicate like column NOT IN (NULL, '') should not push down to index. | 167 | 3 | if (negative) { | 168 | 0 | return Status::OK(); | 169 | 0 | } | 170 | 3 | *roaring |= *null_bitmap; | 171 | 3 | continue; | 172 | 3 | } | 173 | 62 | std::unique_ptr<InvertedIndexQueryParamFactory> query_param = nullptr; | 174 | 62 | RETURN_IF_ERROR(InvertedIndexQueryParamFactory::create_query_value( | 175 | 62 | param_type, ¶m_value, query_param)); | 176 | 62 | InvertedIndexQueryType query_type = InvertedIndexQueryType::EQUAL_QUERY; | 177 | 62 | segment_v2::InvertedIndexParam param; | 178 | 62 | param.column_name = data_type_with_name.first; | 179 | 62 | param.column_type = data_type_with_name.second; | 180 | 62 | param.query_value = query_param->get_value(); | 181 | 62 | param.query_type = query_type; | 182 | 62 | param.num_rows = num_rows; | 183 | 62 | param.roaring = std::make_shared<roaring::Roaring>(); | 184 | 62 | param.analyzer_ctx = analyzer_ctx; | 185 | 62 | RETURN_IF_ERROR(iter->read_from_index(segment_v2::IndexParam {¶m})); | 186 | 62 | *roaring |= *param.roaring; | 187 | 62 | } | 188 | 33 | segment_v2::InvertedIndexResultBitmap result(roaring, null_bitmap); | 189 | 33 | bitmap_result = result; | 190 | 33 | bitmap_result.mask_out_null(); | 191 | | if constexpr (negative) { | 192 | | roaring::Roaring full_result; | 193 | | full_result.addRange(0, num_rows); | 194 | | bitmap_result.op_not(&full_result); | 195 | | } | 196 | 33 | return Status::OK(); | 197 | 33 | } |
_ZNK5doris10FunctionInILb1EE23evaluate_inverted_indexERKSt6vectorINS_21ColumnWithTypeAndNameESaIS3_EERKS2_ISt4pairINSt7__cxx1112basic_stringIcSt11char_traitsIcESaIcEEESt10shared_ptrIKNS_9IDataTypeEEESaISJ_EES2_IPNS_10segment_v213IndexIteratorESaISQ_EEjPKNS_24InvertedIndexAnalyzerCtxERNSO_25InvertedIndexResultBitmapE Line | Count | Source | 141 | 618 | segment_v2::InvertedIndexResultBitmap& bitmap_result) const override { | 142 | 618 | DCHECK(data_type_with_names.size() == 1); | 143 | 618 | DCHECK(iterators.size() == 1); | 144 | 618 | auto* iter = iterators[0]; | 145 | 618 | auto data_type_with_name = data_type_with_names[0]; | 146 | 618 | std::shared_ptr<roaring::Roaring> roaring = std::make_shared<roaring::Roaring>(); | 147 | 618 | std::shared_ptr<roaring::Roaring> null_bitmap = std::make_shared<roaring::Roaring>(); | 148 | | | 149 | 618 | if (iter == nullptr) { | 150 | 0 | return Status::OK(); | 151 | 0 | } | 152 | 618 | if (!segment_v2::IndexReaderHelper::has_string_or_bkd_index(iter)) { | 153 | | //NOT support in list when parser is FULLTEXT for expr inverted index evaluate. | 154 | 76 | return Status::OK(); | 155 | 76 | } | 156 | 543 | if (iter->has_null()) { | 157 | 543 | segment_v2::InvertedIndexQueryCacheHandle null_bitmap_cache_handle; | 158 | 543 | RETURN_IF_ERROR(iter->read_null_bitmap(&null_bitmap_cache_handle)); | 159 | 543 | null_bitmap = null_bitmap_cache_handle.get_bitmap(); | 160 | 543 | } | 161 | 650 | for (const auto& arg : arguments) { | 162 | 650 | Field param_value; | 163 | 650 | arg.column->get(0, param_value); | 164 | 650 | auto param_type = arg.type->get_primitive_type(); | 165 | 650 | if (param_value.is_null()) { | 166 | | // predicate like column NOT IN (NULL, '') should not push down to index. | 167 | 503 | if (negative) { | 168 | 503 | return Status::OK(); | 169 | 503 | } | 170 | 0 | *roaring |= *null_bitmap; | 171 | 0 | continue; | 172 | 503 | } | 173 | 147 | std::unique_ptr<InvertedIndexQueryParamFactory> query_param = nullptr; | 174 | 147 | RETURN_IF_ERROR(InvertedIndexQueryParamFactory::create_query_value( | 175 | 147 | param_type, ¶m_value, query_param)); | 176 | 147 | InvertedIndexQueryType query_type = InvertedIndexQueryType::EQUAL_QUERY; | 177 | 147 | segment_v2::InvertedIndexParam param; | 178 | 147 | param.column_name = data_type_with_name.first; | 179 | 147 | param.column_type = data_type_with_name.second; | 180 | 147 | param.query_value = query_param->get_value(); | 181 | 147 | param.query_type = query_type; | 182 | 147 | param.num_rows = num_rows; | 183 | 147 | param.roaring = std::make_shared<roaring::Roaring>(); | 184 | 147 | param.analyzer_ctx = analyzer_ctx; | 185 | 147 | RETURN_IF_ERROR(iter->read_from_index(segment_v2::IndexParam {¶m})); | 186 | 140 | *roaring |= *param.roaring; | 187 | 140 | } | 188 | 32 | segment_v2::InvertedIndexResultBitmap result(roaring, null_bitmap); | 189 | 32 | bitmap_result = result; | 190 | 32 | bitmap_result.mask_out_null(); | 191 | 32 | if constexpr (negative) { | 192 | 32 | roaring::Roaring full_result; | 193 | 32 | full_result.addRange(0, num_rows); | 194 | 32 | bitmap_result.op_not(&full_result); | 195 | 32 | } | 196 | 32 | return Status::OK(); | 197 | 542 | } |
|
198 | | |
199 | | Status execute_impl(FunctionContext* context, Block& block, const ColumnNumbers& arguments, |
200 | 14.0k | uint32_t result, size_t input_rows_count) const override { |
201 | 14.0k | auto* in_state = reinterpret_cast<InState*>( |
202 | 14.0k | context->get_function_state(FunctionContext::FRAGMENT_LOCAL)); |
203 | 14.0k | if (!in_state) { |
204 | 0 | return Status::RuntimeError("funciton context for function '{}' must have Set;", |
205 | 0 | get_name()); |
206 | 0 | } |
207 | 14.0k | auto res = ColumnUInt8::create(); |
208 | 14.0k | ColumnUInt8::Container& vec_res = res->get_data(); |
209 | 14.0k | vec_res.resize(input_rows_count); |
210 | | |
211 | 14.0k | ColumnUInt8::MutablePtr col_null_map_to; |
212 | 14.0k | col_null_map_to = ColumnUInt8::create(input_rows_count, false); |
213 | 14.0k | auto& vec_null_map_to = col_null_map_to->get_data(); |
214 | | |
215 | 14.0k | const ColumnWithTypeAndName& left_arg = block.get_by_position(arguments[0]); |
216 | 14.0k | const auto& [materialized_column, col_const] = unpack_if_const(left_arg.column); |
217 | | |
218 | 14.0k | if (in_state->use_set) { |
219 | 14.0k | if (materialized_column->is_nullable()) { |
220 | 13.5k | const auto* null_col_ptr = |
221 | 13.5k | check_and_get_column<ColumnNullable>(materialized_column.get()); |
222 | 13.5k | const auto& null_map = |
223 | 13.5k | assert_cast<const ColumnUInt8&>(null_col_ptr->get_null_map_column()) |
224 | 13.5k | .get_data(); |
225 | 13.5k | const auto* nested_col_ptr = null_col_ptr->get_nested_column_ptr().get(); |
226 | | |
227 | 13.5k | if (nested_col_ptr->is_column_string()) { |
228 | 2.92k | const auto* column_string_ptr = |
229 | 2.92k | assert_cast<const ColumnString*>(nested_col_ptr); |
230 | 2.92k | search_hash_set_check_null(in_state, input_rows_count, vec_res, null_map, |
231 | 2.92k | column_string_ptr); |
232 | 10.5k | } else { |
233 | | //TODO: support other column type |
234 | 10.5k | search_hash_set_check_null(in_state, input_rows_count, vec_res, null_map, |
235 | 10.5k | nested_col_ptr); |
236 | 10.5k | } |
237 | | |
238 | 13.5k | if (!in_state->hybrid_set->contain_null()) { |
239 | 5.04M | for (size_t i = 0; i < input_rows_count; ++i) { |
240 | 5.03M | vec_null_map_to[i] = null_map[i]; |
241 | 5.03M | } |
242 | 12.7k | } else { |
243 | 40.6k | for (size_t i = 0; i < input_rows_count; ++i) { |
244 | 39.9k | vec_null_map_to[i] = null_map[i] || negative == vec_res[i]; |
245 | 39.9k | } |
246 | 712 | } |
247 | | |
248 | 13.5k | } else { // non-nullable |
249 | 537 | if (is_string_type(left_arg.type->get_primitive_type())) { |
250 | 268 | const auto* column_string_ptr = |
251 | 268 | assert_cast<const ColumnString*>(materialized_column.get()); |
252 | 268 | search_hash_set(in_state, input_rows_count, vec_res, column_string_ptr); |
253 | 269 | } else { |
254 | 269 | search_hash_set(in_state, input_rows_count, vec_res, materialized_column.get()); |
255 | 269 | } |
256 | | |
257 | 537 | if (in_state->hybrid_set->contain_null()) { |
258 | 79 | for (size_t i = 0; i < input_rows_count; ++i) { |
259 | 50 | vec_null_map_to[i] = negative == vec_res[i]; |
260 | 50 | } |
261 | 29 | } |
262 | 537 | } |
263 | 18.4E | } else { //!in_state->use_set |
264 | 18.4E | std::vector<ColumnPtr> set_columns; |
265 | 18.4E | for (int i = 1; i < arguments.size(); ++i) { |
266 | 2 | set_columns.emplace_back(block.get_by_position(arguments[i]).column); |
267 | 2 | } |
268 | 18.4E | if (col_const) { |
269 | 0 | impl_without_set<true>(context, set_columns, input_rows_count, vec_res, |
270 | 0 | vec_null_map_to, materialized_column); |
271 | 18.4E | } else { |
272 | 18.4E | impl_without_set<false>(context, set_columns, input_rows_count, vec_res, |
273 | 18.4E | vec_null_map_to, materialized_column); |
274 | 18.4E | } |
275 | 18.4E | } |
276 | | |
277 | 14.0k | if (block.get_by_position(result).type->is_nullable()) { |
278 | 13.5k | block.replace_by_position( |
279 | 13.5k | result, ColumnNullable::create(std::move(res), std::move(col_null_map_to))); |
280 | 13.5k | } else { |
281 | 505 | block.replace_by_position(result, std::move(res)); |
282 | 505 | } |
283 | | |
284 | 14.0k | return Status::OK(); |
285 | 14.0k | } _ZNK5doris10FunctionInILb0EE12execute_implEPNS_15FunctionContextERNS_5BlockERKSt6vectorIjSaIjEEjm Line | Count | Source | 200 | 13.1k | uint32_t result, size_t input_rows_count) const override { | 201 | 13.1k | auto* in_state = reinterpret_cast<InState*>( | 202 | 13.1k | context->get_function_state(FunctionContext::FRAGMENT_LOCAL)); | 203 | 13.1k | if (!in_state) { | 204 | 0 | return Status::RuntimeError("funciton context for function '{}' must have Set;", | 205 | 0 | get_name()); | 206 | 0 | } | 207 | 13.1k | auto res = ColumnUInt8::create(); | 208 | 13.1k | ColumnUInt8::Container& vec_res = res->get_data(); | 209 | 13.1k | vec_res.resize(input_rows_count); | 210 | | | 211 | 13.1k | ColumnUInt8::MutablePtr col_null_map_to; | 212 | 13.1k | col_null_map_to = ColumnUInt8::create(input_rows_count, false); | 213 | 13.1k | auto& vec_null_map_to = col_null_map_to->get_data(); | 214 | | | 215 | 13.1k | const ColumnWithTypeAndName& left_arg = block.get_by_position(arguments[0]); | 216 | 13.1k | const auto& [materialized_column, col_const] = unpack_if_const(left_arg.column); | 217 | | | 218 | 13.1k | if (in_state->use_set) { | 219 | 13.1k | if (materialized_column->is_nullable()) { | 220 | 12.6k | const auto* null_col_ptr = | 221 | 12.6k | check_and_get_column<ColumnNullable>(materialized_column.get()); | 222 | 12.6k | const auto& null_map = | 223 | 12.6k | assert_cast<const ColumnUInt8&>(null_col_ptr->get_null_map_column()) | 224 | 12.6k | .get_data(); | 225 | 12.6k | const auto* nested_col_ptr = null_col_ptr->get_nested_column_ptr().get(); | 226 | | | 227 | 12.6k | if (nested_col_ptr->is_column_string()) { | 228 | 2.23k | const auto* column_string_ptr = | 229 | 2.23k | assert_cast<const ColumnString*>(nested_col_ptr); | 230 | 2.23k | search_hash_set_check_null(in_state, input_rows_count, vec_res, null_map, | 231 | 2.23k | column_string_ptr); | 232 | 10.4k | } else { | 233 | | //TODO: support other column type | 234 | 10.4k | search_hash_set_check_null(in_state, input_rows_count, vec_res, null_map, | 235 | 10.4k | nested_col_ptr); | 236 | 10.4k | } | 237 | | | 238 | 12.6k | if (!in_state->hybrid_set->contain_null()) { | 239 | 5.01M | for (size_t i = 0; i < input_rows_count; ++i) { | 240 | 4.99M | vec_null_map_to[i] = null_map[i]; | 241 | 4.99M | } | 242 | 12.4k | } else { | 243 | 28.8k | for (size_t i = 0; i < input_rows_count; ++i) { | 244 | 28.6k | vec_null_map_to[i] = null_map[i] || negative == vec_res[i]; | 245 | 28.6k | } | 246 | 207 | } | 247 | | | 248 | 12.6k | } else { // non-nullable | 249 | 504 | if (is_string_type(left_arg.type->get_primitive_type())) { | 250 | 268 | const auto* column_string_ptr = | 251 | 268 | assert_cast<const ColumnString*>(materialized_column.get()); | 252 | 268 | search_hash_set(in_state, input_rows_count, vec_res, column_string_ptr); | 253 | 268 | } else { | 254 | 236 | search_hash_set(in_state, input_rows_count, vec_res, materialized_column.get()); | 255 | 236 | } | 256 | | | 257 | 504 | if (in_state->hybrid_set->contain_null()) { | 258 | 0 | for (size_t i = 0; i < input_rows_count; ++i) { | 259 | 0 | vec_null_map_to[i] = negative == vec_res[i]; | 260 | 0 | } | 261 | 0 | } | 262 | 504 | } | 263 | 18.4E | } else { //!in_state->use_set | 264 | 18.4E | std::vector<ColumnPtr> set_columns; | 265 | 18.4E | for (int i = 1; i < arguments.size(); ++i) { | 266 | 2 | set_columns.emplace_back(block.get_by_position(arguments[i]).column); | 267 | 2 | } | 268 | 18.4E | if (col_const) { | 269 | 0 | impl_without_set<true>(context, set_columns, input_rows_count, vec_res, | 270 | 0 | vec_null_map_to, materialized_column); | 271 | 18.4E | } else { | 272 | 18.4E | impl_without_set<false>(context, set_columns, input_rows_count, vec_res, | 273 | 18.4E | vec_null_map_to, materialized_column); | 274 | 18.4E | } | 275 | 18.4E | } | 276 | | | 277 | 13.1k | if (block.get_by_position(result).type->is_nullable()) { | 278 | 12.6k | block.replace_by_position( | 279 | 12.6k | result, ColumnNullable::create(std::move(res), std::move(col_null_map_to))); | 280 | 12.6k | } else { | 281 | 501 | block.replace_by_position(result, std::move(res)); | 282 | 501 | } | 283 | | | 284 | 13.1k | return Status::OK(); | 285 | 13.1k | } |
_ZNK5doris10FunctionInILb1EE12execute_implEPNS_15FunctionContextERNS_5BlockERKSt6vectorIjSaIjEEjm Line | Count | Source | 200 | 857 | uint32_t result, size_t input_rows_count) const override { | 201 | 857 | auto* in_state = reinterpret_cast<InState*>( | 202 | 857 | context->get_function_state(FunctionContext::FRAGMENT_LOCAL)); | 203 | 857 | if (!in_state) { | 204 | 0 | return Status::RuntimeError("funciton context for function '{}' must have Set;", | 205 | 0 | get_name()); | 206 | 0 | } | 207 | 857 | auto res = ColumnUInt8::create(); | 208 | 857 | ColumnUInt8::Container& vec_res = res->get_data(); | 209 | 857 | vec_res.resize(input_rows_count); | 210 | | | 211 | 857 | ColumnUInt8::MutablePtr col_null_map_to; | 212 | 857 | col_null_map_to = ColumnUInt8::create(input_rows_count, false); | 213 | 857 | auto& vec_null_map_to = col_null_map_to->get_data(); | 214 | | | 215 | 857 | const ColumnWithTypeAndName& left_arg = block.get_by_position(arguments[0]); | 216 | 857 | const auto& [materialized_column, col_const] = unpack_if_const(left_arg.column); | 217 | | | 218 | 857 | if (in_state->use_set) { | 219 | 857 | if (materialized_column->is_nullable()) { | 220 | 824 | const auto* null_col_ptr = | 221 | 824 | check_and_get_column<ColumnNullable>(materialized_column.get()); | 222 | 824 | const auto& null_map = | 223 | 824 | assert_cast<const ColumnUInt8&>(null_col_ptr->get_null_map_column()) | 224 | 824 | .get_data(); | 225 | 824 | const auto* nested_col_ptr = null_col_ptr->get_nested_column_ptr().get(); | 226 | | | 227 | 824 | if (nested_col_ptr->is_column_string()) { | 228 | 691 | const auto* column_string_ptr = | 229 | 691 | assert_cast<const ColumnString*>(nested_col_ptr); | 230 | 691 | search_hash_set_check_null(in_state, input_rows_count, vec_res, null_map, | 231 | 691 | column_string_ptr); | 232 | 691 | } else { | 233 | | //TODO: support other column type | 234 | 133 | search_hash_set_check_null(in_state, input_rows_count, vec_res, null_map, | 235 | 133 | nested_col_ptr); | 236 | 133 | } | 237 | | | 238 | 824 | if (!in_state->hybrid_set->contain_null()) { | 239 | 37.6k | for (size_t i = 0; i < input_rows_count; ++i) { | 240 | 37.3k | vec_null_map_to[i] = null_map[i]; | 241 | 37.3k | } | 242 | 505 | } else { | 243 | 11.7k | for (size_t i = 0; i < input_rows_count; ++i) { | 244 | 11.2k | vec_null_map_to[i] = null_map[i] || negative == vec_res[i]; | 245 | 11.2k | } | 246 | 505 | } | 247 | | | 248 | 824 | } else { // non-nullable | 249 | 33 | if (is_string_type(left_arg.type->get_primitive_type())) { | 250 | 0 | const auto* column_string_ptr = | 251 | 0 | assert_cast<const ColumnString*>(materialized_column.get()); | 252 | 0 | search_hash_set(in_state, input_rows_count, vec_res, column_string_ptr); | 253 | 33 | } else { | 254 | 33 | search_hash_set(in_state, input_rows_count, vec_res, materialized_column.get()); | 255 | 33 | } | 256 | | | 257 | 33 | if (in_state->hybrid_set->contain_null()) { | 258 | 79 | for (size_t i = 0; i < input_rows_count; ++i) { | 259 | 50 | vec_null_map_to[i] = negative == vec_res[i]; | 260 | 50 | } | 261 | 29 | } | 262 | 33 | } | 263 | 857 | } else { //!in_state->use_set | 264 | 0 | std::vector<ColumnPtr> set_columns; | 265 | 0 | for (int i = 1; i < arguments.size(); ++i) { | 266 | 0 | set_columns.emplace_back(block.get_by_position(arguments[i]).column); | 267 | 0 | } | 268 | 0 | if (col_const) { | 269 | 0 | impl_without_set<true>(context, set_columns, input_rows_count, vec_res, | 270 | 0 | vec_null_map_to, materialized_column); | 271 | 0 | } else { | 272 | 0 | impl_without_set<false>(context, set_columns, input_rows_count, vec_res, | 273 | 0 | vec_null_map_to, materialized_column); | 274 | 0 | } | 275 | 0 | } | 276 | | | 277 | 857 | if (block.get_by_position(result).type->is_nullable()) { | 278 | 853 | block.replace_by_position( | 279 | 853 | result, ColumnNullable::create(std::move(res), std::move(col_null_map_to))); | 280 | 853 | } else { | 281 | 4 | block.replace_by_position(result, std::move(res)); | 282 | 4 | } | 283 | | | 284 | 857 | return Status::OK(); | 285 | 857 | } |
|
286 | | |
287 | | private: |
288 | | template <typename T> |
289 | | static void search_hash_set_check_null(InState* in_state, size_t input_rows_count, |
290 | | ColumnUInt8::Container& vec_res, |
291 | 13.5k | const ColumnUInt8::Container& null_map, T* col_ptr) { |
292 | 13.5k | if constexpr (!negative) { |
293 | 12.6k | in_state->hybrid_set->find_batch_nullable(*col_ptr, input_rows_count, null_map, |
294 | 12.6k | vec_res); |
295 | 12.6k | } else { |
296 | 824 | in_state->hybrid_set->find_batch_nullable_negative(*col_ptr, input_rows_count, null_map, |
297 | 824 | vec_res); |
298 | 824 | } |
299 | 13.5k | } _ZN5doris10FunctionInILb0EE26search_hash_set_check_nullIKNS_9ColumnStrIjEEEEvPNS_7InStateEmRNS_8PODArrayIhLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEERKSC_PT_ Line | Count | Source | 291 | 2.23k | const ColumnUInt8::Container& null_map, T* col_ptr) { | 292 | 2.23k | if constexpr (!negative) { | 293 | 2.23k | in_state->hybrid_set->find_batch_nullable(*col_ptr, input_rows_count, null_map, | 294 | 2.23k | vec_res); | 295 | | } else { | 296 | | in_state->hybrid_set->find_batch_nullable_negative(*col_ptr, input_rows_count, null_map, | 297 | | vec_res); | 298 | | } | 299 | 2.23k | } |
_ZN5doris10FunctionInILb0EE26search_hash_set_check_nullIKNS_7IColumnEEEvPNS_7InStateEmRNS_8PODArrayIhLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEERKSB_PT_ Line | Count | Source | 291 | 10.4k | const ColumnUInt8::Container& null_map, T* col_ptr) { | 292 | 10.4k | if constexpr (!negative) { | 293 | 10.4k | in_state->hybrid_set->find_batch_nullable(*col_ptr, input_rows_count, null_map, | 294 | 10.4k | vec_res); | 295 | | } else { | 296 | | in_state->hybrid_set->find_batch_nullable_negative(*col_ptr, input_rows_count, null_map, | 297 | | vec_res); | 298 | | } | 299 | 10.4k | } |
_ZN5doris10FunctionInILb1EE26search_hash_set_check_nullIKNS_9ColumnStrIjEEEEvPNS_7InStateEmRNS_8PODArrayIhLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEERKSC_PT_ Line | Count | Source | 291 | 691 | const ColumnUInt8::Container& null_map, T* col_ptr) { | 292 | | if constexpr (!negative) { | 293 | | in_state->hybrid_set->find_batch_nullable(*col_ptr, input_rows_count, null_map, | 294 | | vec_res); | 295 | 691 | } else { | 296 | 691 | in_state->hybrid_set->find_batch_nullable_negative(*col_ptr, input_rows_count, null_map, | 297 | 691 | vec_res); | 298 | 691 | } | 299 | 691 | } |
_ZN5doris10FunctionInILb1EE26search_hash_set_check_nullIKNS_7IColumnEEEvPNS_7InStateEmRNS_8PODArrayIhLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEERKSB_PT_ Line | Count | Source | 291 | 133 | const ColumnUInt8::Container& null_map, T* col_ptr) { | 292 | | if constexpr (!negative) { | 293 | | in_state->hybrid_set->find_batch_nullable(*col_ptr, input_rows_count, null_map, | 294 | | vec_res); | 295 | 133 | } else { | 296 | 133 | in_state->hybrid_set->find_batch_nullable_negative(*col_ptr, input_rows_count, null_map, | 297 | 133 | vec_res); | 298 | 133 | } | 299 | 133 | } |
|
300 | | |
301 | | template <typename T> |
302 | | static void search_hash_set(InState* in_state, size_t input_rows_count, |
303 | 537 | ColumnUInt8::Container& vec_res, T* col_ptr) { |
304 | 537 | if constexpr (!negative) { |
305 | 504 | in_state->hybrid_set->find_batch(*col_ptr, input_rows_count, vec_res); |
306 | 504 | } else { |
307 | 33 | in_state->hybrid_set->find_batch_negative(*col_ptr, input_rows_count, vec_res); |
308 | 33 | } |
309 | 537 | } _ZN5doris10FunctionInILb0EE15search_hash_setIKNS_9ColumnStrIjEEEEvPNS_7InStateEmRNS_8PODArrayIhLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEEPT_ Line | Count | Source | 303 | 268 | ColumnUInt8::Container& vec_res, T* col_ptr) { | 304 | 268 | if constexpr (!negative) { | 305 | 268 | in_state->hybrid_set->find_batch(*col_ptr, input_rows_count, vec_res); | 306 | | } else { | 307 | | in_state->hybrid_set->find_batch_negative(*col_ptr, input_rows_count, vec_res); | 308 | | } | 309 | 268 | } |
_ZN5doris10FunctionInILb0EE15search_hash_setIKNS_7IColumnEEEvPNS_7InStateEmRNS_8PODArrayIhLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEEPT_ Line | Count | Source | 303 | 236 | ColumnUInt8::Container& vec_res, T* col_ptr) { | 304 | 236 | if constexpr (!negative) { | 305 | 236 | in_state->hybrid_set->find_batch(*col_ptr, input_rows_count, vec_res); | 306 | | } else { | 307 | | in_state->hybrid_set->find_batch_negative(*col_ptr, input_rows_count, vec_res); | 308 | | } | 309 | 236 | } |
Unexecuted instantiation: _ZN5doris10FunctionInILb1EE15search_hash_setIKNS_9ColumnStrIjEEEEvPNS_7InStateEmRNS_8PODArrayIhLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEEPT_ _ZN5doris10FunctionInILb1EE15search_hash_setIKNS_7IColumnEEEvPNS_7InStateEmRNS_8PODArrayIhLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEEPT_ Line | Count | Source | 303 | 33 | ColumnUInt8::Container& vec_res, T* col_ptr) { | 304 | | if constexpr (!negative) { | 305 | | in_state->hybrid_set->find_batch(*col_ptr, input_rows_count, vec_res); | 306 | 33 | } else { | 307 | 33 | in_state->hybrid_set->find_batch_negative(*col_ptr, input_rows_count, vec_res); | 308 | 33 | } | 309 | 33 | } |
|
310 | | |
311 | | template <bool Const> |
312 | | static void impl_without_set(FunctionContext* context, |
313 | | const std::vector<ColumnPtr>& set_columns, size_t input_rows_count, |
314 | | ColumnUInt8::Container& vec_res, |
315 | | ColumnUInt8::Container& vec_null_map_to, |
316 | 1 | const ColumnPtr& materialized_column) { |
317 | 2 | for (size_t i = 0; i < input_rows_count; ++i) { |
318 | 1 | const auto& ref_data = materialized_column->get_data_at(index_check_const(i, Const)); |
319 | 1 | if (ref_data.data == nullptr) { |
320 | 0 | vec_null_map_to[i] = true; |
321 | 0 | continue; |
322 | 0 | } |
323 | | |
324 | 1 | std::vector<StringRef> set_datas; |
325 | | // To comply with the SQL standard, IN() returns NULL not only if the expression on the left hand side is NULL, |
326 | | // but also if no match is found in the list and one of the expressions in the list is NULL. |
327 | 1 | bool null_in_set = false; |
328 | | |
329 | 2 | for (const auto& set_column : set_columns) { |
330 | 2 | auto set_data = set_column->get_data_at(i); |
331 | 2 | if (set_data.data == nullptr) { |
332 | 0 | null_in_set = true; |
333 | 2 | } else { |
334 | 2 | set_datas.push_back(set_data); |
335 | 2 | } |
336 | 2 | } |
337 | 1 | std::unique_ptr<HybridSetBase> hybrid_set(create_set( |
338 | 1 | context->get_arg_type(0)->get_primitive_type(), set_datas.size(), true)); |
339 | 2 | for (auto& set_data : set_datas) { |
340 | 2 | hybrid_set->insert((void*)(set_data.data), set_data.size); |
341 | 2 | } |
342 | | |
343 | 1 | vec_res[i] = negative ^ hybrid_set->find((void*)ref_data.data, ref_data.size); |
344 | 1 | if (null_in_set) { |
345 | 0 | vec_null_map_to[i] = negative == vec_res[i]; |
346 | 1 | } else { |
347 | 1 | vec_null_map_to[i] = false; |
348 | 1 | } |
349 | 1 | } |
350 | 1 | } Unexecuted instantiation: _ZN5doris10FunctionInILb0EE16impl_without_setILb1EEEvPNS_15FunctionContextERKSt6vectorINS_3COWINS_7IColumnEE13immutable_ptrIS7_EESaISA_EEmRNS_8PODArrayIhLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEESK_RKSA_ _ZN5doris10FunctionInILb0EE16impl_without_setILb0EEEvPNS_15FunctionContextERKSt6vectorINS_3COWINS_7IColumnEE13immutable_ptrIS7_EESaISA_EEmRNS_8PODArrayIhLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEESK_RKSA_ Line | Count | Source | 316 | 1 | const ColumnPtr& materialized_column) { | 317 | 2 | for (size_t i = 0; i < input_rows_count; ++i) { | 318 | 1 | const auto& ref_data = materialized_column->get_data_at(index_check_const(i, Const)); | 319 | 1 | if (ref_data.data == nullptr) { | 320 | 0 | vec_null_map_to[i] = true; | 321 | 0 | continue; | 322 | 0 | } | 323 | | | 324 | 1 | std::vector<StringRef> set_datas; | 325 | | // To comply with the SQL standard, IN() returns NULL not only if the expression on the left hand side is NULL, | 326 | | // but also if no match is found in the list and one of the expressions in the list is NULL. | 327 | 1 | bool null_in_set = false; | 328 | | | 329 | 2 | for (const auto& set_column : set_columns) { | 330 | 2 | auto set_data = set_column->get_data_at(i); | 331 | 2 | if (set_data.data == nullptr) { | 332 | 0 | null_in_set = true; | 333 | 2 | } else { | 334 | 2 | set_datas.push_back(set_data); | 335 | 2 | } | 336 | 2 | } | 337 | 1 | std::unique_ptr<HybridSetBase> hybrid_set(create_set( | 338 | 1 | context->get_arg_type(0)->get_primitive_type(), set_datas.size(), true)); | 339 | 2 | for (auto& set_data : set_datas) { | 340 | 2 | hybrid_set->insert((void*)(set_data.data), set_data.size); | 341 | 2 | } | 342 | | | 343 | 1 | vec_res[i] = negative ^ hybrid_set->find((void*)ref_data.data, ref_data.size); | 344 | 1 | if (null_in_set) { | 345 | 0 | vec_null_map_to[i] = negative == vec_res[i]; | 346 | 1 | } else { | 347 | 1 | vec_null_map_to[i] = false; | 348 | 1 | } | 349 | 1 | } | 350 | 1 | } |
Unexecuted instantiation: _ZN5doris10FunctionInILb1EE16impl_without_setILb1EEEvPNS_15FunctionContextERKSt6vectorINS_3COWINS_7IColumnEE13immutable_ptrIS7_EESaISA_EEmRNS_8PODArrayIhLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEESK_RKSA_ Unexecuted instantiation: _ZN5doris10FunctionInILb1EE16impl_without_setILb0EEEvPNS_15FunctionContextERKSt6vectorINS_3COWINS_7IColumnEE13immutable_ptrIS7_EESaISA_EEmRNS_8PODArrayIhLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEESK_RKSA_ |
351 | | }; |
352 | | |
353 | | } // namespace doris |