be/src/exprs/function/in.h
Line | Count | Source |
1 | | // Licensed to the Apache Software Foundation (ASF) under one |
2 | | // or more contributor license agreements. See the NOTICE file |
3 | | // distributed with this work for additional information |
4 | | // regarding copyright ownership. The ASF licenses this file |
5 | | // to you under the Apache License, Version 2.0 (the |
6 | | // "License"); you may not use this file except in compliance |
7 | | // with the License. You may obtain a copy of the License at |
8 | | // |
9 | | // http://www.apache.org/licenses/LICENSE-2.0 |
10 | | // |
11 | | // Unless required by applicable law or agreed to in writing, |
12 | | // software distributed under the License is distributed on an |
13 | | // "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY |
14 | | // KIND, either express or implied. See the License for the |
15 | | // specific language governing permissions and limitations |
16 | | // under the License. |
17 | | // This file is copied from |
18 | | |
19 | | #pragma once |
20 | | |
21 | | #include <glog/logging.h> |
22 | | |
23 | | #include <boost/iterator/iterator_facade.hpp> |
24 | | #include <cstddef> |
25 | | #include <memory> |
26 | | #include <utility> |
27 | | #include <vector> |
28 | | |
29 | | #include "common/status.h" |
30 | | #include "core/block/block.h" |
31 | | #include "core/block/column_numbers.h" |
32 | | #include "core/block/column_with_type_and_name.h" |
33 | | #include "core/column/column.h" |
34 | | #include "core/column/column_const.h" |
35 | | #include "core/column/column_nullable.h" |
36 | | #include "core/column/column_vector.h" |
37 | | #include "core/data_type/data_type.h" |
38 | | #include "core/data_type/data_type_nullable.h" |
39 | | #include "core/data_type/data_type_number.h" |
40 | | #include "core/data_type/define_primitive_type.h" |
41 | | #include "core/string_ref.h" |
42 | | #include "core/types.h" |
43 | | #include "exprs/aggregate/aggregate_function.h" |
44 | | #include "exprs/create_predicate_function.h" |
45 | | #include "exprs/function/function.h" |
46 | | #include "exprs/function_context.h" |
47 | | #include "exprs/hybrid_set.h" |
48 | | #include "storage/index/index_reader_helper.h" |
49 | | |
50 | | namespace doris { |
51 | | |
52 | | template <typename T> |
53 | | class ColumnStr; |
54 | | using ColumnString = ColumnStr<UInt32>; |
55 | | |
56 | | struct InState { |
57 | | bool use_set = true; |
58 | | std::shared_ptr<HybridSetBase> hybrid_set; |
59 | | }; |
60 | | |
61 | | template <bool negative> |
62 | | class FunctionIn : public IFunction { |
63 | | public: |
64 | | static constexpr auto name = negative ? "not_in" : "in"; |
65 | | |
66 | 1.30k | static FunctionPtr create() { return std::make_shared<FunctionIn>(); }_ZN5doris10FunctionInILb0EE6createEv Line | Count | Source | 66 | 1.11k | static FunctionPtr create() { return std::make_shared<FunctionIn>(); } |
_ZN5doris10FunctionInILb1EE6createEv Line | Count | Source | 66 | 192 | static FunctionPtr create() { return std::make_shared<FunctionIn>(); } |
|
67 | | |
68 | 0 | String get_name() const override { return name; }Unexecuted instantiation: _ZNK5doris10FunctionInILb0EE8get_nameB5cxx11Ev Unexecuted instantiation: _ZNK5doris10FunctionInILb1EE8get_nameB5cxx11Ev |
69 | | |
70 | 1.28k | bool is_variadic() const override { return true; }_ZNK5doris10FunctionInILb0EE11is_variadicEv Line | Count | Source | 70 | 1.10k | bool is_variadic() const override { return true; } |
_ZNK5doris10FunctionInILb1EE11is_variadicEv Line | Count | Source | 70 | 184 | bool is_variadic() const override { return true; } |
|
71 | | |
72 | 0 | size_t get_number_of_arguments() const override { return 0; }Unexecuted instantiation: _ZNK5doris10FunctionInILb0EE23get_number_of_argumentsEv Unexecuted instantiation: _ZNK5doris10FunctionInILb1EE23get_number_of_argumentsEv |
73 | | |
74 | 1.28k | DataTypePtr get_return_type_impl(const DataTypes& args) const override { |
75 | 2.61k | for (const auto& arg : args) { |
76 | 2.61k | if (arg->is_nullable()) { |
77 | 769 | return make_nullable(std::make_shared<DataTypeUInt8>()); |
78 | 769 | } |
79 | 2.61k | } |
80 | 518 | return std::make_shared<DataTypeUInt8>(); |
81 | 1.28k | } _ZNK5doris10FunctionInILb0EE20get_return_type_implERKSt6vectorISt10shared_ptrIKNS_9IDataTypeEESaIS6_EE Line | Count | Source | 74 | 1.10k | DataTypePtr get_return_type_impl(const DataTypes& args) const override { | 75 | 2.32k | for (const auto& arg : args) { | 76 | 2.32k | if (arg->is_nullable()) { | 77 | 624 | return make_nullable(std::make_shared<DataTypeUInt8>()); | 78 | 624 | } | 79 | 2.32k | } | 80 | 480 | return std::make_shared<DataTypeUInt8>(); | 81 | 1.10k | } |
_ZNK5doris10FunctionInILb1EE20get_return_type_implERKSt6vectorISt10shared_ptrIKNS_9IDataTypeEESaIS6_EE Line | Count | Source | 74 | 183 | DataTypePtr get_return_type_impl(const DataTypes& args) const override { | 75 | 292 | for (const auto& arg : args) { | 76 | 292 | if (arg->is_nullable()) { | 77 | 145 | return make_nullable(std::make_shared<DataTypeUInt8>()); | 78 | 145 | } | 79 | 292 | } | 80 | 38 | return std::make_shared<DataTypeUInt8>(); | 81 | 183 | } |
|
82 | | |
83 | 5.10k | bool use_default_implementation_for_nulls() const override { return false; }_ZNK5doris10FunctionInILb0EE36use_default_implementation_for_nullsEv Line | Count | Source | 83 | 4.05k | bool use_default_implementation_for_nulls() const override { return false; } |
_ZNK5doris10FunctionInILb1EE36use_default_implementation_for_nullsEv Line | Count | Source | 83 | 1.04k | bool use_default_implementation_for_nulls() const override { return false; } |
|
84 | | |
85 | | // size of [ in ( 1 , 2 , 3 , null) ] is 3 |
86 | 1.28k | size_t get_size_with_out_null(FunctionContext* context) { |
87 | 1.28k | if ((context->get_num_args() - 1) > FIXED_CONTAINER_MAX_SIZE) { |
88 | 12 | return context->get_num_args() - 1; |
89 | 12 | } |
90 | 1.27k | size_t sz = 0; |
91 | 4.27k | for (int i = 1; i < context->get_num_args(); ++i) { |
92 | 3.00k | const auto& const_column_ptr = context->get_constant_col(i); |
93 | 3.00k | if (const_column_ptr != nullptr) { |
94 | 3.00k | auto const_data = const_column_ptr->column_ptr->get_data_at(0); |
95 | 3.00k | if (const_data.data != nullptr) { |
96 | 2.95k | sz++; |
97 | 2.95k | } |
98 | 3.00k | } |
99 | 3.00k | } |
100 | 1.27k | return sz; |
101 | 1.28k | } _ZN5doris10FunctionInILb0EE22get_size_with_out_nullEPNS_15FunctionContextE Line | Count | Source | 86 | 1.10k | size_t get_size_with_out_null(FunctionContext* context) { | 87 | 1.10k | if ((context->get_num_args() - 1) > FIXED_CONTAINER_MAX_SIZE) { | 88 | 12 | return context->get_num_args() - 1; | 89 | 12 | } | 90 | 1.08k | size_t sz = 0; | 91 | 3.63k | for (int i = 1; i < context->get_num_args(); ++i) { | 92 | 2.55k | const auto& const_column_ptr = context->get_constant_col(i); | 93 | 2.55k | if (const_column_ptr != nullptr) { | 94 | 2.54k | auto const_data = const_column_ptr->column_ptr->get_data_at(0); | 95 | 2.54k | if (const_data.data != nullptr) { | 96 | 2.52k | sz++; | 97 | 2.52k | } | 98 | 2.54k | } | 99 | 2.55k | } | 100 | 1.08k | return sz; | 101 | 1.10k | } |
_ZN5doris10FunctionInILb1EE22get_size_with_out_nullEPNS_15FunctionContextE Line | Count | Source | 86 | 181 | size_t get_size_with_out_null(FunctionContext* context) { | 87 | 181 | if ((context->get_num_args() - 1) > FIXED_CONTAINER_MAX_SIZE) { | 88 | 0 | return context->get_num_args() - 1; | 89 | 0 | } | 90 | 181 | size_t sz = 0; | 91 | 635 | for (int i = 1; i < context->get_num_args(); ++i) { | 92 | 454 | const auto& const_column_ptr = context->get_constant_col(i); | 93 | 454 | if (const_column_ptr != nullptr) { | 94 | 454 | auto const_data = const_column_ptr->column_ptr->get_data_at(0); | 95 | 454 | if (const_data.data != nullptr) { | 96 | 429 | sz++; | 97 | 429 | } | 98 | 454 | } | 99 | 454 | } | 100 | 181 | return sz; | 101 | 181 | } |
|
102 | | |
103 | 11.7k | Status open(FunctionContext* context, FunctionContext::FunctionStateScope scope) override { |
104 | 11.7k | if (scope == FunctionContext::THREAD_LOCAL) { |
105 | 10.4k | return Status::OK(); |
106 | 10.4k | } |
107 | 1.28k | std::shared_ptr<InState> state = std::make_shared<InState>(); |
108 | 1.28k | context->set_function_state(scope, state); |
109 | 1.28k | DCHECK(context->get_num_args() >= 1); |
110 | 1.28k | if (context->get_arg_type(0)->get_primitive_type() == PrimitiveType::TYPE_NULL) { |
111 | 0 | state->hybrid_set.reset(create_set(TYPE_BOOLEAN, 0, true)); |
112 | 1.28k | } else if (context->get_arg_type(0)->get_primitive_type() == PrimitiveType::TYPE_CHAR || |
113 | 1.28k | context->get_arg_type(0)->get_primitive_type() == PrimitiveType::TYPE_VARCHAR || |
114 | 1.28k | context->get_arg_type(0)->get_primitive_type() == PrimitiveType::TYPE_STRING) { |
115 | | // the StringValue's memory is held by FunctionContext, so we can use StringValueSet here directly |
116 | 329 | state->hybrid_set.reset(create_string_value_set(get_size_with_out_null(context))); |
117 | 951 | } else { |
118 | 951 | state->hybrid_set.reset(create_set(context->get_arg_type(0)->get_primitive_type(), |
119 | 951 | get_size_with_out_null(context), true)); |
120 | 951 | } |
121 | | |
122 | 4.44k | for (int i = 1; i < context->get_num_args(); ++i) { |
123 | 3.16k | const auto& const_column_ptr = context->get_constant_col(i); |
124 | 3.16k | if (const_column_ptr != nullptr) { |
125 | 3.16k | auto const_data = const_column_ptr->column_ptr->get_data_at(0); |
126 | 3.16k | state->hybrid_set->insert((void*)const_data.data, const_data.size); |
127 | 3.16k | } else { |
128 | 1 | state->use_set = false; |
129 | 1 | state->hybrid_set.reset(); |
130 | 1 | break; |
131 | 1 | } |
132 | 3.16k | } |
133 | 1.28k | return Status::OK(); |
134 | 11.7k | } _ZN5doris10FunctionInILb0EE4openEPNS_15FunctionContextENS2_18FunctionStateScopeE Line | Count | Source | 103 | 9.14k | Status open(FunctionContext* context, FunctionContext::FunctionStateScope scope) override { | 104 | 9.14k | if (scope == FunctionContext::THREAD_LOCAL) { | 105 | 8.05k | return Status::OK(); | 106 | 8.05k | } | 107 | 1.09k | std::shared_ptr<InState> state = std::make_shared<InState>(); | 108 | 1.09k | context->set_function_state(scope, state); | 109 | 1.09k | DCHECK(context->get_num_args() >= 1); | 110 | 1.09k | if (context->get_arg_type(0)->get_primitive_type() == PrimitiveType::TYPE_NULL) { | 111 | 0 | state->hybrid_set.reset(create_set(TYPE_BOOLEAN, 0, true)); | 112 | 1.09k | } else if (context->get_arg_type(0)->get_primitive_type() == PrimitiveType::TYPE_CHAR || | 113 | 1.09k | context->get_arg_type(0)->get_primitive_type() == PrimitiveType::TYPE_VARCHAR || | 114 | 1.09k | context->get_arg_type(0)->get_primitive_type() == PrimitiveType::TYPE_STRING) { | 115 | | // the StringValue's memory is held by FunctionContext, so we can use StringValueSet here directly | 116 | 242 | state->hybrid_set.reset(create_string_value_set(get_size_with_out_null(context))); | 117 | 857 | } else { | 118 | 857 | state->hybrid_set.reset(create_set(context->get_arg_type(0)->get_primitive_type(), | 119 | 857 | get_size_with_out_null(context), true)); | 120 | 857 | } | 121 | | | 122 | 3.80k | for (int i = 1; i < context->get_num_args(); ++i) { | 123 | 2.70k | const auto& const_column_ptr = context->get_constant_col(i); | 124 | 2.70k | if (const_column_ptr != nullptr) { | 125 | 2.70k | auto const_data = const_column_ptr->column_ptr->get_data_at(0); | 126 | 2.70k | state->hybrid_set->insert((void*)const_data.data, const_data.size); | 127 | 2.70k | } else { | 128 | 1 | state->use_set = false; | 129 | 1 | state->hybrid_set.reset(); | 130 | 1 | break; | 131 | 1 | } | 132 | 2.70k | } | 133 | 1.09k | return Status::OK(); | 134 | 9.14k | } |
_ZN5doris10FunctionInILb1EE4openEPNS_15FunctionContextENS2_18FunctionStateScopeE Line | Count | Source | 103 | 2.56k | Status open(FunctionContext* context, FunctionContext::FunctionStateScope scope) override { | 104 | 2.56k | if (scope == FunctionContext::THREAD_LOCAL) { | 105 | 2.38k | return Status::OK(); | 106 | 2.38k | } | 107 | 181 | std::shared_ptr<InState> state = std::make_shared<InState>(); | 108 | 181 | context->set_function_state(scope, state); | 109 | 181 | DCHECK(context->get_num_args() >= 1); | 110 | 181 | if (context->get_arg_type(0)->get_primitive_type() == PrimitiveType::TYPE_NULL) { | 111 | 0 | state->hybrid_set.reset(create_set(TYPE_BOOLEAN, 0, true)); | 112 | 181 | } else if (context->get_arg_type(0)->get_primitive_type() == PrimitiveType::TYPE_CHAR || | 113 | 181 | context->get_arg_type(0)->get_primitive_type() == PrimitiveType::TYPE_VARCHAR || | 114 | 181 | context->get_arg_type(0)->get_primitive_type() == PrimitiveType::TYPE_STRING) { | 115 | | // the StringValue's memory is held by FunctionContext, so we can use StringValueSet here directly | 116 | 87 | state->hybrid_set.reset(create_string_value_set(get_size_with_out_null(context))); | 117 | 94 | } else { | 118 | 94 | state->hybrid_set.reset(create_set(context->get_arg_type(0)->get_primitive_type(), | 119 | 94 | get_size_with_out_null(context), true)); | 120 | 94 | } | 121 | | | 122 | 635 | for (int i = 1; i < context->get_num_args(); ++i) { | 123 | 454 | const auto& const_column_ptr = context->get_constant_col(i); | 124 | 454 | if (const_column_ptr != nullptr) { | 125 | 454 | auto const_data = const_column_ptr->column_ptr->get_data_at(0); | 126 | 454 | state->hybrid_set->insert((void*)const_data.data, const_data.size); | 127 | 454 | } else { | 128 | 0 | state->use_set = false; | 129 | 0 | state->hybrid_set.reset(); | 130 | 0 | break; | 131 | 0 | } | 132 | 454 | } | 133 | 181 | return Status::OK(); | 134 | 2.56k | } |
|
135 | | |
136 | | Status evaluate_inverted_index( |
137 | | const ColumnsWithTypeAndName& arguments, |
138 | | const std::vector<IndexFieldNameAndTypePair>& data_type_with_names, |
139 | | std::vector<segment_v2::IndexIterator*> iterators, uint32_t num_rows, |
140 | | const InvertedIndexAnalyzerCtx* analyzer_ctx, |
141 | 716 | segment_v2::InvertedIndexResultBitmap& bitmap_result) const override { |
142 | 716 | DCHECK(data_type_with_names.size() == 1); |
143 | 716 | DCHECK(iterators.size() == 1); |
144 | 716 | auto* iter = iterators[0]; |
145 | 716 | auto data_type_with_name = data_type_with_names[0]; |
146 | 716 | std::shared_ptr<roaring::Roaring> roaring = std::make_shared<roaring::Roaring>(); |
147 | 716 | std::shared_ptr<roaring::Roaring> null_bitmap = std::make_shared<roaring::Roaring>(); |
148 | | |
149 | 716 | if (iter == nullptr) { |
150 | 0 | return Status::OK(); |
151 | 0 | } |
152 | 716 | if (!segment_v2::IndexReaderHelper::has_string_or_bkd_index(iter)) { |
153 | | //NOT support in list when parser is FULLTEXT for expr inverted index evaluate. |
154 | 140 | return Status::OK(); |
155 | 140 | } |
156 | 576 | if (iter->has_null()) { |
157 | 576 | segment_v2::InvertedIndexQueryCacheHandle null_bitmap_cache_handle; |
158 | 576 | RETURN_IF_ERROR(iter->read_null_bitmap(&null_bitmap_cache_handle)); |
159 | 576 | null_bitmap = null_bitmap_cache_handle.get_bitmap(); |
160 | 576 | } |
161 | 718 | for (const auto& arg : arguments) { |
162 | 718 | Field param_value; |
163 | 718 | arg.column->get(0, param_value); |
164 | 718 | auto param_type = arg.type->get_primitive_type(); |
165 | 718 | if (param_value.is_null()) { |
166 | | // predicate like column NOT IN (NULL, '') should not push down to index. |
167 | 506 | if (negative) { |
168 | 503 | return Status::OK(); |
169 | 503 | } |
170 | 3 | *roaring |= *null_bitmap; |
171 | 3 | continue; |
172 | 506 | } |
173 | 212 | std::unique_ptr<InvertedIndexQueryParamFactory> query_param = nullptr; |
174 | 212 | RETURN_IF_ERROR(InvertedIndexQueryParamFactory::create_query_value( |
175 | 212 | param_type, ¶m_value, query_param)); |
176 | 212 | InvertedIndexQueryType query_type = InvertedIndexQueryType::EQUAL_QUERY; |
177 | 212 | segment_v2::InvertedIndexParam param; |
178 | 212 | param.column_name = data_type_with_name.first; |
179 | 212 | param.column_type = data_type_with_name.second; |
180 | 212 | param.query_value = query_param->get_value(); |
181 | 212 | param.query_type = query_type; |
182 | 212 | param.num_rows = num_rows; |
183 | 212 | param.roaring = std::make_shared<roaring::Roaring>(); |
184 | 212 | param.analyzer_ctx = analyzer_ctx; |
185 | 212 | RETURN_IF_ERROR(iter->read_from_index(segment_v2::IndexParam {¶m})); |
186 | 205 | *roaring |= *param.roaring; |
187 | 205 | } |
188 | 66 | segment_v2::InvertedIndexResultBitmap result(roaring, null_bitmap); |
189 | 66 | bitmap_result = result; |
190 | 66 | bitmap_result.mask_out_null(); |
191 | 66 | if constexpr (negative) { |
192 | 33 | roaring::Roaring full_result; |
193 | 33 | full_result.addRange(0, num_rows); |
194 | 33 | bitmap_result.op_not(&full_result); |
195 | 33 | } |
196 | 66 | return Status::OK(); |
197 | 576 | } _ZNK5doris10FunctionInILb0EE23evaluate_inverted_indexERKSt6vectorINS_21ColumnWithTypeAndNameESaIS3_EERKS2_ISt4pairINSt7__cxx1112basic_stringIcSt11char_traitsIcESaIcEEESt10shared_ptrIKNS_9IDataTypeEEESaISJ_EES2_IPNS_10segment_v213IndexIteratorESaISQ_EEjPKNS_24InvertedIndexAnalyzerCtxERNSO_25InvertedIndexResultBitmapE Line | Count | Source | 141 | 97 | segment_v2::InvertedIndexResultBitmap& bitmap_result) const override { | 142 | 97 | DCHECK(data_type_with_names.size() == 1); | 143 | 97 | DCHECK(iterators.size() == 1); | 144 | 97 | auto* iter = iterators[0]; | 145 | 97 | auto data_type_with_name = data_type_with_names[0]; | 146 | 97 | std::shared_ptr<roaring::Roaring> roaring = std::make_shared<roaring::Roaring>(); | 147 | 97 | std::shared_ptr<roaring::Roaring> null_bitmap = std::make_shared<roaring::Roaring>(); | 148 | | | 149 | 97 | if (iter == nullptr) { | 150 | 0 | return Status::OK(); | 151 | 0 | } | 152 | 97 | if (!segment_v2::IndexReaderHelper::has_string_or_bkd_index(iter)) { | 153 | | //NOT support in list when parser is FULLTEXT for expr inverted index evaluate. | 154 | 64 | return Status::OK(); | 155 | 64 | } | 156 | 33 | if (iter->has_null()) { | 157 | 33 | segment_v2::InvertedIndexQueryCacheHandle null_bitmap_cache_handle; | 158 | 33 | RETURN_IF_ERROR(iter->read_null_bitmap(&null_bitmap_cache_handle)); | 159 | 33 | null_bitmap = null_bitmap_cache_handle.get_bitmap(); | 160 | 33 | } | 161 | 66 | for (const auto& arg : arguments) { | 162 | 66 | Field param_value; | 163 | 66 | arg.column->get(0, param_value); | 164 | 66 | auto param_type = arg.type->get_primitive_type(); | 165 | 66 | if (param_value.is_null()) { | 166 | | // predicate like column NOT IN (NULL, '') should not push down to index. | 167 | 3 | if (negative) { | 168 | 0 | return Status::OK(); | 169 | 0 | } | 170 | 3 | *roaring |= *null_bitmap; | 171 | 3 | continue; | 172 | 3 | } | 173 | 63 | std::unique_ptr<InvertedIndexQueryParamFactory> query_param = nullptr; | 174 | 63 | RETURN_IF_ERROR(InvertedIndexQueryParamFactory::create_query_value( | 175 | 63 | param_type, ¶m_value, query_param)); | 176 | 63 | InvertedIndexQueryType query_type = InvertedIndexQueryType::EQUAL_QUERY; | 177 | 63 | segment_v2::InvertedIndexParam param; | 178 | 63 | param.column_name = data_type_with_name.first; | 179 | 63 | param.column_type = data_type_with_name.second; | 180 | 63 | param.query_value = query_param->get_value(); | 181 | 63 | param.query_type = query_type; | 182 | 63 | param.num_rows = num_rows; | 183 | 63 | param.roaring = std::make_shared<roaring::Roaring>(); | 184 | 63 | param.analyzer_ctx = analyzer_ctx; | 185 | 63 | RETURN_IF_ERROR(iter->read_from_index(segment_v2::IndexParam {¶m})); | 186 | 63 | *roaring |= *param.roaring; | 187 | 63 | } | 188 | 33 | segment_v2::InvertedIndexResultBitmap result(roaring, null_bitmap); | 189 | 33 | bitmap_result = result; | 190 | 33 | bitmap_result.mask_out_null(); | 191 | | if constexpr (negative) { | 192 | | roaring::Roaring full_result; | 193 | | full_result.addRange(0, num_rows); | 194 | | bitmap_result.op_not(&full_result); | 195 | | } | 196 | 33 | return Status::OK(); | 197 | 33 | } |
_ZNK5doris10FunctionInILb1EE23evaluate_inverted_indexERKSt6vectorINS_21ColumnWithTypeAndNameESaIS3_EERKS2_ISt4pairINSt7__cxx1112basic_stringIcSt11char_traitsIcESaIcEEESt10shared_ptrIKNS_9IDataTypeEEESaISJ_EES2_IPNS_10segment_v213IndexIteratorESaISQ_EEjPKNS_24InvertedIndexAnalyzerCtxERNSO_25InvertedIndexResultBitmapE Line | Count | Source | 141 | 619 | segment_v2::InvertedIndexResultBitmap& bitmap_result) const override { | 142 | 619 | DCHECK(data_type_with_names.size() == 1); | 143 | 619 | DCHECK(iterators.size() == 1); | 144 | 619 | auto* iter = iterators[0]; | 145 | 619 | auto data_type_with_name = data_type_with_names[0]; | 146 | 619 | std::shared_ptr<roaring::Roaring> roaring = std::make_shared<roaring::Roaring>(); | 147 | 619 | std::shared_ptr<roaring::Roaring> null_bitmap = std::make_shared<roaring::Roaring>(); | 148 | | | 149 | 619 | if (iter == nullptr) { | 150 | 0 | return Status::OK(); | 151 | 0 | } | 152 | 619 | if (!segment_v2::IndexReaderHelper::has_string_or_bkd_index(iter)) { | 153 | | //NOT support in list when parser is FULLTEXT for expr inverted index evaluate. | 154 | 76 | return Status::OK(); | 155 | 76 | } | 156 | 543 | if (iter->has_null()) { | 157 | 543 | segment_v2::InvertedIndexQueryCacheHandle null_bitmap_cache_handle; | 158 | 543 | RETURN_IF_ERROR(iter->read_null_bitmap(&null_bitmap_cache_handle)); | 159 | 543 | null_bitmap = null_bitmap_cache_handle.get_bitmap(); | 160 | 543 | } | 161 | 652 | for (const auto& arg : arguments) { | 162 | 652 | Field param_value; | 163 | 652 | arg.column->get(0, param_value); | 164 | 652 | auto param_type = arg.type->get_primitive_type(); | 165 | 652 | if (param_value.is_null()) { | 166 | | // predicate like column NOT IN (NULL, '') should not push down to index. | 167 | 503 | if (negative) { | 168 | 503 | return Status::OK(); | 169 | 503 | } | 170 | 0 | *roaring |= *null_bitmap; | 171 | 0 | continue; | 172 | 503 | } | 173 | 149 | std::unique_ptr<InvertedIndexQueryParamFactory> query_param = nullptr; | 174 | 149 | RETURN_IF_ERROR(InvertedIndexQueryParamFactory::create_query_value( | 175 | 149 | param_type, ¶m_value, query_param)); | 176 | 149 | InvertedIndexQueryType query_type = InvertedIndexQueryType::EQUAL_QUERY; | 177 | 149 | segment_v2::InvertedIndexParam param; | 178 | 149 | param.column_name = data_type_with_name.first; | 179 | 149 | param.column_type = data_type_with_name.second; | 180 | 149 | param.query_value = query_param->get_value(); | 181 | 149 | param.query_type = query_type; | 182 | 149 | param.num_rows = num_rows; | 183 | 149 | param.roaring = std::make_shared<roaring::Roaring>(); | 184 | 149 | param.analyzer_ctx = analyzer_ctx; | 185 | 149 | RETURN_IF_ERROR(iter->read_from_index(segment_v2::IndexParam {¶m})); | 186 | 142 | *roaring |= *param.roaring; | 187 | 142 | } | 188 | 33 | segment_v2::InvertedIndexResultBitmap result(roaring, null_bitmap); | 189 | 33 | bitmap_result = result; | 190 | 33 | bitmap_result.mask_out_null(); | 191 | 33 | if constexpr (negative) { | 192 | 33 | roaring::Roaring full_result; | 193 | 33 | full_result.addRange(0, num_rows); | 194 | 33 | bitmap_result.op_not(&full_result); | 195 | 33 | } | 196 | 33 | return Status::OK(); | 197 | 543 | } |
|
198 | | |
199 | | Status execute_impl(FunctionContext* context, Block& block, const ColumnNumbers& arguments, |
200 | 3.81k | uint32_t result, size_t input_rows_count) const override { |
201 | 3.81k | auto* in_state = reinterpret_cast<InState*>( |
202 | 3.81k | context->get_function_state(FunctionContext::FRAGMENT_LOCAL)); |
203 | 3.81k | if (!in_state) { |
204 | 0 | return Status::RuntimeError("funciton context for function '{}' must have Set;", |
205 | 0 | get_name()); |
206 | 0 | } |
207 | 3.81k | auto res = ColumnUInt8::create(); |
208 | 3.81k | ColumnUInt8::Container& vec_res = res->get_data(); |
209 | 3.81k | vec_res.resize(input_rows_count); |
210 | | |
211 | 3.81k | ColumnUInt8::MutablePtr col_null_map_to; |
212 | 3.81k | col_null_map_to = ColumnUInt8::create(input_rows_count, false); |
213 | 3.81k | auto& vec_null_map_to = col_null_map_to->get_data(); |
214 | | |
215 | 3.81k | const ColumnWithTypeAndName& left_arg = block.get_by_position(arguments[0]); |
216 | 3.81k | const auto& [materialized_column, col_const] = unpack_if_const(left_arg.column); |
217 | | |
218 | 3.81k | if (in_state->use_set) { |
219 | 3.81k | if (materialized_column->is_nullable()) { |
220 | 3.17k | const auto* null_col_ptr = |
221 | 3.17k | check_and_get_column<ColumnNullable>(materialized_column.get()); |
222 | 3.17k | const auto& null_map = |
223 | 3.17k | assert_cast<const ColumnUInt8&>(null_col_ptr->get_null_map_column()) |
224 | 3.17k | .get_data(); |
225 | 3.17k | const auto* nested_col_ptr = null_col_ptr->get_nested_column_ptr().get(); |
226 | | |
227 | 3.17k | if (nested_col_ptr->is_column_string()) { |
228 | 2.53k | const auto* column_string_ptr = |
229 | 2.53k | assert_cast<const ColumnString*>(nested_col_ptr); |
230 | 2.53k | search_hash_set_check_null(in_state, input_rows_count, vec_res, null_map, |
231 | 2.53k | column_string_ptr); |
232 | 2.53k | } else { |
233 | | //TODO: support other column type |
234 | 642 | search_hash_set_check_null(in_state, input_rows_count, vec_res, null_map, |
235 | 642 | nested_col_ptr); |
236 | 642 | } |
237 | | |
238 | 3.17k | if (!in_state->hybrid_set->contain_null()) { |
239 | 246k | for (size_t i = 0; i < input_rows_count; ++i) { |
240 | 243k | vec_null_map_to[i] = null_map[i]; |
241 | 243k | } |
242 | 2.62k | } else { |
243 | 11.9k | for (size_t i = 0; i < input_rows_count; ++i) { |
244 | 11.3k | vec_null_map_to[i] = null_map[i] || negative == vec_res[i]; |
245 | 11.3k | } |
246 | 552 | } |
247 | | |
248 | 3.17k | } else { // non-nullable |
249 | 639 | if (is_string_type(left_arg.type->get_primitive_type())) { |
250 | 357 | const auto* column_string_ptr = |
251 | 357 | assert_cast<const ColumnString*>(materialized_column.get()); |
252 | 357 | search_hash_set(in_state, input_rows_count, vec_res, column_string_ptr); |
253 | 357 | } else { |
254 | 282 | search_hash_set(in_state, input_rows_count, vec_res, materialized_column.get()); |
255 | 282 | } |
256 | | |
257 | 639 | if (in_state->hybrid_set->contain_null()) { |
258 | 79 | for (size_t i = 0; i < input_rows_count; ++i) { |
259 | 50 | vec_null_map_to[i] = negative == vec_res[i]; |
260 | 50 | } |
261 | 29 | } |
262 | 639 | } |
263 | 3.81k | } else { //!in_state->use_set |
264 | 0 | std::vector<ColumnPtr> set_columns; |
265 | 2 | for (int i = 1; i < arguments.size(); ++i) { |
266 | 2 | set_columns.emplace_back(block.get_by_position(arguments[i]).column); |
267 | 2 | } |
268 | 0 | if (col_const) { |
269 | 0 | impl_without_set<true>(context, set_columns, input_rows_count, vec_res, |
270 | 0 | vec_null_map_to, materialized_column); |
271 | 0 | } else { |
272 | 0 | impl_without_set<false>(context, set_columns, input_rows_count, vec_res, |
273 | 0 | vec_null_map_to, materialized_column); |
274 | 0 | } |
275 | 0 | } |
276 | | |
277 | 3.81k | if (block.get_by_position(result).type->is_nullable()) { |
278 | 3.20k | block.replace_by_position( |
279 | 3.20k | result, ColumnNullable::create(std::move(res), std::move(col_null_map_to))); |
280 | 3.20k | } else { |
281 | 609 | block.replace_by_position(result, std::move(res)); |
282 | 609 | } |
283 | | |
284 | 3.81k | return Status::OK(); |
285 | 3.81k | } _ZNK5doris10FunctionInILb0EE12execute_implEPNS_15FunctionContextERNS_5BlockERKSt6vectorIjSaIjEEjm Line | Count | Source | 200 | 2.94k | uint32_t result, size_t input_rows_count) const override { | 201 | 2.94k | auto* in_state = reinterpret_cast<InState*>( | 202 | 2.94k | context->get_function_state(FunctionContext::FRAGMENT_LOCAL)); | 203 | 2.94k | if (!in_state) { | 204 | 0 | return Status::RuntimeError("funciton context for function '{}' must have Set;", | 205 | 0 | get_name()); | 206 | 0 | } | 207 | 2.94k | auto res = ColumnUInt8::create(); | 208 | 2.94k | ColumnUInt8::Container& vec_res = res->get_data(); | 209 | 2.94k | vec_res.resize(input_rows_count); | 210 | | | 211 | 2.94k | ColumnUInt8::MutablePtr col_null_map_to; | 212 | 2.94k | col_null_map_to = ColumnUInt8::create(input_rows_count, false); | 213 | 2.94k | auto& vec_null_map_to = col_null_map_to->get_data(); | 214 | | | 215 | 2.94k | const ColumnWithTypeAndName& left_arg = block.get_by_position(arguments[0]); | 216 | 2.94k | const auto& [materialized_column, col_const] = unpack_if_const(left_arg.column); | 217 | | | 218 | 2.94k | if (in_state->use_set) { | 219 | 2.94k | if (materialized_column->is_nullable()) { | 220 | 2.34k | const auto* null_col_ptr = | 221 | 2.34k | check_and_get_column<ColumnNullable>(materialized_column.get()); | 222 | 2.34k | const auto& null_map = | 223 | 2.34k | assert_cast<const ColumnUInt8&>(null_col_ptr->get_null_map_column()) | 224 | 2.34k | .get_data(); | 225 | 2.34k | const auto* nested_col_ptr = null_col_ptr->get_nested_column_ptr().get(); | 226 | | | 227 | 2.34k | if (nested_col_ptr->is_column_string()) { | 228 | 1.82k | const auto* column_string_ptr = | 229 | 1.82k | assert_cast<const ColumnString*>(nested_col_ptr); | 230 | 1.82k | search_hash_set_check_null(in_state, input_rows_count, vec_res, null_map, | 231 | 1.82k | column_string_ptr); | 232 | 1.82k | } else { | 233 | | //TODO: support other column type | 234 | 515 | search_hash_set_check_null(in_state, input_rows_count, vec_res, null_map, | 235 | 515 | nested_col_ptr); | 236 | 515 | } | 237 | | | 238 | 2.34k | if (!in_state->hybrid_set->contain_null()) { | 239 | 241k | for (size_t i = 0; i < input_rows_count; ++i) { | 240 | 238k | vec_null_map_to[i] = null_map[i]; | 241 | 238k | } | 242 | 2.29k | } else { | 243 | 142 | for (size_t i = 0; i < input_rows_count; ++i) { | 244 | 95 | vec_null_map_to[i] = null_map[i] || negative == vec_res[i]; | 245 | 95 | } | 246 | 47 | } | 247 | | | 248 | 2.34k | } else { // non-nullable | 249 | 606 | if (is_string_type(left_arg.type->get_primitive_type())) { | 250 | 357 | const auto* column_string_ptr = | 251 | 357 | assert_cast<const ColumnString*>(materialized_column.get()); | 252 | 357 | search_hash_set(in_state, input_rows_count, vec_res, column_string_ptr); | 253 | 357 | } else { | 254 | 249 | search_hash_set(in_state, input_rows_count, vec_res, materialized_column.get()); | 255 | 249 | } | 256 | | | 257 | 606 | if (in_state->hybrid_set->contain_null()) { | 258 | 0 | for (size_t i = 0; i < input_rows_count; ++i) { | 259 | 0 | vec_null_map_to[i] = negative == vec_res[i]; | 260 | 0 | } | 261 | 0 | } | 262 | 606 | } | 263 | 2.94k | } else { //!in_state->use_set | 264 | 0 | std::vector<ColumnPtr> set_columns; | 265 | 2 | for (int i = 1; i < arguments.size(); ++i) { | 266 | 2 | set_columns.emplace_back(block.get_by_position(arguments[i]).column); | 267 | 2 | } | 268 | 0 | if (col_const) { | 269 | 0 | impl_without_set<true>(context, set_columns, input_rows_count, vec_res, | 270 | 0 | vec_null_map_to, materialized_column); | 271 | 0 | } else { | 272 | 0 | impl_without_set<false>(context, set_columns, input_rows_count, vec_res, | 273 | 0 | vec_null_map_to, materialized_column); | 274 | 0 | } | 275 | 0 | } | 276 | | | 277 | 2.94k | if (block.get_by_position(result).type->is_nullable()) { | 278 | 2.34k | block.replace_by_position( | 279 | 2.34k | result, ColumnNullable::create(std::move(res), std::move(col_null_map_to))); | 280 | 2.34k | } else { | 281 | 605 | block.replace_by_position(result, std::move(res)); | 282 | 605 | } | 283 | | | 284 | 2.94k | return Status::OK(); | 285 | 2.94k | } |
_ZNK5doris10FunctionInILb1EE12execute_implEPNS_15FunctionContextERNS_5BlockERKSt6vectorIjSaIjEEjm Line | Count | Source | 200 | 866 | uint32_t result, size_t input_rows_count) const override { | 201 | 866 | auto* in_state = reinterpret_cast<InState*>( | 202 | 866 | context->get_function_state(FunctionContext::FRAGMENT_LOCAL)); | 203 | 866 | if (!in_state) { | 204 | 0 | return Status::RuntimeError("funciton context for function '{}' must have Set;", | 205 | 0 | get_name()); | 206 | 0 | } | 207 | 866 | auto res = ColumnUInt8::create(); | 208 | 866 | ColumnUInt8::Container& vec_res = res->get_data(); | 209 | 866 | vec_res.resize(input_rows_count); | 210 | | | 211 | 866 | ColumnUInt8::MutablePtr col_null_map_to; | 212 | 866 | col_null_map_to = ColumnUInt8::create(input_rows_count, false); | 213 | 866 | auto& vec_null_map_to = col_null_map_to->get_data(); | 214 | | | 215 | 866 | const ColumnWithTypeAndName& left_arg = block.get_by_position(arguments[0]); | 216 | 866 | const auto& [materialized_column, col_const] = unpack_if_const(left_arg.column); | 217 | | | 218 | 866 | if (in_state->use_set) { | 219 | 866 | if (materialized_column->is_nullable()) { | 220 | 833 | const auto* null_col_ptr = | 221 | 833 | check_and_get_column<ColumnNullable>(materialized_column.get()); | 222 | 833 | const auto& null_map = | 223 | 833 | assert_cast<const ColumnUInt8&>(null_col_ptr->get_null_map_column()) | 224 | 833 | .get_data(); | 225 | 833 | const auto* nested_col_ptr = null_col_ptr->get_nested_column_ptr().get(); | 226 | | | 227 | 833 | if (nested_col_ptr->is_column_string()) { | 228 | 706 | const auto* column_string_ptr = | 229 | 706 | assert_cast<const ColumnString*>(nested_col_ptr); | 230 | 706 | search_hash_set_check_null(in_state, input_rows_count, vec_res, null_map, | 231 | 706 | column_string_ptr); | 232 | 706 | } else { | 233 | | //TODO: support other column type | 234 | 127 | search_hash_set_check_null(in_state, input_rows_count, vec_res, null_map, | 235 | 127 | nested_col_ptr); | 236 | 127 | } | 237 | | | 238 | 833 | if (!in_state->hybrid_set->contain_null()) { | 239 | 4.98k | for (size_t i = 0; i < input_rows_count; ++i) { | 240 | 4.66k | vec_null_map_to[i] = null_map[i]; | 241 | 4.66k | } | 242 | 505 | } else { | 243 | 11.7k | for (size_t i = 0; i < input_rows_count; ++i) { | 244 | 11.2k | vec_null_map_to[i] = null_map[i] || negative == vec_res[i]; | 245 | 11.2k | } | 246 | 505 | } | 247 | | | 248 | 833 | } else { // non-nullable | 249 | 33 | if (is_string_type(left_arg.type->get_primitive_type())) { | 250 | 0 | const auto* column_string_ptr = | 251 | 0 | assert_cast<const ColumnString*>(materialized_column.get()); | 252 | 0 | search_hash_set(in_state, input_rows_count, vec_res, column_string_ptr); | 253 | 33 | } else { | 254 | 33 | search_hash_set(in_state, input_rows_count, vec_res, materialized_column.get()); | 255 | 33 | } | 256 | | | 257 | 33 | if (in_state->hybrid_set->contain_null()) { | 258 | 79 | for (size_t i = 0; i < input_rows_count; ++i) { | 259 | 50 | vec_null_map_to[i] = negative == vec_res[i]; | 260 | 50 | } | 261 | 29 | } | 262 | 33 | } | 263 | 866 | } else { //!in_state->use_set | 264 | 0 | std::vector<ColumnPtr> set_columns; | 265 | 0 | for (int i = 1; i < arguments.size(); ++i) { | 266 | 0 | set_columns.emplace_back(block.get_by_position(arguments[i]).column); | 267 | 0 | } | 268 | 0 | if (col_const) { | 269 | 0 | impl_without_set<true>(context, set_columns, input_rows_count, vec_res, | 270 | 0 | vec_null_map_to, materialized_column); | 271 | 0 | } else { | 272 | 0 | impl_without_set<false>(context, set_columns, input_rows_count, vec_res, | 273 | 0 | vec_null_map_to, materialized_column); | 274 | 0 | } | 275 | 0 | } | 276 | | | 277 | 866 | if (block.get_by_position(result).type->is_nullable()) { | 278 | 862 | block.replace_by_position( | 279 | 862 | result, ColumnNullable::create(std::move(res), std::move(col_null_map_to))); | 280 | 862 | } else { | 281 | 4 | block.replace_by_position(result, std::move(res)); | 282 | 4 | } | 283 | | | 284 | 866 | return Status::OK(); | 285 | 866 | } |
|
286 | | |
287 | | private: |
288 | | template <typename T> |
289 | | static void search_hash_set_check_null(InState* in_state, size_t input_rows_count, |
290 | | ColumnUInt8::Container& vec_res, |
291 | 3.17k | const ColumnUInt8::Container& null_map, T* col_ptr) { |
292 | 3.17k | if constexpr (!negative) { |
293 | 2.34k | in_state->hybrid_set->find_batch_nullable(*col_ptr, input_rows_count, null_map, |
294 | 2.34k | vec_res); |
295 | 2.34k | } else { |
296 | 833 | in_state->hybrid_set->find_batch_nullable_negative(*col_ptr, input_rows_count, null_map, |
297 | 833 | vec_res); |
298 | 833 | } |
299 | 3.17k | } _ZN5doris10FunctionInILb0EE26search_hash_set_check_nullIKNS_9ColumnStrIjEEEEvPNS_7InStateEmRNS_8PODArrayIhLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb0EEELm16ELm15EEERKSC_PT_ Line | Count | Source | 291 | 1.82k | const ColumnUInt8::Container& null_map, T* col_ptr) { | 292 | 1.82k | if constexpr (!negative) { | 293 | 1.82k | in_state->hybrid_set->find_batch_nullable(*col_ptr, input_rows_count, null_map, | 294 | 1.82k | vec_res); | 295 | | } else { | 296 | | in_state->hybrid_set->find_batch_nullable_negative(*col_ptr, input_rows_count, null_map, | 297 | | vec_res); | 298 | | } | 299 | 1.82k | } |
_ZN5doris10FunctionInILb0EE26search_hash_set_check_nullIKNS_7IColumnEEEvPNS_7InStateEmRNS_8PODArrayIhLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb0EEELm16ELm15EEERKSB_PT_ Line | Count | Source | 291 | 515 | const ColumnUInt8::Container& null_map, T* col_ptr) { | 292 | 515 | if constexpr (!negative) { | 293 | 515 | in_state->hybrid_set->find_batch_nullable(*col_ptr, input_rows_count, null_map, | 294 | 515 | vec_res); | 295 | | } else { | 296 | | in_state->hybrid_set->find_batch_nullable_negative(*col_ptr, input_rows_count, null_map, | 297 | | vec_res); | 298 | | } | 299 | 515 | } |
_ZN5doris10FunctionInILb1EE26search_hash_set_check_nullIKNS_9ColumnStrIjEEEEvPNS_7InStateEmRNS_8PODArrayIhLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb0EEELm16ELm15EEERKSC_PT_ Line | Count | Source | 291 | 706 | const ColumnUInt8::Container& null_map, T* col_ptr) { | 292 | | if constexpr (!negative) { | 293 | | in_state->hybrid_set->find_batch_nullable(*col_ptr, input_rows_count, null_map, | 294 | | vec_res); | 295 | 706 | } else { | 296 | 706 | in_state->hybrid_set->find_batch_nullable_negative(*col_ptr, input_rows_count, null_map, | 297 | 706 | vec_res); | 298 | 706 | } | 299 | 706 | } |
_ZN5doris10FunctionInILb1EE26search_hash_set_check_nullIKNS_7IColumnEEEvPNS_7InStateEmRNS_8PODArrayIhLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb0EEELm16ELm15EEERKSB_PT_ Line | Count | Source | 291 | 127 | const ColumnUInt8::Container& null_map, T* col_ptr) { | 292 | | if constexpr (!negative) { | 293 | | in_state->hybrid_set->find_batch_nullable(*col_ptr, input_rows_count, null_map, | 294 | | vec_res); | 295 | 127 | } else { | 296 | 127 | in_state->hybrid_set->find_batch_nullable_negative(*col_ptr, input_rows_count, null_map, | 297 | 127 | vec_res); | 298 | 127 | } | 299 | 127 | } |
|
300 | | |
301 | | template <typename T> |
302 | | static void search_hash_set(InState* in_state, size_t input_rows_count, |
303 | 639 | ColumnUInt8::Container& vec_res, T* col_ptr) { |
304 | 639 | if constexpr (!negative) { |
305 | 606 | in_state->hybrid_set->find_batch(*col_ptr, input_rows_count, vec_res); |
306 | 606 | } else { |
307 | 33 | in_state->hybrid_set->find_batch_negative(*col_ptr, input_rows_count, vec_res); |
308 | 33 | } |
309 | 639 | } _ZN5doris10FunctionInILb0EE15search_hash_setIKNS_9ColumnStrIjEEEEvPNS_7InStateEmRNS_8PODArrayIhLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb0EEELm16ELm15EEEPT_ Line | Count | Source | 303 | 357 | ColumnUInt8::Container& vec_res, T* col_ptr) { | 304 | 357 | if constexpr (!negative) { | 305 | 357 | in_state->hybrid_set->find_batch(*col_ptr, input_rows_count, vec_res); | 306 | | } else { | 307 | | in_state->hybrid_set->find_batch_negative(*col_ptr, input_rows_count, vec_res); | 308 | | } | 309 | 357 | } |
_ZN5doris10FunctionInILb0EE15search_hash_setIKNS_7IColumnEEEvPNS_7InStateEmRNS_8PODArrayIhLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb0EEELm16ELm15EEEPT_ Line | Count | Source | 303 | 249 | ColumnUInt8::Container& vec_res, T* col_ptr) { | 304 | 249 | if constexpr (!negative) { | 305 | 249 | in_state->hybrid_set->find_batch(*col_ptr, input_rows_count, vec_res); | 306 | | } else { | 307 | | in_state->hybrid_set->find_batch_negative(*col_ptr, input_rows_count, vec_res); | 308 | | } | 309 | 249 | } |
Unexecuted instantiation: _ZN5doris10FunctionInILb1EE15search_hash_setIKNS_9ColumnStrIjEEEEvPNS_7InStateEmRNS_8PODArrayIhLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb0EEELm16ELm15EEEPT_ _ZN5doris10FunctionInILb1EE15search_hash_setIKNS_7IColumnEEEvPNS_7InStateEmRNS_8PODArrayIhLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb0EEELm16ELm15EEEPT_ Line | Count | Source | 303 | 33 | ColumnUInt8::Container& vec_res, T* col_ptr) { | 304 | | if constexpr (!negative) { | 305 | | in_state->hybrid_set->find_batch(*col_ptr, input_rows_count, vec_res); | 306 | 33 | } else { | 307 | 33 | in_state->hybrid_set->find_batch_negative(*col_ptr, input_rows_count, vec_res); | 308 | 33 | } | 309 | 33 | } |
|
310 | | |
311 | | template <bool Const> |
312 | | static void impl_without_set(FunctionContext* context, |
313 | | const std::vector<ColumnPtr>& set_columns, size_t input_rows_count, |
314 | | ColumnUInt8::Container& vec_res, |
315 | | ColumnUInt8::Container& vec_null_map_to, |
316 | 1 | const ColumnPtr& materialized_column) { |
317 | 2 | for (size_t i = 0; i < input_rows_count; ++i) { |
318 | 1 | const auto& ref_data = materialized_column->get_data_at(index_check_const(i, Const)); |
319 | 1 | if (ref_data.data == nullptr) { |
320 | 0 | vec_null_map_to[i] = true; |
321 | 0 | continue; |
322 | 0 | } |
323 | | |
324 | 1 | std::vector<StringRef> set_datas; |
325 | | // To comply with the SQL standard, IN() returns NULL not only if the expression on the left hand side is NULL, |
326 | | // but also if no match is found in the list and one of the expressions in the list is NULL. |
327 | 1 | bool null_in_set = false; |
328 | | |
329 | 2 | for (const auto& set_column : set_columns) { |
330 | 2 | auto set_data = set_column->get_data_at(i); |
331 | 2 | if (set_data.data == nullptr) { |
332 | 0 | null_in_set = true; |
333 | 2 | } else { |
334 | 2 | set_datas.push_back(set_data); |
335 | 2 | } |
336 | 2 | } |
337 | 1 | std::unique_ptr<HybridSetBase> hybrid_set(create_set( |
338 | 1 | context->get_arg_type(0)->get_primitive_type(), set_datas.size(), true)); |
339 | 2 | for (auto& set_data : set_datas) { |
340 | 2 | hybrid_set->insert((void*)(set_data.data), set_data.size); |
341 | 2 | } |
342 | | |
343 | 1 | vec_res[i] = negative ^ hybrid_set->find((void*)ref_data.data, ref_data.size); |
344 | 1 | if (null_in_set) { |
345 | 0 | vec_null_map_to[i] = negative == vec_res[i]; |
346 | 1 | } else { |
347 | 1 | vec_null_map_to[i] = false; |
348 | 1 | } |
349 | 1 | } |
350 | 1 | } Unexecuted instantiation: _ZN5doris10FunctionInILb0EE16impl_without_setILb1EEEvPNS_15FunctionContextERKSt6vectorINS_3COWINS_7IColumnEE13immutable_ptrIS7_EESaISA_EEmRNS_8PODArrayIhLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb0EEELm16ELm15EEESK_RKSA_ _ZN5doris10FunctionInILb0EE16impl_without_setILb0EEEvPNS_15FunctionContextERKSt6vectorINS_3COWINS_7IColumnEE13immutable_ptrIS7_EESaISA_EEmRNS_8PODArrayIhLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb0EEELm16ELm15EEESK_RKSA_ Line | Count | Source | 316 | 1 | const ColumnPtr& materialized_column) { | 317 | 2 | for (size_t i = 0; i < input_rows_count; ++i) { | 318 | 1 | const auto& ref_data = materialized_column->get_data_at(index_check_const(i, Const)); | 319 | 1 | if (ref_data.data == nullptr) { | 320 | 0 | vec_null_map_to[i] = true; | 321 | 0 | continue; | 322 | 0 | } | 323 | | | 324 | 1 | std::vector<StringRef> set_datas; | 325 | | // To comply with the SQL standard, IN() returns NULL not only if the expression on the left hand side is NULL, | 326 | | // but also if no match is found in the list and one of the expressions in the list is NULL. | 327 | 1 | bool null_in_set = false; | 328 | | | 329 | 2 | for (const auto& set_column : set_columns) { | 330 | 2 | auto set_data = set_column->get_data_at(i); | 331 | 2 | if (set_data.data == nullptr) { | 332 | 0 | null_in_set = true; | 333 | 2 | } else { | 334 | 2 | set_datas.push_back(set_data); | 335 | 2 | } | 336 | 2 | } | 337 | 1 | std::unique_ptr<HybridSetBase> hybrid_set(create_set( | 338 | 1 | context->get_arg_type(0)->get_primitive_type(), set_datas.size(), true)); | 339 | 2 | for (auto& set_data : set_datas) { | 340 | 2 | hybrid_set->insert((void*)(set_data.data), set_data.size); | 341 | 2 | } | 342 | | | 343 | 1 | vec_res[i] = negative ^ hybrid_set->find((void*)ref_data.data, ref_data.size); | 344 | 1 | if (null_in_set) { | 345 | 0 | vec_null_map_to[i] = negative == vec_res[i]; | 346 | 1 | } else { | 347 | 1 | vec_null_map_to[i] = false; | 348 | 1 | } | 349 | 1 | } | 350 | 1 | } |
Unexecuted instantiation: _ZN5doris10FunctionInILb1EE16impl_without_setILb1EEEvPNS_15FunctionContextERKSt6vectorINS_3COWINS_7IColumnEE13immutable_ptrIS7_EESaISA_EEmRNS_8PODArrayIhLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb0EEELm16ELm15EEESK_RKSA_ Unexecuted instantiation: _ZN5doris10FunctionInILb1EE16impl_without_setILb0EEEvPNS_15FunctionContextERKSt6vectorINS_3COWINS_7IColumnEE13immutable_ptrIS7_EESaISA_EEmRNS_8PODArrayIhLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb0EEELm16ELm15EEESK_RKSA_ |
351 | | }; |
352 | | |
353 | | } // namespace doris |