be/src/exprs/function/in.h
Line | Count | Source |
1 | | // Licensed to the Apache Software Foundation (ASF) under one |
2 | | // or more contributor license agreements. See the NOTICE file |
3 | | // distributed with this work for additional information |
4 | | // regarding copyright ownership. The ASF licenses this file |
5 | | // to you under the Apache License, Version 2.0 (the |
6 | | // "License"); you may not use this file except in compliance |
7 | | // with the License. You may obtain a copy of the License at |
8 | | // |
9 | | // http://www.apache.org/licenses/LICENSE-2.0 |
10 | | // |
11 | | // Unless required by applicable law or agreed to in writing, |
12 | | // software distributed under the License is distributed on an |
13 | | // "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY |
14 | | // KIND, either express or implied. See the License for the |
15 | | // specific language governing permissions and limitations |
16 | | // under the License. |
17 | | // This file is copied from |
18 | | |
19 | | #pragma once |
20 | | |
21 | | #include <glog/logging.h> |
22 | | |
23 | | #include <boost/iterator/iterator_facade.hpp> |
24 | | #include <cstddef> |
25 | | #include <memory> |
26 | | #include <utility> |
27 | | #include <vector> |
28 | | |
29 | | #include "common/status.h" |
30 | | #include "core/block/block.h" |
31 | | #include "core/block/column_numbers.h" |
32 | | #include "core/block/column_with_type_and_name.h" |
33 | | #include "core/column/column.h" |
34 | | #include "core/column/column_const.h" |
35 | | #include "core/column/column_nullable.h" |
36 | | #include "core/column/column_vector.h" |
37 | | #include "core/data_type/data_type.h" |
38 | | #include "core/data_type/data_type_nullable.h" |
39 | | #include "core/data_type/data_type_number.h" |
40 | | #include "core/data_type/define_primitive_type.h" |
41 | | #include "core/string_ref.h" |
42 | | #include "core/types.h" |
43 | | #include "exprs/aggregate/aggregate_function.h" |
44 | | #include "exprs/create_predicate_function.h" |
45 | | #include "exprs/function/function.h" |
46 | | #include "exprs/function_context.h" |
47 | | #include "exprs/hybrid_set.h" |
48 | | #include "storage/index/index_reader_helper.h" |
49 | | |
50 | | namespace doris { |
51 | | |
52 | | template <typename T> |
53 | | class ColumnStr; |
54 | | using ColumnString = ColumnStr<UInt32>; |
55 | | |
56 | | struct InState { |
57 | | bool use_set = true; |
58 | | std::shared_ptr<HybridSetBase> hybrid_set; |
59 | | }; |
60 | | |
61 | | template <bool negative> |
62 | | class FunctionIn : public IFunction { |
63 | | public: |
64 | | static constexpr auto name = negative ? "not_in" : "in"; |
65 | | |
66 | 1.94k | static FunctionPtr create() { return std::make_shared<FunctionIn>(); }_ZN5doris10FunctionInILb0EE6createEv Line | Count | Source | 66 | 1.74k | static FunctionPtr create() { return std::make_shared<FunctionIn>(); } |
_ZN5doris10FunctionInILb1EE6createEv Line | Count | Source | 66 | 192 | static FunctionPtr create() { return std::make_shared<FunctionIn>(); } |
|
67 | | |
68 | 0 | String get_name() const override { return name; }Unexecuted instantiation: _ZNK5doris10FunctionInILb0EE8get_nameB5cxx11Ev Unexecuted instantiation: _ZNK5doris10FunctionInILb1EE8get_nameB5cxx11Ev |
69 | | |
70 | 1.92k | bool is_variadic() const override { return true; }_ZNK5doris10FunctionInILb0EE11is_variadicEv Line | Count | Source | 70 | 1.74k | bool is_variadic() const override { return true; } |
_ZNK5doris10FunctionInILb1EE11is_variadicEv Line | Count | Source | 70 | 184 | bool is_variadic() const override { return true; } |
|
71 | | |
72 | 0 | size_t get_number_of_arguments() const override { return 0; }Unexecuted instantiation: _ZNK5doris10FunctionInILb0EE23get_number_of_argumentsEv Unexecuted instantiation: _ZNK5doris10FunctionInILb1EE23get_number_of_argumentsEv |
73 | | |
74 | 1.92k | DataTypePtr get_return_type_impl(const DataTypes& args) const override { |
75 | 3.31k | for (const auto& arg : args) { |
76 | 3.31k | if (arg->is_nullable()) { |
77 | 1.39k | return make_nullable(std::make_shared<DataTypeUInt8>()); |
78 | 1.39k | } |
79 | 3.31k | } |
80 | 524 | return std::make_shared<DataTypeUInt8>(); |
81 | 1.92k | } _ZNK5doris10FunctionInILb0EE20get_return_type_implERKSt6vectorISt10shared_ptrIKNS_9IDataTypeEESaIS6_EE Line | Count | Source | 74 | 1.73k | DataTypePtr get_return_type_impl(const DataTypes& args) const override { | 75 | 3.02k | for (const auto& arg : args) { | 76 | 3.02k | if (arg->is_nullable()) { | 77 | 1.25k | return make_nullable(std::make_shared<DataTypeUInt8>()); | 78 | 1.25k | } | 79 | 3.02k | } | 80 | 486 | return std::make_shared<DataTypeUInt8>(); | 81 | 1.73k | } |
_ZNK5doris10FunctionInILb1EE20get_return_type_implERKSt6vectorISt10shared_ptrIKNS_9IDataTypeEESaIS6_EE Line | Count | Source | 74 | 183 | DataTypePtr get_return_type_impl(const DataTypes& args) const override { | 75 | 290 | for (const auto& arg : args) { | 76 | 290 | if (arg->is_nullable()) { | 77 | 145 | return make_nullable(std::make_shared<DataTypeUInt8>()); | 78 | 145 | } | 79 | 290 | } | 80 | 38 | return std::make_shared<DataTypeUInt8>(); | 81 | 183 | } |
|
82 | | |
83 | 20.1k | bool use_default_implementation_for_nulls() const override { return false; }_ZNK5doris10FunctionInILb0EE36use_default_implementation_for_nullsEv Line | Count | Source | 83 | 19.1k | bool use_default_implementation_for_nulls() const override { return false; } |
_ZNK5doris10FunctionInILb1EE36use_default_implementation_for_nullsEv Line | Count | Source | 83 | 989 | bool use_default_implementation_for_nulls() const override { return false; } |
|
84 | | |
85 | | // size of [ in ( 1 , 2 , 3 , null) ] is 3 |
86 | 1.91k | size_t get_size_with_out_null(FunctionContext* context) { |
87 | 1.91k | if ((context->get_num_args() - 1) > FIXED_CONTAINER_MAX_SIZE) { |
88 | 14 | return context->get_num_args() - 1; |
89 | 14 | } |
90 | 1.90k | size_t sz = 0; |
91 | 6.36k | for (int i = 1; i < context->get_num_args(); ++i) { |
92 | 4.45k | const auto& const_column_ptr = context->get_constant_col(i); |
93 | 4.45k | if (const_column_ptr != nullptr) { |
94 | 4.45k | auto const_data = const_column_ptr->column_ptr->get_data_at(0); |
95 | 4.45k | if (const_data.data != nullptr) { |
96 | 4.40k | sz++; |
97 | 4.40k | } |
98 | 4.45k | } |
99 | 4.45k | } |
100 | 1.90k | return sz; |
101 | 1.91k | } _ZN5doris10FunctionInILb0EE22get_size_with_out_nullEPNS_15FunctionContextE Line | Count | Source | 86 | 1.73k | size_t get_size_with_out_null(FunctionContext* context) { | 87 | 1.73k | if ((context->get_num_args() - 1) > FIXED_CONTAINER_MAX_SIZE) { | 88 | 14 | return context->get_num_args() - 1; | 89 | 14 | } | 90 | 1.72k | size_t sz = 0; | 91 | 5.73k | for (int i = 1; i < context->get_num_args(); ++i) { | 92 | 4.00k | const auto& const_column_ptr = context->get_constant_col(i); | 93 | 4.00k | if (const_column_ptr != nullptr) { | 94 | 4.00k | auto const_data = const_column_ptr->column_ptr->get_data_at(0); | 95 | 4.00k | if (const_data.data != nullptr) { | 96 | 3.97k | sz++; | 97 | 3.97k | } | 98 | 4.00k | } | 99 | 4.00k | } | 100 | 1.72k | return sz; | 101 | 1.73k | } |
_ZN5doris10FunctionInILb1EE22get_size_with_out_nullEPNS_15FunctionContextE Line | Count | Source | 86 | 181 | size_t get_size_with_out_null(FunctionContext* context) { | 87 | 181 | if ((context->get_num_args() - 1) > FIXED_CONTAINER_MAX_SIZE) { | 88 | 0 | return context->get_num_args() - 1; | 89 | 0 | } | 90 | 181 | size_t sz = 0; | 91 | 631 | for (int i = 1; i < context->get_num_args(); ++i) { | 92 | 450 | const auto& const_column_ptr = context->get_constant_col(i); | 93 | 450 | if (const_column_ptr != nullptr) { | 94 | 450 | auto const_data = const_column_ptr->column_ptr->get_data_at(0); | 95 | 450 | if (const_data.data != nullptr) { | 96 | 429 | sz++; | 97 | 429 | } | 98 | 450 | } | 99 | 450 | } | 100 | 181 | return sz; | 101 | 181 | } |
|
102 | | |
103 | 14.3k | Status open(FunctionContext* context, FunctionContext::FunctionStateScope scope) override { |
104 | 14.3k | if (scope == FunctionContext::THREAD_LOCAL) { |
105 | 12.4k | return Status::OK(); |
106 | 12.4k | } |
107 | 1.91k | std::shared_ptr<InState> state = std::make_shared<InState>(); |
108 | 1.91k | context->set_function_state(scope, state); |
109 | 1.91k | DCHECK(context->get_num_args() >= 1); |
110 | 1.91k | if (context->get_arg_type(0)->get_primitive_type() == PrimitiveType::TYPE_NULL) { |
111 | 0 | state->hybrid_set.reset(create_set(TYPE_BOOLEAN, 0, true)); |
112 | 1.91k | } else if (context->get_arg_type(0)->get_primitive_type() == PrimitiveType::TYPE_CHAR || |
113 | 1.91k | context->get_arg_type(0)->get_primitive_type() == PrimitiveType::TYPE_VARCHAR || |
114 | 1.91k | context->get_arg_type(0)->get_primitive_type() == PrimitiveType::TYPE_STRING) { |
115 | | // the StringValue's memory is held by FunctionContext, so we can use StringValueSet here directly |
116 | 515 | state->hybrid_set.reset(create_string_value_set(get_size_with_out_null(context), true)); |
117 | 1.40k | } else { |
118 | 1.40k | state->hybrid_set.reset(create_set(context->get_arg_type(0)->get_primitive_type(), |
119 | 1.40k | get_size_with_out_null(context), true)); |
120 | 1.40k | } |
121 | | |
122 | 6.59k | for (int i = 1; i < context->get_num_args(); ++i) { |
123 | 4.67k | const auto& const_column_ptr = context->get_constant_col(i); |
124 | 4.67k | if (const_column_ptr != nullptr) { |
125 | 4.67k | auto const_data = const_column_ptr->column_ptr->get_data_at(0); |
126 | 4.67k | state->hybrid_set->insert((void*)const_data.data, const_data.size); |
127 | 4.67k | } else { |
128 | 1 | state->use_set = false; |
129 | 1 | state->hybrid_set.reset(); |
130 | 1 | break; |
131 | 1 | } |
132 | 4.67k | } |
133 | 1.91k | return Status::OK(); |
134 | 14.3k | } _ZN5doris10FunctionInILb0EE4openEPNS_15FunctionContextENS2_18FunctionStateScopeE Line | Count | Source | 103 | 11.7k | Status open(FunctionContext* context, FunctionContext::FunctionStateScope scope) override { | 104 | 11.7k | if (scope == FunctionContext::THREAD_LOCAL) { | 105 | 10.0k | return Status::OK(); | 106 | 10.0k | } | 107 | 1.73k | std::shared_ptr<InState> state = std::make_shared<InState>(); | 108 | 1.73k | context->set_function_state(scope, state); | 109 | 1.73k | DCHECK(context->get_num_args() >= 1); | 110 | 1.73k | if (context->get_arg_type(0)->get_primitive_type() == PrimitiveType::TYPE_NULL) { | 111 | 0 | state->hybrid_set.reset(create_set(TYPE_BOOLEAN, 0, true)); | 112 | 1.73k | } else if (context->get_arg_type(0)->get_primitive_type() == PrimitiveType::TYPE_CHAR || | 113 | 1.73k | context->get_arg_type(0)->get_primitive_type() == PrimitiveType::TYPE_VARCHAR || | 114 | 1.73k | context->get_arg_type(0)->get_primitive_type() == PrimitiveType::TYPE_STRING) { | 115 | | // the StringValue's memory is held by FunctionContext, so we can use StringValueSet here directly | 116 | 428 | state->hybrid_set.reset(create_string_value_set(get_size_with_out_null(context), true)); | 117 | 1.30k | } else { | 118 | 1.30k | state->hybrid_set.reset(create_set(context->get_arg_type(0)->get_primitive_type(), | 119 | 1.30k | get_size_with_out_null(context), true)); | 120 | 1.30k | } | 121 | | | 122 | 5.95k | for (int i = 1; i < context->get_num_args(); ++i) { | 123 | 4.22k | const auto& const_column_ptr = context->get_constant_col(i); | 124 | 4.22k | if (const_column_ptr != nullptr) { | 125 | 4.22k | auto const_data = const_column_ptr->column_ptr->get_data_at(0); | 126 | 4.22k | state->hybrid_set->insert((void*)const_data.data, const_data.size); | 127 | 4.22k | } else { | 128 | 1 | state->use_set = false; | 129 | 1 | state->hybrid_set.reset(); | 130 | 1 | break; | 131 | 1 | } | 132 | 4.22k | } | 133 | 1.73k | return Status::OK(); | 134 | 11.7k | } |
_ZN5doris10FunctionInILb1EE4openEPNS_15FunctionContextENS2_18FunctionStateScopeE Line | Count | Source | 103 | 2.56k | Status open(FunctionContext* context, FunctionContext::FunctionStateScope scope) override { | 104 | 2.56k | if (scope == FunctionContext::THREAD_LOCAL) { | 105 | 2.38k | return Status::OK(); | 106 | 2.38k | } | 107 | 183 | std::shared_ptr<InState> state = std::make_shared<InState>(); | 108 | 183 | context->set_function_state(scope, state); | 109 | 183 | DCHECK(context->get_num_args() >= 1); | 110 | 183 | if (context->get_arg_type(0)->get_primitive_type() == PrimitiveType::TYPE_NULL) { | 111 | 0 | state->hybrid_set.reset(create_set(TYPE_BOOLEAN, 0, true)); | 112 | 183 | } else if (context->get_arg_type(0)->get_primitive_type() == PrimitiveType::TYPE_CHAR || | 113 | 183 | context->get_arg_type(0)->get_primitive_type() == PrimitiveType::TYPE_VARCHAR || | 114 | 183 | context->get_arg_type(0)->get_primitive_type() == PrimitiveType::TYPE_STRING) { | 115 | | // the StringValue's memory is held by FunctionContext, so we can use StringValueSet here directly | 116 | 87 | state->hybrid_set.reset(create_string_value_set(get_size_with_out_null(context), true)); | 117 | 96 | } else { | 118 | 96 | state->hybrid_set.reset(create_set(context->get_arg_type(0)->get_primitive_type(), | 119 | 96 | get_size_with_out_null(context), true)); | 120 | 96 | } | 121 | | | 122 | 633 | for (int i = 1; i < context->get_num_args(); ++i) { | 123 | 450 | const auto& const_column_ptr = context->get_constant_col(i); | 124 | 450 | if (const_column_ptr != nullptr) { | 125 | 450 | auto const_data = const_column_ptr->column_ptr->get_data_at(0); | 126 | 450 | state->hybrid_set->insert((void*)const_data.data, const_data.size); | 127 | 450 | } else { | 128 | 0 | state->use_set = false; | 129 | 0 | state->hybrid_set.reset(); | 130 | 0 | break; | 131 | 0 | } | 132 | 450 | } | 133 | 183 | return Status::OK(); | 134 | 2.56k | } |
|
135 | | |
136 | | Status evaluate_inverted_index( |
137 | | const ColumnsWithTypeAndName& arguments, |
138 | | const std::vector<IndexFieldNameAndTypePair>& data_type_with_names, |
139 | | std::vector<segment_v2::IndexIterator*> iterators, uint32_t num_rows, |
140 | | const InvertedIndexAnalyzerCtx* analyzer_ctx, |
141 | 712 | segment_v2::InvertedIndexResultBitmap& bitmap_result) const override { |
142 | 712 | DCHECK(data_type_with_names.size() == 1); |
143 | 712 | DCHECK(iterators.size() == 1); |
144 | 712 | auto* iter = iterators[0]; |
145 | 712 | auto data_type_with_name = data_type_with_names[0]; |
146 | 712 | std::shared_ptr<roaring::Roaring> roaring = std::make_shared<roaring::Roaring>(); |
147 | 712 | std::shared_ptr<roaring::Roaring> null_bitmap = std::make_shared<roaring::Roaring>(); |
148 | | |
149 | 712 | if (iter == nullptr) { |
150 | 0 | return Status::OK(); |
151 | 0 | } |
152 | 712 | if (!segment_v2::IndexReaderHelper::has_string_or_bkd_index(iter)) { |
153 | | //NOT support in list when parser is FULLTEXT for expr inverted index evaluate. |
154 | 140 | return Status::OK(); |
155 | 140 | } |
156 | 575 | if (iter->has_null()) { |
157 | 575 | segment_v2::InvertedIndexQueryCacheHandle null_bitmap_cache_handle; |
158 | 575 | RETURN_IF_ERROR(iter->read_null_bitmap(&null_bitmap_cache_handle)); |
159 | 575 | null_bitmap = null_bitmap_cache_handle.get_bitmap(); |
160 | 575 | } |
161 | 718 | for (const auto& arg : arguments) { |
162 | 718 | Field param_value; |
163 | 718 | arg.column->get(0, param_value); |
164 | 718 | auto param_type = arg.type->get_primitive_type(); |
165 | 718 | if (param_value.is_null()) { |
166 | | // predicate like column NOT IN (NULL, '') should not push down to index. |
167 | 508 | if (negative) { |
168 | 505 | return Status::OK(); |
169 | 505 | } |
170 | 3 | *roaring |= *null_bitmap; |
171 | 3 | continue; |
172 | 508 | } |
173 | 210 | std::unique_ptr<InvertedIndexQueryParamFactory> query_param = nullptr; |
174 | 210 | RETURN_IF_ERROR(InvertedIndexQueryParamFactory::create_query_value( |
175 | 210 | param_type, ¶m_value, query_param)); |
176 | 210 | InvertedIndexQueryType query_type = InvertedIndexQueryType::EQUAL_QUERY; |
177 | 210 | segment_v2::InvertedIndexParam param; |
178 | 210 | param.column_name = data_type_with_name.first; |
179 | 210 | param.column_type = data_type_with_name.second; |
180 | 210 | param.query_value = query_param->get_value(); |
181 | 210 | param.query_type = query_type; |
182 | 210 | param.num_rows = num_rows; |
183 | 210 | param.roaring = std::make_shared<roaring::Roaring>(); |
184 | 210 | param.analyzer_ctx = analyzer_ctx; |
185 | 210 | RETURN_IF_ERROR(iter->read_from_index(segment_v2::IndexParam {¶m})); |
186 | 203 | *roaring |= *param.roaring; |
187 | 203 | } |
188 | 60 | segment_v2::InvertedIndexResultBitmap result(roaring, null_bitmap); |
189 | 60 | bitmap_result = result; |
190 | 60 | bitmap_result.mask_out_null(); |
191 | 60 | if constexpr (negative) { |
192 | 29 | roaring::Roaring full_result; |
193 | 29 | full_result.addRange(0, num_rows); |
194 | 29 | bitmap_result.op_not(&full_result); |
195 | 29 | } |
196 | 60 | return Status::OK(); |
197 | 572 | } _ZNK5doris10FunctionInILb0EE23evaluate_inverted_indexERKSt6vectorINS_21ColumnWithTypeAndNameESaIS3_EERKS2_ISt4pairINSt7__cxx1112basic_stringIcSt11char_traitsIcESaIcEEESt10shared_ptrIKNS_9IDataTypeEEESaISJ_EES2_IPNS_10segment_v213IndexIteratorESaISQ_EEjPKNS_24InvertedIndexAnalyzerCtxERNSO_25InvertedIndexResultBitmapE Line | Count | Source | 141 | 95 | segment_v2::InvertedIndexResultBitmap& bitmap_result) const override { | 142 | 95 | DCHECK(data_type_with_names.size() == 1); | 143 | 95 | DCHECK(iterators.size() == 1); | 144 | 95 | auto* iter = iterators[0]; | 145 | 95 | auto data_type_with_name = data_type_with_names[0]; | 146 | 95 | std::shared_ptr<roaring::Roaring> roaring = std::make_shared<roaring::Roaring>(); | 147 | 95 | std::shared_ptr<roaring::Roaring> null_bitmap = std::make_shared<roaring::Roaring>(); | 148 | | | 149 | 95 | if (iter == nullptr) { | 150 | 0 | return Status::OK(); | 151 | 0 | } | 152 | 95 | if (!segment_v2::IndexReaderHelper::has_string_or_bkd_index(iter)) { | 153 | | //NOT support in list when parser is FULLTEXT for expr inverted index evaluate. | 154 | 64 | return Status::OK(); | 155 | 64 | } | 156 | 33 | if (iter->has_null()) { | 157 | 33 | segment_v2::InvertedIndexQueryCacheHandle null_bitmap_cache_handle; | 158 | 33 | RETURN_IF_ERROR(iter->read_null_bitmap(&null_bitmap_cache_handle)); | 159 | 33 | null_bitmap = null_bitmap_cache_handle.get_bitmap(); | 160 | 33 | } | 161 | 66 | for (const auto& arg : arguments) { | 162 | 66 | Field param_value; | 163 | 66 | arg.column->get(0, param_value); | 164 | 66 | auto param_type = arg.type->get_primitive_type(); | 165 | 66 | if (param_value.is_null()) { | 166 | | // predicate like column NOT IN (NULL, '') should not push down to index. | 167 | 3 | if (negative) { | 168 | 0 | return Status::OK(); | 169 | 0 | } | 170 | 3 | *roaring |= *null_bitmap; | 171 | 3 | continue; | 172 | 3 | } | 173 | 63 | std::unique_ptr<InvertedIndexQueryParamFactory> query_param = nullptr; | 174 | 63 | RETURN_IF_ERROR(InvertedIndexQueryParamFactory::create_query_value( | 175 | 63 | param_type, ¶m_value, query_param)); | 176 | 63 | InvertedIndexQueryType query_type = InvertedIndexQueryType::EQUAL_QUERY; | 177 | 63 | segment_v2::InvertedIndexParam param; | 178 | 63 | param.column_name = data_type_with_name.first; | 179 | 63 | param.column_type = data_type_with_name.second; | 180 | 63 | param.query_value = query_param->get_value(); | 181 | 63 | param.query_type = query_type; | 182 | 63 | param.num_rows = num_rows; | 183 | 63 | param.roaring = std::make_shared<roaring::Roaring>(); | 184 | 63 | param.analyzer_ctx = analyzer_ctx; | 185 | 63 | RETURN_IF_ERROR(iter->read_from_index(segment_v2::IndexParam {¶m})); | 186 | 63 | *roaring |= *param.roaring; | 187 | 63 | } | 188 | 31 | segment_v2::InvertedIndexResultBitmap result(roaring, null_bitmap); | 189 | 31 | bitmap_result = result; | 190 | 31 | bitmap_result.mask_out_null(); | 191 | | if constexpr (negative) { | 192 | | roaring::Roaring full_result; | 193 | | full_result.addRange(0, num_rows); | 194 | | bitmap_result.op_not(&full_result); | 195 | | } | 196 | 31 | return Status::OK(); | 197 | 31 | } |
_ZNK5doris10FunctionInILb1EE23evaluate_inverted_indexERKSt6vectorINS_21ColumnWithTypeAndNameESaIS3_EERKS2_ISt4pairINSt7__cxx1112basic_stringIcSt11char_traitsIcESaIcEEESt10shared_ptrIKNS_9IDataTypeEEESaISJ_EES2_IPNS_10segment_v213IndexIteratorESaISQ_EEjPKNS_24InvertedIndexAnalyzerCtxERNSO_25InvertedIndexResultBitmapE Line | Count | Source | 141 | 617 | segment_v2::InvertedIndexResultBitmap& bitmap_result) const override { | 142 | 617 | DCHECK(data_type_with_names.size() == 1); | 143 | 617 | DCHECK(iterators.size() == 1); | 144 | 617 | auto* iter = iterators[0]; | 145 | 617 | auto data_type_with_name = data_type_with_names[0]; | 146 | 617 | std::shared_ptr<roaring::Roaring> roaring = std::make_shared<roaring::Roaring>(); | 147 | 617 | std::shared_ptr<roaring::Roaring> null_bitmap = std::make_shared<roaring::Roaring>(); | 148 | | | 149 | 617 | if (iter == nullptr) { | 150 | 0 | return Status::OK(); | 151 | 0 | } | 152 | 617 | if (!segment_v2::IndexReaderHelper::has_string_or_bkd_index(iter)) { | 153 | | //NOT support in list when parser is FULLTEXT for expr inverted index evaluate. | 154 | 76 | return Status::OK(); | 155 | 76 | } | 156 | 542 | if (iter->has_null()) { | 157 | 542 | segment_v2::InvertedIndexQueryCacheHandle null_bitmap_cache_handle; | 158 | 542 | RETURN_IF_ERROR(iter->read_null_bitmap(&null_bitmap_cache_handle)); | 159 | 542 | null_bitmap = null_bitmap_cache_handle.get_bitmap(); | 160 | 542 | } | 161 | 652 | for (const auto& arg : arguments) { | 162 | 652 | Field param_value; | 163 | 652 | arg.column->get(0, param_value); | 164 | 652 | auto param_type = arg.type->get_primitive_type(); | 165 | 652 | if (param_value.is_null()) { | 166 | | // predicate like column NOT IN (NULL, '') should not push down to index. | 167 | 505 | if (negative) { | 168 | 505 | return Status::OK(); | 169 | 505 | } | 170 | 0 | *roaring |= *null_bitmap; | 171 | 0 | continue; | 172 | 505 | } | 173 | 147 | std::unique_ptr<InvertedIndexQueryParamFactory> query_param = nullptr; | 174 | 147 | RETURN_IF_ERROR(InvertedIndexQueryParamFactory::create_query_value( | 175 | 147 | param_type, ¶m_value, query_param)); | 176 | 147 | InvertedIndexQueryType query_type = InvertedIndexQueryType::EQUAL_QUERY; | 177 | 147 | segment_v2::InvertedIndexParam param; | 178 | 147 | param.column_name = data_type_with_name.first; | 179 | 147 | param.column_type = data_type_with_name.second; | 180 | 147 | param.query_value = query_param->get_value(); | 181 | 147 | param.query_type = query_type; | 182 | 147 | param.num_rows = num_rows; | 183 | 147 | param.roaring = std::make_shared<roaring::Roaring>(); | 184 | 147 | param.analyzer_ctx = analyzer_ctx; | 185 | 147 | RETURN_IF_ERROR(iter->read_from_index(segment_v2::IndexParam {¶m})); | 186 | 140 | *roaring |= *param.roaring; | 187 | 140 | } | 188 | 29 | segment_v2::InvertedIndexResultBitmap result(roaring, null_bitmap); | 189 | 29 | bitmap_result = result; | 190 | 29 | bitmap_result.mask_out_null(); | 191 | 29 | if constexpr (negative) { | 192 | 29 | roaring::Roaring full_result; | 193 | 29 | full_result.addRange(0, num_rows); | 194 | 29 | bitmap_result.op_not(&full_result); | 195 | 29 | } | 196 | 29 | return Status::OK(); | 197 | 541 | } |
|
198 | | |
199 | | Status execute_impl(FunctionContext* context, Block& block, const ColumnNumbers& arguments, |
200 | 18.2k | uint32_t result, size_t input_rows_count) const override { |
201 | 18.2k | auto* in_state = reinterpret_cast<InState*>( |
202 | 18.2k | context->get_function_state(FunctionContext::FRAGMENT_LOCAL)); |
203 | 18.2k | if (!in_state) { |
204 | 0 | return Status::RuntimeError("funciton context for function '{}' must have Set;", |
205 | 0 | get_name()); |
206 | 0 | } |
207 | 18.2k | auto res = ColumnUInt8::create(); |
208 | 18.2k | ColumnUInt8::Container& vec_res = res->get_data(); |
209 | 18.2k | vec_res.resize(input_rows_count); |
210 | | |
211 | 18.2k | ColumnUInt8::MutablePtr col_null_map_to; |
212 | 18.2k | col_null_map_to = ColumnUInt8::create(input_rows_count, false); |
213 | 18.2k | auto& vec_null_map_to = col_null_map_to->get_data(); |
214 | | |
215 | 18.2k | const ColumnWithTypeAndName& left_arg = block.get_by_position(arguments[0]); |
216 | 18.2k | const auto& [materialized_column, col_const] = unpack_if_const(left_arg.column); |
217 | | |
218 | 18.2k | if (in_state->use_set) { |
219 | 18.2k | if (materialized_column->is_nullable()) { |
220 | 17.6k | const auto* null_col_ptr = |
221 | 17.6k | check_and_get_column<ColumnNullable>(materialized_column.get()); |
222 | 17.6k | const auto& null_map = null_col_ptr->get_null_map_column().get_data(); |
223 | 17.6k | const auto* nested_col_ptr = null_col_ptr->get_nested_column_ptr().get(); |
224 | | |
225 | 17.6k | if (nested_col_ptr->is_column_string()) { |
226 | 1.97k | const auto* column_string_ptr = |
227 | 1.97k | assert_cast<const ColumnString*>(nested_col_ptr); |
228 | 1.97k | search_hash_set_check_null(in_state, input_rows_count, vec_res, null_map, |
229 | 1.97k | column_string_ptr); |
230 | 15.6k | } else { |
231 | | //TODO: support other column type |
232 | 15.6k | search_hash_set_check_null(in_state, input_rows_count, vec_res, null_map, |
233 | 15.6k | nested_col_ptr); |
234 | 15.6k | } |
235 | | |
236 | 17.6k | if (!in_state->hybrid_set->contain_null()) { |
237 | 3.17M | for (size_t i = 0; i < input_rows_count; ++i) { |
238 | 3.15M | vec_null_map_to[i] = null_map[i]; |
239 | 3.15M | } |
240 | 16.7k | } else { |
241 | 32.3k | for (size_t i = 0; i < input_rows_count; ++i) { |
242 | 31.5k | vec_null_map_to[i] = null_map[i] || negative == vec_res[i]; |
243 | 31.5k | } |
244 | 847 | } |
245 | | |
246 | 17.6k | } else { // non-nullable |
247 | 621 | if (is_string_type(left_arg.type->get_primitive_type())) { |
248 | 349 | const auto* column_string_ptr = |
249 | 349 | assert_cast<const ColumnString*>(materialized_column.get()); |
250 | 349 | search_hash_set(in_state, input_rows_count, vec_res, column_string_ptr); |
251 | 349 | } else { |
252 | 272 | search_hash_set(in_state, input_rows_count, vec_res, materialized_column.get()); |
253 | 272 | } |
254 | | |
255 | 621 | if (in_state->hybrid_set->contain_null()) { |
256 | 81 | for (size_t i = 0; i < input_rows_count; ++i) { |
257 | 51 | vec_null_map_to[i] = negative == vec_res[i]; |
258 | 51 | } |
259 | 30 | } |
260 | 621 | } |
261 | 18.2k | } else { //!in_state->use_set |
262 | 0 | std::vector<ColumnPtr> set_columns; |
263 | 2 | for (int i = 1; i < arguments.size(); ++i) { |
264 | 2 | set_columns.emplace_back(block.get_by_position(arguments[i]).column); |
265 | 2 | } |
266 | 0 | if (col_const) { |
267 | 0 | impl_without_set<true>(context, set_columns, input_rows_count, vec_res, |
268 | 0 | vec_null_map_to, materialized_column); |
269 | 0 | } else { |
270 | 0 | impl_without_set<false>(context, set_columns, input_rows_count, vec_res, |
271 | 0 | vec_null_map_to, materialized_column); |
272 | 0 | } |
273 | 0 | } |
274 | | |
275 | 18.2k | if (block.get_by_position(result).type->is_nullable()) { |
276 | 17.6k | block.replace_by_position( |
277 | 17.6k | result, ColumnNullable::create(std::move(res), std::move(col_null_map_to))); |
278 | 17.6k | } else { |
279 | 590 | block.replace_by_position(result, std::move(res)); |
280 | 590 | } |
281 | | |
282 | 18.2k | return Status::OK(); |
283 | 18.2k | } _ZNK5doris10FunctionInILb0EE12execute_implEPNS_15FunctionContextERNS_5BlockERKSt6vectorIjSaIjEEjm Line | Count | Source | 200 | 17.4k | uint32_t result, size_t input_rows_count) const override { | 201 | 17.4k | auto* in_state = reinterpret_cast<InState*>( | 202 | 17.4k | context->get_function_state(FunctionContext::FRAGMENT_LOCAL)); | 203 | 17.4k | if (!in_state) { | 204 | 0 | return Status::RuntimeError("funciton context for function '{}' must have Set;", | 205 | 0 | get_name()); | 206 | 0 | } | 207 | 17.4k | auto res = ColumnUInt8::create(); | 208 | 17.4k | ColumnUInt8::Container& vec_res = res->get_data(); | 209 | 17.4k | vec_res.resize(input_rows_count); | 210 | | | 211 | 17.4k | ColumnUInt8::MutablePtr col_null_map_to; | 212 | 17.4k | col_null_map_to = ColumnUInt8::create(input_rows_count, false); | 213 | 17.4k | auto& vec_null_map_to = col_null_map_to->get_data(); | 214 | | | 215 | 17.4k | const ColumnWithTypeAndName& left_arg = block.get_by_position(arguments[0]); | 216 | 17.4k | const auto& [materialized_column, col_const] = unpack_if_const(left_arg.column); | 217 | | | 218 | 17.4k | if (in_state->use_set) { | 219 | 17.4k | if (materialized_column->is_nullable()) { | 220 | 16.8k | const auto* null_col_ptr = | 221 | 16.8k | check_and_get_column<ColumnNullable>(materialized_column.get()); | 222 | 16.8k | const auto& null_map = null_col_ptr->get_null_map_column().get_data(); | 223 | 16.8k | const auto* nested_col_ptr = null_col_ptr->get_nested_column_ptr().get(); | 224 | | | 225 | 16.8k | if (nested_col_ptr->is_column_string()) { | 226 | 1.33k | const auto* column_string_ptr = | 227 | 1.33k | assert_cast<const ColumnString*>(nested_col_ptr); | 228 | 1.33k | search_hash_set_check_null(in_state, input_rows_count, vec_res, null_map, | 229 | 1.33k | column_string_ptr); | 230 | 15.5k | } else { | 231 | | //TODO: support other column type | 232 | 15.5k | search_hash_set_check_null(in_state, input_rows_count, vec_res, null_map, | 233 | 15.5k | nested_col_ptr); | 234 | 15.5k | } | 235 | | | 236 | 16.8k | if (!in_state->hybrid_set->contain_null()) { | 237 | 3.15M | for (size_t i = 0; i < input_rows_count; ++i) { | 238 | 3.13M | vec_null_map_to[i] = null_map[i]; | 239 | 3.13M | } | 240 | 16.5k | } else { | 241 | 20.5k | for (size_t i = 0; i < input_rows_count; ++i) { | 242 | 20.2k | vec_null_map_to[i] = null_map[i] || negative == vec_res[i]; | 243 | 20.2k | } | 244 | 342 | } | 245 | | | 246 | 16.8k | } else { // non-nullable | 247 | 588 | if (is_string_type(left_arg.type->get_primitive_type())) { | 248 | 349 | const auto* column_string_ptr = | 249 | 349 | assert_cast<const ColumnString*>(materialized_column.get()); | 250 | 349 | search_hash_set(in_state, input_rows_count, vec_res, column_string_ptr); | 251 | 349 | } else { | 252 | 239 | search_hash_set(in_state, input_rows_count, vec_res, materialized_column.get()); | 253 | 239 | } | 254 | | | 255 | 588 | if (in_state->hybrid_set->contain_null()) { | 256 | 2 | for (size_t i = 0; i < input_rows_count; ++i) { | 257 | 1 | vec_null_map_to[i] = negative == vec_res[i]; | 258 | 1 | } | 259 | 1 | } | 260 | 588 | } | 261 | 17.4k | } else { //!in_state->use_set | 262 | 0 | std::vector<ColumnPtr> set_columns; | 263 | 2 | for (int i = 1; i < arguments.size(); ++i) { | 264 | 2 | set_columns.emplace_back(block.get_by_position(arguments[i]).column); | 265 | 2 | } | 266 | 0 | if (col_const) { | 267 | 0 | impl_without_set<true>(context, set_columns, input_rows_count, vec_res, | 268 | 0 | vec_null_map_to, materialized_column); | 269 | 0 | } else { | 270 | 0 | impl_without_set<false>(context, set_columns, input_rows_count, vec_res, | 271 | 0 | vec_null_map_to, materialized_column); | 272 | 0 | } | 273 | 0 | } | 274 | | | 275 | 17.4k | if (block.get_by_position(result).type->is_nullable()) { | 276 | 16.8k | block.replace_by_position( | 277 | 16.8k | result, ColumnNullable::create(std::move(res), std::move(col_null_map_to))); | 278 | 16.8k | } else { | 279 | 586 | block.replace_by_position(result, std::move(res)); | 280 | 586 | } | 281 | | | 282 | 17.4k | return Status::OK(); | 283 | 17.4k | } |
_ZNK5doris10FunctionInILb1EE12execute_implEPNS_15FunctionContextERNS_5BlockERKSt6vectorIjSaIjEEjm Line | Count | Source | 200 | 806 | uint32_t result, size_t input_rows_count) const override { | 201 | 806 | auto* in_state = reinterpret_cast<InState*>( | 202 | 806 | context->get_function_state(FunctionContext::FRAGMENT_LOCAL)); | 203 | 806 | if (!in_state) { | 204 | 0 | return Status::RuntimeError("funciton context for function '{}' must have Set;", | 205 | 0 | get_name()); | 206 | 0 | } | 207 | 806 | auto res = ColumnUInt8::create(); | 208 | 806 | ColumnUInt8::Container& vec_res = res->get_data(); | 209 | 806 | vec_res.resize(input_rows_count); | 210 | | | 211 | 806 | ColumnUInt8::MutablePtr col_null_map_to; | 212 | 806 | col_null_map_to = ColumnUInt8::create(input_rows_count, false); | 213 | 806 | auto& vec_null_map_to = col_null_map_to->get_data(); | 214 | | | 215 | 806 | const ColumnWithTypeAndName& left_arg = block.get_by_position(arguments[0]); | 216 | 806 | const auto& [materialized_column, col_const] = unpack_if_const(left_arg.column); | 217 | | | 218 | 806 | if (in_state->use_set) { | 219 | 806 | if (materialized_column->is_nullable()) { | 220 | 773 | const auto* null_col_ptr = | 221 | 773 | check_and_get_column<ColumnNullable>(materialized_column.get()); | 222 | 773 | const auto& null_map = null_col_ptr->get_null_map_column().get_data(); | 223 | 773 | const auto* nested_col_ptr = null_col_ptr->get_nested_column_ptr().get(); | 224 | | | 225 | 773 | if (nested_col_ptr->is_column_string()) { | 226 | 643 | const auto* column_string_ptr = | 227 | 643 | assert_cast<const ColumnString*>(nested_col_ptr); | 228 | 643 | search_hash_set_check_null(in_state, input_rows_count, vec_res, null_map, | 229 | 643 | column_string_ptr); | 230 | 643 | } else { | 231 | | //TODO: support other column type | 232 | 130 | search_hash_set_check_null(in_state, input_rows_count, vec_res, null_map, | 233 | 130 | nested_col_ptr); | 234 | 130 | } | 235 | | | 236 | 773 | if (!in_state->hybrid_set->contain_null()) { | 237 | 21.8k | for (size_t i = 0; i < input_rows_count; ++i) { | 238 | 21.5k | vec_null_map_to[i] = null_map[i]; | 239 | 21.5k | } | 240 | 505 | } else { | 241 | 11.7k | for (size_t i = 0; i < input_rows_count; ++i) { | 242 | 11.2k | vec_null_map_to[i] = null_map[i] || negative == vec_res[i]; | 243 | 11.2k | } | 244 | 505 | } | 245 | | | 246 | 773 | } else { // non-nullable | 247 | 33 | if (is_string_type(left_arg.type->get_primitive_type())) { | 248 | 0 | const auto* column_string_ptr = | 249 | 0 | assert_cast<const ColumnString*>(materialized_column.get()); | 250 | 0 | search_hash_set(in_state, input_rows_count, vec_res, column_string_ptr); | 251 | 33 | } else { | 252 | 33 | search_hash_set(in_state, input_rows_count, vec_res, materialized_column.get()); | 253 | 33 | } | 254 | | | 255 | 33 | if (in_state->hybrid_set->contain_null()) { | 256 | 79 | for (size_t i = 0; i < input_rows_count; ++i) { | 257 | 50 | vec_null_map_to[i] = negative == vec_res[i]; | 258 | 50 | } | 259 | 29 | } | 260 | 33 | } | 261 | 806 | } else { //!in_state->use_set | 262 | 0 | std::vector<ColumnPtr> set_columns; | 263 | 0 | for (int i = 1; i < arguments.size(); ++i) { | 264 | 0 | set_columns.emplace_back(block.get_by_position(arguments[i]).column); | 265 | 0 | } | 266 | 0 | if (col_const) { | 267 | 0 | impl_without_set<true>(context, set_columns, input_rows_count, vec_res, | 268 | 0 | vec_null_map_to, materialized_column); | 269 | 0 | } else { | 270 | 0 | impl_without_set<false>(context, set_columns, input_rows_count, vec_res, | 271 | 0 | vec_null_map_to, materialized_column); | 272 | 0 | } | 273 | 0 | } | 274 | | | 275 | 806 | if (block.get_by_position(result).type->is_nullable()) { | 276 | 802 | block.replace_by_position( | 277 | 802 | result, ColumnNullable::create(std::move(res), std::move(col_null_map_to))); | 278 | 802 | } else { | 279 | 4 | block.replace_by_position(result, std::move(res)); | 280 | 4 | } | 281 | | | 282 | 806 | return Status::OK(); | 283 | 806 | } |
|
284 | | |
285 | | private: |
286 | | template <typename T> |
287 | | static void search_hash_set_check_null(InState* in_state, size_t input_rows_count, |
288 | | ColumnUInt8::Container& vec_res, |
289 | 17.6k | const ColumnUInt8::Container& null_map, T* col_ptr) { |
290 | 17.6k | if constexpr (!negative) { |
291 | 16.8k | in_state->hybrid_set->find_batch_nullable(*col_ptr, input_rows_count, null_map, |
292 | 16.8k | vec_res); |
293 | 16.8k | } else { |
294 | 773 | in_state->hybrid_set->find_batch_nullable_negative(*col_ptr, input_rows_count, null_map, |
295 | 773 | vec_res); |
296 | 773 | } |
297 | 17.6k | } _ZN5doris10FunctionInILb0EE26search_hash_set_check_nullIKNS_9ColumnStrIjEEEEvPNS_7InStateEmRNS_8PODArrayIhLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEERKSC_PT_ Line | Count | Source | 289 | 1.33k | const ColumnUInt8::Container& null_map, T* col_ptr) { | 290 | 1.33k | if constexpr (!negative) { | 291 | 1.33k | in_state->hybrid_set->find_batch_nullable(*col_ptr, input_rows_count, null_map, | 292 | 1.33k | vec_res); | 293 | | } else { | 294 | | in_state->hybrid_set->find_batch_nullable_negative(*col_ptr, input_rows_count, null_map, | 295 | | vec_res); | 296 | | } | 297 | 1.33k | } |
_ZN5doris10FunctionInILb0EE26search_hash_set_check_nullIKNS_7IColumnEEEvPNS_7InStateEmRNS_8PODArrayIhLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEERKSB_PT_ Line | Count | Source | 289 | 15.5k | const ColumnUInt8::Container& null_map, T* col_ptr) { | 290 | 15.5k | if constexpr (!negative) { | 291 | 15.5k | in_state->hybrid_set->find_batch_nullable(*col_ptr, input_rows_count, null_map, | 292 | 15.5k | vec_res); | 293 | | } else { | 294 | | in_state->hybrid_set->find_batch_nullable_negative(*col_ptr, input_rows_count, null_map, | 295 | | vec_res); | 296 | | } | 297 | 15.5k | } |
_ZN5doris10FunctionInILb1EE26search_hash_set_check_nullIKNS_9ColumnStrIjEEEEvPNS_7InStateEmRNS_8PODArrayIhLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEERKSC_PT_ Line | Count | Source | 289 | 643 | const ColumnUInt8::Container& null_map, T* col_ptr) { | 290 | | if constexpr (!negative) { | 291 | | in_state->hybrid_set->find_batch_nullable(*col_ptr, input_rows_count, null_map, | 292 | | vec_res); | 293 | 643 | } else { | 294 | 643 | in_state->hybrid_set->find_batch_nullable_negative(*col_ptr, input_rows_count, null_map, | 295 | 643 | vec_res); | 296 | 643 | } | 297 | 643 | } |
_ZN5doris10FunctionInILb1EE26search_hash_set_check_nullIKNS_7IColumnEEEvPNS_7InStateEmRNS_8PODArrayIhLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEERKSB_PT_ Line | Count | Source | 289 | 130 | const ColumnUInt8::Container& null_map, T* col_ptr) { | 290 | | if constexpr (!negative) { | 291 | | in_state->hybrid_set->find_batch_nullable(*col_ptr, input_rows_count, null_map, | 292 | | vec_res); | 293 | 130 | } else { | 294 | 130 | in_state->hybrid_set->find_batch_nullable_negative(*col_ptr, input_rows_count, null_map, | 295 | 130 | vec_res); | 296 | 130 | } | 297 | 130 | } |
|
298 | | |
299 | | template <typename T> |
300 | | static void search_hash_set(InState* in_state, size_t input_rows_count, |
301 | 621 | ColumnUInt8::Container& vec_res, T* col_ptr) { |
302 | 621 | if constexpr (!negative) { |
303 | 588 | in_state->hybrid_set->find_batch(*col_ptr, input_rows_count, vec_res); |
304 | 588 | } else { |
305 | 33 | in_state->hybrid_set->find_batch_negative(*col_ptr, input_rows_count, vec_res); |
306 | 33 | } |
307 | 621 | } _ZN5doris10FunctionInILb0EE15search_hash_setIKNS_9ColumnStrIjEEEEvPNS_7InStateEmRNS_8PODArrayIhLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEEPT_ Line | Count | Source | 301 | 349 | ColumnUInt8::Container& vec_res, T* col_ptr) { | 302 | 349 | if constexpr (!negative) { | 303 | 349 | in_state->hybrid_set->find_batch(*col_ptr, input_rows_count, vec_res); | 304 | | } else { | 305 | | in_state->hybrid_set->find_batch_negative(*col_ptr, input_rows_count, vec_res); | 306 | | } | 307 | 349 | } |
_ZN5doris10FunctionInILb0EE15search_hash_setIKNS_7IColumnEEEvPNS_7InStateEmRNS_8PODArrayIhLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEEPT_ Line | Count | Source | 301 | 239 | ColumnUInt8::Container& vec_res, T* col_ptr) { | 302 | 239 | if constexpr (!negative) { | 303 | 239 | in_state->hybrid_set->find_batch(*col_ptr, input_rows_count, vec_res); | 304 | | } else { | 305 | | in_state->hybrid_set->find_batch_negative(*col_ptr, input_rows_count, vec_res); | 306 | | } | 307 | 239 | } |
Unexecuted instantiation: _ZN5doris10FunctionInILb1EE15search_hash_setIKNS_9ColumnStrIjEEEEvPNS_7InStateEmRNS_8PODArrayIhLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEEPT_ _ZN5doris10FunctionInILb1EE15search_hash_setIKNS_7IColumnEEEvPNS_7InStateEmRNS_8PODArrayIhLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEEPT_ Line | Count | Source | 301 | 33 | ColumnUInt8::Container& vec_res, T* col_ptr) { | 302 | | if constexpr (!negative) { | 303 | | in_state->hybrid_set->find_batch(*col_ptr, input_rows_count, vec_res); | 304 | 33 | } else { | 305 | 33 | in_state->hybrid_set->find_batch_negative(*col_ptr, input_rows_count, vec_res); | 306 | 33 | } | 307 | 33 | } |
|
308 | | |
309 | | template <bool Const> |
310 | | static void impl_without_set(FunctionContext* context, |
311 | | const std::vector<ColumnPtr>& set_columns, size_t input_rows_count, |
312 | | ColumnUInt8::Container& vec_res, |
313 | | ColumnUInt8::Container& vec_null_map_to, |
314 | 1 | const ColumnPtr& materialized_column) { |
315 | 2 | for (size_t i = 0; i < input_rows_count; ++i) { |
316 | 1 | const auto& ref_data = materialized_column->get_data_at(index_check_const(i, Const)); |
317 | 1 | if (ref_data.data == nullptr) { |
318 | 0 | vec_null_map_to[i] = true; |
319 | 0 | continue; |
320 | 0 | } |
321 | | |
322 | 1 | std::vector<StringRef> set_datas; |
323 | | // To comply with the SQL standard, IN() returns NULL not only if the expression on the left hand side is NULL, |
324 | | // but also if no match is found in the list and one of the expressions in the list is NULL. |
325 | 1 | bool null_in_set = false; |
326 | | |
327 | 2 | for (const auto& set_column : set_columns) { |
328 | 2 | auto set_data = set_column->get_data_at(i); |
329 | 2 | if (set_data.data == nullptr) { |
330 | 0 | null_in_set = true; |
331 | 2 | } else { |
332 | 2 | set_datas.push_back(set_data); |
333 | 2 | } |
334 | 2 | } |
335 | 1 | std::unique_ptr<HybridSetBase> hybrid_set(create_set( |
336 | 1 | context->get_arg_type(0)->get_primitive_type(), set_datas.size(), true)); |
337 | 2 | for (auto& set_data : set_datas) { |
338 | 2 | hybrid_set->insert((void*)(set_data.data), set_data.size); |
339 | 2 | } |
340 | | |
341 | 1 | vec_res[i] = negative ^ hybrid_set->find((void*)ref_data.data, ref_data.size); |
342 | 1 | if (null_in_set) { |
343 | 0 | vec_null_map_to[i] = negative == vec_res[i]; |
344 | 1 | } else { |
345 | 1 | vec_null_map_to[i] = false; |
346 | 1 | } |
347 | 1 | } |
348 | 1 | } Unexecuted instantiation: _ZN5doris10FunctionInILb0EE16impl_without_setILb1EEEvPNS_15FunctionContextERKSt6vectorINS_3COWINS_7IColumnEE13immutable_ptrIS7_EESaISA_EEmRNS_8PODArrayIhLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEESK_RKSA_ _ZN5doris10FunctionInILb0EE16impl_without_setILb0EEEvPNS_15FunctionContextERKSt6vectorINS_3COWINS_7IColumnEE13immutable_ptrIS7_EESaISA_EEmRNS_8PODArrayIhLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEESK_RKSA_ Line | Count | Source | 314 | 1 | const ColumnPtr& materialized_column) { | 315 | 2 | for (size_t i = 0; i < input_rows_count; ++i) { | 316 | 1 | const auto& ref_data = materialized_column->get_data_at(index_check_const(i, Const)); | 317 | 1 | if (ref_data.data == nullptr) { | 318 | 0 | vec_null_map_to[i] = true; | 319 | 0 | continue; | 320 | 0 | } | 321 | | | 322 | 1 | std::vector<StringRef> set_datas; | 323 | | // To comply with the SQL standard, IN() returns NULL not only if the expression on the left hand side is NULL, | 324 | | // but also if no match is found in the list and one of the expressions in the list is NULL. | 325 | 1 | bool null_in_set = false; | 326 | | | 327 | 2 | for (const auto& set_column : set_columns) { | 328 | 2 | auto set_data = set_column->get_data_at(i); | 329 | 2 | if (set_data.data == nullptr) { | 330 | 0 | null_in_set = true; | 331 | 2 | } else { | 332 | 2 | set_datas.push_back(set_data); | 333 | 2 | } | 334 | 2 | } | 335 | 1 | std::unique_ptr<HybridSetBase> hybrid_set(create_set( | 336 | 1 | context->get_arg_type(0)->get_primitive_type(), set_datas.size(), true)); | 337 | 2 | for (auto& set_data : set_datas) { | 338 | 2 | hybrid_set->insert((void*)(set_data.data), set_data.size); | 339 | 2 | } | 340 | | | 341 | 1 | vec_res[i] = negative ^ hybrid_set->find((void*)ref_data.data, ref_data.size); | 342 | 1 | if (null_in_set) { | 343 | 0 | vec_null_map_to[i] = negative == vec_res[i]; | 344 | 1 | } else { | 345 | 1 | vec_null_map_to[i] = false; | 346 | 1 | } | 347 | 1 | } | 348 | 1 | } |
Unexecuted instantiation: _ZN5doris10FunctionInILb1EE16impl_without_setILb1EEEvPNS_15FunctionContextERKSt6vectorINS_3COWINS_7IColumnEE13immutable_ptrIS7_EESaISA_EEmRNS_8PODArrayIhLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEESK_RKSA_ Unexecuted instantiation: _ZN5doris10FunctionInILb1EE16impl_without_setILb0EEEvPNS_15FunctionContextERKSt6vectorINS_3COWINS_7IColumnEE13immutable_ptrIS7_EESaISA_EEmRNS_8PODArrayIhLm4096ENS_9AllocatorILb0ELb0ELb0ENS_22DefaultMemoryAllocatorELb1EEELm16ELm15EEESK_RKSA_ |
349 | | }; |
350 | | |
351 | | } // namespace doris |