Coverage Report

Created: 2026-05-24 00:06

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
be/src/format/parquet/vparquet_column_reader.cpp
Line
Count
Source
1
// Licensed to the Apache Software Foundation (ASF) under one
2
// or more contributor license agreements.  See the NOTICE file
3
// distributed with this work for additional information
4
// regarding copyright ownership.  The ASF licenses this file
5
// to you under the Apache License, Version 2.0 (the
6
// "License"); you may not use this file except in compliance
7
// with the License.  You may obtain a copy of the License at
8
//
9
//   http://www.apache.org/licenses/LICENSE-2.0
10
//
11
// Unless required by applicable law or agreed to in writing,
12
// software distributed under the License is distributed on an
13
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
14
// KIND, either express or implied.  See the License for the
15
// specific language governing permissions and limitations
16
// under the License.
17
18
#include "format/parquet/vparquet_column_reader.h"
19
20
#include <gen_cpp/parquet_types.h>
21
#include <limits.h>
22
#include <sys/types.h>
23
24
#include <algorithm>
25
#include <utility>
26
27
#include "common/status.h"
28
#include "core/column/column.h"
29
#include "core/column/column_array.h"
30
#include "core/column/column_map.h"
31
#include "core/column/column_nullable.h"
32
#include "core/column/column_struct.h"
33
#include "core/data_type/data_type_array.h"
34
#include "core/data_type/data_type_map.h"
35
#include "core/data_type/data_type_nullable.h"
36
#include "core/data_type/data_type_struct.h"
37
#include "core/data_type/define_primitive_type.h"
38
#include "format/parquet/level_decoder.h"
39
#include "format/parquet/schema_desc.h"
40
#include "format/parquet/vparquet_column_chunk_reader.h"
41
#include "io/fs/tracing_file_reader.h"
42
#include "runtime/runtime_profile.h"
43
44
namespace doris {
45
static void fill_struct_null_map(FieldSchema* field, NullMap& null_map,
46
                                 const std::vector<level_t>& rep_levels,
47
11
                                 const std::vector<level_t>& def_levels) {
48
11
    size_t num_levels = def_levels.size();
49
11
    DCHECK_EQ(num_levels, rep_levels.size());
50
11
    size_t origin_size = null_map.size();
51
11
    null_map.resize(origin_size + num_levels);
52
11
    size_t pos = origin_size;
53
26
    for (size_t i = 0; i < num_levels; ++i) {
54
        // skip the levels affect its ancestor or its descendants
55
15
        if (def_levels[i] < field->repeated_parent_def_level ||
56
15
            rep_levels[i] > field->repetition_level) {
57
0
            continue;
58
0
        }
59
15
        if (def_levels[i] >= field->definition_level) {
60
15
            null_map[pos++] = 0;
61
15
        } else {
62
0
            null_map[pos++] = 1;
63
0
        }
64
15
    }
65
11
    null_map.resize(pos);
66
11
}
67
68
static void fill_array_offset(FieldSchema* field, ColumnArray::Offsets64& offsets_data,
69
                              NullMap* null_map_ptr, const std::vector<level_t>& rep_levels,
70
2
                              const std::vector<level_t>& def_levels) {
71
2
    size_t num_levels = rep_levels.size();
72
2
    DCHECK_EQ(num_levels, def_levels.size());
73
2
    size_t origin_size = offsets_data.size();
74
2
    offsets_data.resize(origin_size + num_levels);
75
2
    if (null_map_ptr != nullptr) {
76
2
        null_map_ptr->resize(origin_size + num_levels);
77
2
    }
78
2
    size_t offset_pos = origin_size - 1;
79
8
    for (size_t i = 0; i < num_levels; ++i) {
80
        // skip the levels affect its ancestor or its descendants
81
6
        if (def_levels[i] < field->repeated_parent_def_level ||
82
6
            rep_levels[i] > field->repetition_level) {
83
0
            continue;
84
0
        }
85
6
        if (rep_levels[i] == field->repetition_level) {
86
4
            offsets_data[offset_pos]++;
87
4
            continue;
88
4
        }
89
2
        offset_pos++;
90
2
        offsets_data[offset_pos] = offsets_data[offset_pos - 1];
91
2
        if (def_levels[i] >= field->definition_level) {
92
2
            offsets_data[offset_pos]++;
93
2
        }
94
2
        if (def_levels[i] >= field->definition_level - 1) {
95
2
            (*null_map_ptr)[offset_pos] = 0;
96
2
        } else {
97
0
            (*null_map_ptr)[offset_pos] = 1;
98
0
        }
99
2
    }
100
2
    offsets_data.resize(offset_pos + 1);
101
2
    if (null_map_ptr != nullptr) {
102
2
        null_map_ptr->resize(offset_pos + 1);
103
2
    }
104
2
}
105
106
Status ParquetColumnReader::create(io::FileReaderSPtr file, FieldSchema* field,
107
                                   const tparquet::RowGroup& row_group, const RowRanges& row_ranges,
108
                                   const cctz::time_zone* ctz, io::IOContext* io_ctx,
109
                                   std::unique_ptr<ParquetColumnReader>& reader,
110
                                   size_t max_buf_size,
111
                                   std::unordered_map<int, tparquet::OffsetIndex>& col_offsets,
112
                                   RuntimeState* state, bool in_collection,
113
                                   const std::set<uint64_t>& column_ids,
114
132
                                   const std::set<uint64_t>& filter_column_ids) {
115
132
    size_t total_rows = row_group.num_rows;
116
132
    if (field->data_type->get_primitive_type() == TYPE_ARRAY) {
117
2
        std::unique_ptr<ParquetColumnReader> element_reader;
118
2
        RETURN_IF_ERROR(create(file, &field->children[0], row_group, row_ranges, ctz, io_ctx,
119
2
                               element_reader, max_buf_size, col_offsets, state, true, column_ids,
120
2
                               filter_column_ids));
121
2
        auto array_reader = ArrayColumnReader::create_unique(row_ranges, total_rows, ctz, io_ctx);
122
2
        element_reader->set_column_in_nested();
123
2
        RETURN_IF_ERROR(array_reader->init(std::move(element_reader), field));
124
2
        array_reader->_filter_column_ids = filter_column_ids;
125
2
        reader.reset(array_reader.release());
126
130
    } else if (field->data_type->get_primitive_type() == TYPE_MAP) {
127
0
        std::unique_ptr<ParquetColumnReader> key_reader;
128
0
        std::unique_ptr<ParquetColumnReader> value_reader;
129
130
0
        if (column_ids.empty() ||
131
0
            column_ids.find(field->children[0].get_column_id()) != column_ids.end()) {
132
            // Create key reader
133
0
            RETURN_IF_ERROR(create(file, &field->children[0], row_group, row_ranges, ctz, io_ctx,
134
0
                                   key_reader, max_buf_size, col_offsets, state, true, column_ids,
135
0
                                   filter_column_ids));
136
0
        } else {
137
0
            auto skip_reader = std::make_unique<SkipReadingReader>(row_ranges, total_rows, ctz,
138
0
                                                                   io_ctx, &field->children[0]);
139
0
            key_reader = std::move(skip_reader);
140
0
        }
141
142
0
        if (column_ids.empty() ||
143
0
            column_ids.find(field->children[1].get_column_id()) != column_ids.end()) {
144
            // Create value reader
145
0
            RETURN_IF_ERROR(create(file, &field->children[1], row_group, row_ranges, ctz, io_ctx,
146
0
                                   value_reader, max_buf_size, col_offsets, state, true, column_ids,
147
0
                                   filter_column_ids));
148
0
        } else {
149
0
            auto skip_reader = std::make_unique<SkipReadingReader>(row_ranges, total_rows, ctz,
150
0
                                                                   io_ctx, &field->children[0]);
151
0
            value_reader = std::move(skip_reader);
152
0
        }
153
154
0
        auto map_reader = MapColumnReader::create_unique(row_ranges, total_rows, ctz, io_ctx);
155
0
        key_reader->set_column_in_nested();
156
0
        value_reader->set_column_in_nested();
157
0
        RETURN_IF_ERROR(map_reader->init(std::move(key_reader), std::move(value_reader), field));
158
0
        map_reader->_filter_column_ids = filter_column_ids;
159
0
        reader.reset(map_reader.release());
160
130
    } else if (field->data_type->get_primitive_type() == TYPE_STRUCT) {
161
11
        std::unordered_map<std::string, std::unique_ptr<ParquetColumnReader>> child_readers;
162
11
        child_readers.reserve(field->children.size());
163
11
        int non_skip_reader_idx = -1;
164
37
        for (int i = 0; i < field->children.size(); ++i) {
165
26
            auto& child = field->children[i];
166
26
            std::unique_ptr<ParquetColumnReader> child_reader;
167
26
            if (column_ids.empty() || column_ids.find(child.get_column_id()) != column_ids.end()) {
168
22
                RETURN_IF_ERROR(create(file, &child, row_group, row_ranges, ctz, io_ctx,
169
22
                                       child_reader, max_buf_size, col_offsets, state,
170
22
                                       in_collection, column_ids, filter_column_ids));
171
22
                child_readers[child.name] = std::move(child_reader);
172
                // Record the first non-SkippingReader
173
22
                if (non_skip_reader_idx == -1) {
174
11
                    non_skip_reader_idx = i;
175
11
                }
176
22
            } else {
177
4
                auto skip_reader = std::make_unique<SkipReadingReader>(row_ranges, total_rows, ctz,
178
4
                                                                       io_ctx, &child);
179
4
                skip_reader->_filter_column_ids = filter_column_ids;
180
4
                child_readers[child.name] = std::move(skip_reader);
181
4
            }
182
26
            child_readers[child.name]->set_column_in_nested();
183
26
        }
184
        // If all children are SkipReadingReader, force the first child to call create
185
11
        if (non_skip_reader_idx == -1) {
186
0
            std::unique_ptr<ParquetColumnReader> child_reader;
187
0
            RETURN_IF_ERROR(create(file, &field->children[0], row_group, row_ranges, ctz, io_ctx,
188
0
                                   child_reader, max_buf_size, col_offsets, state, in_collection,
189
0
                                   column_ids, filter_column_ids));
190
0
            child_reader->set_column_in_nested();
191
0
            child_readers[field->children[0].name] = std::move(child_reader);
192
0
        }
193
11
        auto struct_reader = StructColumnReader::create_unique(row_ranges, total_rows, ctz, io_ctx);
194
11
        RETURN_IF_ERROR(struct_reader->init(std::move(child_readers), field));
195
11
        struct_reader->_filter_column_ids = filter_column_ids;
196
11
        reader.reset(struct_reader.release());
197
119
    } else {
198
119
        auto physical_index = field->physical_column_index;
199
119
        const tparquet::OffsetIndex* offset_index =
200
119
                col_offsets.find(physical_index) != col_offsets.end() ? &col_offsets[physical_index]
201
119
                                                                      : nullptr;
202
203
119
        const tparquet::ColumnChunk& chunk = row_group.columns[physical_index];
204
119
        if (in_collection) {
205
3
            if (offset_index == nullptr) {
206
3
                auto scalar_reader = ScalarColumnReader<true, false>::create_unique(
207
3
                        row_ranges, total_rows, chunk, offset_index, ctz, io_ctx);
208
209
3
                RETURN_IF_ERROR(scalar_reader->init(file, field, max_buf_size, state));
210
3
                scalar_reader->_filter_column_ids = filter_column_ids;
211
3
                reader.reset(scalar_reader.release());
212
3
            } else {
213
0
                auto scalar_reader = ScalarColumnReader<true, true>::create_unique(
214
0
                        row_ranges, total_rows, chunk, offset_index, ctz, io_ctx);
215
216
0
                RETURN_IF_ERROR(scalar_reader->init(file, field, max_buf_size, state));
217
0
                scalar_reader->_filter_column_ids = filter_column_ids;
218
0
                reader.reset(scalar_reader.release());
219
0
            }
220
116
        } else {
221
116
            if (offset_index == nullptr) {
222
116
                auto scalar_reader = ScalarColumnReader<false, false>::create_unique(
223
116
                        row_ranges, total_rows, chunk, offset_index, ctz, io_ctx);
224
225
116
                RETURN_IF_ERROR(scalar_reader->init(file, field, max_buf_size, state));
226
116
                scalar_reader->_filter_column_ids = filter_column_ids;
227
116
                reader.reset(scalar_reader.release());
228
116
            } else {
229
0
                auto scalar_reader = ScalarColumnReader<false, true>::create_unique(
230
0
                        row_ranges, total_rows, chunk, offset_index, ctz, io_ctx);
231
232
0
                RETURN_IF_ERROR(scalar_reader->init(file, field, max_buf_size, state));
233
0
                scalar_reader->_filter_column_ids = filter_column_ids;
234
0
                reader.reset(scalar_reader.release());
235
0
            }
236
116
        }
237
119
    }
238
132
    return Status::OK();
239
132
}
240
241
void ParquetColumnReader::_generate_read_ranges(RowRange page_row_range,
242
274
                                                RowRanges* result_ranges) const {
243
274
    result_ranges->add(page_row_range);
244
274
    RowRanges::ranges_intersection(*result_ranges, _row_ranges, result_ranges);
245
274
}
246
247
template <bool IN_COLLECTION, bool OFFSET_INDEX>
248
Status ScalarColumnReader<IN_COLLECTION, OFFSET_INDEX>::init(io::FileReaderSPtr file,
249
                                                             FieldSchema* field,
250
                                                             size_t max_buf_size,
251
119
                                                             RuntimeState* state) {
252
119
    _field_schema = field;
253
119
    auto& chunk_meta = _chunk_meta.meta_data;
254
119
    int64_t chunk_start = has_dict_page(chunk_meta) ? chunk_meta.dictionary_page_offset
255
119
                                                    : chunk_meta.data_page_offset;
256
119
    size_t chunk_len = chunk_meta.total_compressed_size;
257
119
    size_t prefetch_buffer_size = std::min(chunk_len, max_buf_size);
258
119
    if ((typeid_cast<doris::io::TracingFileReader*>(file.get()) &&
259
119
         typeid_cast<io::MergeRangeFileReader*>(
260
53
                 ((doris::io::TracingFileReader*)(file.get()))->inner_reader().get())) ||
261
119
        typeid_cast<io::MergeRangeFileReader*>(file.get())) {
262
        // turn off prefetch data when using MergeRangeFileReader
263
119
        prefetch_buffer_size = 0;
264
119
    }
265
119
    _stream_reader = std::make_unique<io::BufferedFileStreamReader>(file, chunk_start, chunk_len,
266
119
                                                                    prefetch_buffer_size);
267
119
    ParquetPageReadContext ctx(
268
119
            (state == nullptr) ? true : state->query_options().enable_parquet_file_page_cache);
269
270
119
    _chunk_reader = std::make_unique<ColumnChunkReader<IN_COLLECTION, OFFSET_INDEX>>(
271
119
            _stream_reader.get(), &_chunk_meta, field, _offset_index, _total_rows, _io_ctx, ctx);
272
119
    RETURN_IF_ERROR(_chunk_reader->init());
273
119
    return Status::OK();
274
119
}
Unexecuted instantiation: _ZN5doris18ScalarColumnReaderILb1ELb1EE4initESt10shared_ptrINS_2io10FileReaderEEPNS_11FieldSchemaEmPNS_12RuntimeStateE
_ZN5doris18ScalarColumnReaderILb1ELb0EE4initESt10shared_ptrINS_2io10FileReaderEEPNS_11FieldSchemaEmPNS_12RuntimeStateE
Line
Count
Source
251
3
                                                             RuntimeState* state) {
252
3
    _field_schema = field;
253
3
    auto& chunk_meta = _chunk_meta.meta_data;
254
3
    int64_t chunk_start = has_dict_page(chunk_meta) ? chunk_meta.dictionary_page_offset
255
3
                                                    : chunk_meta.data_page_offset;
256
3
    size_t chunk_len = chunk_meta.total_compressed_size;
257
3
    size_t prefetch_buffer_size = std::min(chunk_len, max_buf_size);
258
3
    if ((typeid_cast<doris::io::TracingFileReader*>(file.get()) &&
259
3
         typeid_cast<io::MergeRangeFileReader*>(
260
0
                 ((doris::io::TracingFileReader*)(file.get()))->inner_reader().get())) ||
261
3
        typeid_cast<io::MergeRangeFileReader*>(file.get())) {
262
        // turn off prefetch data when using MergeRangeFileReader
263
3
        prefetch_buffer_size = 0;
264
3
    }
265
3
    _stream_reader = std::make_unique<io::BufferedFileStreamReader>(file, chunk_start, chunk_len,
266
3
                                                                    prefetch_buffer_size);
267
3
    ParquetPageReadContext ctx(
268
3
            (state == nullptr) ? true : state->query_options().enable_parquet_file_page_cache);
269
270
3
    _chunk_reader = std::make_unique<ColumnChunkReader<IN_COLLECTION, OFFSET_INDEX>>(
271
3
            _stream_reader.get(), &_chunk_meta, field, _offset_index, _total_rows, _io_ctx, ctx);
272
3
    RETURN_IF_ERROR(_chunk_reader->init());
273
3
    return Status::OK();
274
3
}
Unexecuted instantiation: _ZN5doris18ScalarColumnReaderILb0ELb1EE4initESt10shared_ptrINS_2io10FileReaderEEPNS_11FieldSchemaEmPNS_12RuntimeStateE
_ZN5doris18ScalarColumnReaderILb0ELb0EE4initESt10shared_ptrINS_2io10FileReaderEEPNS_11FieldSchemaEmPNS_12RuntimeStateE
Line
Count
Source
251
116
                                                             RuntimeState* state) {
252
116
    _field_schema = field;
253
116
    auto& chunk_meta = _chunk_meta.meta_data;
254
116
    int64_t chunk_start = has_dict_page(chunk_meta) ? chunk_meta.dictionary_page_offset
255
116
                                                    : chunk_meta.data_page_offset;
256
116
    size_t chunk_len = chunk_meta.total_compressed_size;
257
116
    size_t prefetch_buffer_size = std::min(chunk_len, max_buf_size);
258
116
    if ((typeid_cast<doris::io::TracingFileReader*>(file.get()) &&
259
116
         typeid_cast<io::MergeRangeFileReader*>(
260
53
                 ((doris::io::TracingFileReader*)(file.get()))->inner_reader().get())) ||
261
116
        typeid_cast<io::MergeRangeFileReader*>(file.get())) {
262
        // turn off prefetch data when using MergeRangeFileReader
263
116
        prefetch_buffer_size = 0;
264
116
    }
265
116
    _stream_reader = std::make_unique<io::BufferedFileStreamReader>(file, chunk_start, chunk_len,
266
116
                                                                    prefetch_buffer_size);
267
116
    ParquetPageReadContext ctx(
268
116
            (state == nullptr) ? true : state->query_options().enable_parquet_file_page_cache);
269
270
116
    _chunk_reader = std::make_unique<ColumnChunkReader<IN_COLLECTION, OFFSET_INDEX>>(
271
116
            _stream_reader.get(), &_chunk_meta, field, _offset_index, _total_rows, _io_ctx, ctx);
272
116
    RETURN_IF_ERROR(_chunk_reader->init());
273
116
    return Status::OK();
274
116
}
275
276
template <bool IN_COLLECTION, bool OFFSET_INDEX>
277
244
Status ScalarColumnReader<IN_COLLECTION, OFFSET_INDEX>::_skip_values(size_t num_values) {
278
244
    if (num_values == 0) {
279
142
        return Status::OK();
280
142
    }
281
102
    if (_chunk_reader->max_def_level() > 0) {
282
102
        LevelDecoder& def_decoder = _chunk_reader->def_level_decoder();
283
102
        size_t skipped = 0;
284
102
        size_t null_size = 0;
285
102
        size_t nonnull_size = 0;
286
217
        while (skipped < num_values) {
287
115
            level_t def_level = -1;
288
115
            size_t loop_skip = def_decoder.get_next_run(&def_level, num_values - skipped);
289
115
            if (loop_skip == 0) {
290
0
                std::stringstream ss;
291
0
                auto& bit_reader = def_decoder.rle_decoder().bit_reader();
292
0
                ss << "def_decoder buffer (hex): ";
293
0
                for (size_t i = 0; i < bit_reader.max_bytes(); ++i) {
294
0
                    ss << std::hex << std::setw(2) << std::setfill('0')
295
0
                       << static_cast<int>(bit_reader.buffer()[i]) << " ";
296
0
                }
297
0
                LOG(WARNING) << ss.str();
298
0
                return Status::InternalError("Failed to decode definition level.");
299
0
            }
300
115
            if (def_level < _field_schema->definition_level) {
301
8
                null_size += loop_skip;
302
107
            } else {
303
107
                nonnull_size += loop_skip;
304
107
            }
305
115
            skipped += loop_skip;
306
115
        }
307
102
        if (null_size > 0) {
308
5
            RETURN_IF_ERROR(_chunk_reader->skip_values(null_size, false));
309
5
        }
310
102
        if (nonnull_size > 0) {
311
101
            RETURN_IF_ERROR(_chunk_reader->skip_values(nonnull_size, true));
312
101
        }
313
102
    } else {
314
0
        RETURN_IF_ERROR(_chunk_reader->skip_values(num_values));
315
0
    }
316
102
    return Status::OK();
317
102
}
Unexecuted instantiation: _ZN5doris18ScalarColumnReaderILb1ELb1EE12_skip_valuesEm
Unexecuted instantiation: _ZN5doris18ScalarColumnReaderILb1ELb0EE12_skip_valuesEm
Unexecuted instantiation: _ZN5doris18ScalarColumnReaderILb0ELb1EE12_skip_valuesEm
_ZN5doris18ScalarColumnReaderILb0ELb0EE12_skip_valuesEm
Line
Count
Source
277
244
Status ScalarColumnReader<IN_COLLECTION, OFFSET_INDEX>::_skip_values(size_t num_values) {
278
244
    if (num_values == 0) {
279
142
        return Status::OK();
280
142
    }
281
102
    if (_chunk_reader->max_def_level() > 0) {
282
102
        LevelDecoder& def_decoder = _chunk_reader->def_level_decoder();
283
102
        size_t skipped = 0;
284
102
        size_t null_size = 0;
285
102
        size_t nonnull_size = 0;
286
217
        while (skipped < num_values) {
287
115
            level_t def_level = -1;
288
115
            size_t loop_skip = def_decoder.get_next_run(&def_level, num_values - skipped);
289
115
            if (loop_skip == 0) {
290
0
                std::stringstream ss;
291
0
                auto& bit_reader = def_decoder.rle_decoder().bit_reader();
292
0
                ss << "def_decoder buffer (hex): ";
293
0
                for (size_t i = 0; i < bit_reader.max_bytes(); ++i) {
294
0
                    ss << std::hex << std::setw(2) << std::setfill('0')
295
0
                       << static_cast<int>(bit_reader.buffer()[i]) << " ";
296
0
                }
297
0
                LOG(WARNING) << ss.str();
298
0
                return Status::InternalError("Failed to decode definition level.");
299
0
            }
300
115
            if (def_level < _field_schema->definition_level) {
301
8
                null_size += loop_skip;
302
107
            } else {
303
107
                nonnull_size += loop_skip;
304
107
            }
305
115
            skipped += loop_skip;
306
115
        }
307
102
        if (null_size > 0) {
308
5
            RETURN_IF_ERROR(_chunk_reader->skip_values(null_size, false));
309
5
        }
310
102
        if (nonnull_size > 0) {
311
101
            RETURN_IF_ERROR(_chunk_reader->skip_values(nonnull_size, true));
312
101
        }
313
102
    } else {
314
0
        RETURN_IF_ERROR(_chunk_reader->skip_values(num_values));
315
0
    }
316
102
    return Status::OK();
317
102
}
318
319
template <bool IN_COLLECTION, bool OFFSET_INDEX>
320
Status ScalarColumnReader<IN_COLLECTION, OFFSET_INDEX>::_read_values(size_t num_values,
321
                                                                     ColumnPtr& doris_column,
322
                                                                     DataTypePtr& type,
323
                                                                     FilterMap& filter_map,
324
244
                                                                     bool is_dict_filter) {
325
244
    if (num_values == 0) {
326
0
        return Status::OK();
327
0
    }
328
244
    MutableColumnPtr data_column;
329
244
    std::vector<uint16_t> null_map;
330
244
    NullMap* map_data_column = nullptr;
331
244
    doris_column = IColumn::mutate(std::move(doris_column));
332
244
    if (doris_column->is_nullable()) {
333
242
        SCOPED_RAW_TIMER(&_decode_null_map_time);
334
242
        auto mutable_column = doris_column->assert_mutable();
335
242
        auto* nullable_column = assert_cast<ColumnNullable*>(mutable_column.get());
336
337
242
        data_column = nullable_column->get_nested_column_ptr();
338
242
        map_data_column = &(nullable_column->get_null_map_data());
339
242
        if (_chunk_reader->max_def_level() > 0) {
340
174
            LevelDecoder& def_decoder = _chunk_reader->def_level_decoder();
341
174
            size_t has_read = 0;
342
174
            bool prev_is_null = true;
343
348
            while (has_read < num_values) {
344
174
                level_t def_level;
345
174
                size_t loop_read = def_decoder.get_next_run(&def_level, num_values - has_read);
346
174
                if (loop_read == 0) {
347
0
                    std::stringstream ss;
348
0
                    auto& bit_reader = def_decoder.rle_decoder().bit_reader();
349
0
                    ss << "def_decoder buffer (hex): ";
350
0
                    for (size_t i = 0; i < bit_reader.max_bytes(); ++i) {
351
0
                        ss << std::hex << std::setw(2) << std::setfill('0')
352
0
                           << static_cast<int>(bit_reader.buffer()[i]) << " ";
353
0
                    }
354
0
                    LOG(WARNING) << ss.str();
355
0
                    return Status::InternalError("Failed to decode definition level.");
356
0
                }
357
358
174
                bool is_null = def_level < _field_schema->definition_level;
359
174
                if (!(prev_is_null ^ is_null)) {
360
57
                    null_map.emplace_back(0);
361
57
                }
362
174
                size_t remaining = loop_read;
363
174
                while (remaining > USHRT_MAX) {
364
0
                    null_map.emplace_back(USHRT_MAX);
365
0
                    null_map.emplace_back(0);
366
0
                    remaining -= USHRT_MAX;
367
0
                }
368
174
                null_map.emplace_back((u_short)remaining);
369
174
                prev_is_null = is_null;
370
174
                has_read += loop_read;
371
174
            }
372
174
        }
373
242
    } else {
374
2
        if (_chunk_reader->max_def_level() > 0) {
375
0
            return Status::Corruption("Not nullable column has null values in parquet file");
376
0
        }
377
2
        data_column = doris_column->assert_mutable();
378
2
    }
379
244
    if (null_map.size() == 0) {
380
70
        size_t remaining = num_values;
381
70
        while (remaining > USHRT_MAX) {
382
0
            null_map.emplace_back(USHRT_MAX);
383
0
            null_map.emplace_back(0);
384
0
            remaining -= USHRT_MAX;
385
0
        }
386
70
        null_map.emplace_back((u_short)remaining);
387
70
    }
388
244
    ColumnSelectVector select_vector;
389
244
    {
390
244
        SCOPED_RAW_TIMER(&_decode_null_map_time);
391
244
        RETURN_IF_ERROR(select_vector.init(null_map, num_values, map_data_column, &filter_map,
392
244
                                           _filter_map_index));
393
244
        _filter_map_index += num_values;
394
244
    }
395
0
    return _chunk_reader->decode_values(data_column, type, select_vector, is_dict_filter);
396
244
}
Unexecuted instantiation: _ZN5doris18ScalarColumnReaderILb1ELb1EE12_read_valuesEmRNS_3COWINS_7IColumnEE13immutable_ptrIS3_EERSt10shared_ptrIKNS_9IDataTypeEERNS_9FilterMapEb
Unexecuted instantiation: _ZN5doris18ScalarColumnReaderILb1ELb0EE12_read_valuesEmRNS_3COWINS_7IColumnEE13immutable_ptrIS3_EERSt10shared_ptrIKNS_9IDataTypeEERNS_9FilterMapEb
Unexecuted instantiation: _ZN5doris18ScalarColumnReaderILb0ELb1EE12_read_valuesEmRNS_3COWINS_7IColumnEE13immutable_ptrIS3_EERSt10shared_ptrIKNS_9IDataTypeEERNS_9FilterMapEb
_ZN5doris18ScalarColumnReaderILb0ELb0EE12_read_valuesEmRNS_3COWINS_7IColumnEE13immutable_ptrIS3_EERSt10shared_ptrIKNS_9IDataTypeEERNS_9FilterMapEb
Line
Count
Source
324
244
                                                                     bool is_dict_filter) {
325
244
    if (num_values == 0) {
326
0
        return Status::OK();
327
0
    }
328
244
    MutableColumnPtr data_column;
329
244
    std::vector<uint16_t> null_map;
330
244
    NullMap* map_data_column = nullptr;
331
244
    doris_column = IColumn::mutate(std::move(doris_column));
332
244
    if (doris_column->is_nullable()) {
333
242
        SCOPED_RAW_TIMER(&_decode_null_map_time);
334
242
        auto mutable_column = doris_column->assert_mutable();
335
242
        auto* nullable_column = assert_cast<ColumnNullable*>(mutable_column.get());
336
337
242
        data_column = nullable_column->get_nested_column_ptr();
338
242
        map_data_column = &(nullable_column->get_null_map_data());
339
242
        if (_chunk_reader->max_def_level() > 0) {
340
174
            LevelDecoder& def_decoder = _chunk_reader->def_level_decoder();
341
174
            size_t has_read = 0;
342
174
            bool prev_is_null = true;
343
348
            while (has_read < num_values) {
344
174
                level_t def_level;
345
174
                size_t loop_read = def_decoder.get_next_run(&def_level, num_values - has_read);
346
174
                if (loop_read == 0) {
347
0
                    std::stringstream ss;
348
0
                    auto& bit_reader = def_decoder.rle_decoder().bit_reader();
349
0
                    ss << "def_decoder buffer (hex): ";
350
0
                    for (size_t i = 0; i < bit_reader.max_bytes(); ++i) {
351
0
                        ss << std::hex << std::setw(2) << std::setfill('0')
352
0
                           << static_cast<int>(bit_reader.buffer()[i]) << " ";
353
0
                    }
354
0
                    LOG(WARNING) << ss.str();
355
0
                    return Status::InternalError("Failed to decode definition level.");
356
0
                }
357
358
174
                bool is_null = def_level < _field_schema->definition_level;
359
174
                if (!(prev_is_null ^ is_null)) {
360
57
                    null_map.emplace_back(0);
361
57
                }
362
174
                size_t remaining = loop_read;
363
174
                while (remaining > USHRT_MAX) {
364
0
                    null_map.emplace_back(USHRT_MAX);
365
0
                    null_map.emplace_back(0);
366
0
                    remaining -= USHRT_MAX;
367
0
                }
368
174
                null_map.emplace_back((u_short)remaining);
369
174
                prev_is_null = is_null;
370
174
                has_read += loop_read;
371
174
            }
372
174
        }
373
242
    } else {
374
2
        if (_chunk_reader->max_def_level() > 0) {
375
0
            return Status::Corruption("Not nullable column has null values in parquet file");
376
0
        }
377
2
        data_column = doris_column->assert_mutable();
378
2
    }
379
244
    if (null_map.size() == 0) {
380
70
        size_t remaining = num_values;
381
70
        while (remaining > USHRT_MAX) {
382
0
            null_map.emplace_back(USHRT_MAX);
383
0
            null_map.emplace_back(0);
384
0
            remaining -= USHRT_MAX;
385
0
        }
386
70
        null_map.emplace_back((u_short)remaining);
387
70
    }
388
244
    ColumnSelectVector select_vector;
389
244
    {
390
244
        SCOPED_RAW_TIMER(&_decode_null_map_time);
391
244
        RETURN_IF_ERROR(select_vector.init(null_map, num_values, map_data_column, &filter_map,
392
244
                                           _filter_map_index));
393
244
        _filter_map_index += num_values;
394
244
    }
395
0
    return _chunk_reader->decode_values(data_column, type, select_vector, is_dict_filter);
396
244
}
397
398
/**
399
 * Load the nested column data of complex type.
400
 * A row of complex type may be stored across two(or more) pages, and the parameter `align_rows` indicates that
401
 * whether the reader should read the remaining value of the last row in previous page.
402
 */
403
template <bool IN_COLLECTION, bool OFFSET_INDEX>
404
Status ScalarColumnReader<IN_COLLECTION, OFFSET_INDEX>::_read_nested_column(
405
        ColumnPtr& doris_column, DataTypePtr& type, FilterMap& filter_map, size_t batch_size,
406
13
        size_t* read_rows, bool* eof, bool is_dict_filter) {
407
13
    _rep_levels.clear();
408
13
    _def_levels.clear();
409
410
    // Handle nullable columns
411
13
    MutableColumnPtr data_column;
412
13
    NullMap* map_data_column = nullptr;
413
13
    doris_column = IColumn::mutate(std::move(doris_column));
414
13
    if (doris_column->is_nullable()) {
415
13
        SCOPED_RAW_TIMER(&_decode_null_map_time);
416
13
        auto mutable_column = doris_column->assert_mutable();
417
13
        auto* nullable_column = assert_cast<ColumnNullable*>(mutable_column.get());
418
13
        data_column = nullable_column->get_nested_column_ptr();
419
13
        map_data_column = &(nullable_column->get_null_map_data());
420
13
    } else {
421
0
        if (_field_schema->data_type->is_nullable()) {
422
0
            return Status::Corruption("Not nullable column has null values in parquet file");
423
0
        }
424
0
        data_column = doris_column->assert_mutable();
425
0
    }
426
427
13
    std::vector<uint16_t> null_map;
428
13
    std::unordered_set<size_t> ancestor_null_indices;
429
13
    std::vector<uint8_t> nested_filter_map_data;
430
431
13
    auto read_and_fill_data = [&](size_t before_rep_level_sz, size_t filter_map_index) {
432
13
        RETURN_IF_ERROR(_chunk_reader->fill_def(_def_levels));
433
13
        std::unique_ptr<FilterMap> nested_filter_map = std::make_unique<FilterMap>();
434
13
        if (filter_map.has_filter()) {
435
0
            RETURN_IF_ERROR(gen_filter_map(filter_map, filter_map_index, before_rep_level_sz,
436
0
                                           _rep_levels.size(), nested_filter_map_data,
437
0
                                           &nested_filter_map));
438
0
        }
439
440
13
        null_map.clear();
441
13
        ancestor_null_indices.clear();
442
13
        RETURN_IF_ERROR(gen_nested_null_map(before_rep_level_sz, _rep_levels.size(), null_map,
443
13
                                            ancestor_null_indices));
444
445
13
        ColumnSelectVector select_vector;
446
13
        {
447
13
            SCOPED_RAW_TIMER(&_decode_null_map_time);
448
13
            RETURN_IF_ERROR(select_vector.init(
449
13
                    null_map,
450
13
                    _rep_levels.size() - before_rep_level_sz - ancestor_null_indices.size(),
451
13
                    map_data_column, nested_filter_map.get(), 0, &ancestor_null_indices));
452
13
        }
453
454
13
        RETURN_IF_ERROR(
455
13
                _chunk_reader->decode_values(data_column, type, select_vector, is_dict_filter));
456
13
        if (ancestor_null_indices.size() != 0) {
457
0
            RETURN_IF_ERROR(_chunk_reader->skip_values(ancestor_null_indices.size(), false));
458
0
        }
459
13
        if (filter_map.has_filter()) {
460
0
            auto new_rep_sz = before_rep_level_sz;
461
0
            for (size_t idx = before_rep_level_sz; idx < _rep_levels.size(); idx++) {
462
0
                if (nested_filter_map_data[idx - before_rep_level_sz]) {
463
0
                    _rep_levels[new_rep_sz] = _rep_levels[idx];
464
0
                    _def_levels[new_rep_sz] = _def_levels[idx];
465
0
                    new_rep_sz++;
466
0
                }
467
0
            }
468
0
            _rep_levels.resize(new_rep_sz);
469
0
            _def_levels.resize(new_rep_sz);
470
0
        }
471
13
        return Status::OK();
472
13
    };
Unexecuted instantiation: _ZZN5doris18ScalarColumnReaderILb1ELb1EE19_read_nested_columnERNS_3COWINS_7IColumnEE13immutable_ptrIS3_EERSt10shared_ptrIKNS_9IDataTypeEERNS_9FilterMapEmPmPbbENKUlmmE_clEmm
_ZZN5doris18ScalarColumnReaderILb1ELb0EE19_read_nested_columnERNS_3COWINS_7IColumnEE13immutable_ptrIS3_EERSt10shared_ptrIKNS_9IDataTypeEERNS_9FilterMapEmPmPbbENKUlmmE_clEmm
Line
Count
Source
431
3
    auto read_and_fill_data = [&](size_t before_rep_level_sz, size_t filter_map_index) {
432
3
        RETURN_IF_ERROR(_chunk_reader->fill_def(_def_levels));
433
3
        std::unique_ptr<FilterMap> nested_filter_map = std::make_unique<FilterMap>();
434
3
        if (filter_map.has_filter()) {
435
0
            RETURN_IF_ERROR(gen_filter_map(filter_map, filter_map_index, before_rep_level_sz,
436
0
                                           _rep_levels.size(), nested_filter_map_data,
437
0
                                           &nested_filter_map));
438
0
        }
439
440
3
        null_map.clear();
441
3
        ancestor_null_indices.clear();
442
3
        RETURN_IF_ERROR(gen_nested_null_map(before_rep_level_sz, _rep_levels.size(), null_map,
443
3
                                            ancestor_null_indices));
444
445
3
        ColumnSelectVector select_vector;
446
3
        {
447
3
            SCOPED_RAW_TIMER(&_decode_null_map_time);
448
3
            RETURN_IF_ERROR(select_vector.init(
449
3
                    null_map,
450
3
                    _rep_levels.size() - before_rep_level_sz - ancestor_null_indices.size(),
451
3
                    map_data_column, nested_filter_map.get(), 0, &ancestor_null_indices));
452
3
        }
453
454
3
        RETURN_IF_ERROR(
455
3
                _chunk_reader->decode_values(data_column, type, select_vector, is_dict_filter));
456
3
        if (ancestor_null_indices.size() != 0) {
457
0
            RETURN_IF_ERROR(_chunk_reader->skip_values(ancestor_null_indices.size(), false));
458
0
        }
459
3
        if (filter_map.has_filter()) {
460
0
            auto new_rep_sz = before_rep_level_sz;
461
0
            for (size_t idx = before_rep_level_sz; idx < _rep_levels.size(); idx++) {
462
0
                if (nested_filter_map_data[idx - before_rep_level_sz]) {
463
0
                    _rep_levels[new_rep_sz] = _rep_levels[idx];
464
0
                    _def_levels[new_rep_sz] = _def_levels[idx];
465
0
                    new_rep_sz++;
466
0
                }
467
0
            }
468
0
            _rep_levels.resize(new_rep_sz);
469
0
            _def_levels.resize(new_rep_sz);
470
0
        }
471
3
        return Status::OK();
472
3
    };
Unexecuted instantiation: _ZZN5doris18ScalarColumnReaderILb0ELb1EE19_read_nested_columnERNS_3COWINS_7IColumnEE13immutable_ptrIS3_EERSt10shared_ptrIKNS_9IDataTypeEERNS_9FilterMapEmPmPbbENKUlmmE_clEmm
_ZZN5doris18ScalarColumnReaderILb0ELb0EE19_read_nested_columnERNS_3COWINS_7IColumnEE13immutable_ptrIS3_EERSt10shared_ptrIKNS_9IDataTypeEERNS_9FilterMapEmPmPbbENKUlmmE_clEmm
Line
Count
Source
431
10
    auto read_and_fill_data = [&](size_t before_rep_level_sz, size_t filter_map_index) {
432
10
        RETURN_IF_ERROR(_chunk_reader->fill_def(_def_levels));
433
10
        std::unique_ptr<FilterMap> nested_filter_map = std::make_unique<FilterMap>();
434
10
        if (filter_map.has_filter()) {
435
0
            RETURN_IF_ERROR(gen_filter_map(filter_map, filter_map_index, before_rep_level_sz,
436
0
                                           _rep_levels.size(), nested_filter_map_data,
437
0
                                           &nested_filter_map));
438
0
        }
439
440
10
        null_map.clear();
441
10
        ancestor_null_indices.clear();
442
10
        RETURN_IF_ERROR(gen_nested_null_map(before_rep_level_sz, _rep_levels.size(), null_map,
443
10
                                            ancestor_null_indices));
444
445
10
        ColumnSelectVector select_vector;
446
10
        {
447
10
            SCOPED_RAW_TIMER(&_decode_null_map_time);
448
10
            RETURN_IF_ERROR(select_vector.init(
449
10
                    null_map,
450
10
                    _rep_levels.size() - before_rep_level_sz - ancestor_null_indices.size(),
451
10
                    map_data_column, nested_filter_map.get(), 0, &ancestor_null_indices));
452
10
        }
453
454
10
        RETURN_IF_ERROR(
455
10
                _chunk_reader->decode_values(data_column, type, select_vector, is_dict_filter));
456
10
        if (ancestor_null_indices.size() != 0) {
457
0
            RETURN_IF_ERROR(_chunk_reader->skip_values(ancestor_null_indices.size(), false));
458
0
        }
459
10
        if (filter_map.has_filter()) {
460
0
            auto new_rep_sz = before_rep_level_sz;
461
0
            for (size_t idx = before_rep_level_sz; idx < _rep_levels.size(); idx++) {
462
0
                if (nested_filter_map_data[idx - before_rep_level_sz]) {
463
0
                    _rep_levels[new_rep_sz] = _rep_levels[idx];
464
0
                    _def_levels[new_rep_sz] = _def_levels[idx];
465
0
                    new_rep_sz++;
466
0
                }
467
0
            }
468
0
            _rep_levels.resize(new_rep_sz);
469
0
            _def_levels.resize(new_rep_sz);
470
0
        }
471
10
        return Status::OK();
472
10
    };
473
474
15
    while (_current_range_idx < _row_ranges.range_size()) {
475
13
        size_t left_row =
476
13
                std::max(_current_row_index, _row_ranges.get_range_from(_current_range_idx));
477
13
        size_t right_row = std::min(left_row + batch_size - *read_rows,
478
13
                                    (size_t)_row_ranges.get_range_to(_current_range_idx));
479
13
        _current_row_index = left_row;
480
13
        RETURN_IF_ERROR(_chunk_reader->seek_to_nested_row(left_row));
481
13
        size_t load_rows = 0;
482
13
        bool cross_page = false;
483
13
        size_t before_rep_level_sz = _rep_levels.size();
484
13
        RETURN_IF_ERROR(_chunk_reader->load_page_nested_rows(_rep_levels, right_row - left_row,
485
13
                                                             &load_rows, &cross_page));
486
13
        RETURN_IF_ERROR(read_and_fill_data(before_rep_level_sz, _filter_map_index));
487
13
        _filter_map_index += load_rows;
488
13
        while (cross_page) {
489
0
            before_rep_level_sz = _rep_levels.size();
490
0
            RETURN_IF_ERROR(_chunk_reader->load_cross_page_nested_row(_rep_levels, &cross_page));
491
0
            RETURN_IF_ERROR(read_and_fill_data(before_rep_level_sz, _filter_map_index - 1));
492
0
        }
493
13
        *read_rows += load_rows;
494
13
        _current_row_index += load_rows;
495
13
        _current_range_idx += (_current_row_index == _row_ranges.get_range_to(_current_range_idx));
496
13
        if (*read_rows == batch_size) {
497
11
            break;
498
11
        }
499
13
    }
500
13
    *eof = _current_range_idx == _row_ranges.range_size();
501
13
    return Status::OK();
502
13
}
Unexecuted instantiation: _ZN5doris18ScalarColumnReaderILb1ELb1EE19_read_nested_columnERNS_3COWINS_7IColumnEE13immutable_ptrIS3_EERSt10shared_ptrIKNS_9IDataTypeEERNS_9FilterMapEmPmPbb
_ZN5doris18ScalarColumnReaderILb1ELb0EE19_read_nested_columnERNS_3COWINS_7IColumnEE13immutable_ptrIS3_EERSt10shared_ptrIKNS_9IDataTypeEERNS_9FilterMapEmPmPbb
Line
Count
Source
406
3
        size_t* read_rows, bool* eof, bool is_dict_filter) {
407
3
    _rep_levels.clear();
408
3
    _def_levels.clear();
409
410
    // Handle nullable columns
411
3
    MutableColumnPtr data_column;
412
3
    NullMap* map_data_column = nullptr;
413
3
    doris_column = IColumn::mutate(std::move(doris_column));
414
3
    if (doris_column->is_nullable()) {
415
3
        SCOPED_RAW_TIMER(&_decode_null_map_time);
416
3
        auto mutable_column = doris_column->assert_mutable();
417
3
        auto* nullable_column = assert_cast<ColumnNullable*>(mutable_column.get());
418
3
        data_column = nullable_column->get_nested_column_ptr();
419
3
        map_data_column = &(nullable_column->get_null_map_data());
420
3
    } else {
421
0
        if (_field_schema->data_type->is_nullable()) {
422
0
            return Status::Corruption("Not nullable column has null values in parquet file");
423
0
        }
424
0
        data_column = doris_column->assert_mutable();
425
0
    }
426
427
3
    std::vector<uint16_t> null_map;
428
3
    std::unordered_set<size_t> ancestor_null_indices;
429
3
    std::vector<uint8_t> nested_filter_map_data;
430
431
3
    auto read_and_fill_data = [&](size_t before_rep_level_sz, size_t filter_map_index) {
432
3
        RETURN_IF_ERROR(_chunk_reader->fill_def(_def_levels));
433
3
        std::unique_ptr<FilterMap> nested_filter_map = std::make_unique<FilterMap>();
434
3
        if (filter_map.has_filter()) {
435
3
            RETURN_IF_ERROR(gen_filter_map(filter_map, filter_map_index, before_rep_level_sz,
436
3
                                           _rep_levels.size(), nested_filter_map_data,
437
3
                                           &nested_filter_map));
438
3
        }
439
440
3
        null_map.clear();
441
3
        ancestor_null_indices.clear();
442
3
        RETURN_IF_ERROR(gen_nested_null_map(before_rep_level_sz, _rep_levels.size(), null_map,
443
3
                                            ancestor_null_indices));
444
445
3
        ColumnSelectVector select_vector;
446
3
        {
447
3
            SCOPED_RAW_TIMER(&_decode_null_map_time);
448
3
            RETURN_IF_ERROR(select_vector.init(
449
3
                    null_map,
450
3
                    _rep_levels.size() - before_rep_level_sz - ancestor_null_indices.size(),
451
3
                    map_data_column, nested_filter_map.get(), 0, &ancestor_null_indices));
452
3
        }
453
454
3
        RETURN_IF_ERROR(
455
3
                _chunk_reader->decode_values(data_column, type, select_vector, is_dict_filter));
456
3
        if (ancestor_null_indices.size() != 0) {
457
3
            RETURN_IF_ERROR(_chunk_reader->skip_values(ancestor_null_indices.size(), false));
458
3
        }
459
3
        if (filter_map.has_filter()) {
460
3
            auto new_rep_sz = before_rep_level_sz;
461
3
            for (size_t idx = before_rep_level_sz; idx < _rep_levels.size(); idx++) {
462
3
                if (nested_filter_map_data[idx - before_rep_level_sz]) {
463
3
                    _rep_levels[new_rep_sz] = _rep_levels[idx];
464
3
                    _def_levels[new_rep_sz] = _def_levels[idx];
465
3
                    new_rep_sz++;
466
3
                }
467
3
            }
468
3
            _rep_levels.resize(new_rep_sz);
469
3
            _def_levels.resize(new_rep_sz);
470
3
        }
471
3
        return Status::OK();
472
3
    };
473
474
3
    while (_current_range_idx < _row_ranges.range_size()) {
475
3
        size_t left_row =
476
3
                std::max(_current_row_index, _row_ranges.get_range_from(_current_range_idx));
477
3
        size_t right_row = std::min(left_row + batch_size - *read_rows,
478
3
                                    (size_t)_row_ranges.get_range_to(_current_range_idx));
479
3
        _current_row_index = left_row;
480
3
        RETURN_IF_ERROR(_chunk_reader->seek_to_nested_row(left_row));
481
3
        size_t load_rows = 0;
482
3
        bool cross_page = false;
483
3
        size_t before_rep_level_sz = _rep_levels.size();
484
3
        RETURN_IF_ERROR(_chunk_reader->load_page_nested_rows(_rep_levels, right_row - left_row,
485
3
                                                             &load_rows, &cross_page));
486
3
        RETURN_IF_ERROR(read_and_fill_data(before_rep_level_sz, _filter_map_index));
487
3
        _filter_map_index += load_rows;
488
3
        while (cross_page) {
489
0
            before_rep_level_sz = _rep_levels.size();
490
0
            RETURN_IF_ERROR(_chunk_reader->load_cross_page_nested_row(_rep_levels, &cross_page));
491
0
            RETURN_IF_ERROR(read_and_fill_data(before_rep_level_sz, _filter_map_index - 1));
492
0
        }
493
3
        *read_rows += load_rows;
494
3
        _current_row_index += load_rows;
495
3
        _current_range_idx += (_current_row_index == _row_ranges.get_range_to(_current_range_idx));
496
3
        if (*read_rows == batch_size) {
497
3
            break;
498
3
        }
499
3
    }
500
3
    *eof = _current_range_idx == _row_ranges.range_size();
501
3
    return Status::OK();
502
3
}
Unexecuted instantiation: _ZN5doris18ScalarColumnReaderILb0ELb1EE19_read_nested_columnERNS_3COWINS_7IColumnEE13immutable_ptrIS3_EERSt10shared_ptrIKNS_9IDataTypeEERNS_9FilterMapEmPmPbb
_ZN5doris18ScalarColumnReaderILb0ELb0EE19_read_nested_columnERNS_3COWINS_7IColumnEE13immutable_ptrIS3_EERSt10shared_ptrIKNS_9IDataTypeEERNS_9FilterMapEmPmPbb
Line
Count
Source
406
10
        size_t* read_rows, bool* eof, bool is_dict_filter) {
407
10
    _rep_levels.clear();
408
10
    _def_levels.clear();
409
410
    // Handle nullable columns
411
10
    MutableColumnPtr data_column;
412
10
    NullMap* map_data_column = nullptr;
413
10
    doris_column = IColumn::mutate(std::move(doris_column));
414
10
    if (doris_column->is_nullable()) {
415
10
        SCOPED_RAW_TIMER(&_decode_null_map_time);
416
10
        auto mutable_column = doris_column->assert_mutable();
417
10
        auto* nullable_column = assert_cast<ColumnNullable*>(mutable_column.get());
418
10
        data_column = nullable_column->get_nested_column_ptr();
419
10
        map_data_column = &(nullable_column->get_null_map_data());
420
10
    } else {
421
0
        if (_field_schema->data_type->is_nullable()) {
422
0
            return Status::Corruption("Not nullable column has null values in parquet file");
423
0
        }
424
0
        data_column = doris_column->assert_mutable();
425
0
    }
426
427
10
    std::vector<uint16_t> null_map;
428
10
    std::unordered_set<size_t> ancestor_null_indices;
429
10
    std::vector<uint8_t> nested_filter_map_data;
430
431
10
    auto read_and_fill_data = [&](size_t before_rep_level_sz, size_t filter_map_index) {
432
10
        RETURN_IF_ERROR(_chunk_reader->fill_def(_def_levels));
433
10
        std::unique_ptr<FilterMap> nested_filter_map = std::make_unique<FilterMap>();
434
10
        if (filter_map.has_filter()) {
435
10
            RETURN_IF_ERROR(gen_filter_map(filter_map, filter_map_index, before_rep_level_sz,
436
10
                                           _rep_levels.size(), nested_filter_map_data,
437
10
                                           &nested_filter_map));
438
10
        }
439
440
10
        null_map.clear();
441
10
        ancestor_null_indices.clear();
442
10
        RETURN_IF_ERROR(gen_nested_null_map(before_rep_level_sz, _rep_levels.size(), null_map,
443
10
                                            ancestor_null_indices));
444
445
10
        ColumnSelectVector select_vector;
446
10
        {
447
10
            SCOPED_RAW_TIMER(&_decode_null_map_time);
448
10
            RETURN_IF_ERROR(select_vector.init(
449
10
                    null_map,
450
10
                    _rep_levels.size() - before_rep_level_sz - ancestor_null_indices.size(),
451
10
                    map_data_column, nested_filter_map.get(), 0, &ancestor_null_indices));
452
10
        }
453
454
10
        RETURN_IF_ERROR(
455
10
                _chunk_reader->decode_values(data_column, type, select_vector, is_dict_filter));
456
10
        if (ancestor_null_indices.size() != 0) {
457
10
            RETURN_IF_ERROR(_chunk_reader->skip_values(ancestor_null_indices.size(), false));
458
10
        }
459
10
        if (filter_map.has_filter()) {
460
10
            auto new_rep_sz = before_rep_level_sz;
461
10
            for (size_t idx = before_rep_level_sz; idx < _rep_levels.size(); idx++) {
462
10
                if (nested_filter_map_data[idx - before_rep_level_sz]) {
463
10
                    _rep_levels[new_rep_sz] = _rep_levels[idx];
464
10
                    _def_levels[new_rep_sz] = _def_levels[idx];
465
10
                    new_rep_sz++;
466
10
                }
467
10
            }
468
10
            _rep_levels.resize(new_rep_sz);
469
10
            _def_levels.resize(new_rep_sz);
470
10
        }
471
10
        return Status::OK();
472
10
    };
473
474
12
    while (_current_range_idx < _row_ranges.range_size()) {
475
10
        size_t left_row =
476
10
                std::max(_current_row_index, _row_ranges.get_range_from(_current_range_idx));
477
10
        size_t right_row = std::min(left_row + batch_size - *read_rows,
478
10
                                    (size_t)_row_ranges.get_range_to(_current_range_idx));
479
10
        _current_row_index = left_row;
480
10
        RETURN_IF_ERROR(_chunk_reader->seek_to_nested_row(left_row));
481
10
        size_t load_rows = 0;
482
10
        bool cross_page = false;
483
10
        size_t before_rep_level_sz = _rep_levels.size();
484
10
        RETURN_IF_ERROR(_chunk_reader->load_page_nested_rows(_rep_levels, right_row - left_row,
485
10
                                                             &load_rows, &cross_page));
486
10
        RETURN_IF_ERROR(read_and_fill_data(before_rep_level_sz, _filter_map_index));
487
10
        _filter_map_index += load_rows;
488
10
        while (cross_page) {
489
0
            before_rep_level_sz = _rep_levels.size();
490
0
            RETURN_IF_ERROR(_chunk_reader->load_cross_page_nested_row(_rep_levels, &cross_page));
491
0
            RETURN_IF_ERROR(read_and_fill_data(before_rep_level_sz, _filter_map_index - 1));
492
0
        }
493
10
        *read_rows += load_rows;
494
10
        _current_row_index += load_rows;
495
10
        _current_range_idx += (_current_row_index == _row_ranges.get_range_to(_current_range_idx));
496
10
        if (*read_rows == batch_size) {
497
8
            break;
498
8
        }
499
10
    }
500
10
    *eof = _current_range_idx == _row_ranges.range_size();
501
10
    return Status::OK();
502
10
}
503
504
template <bool IN_COLLECTION, bool OFFSET_INDEX>
505
Status ScalarColumnReader<IN_COLLECTION, OFFSET_INDEX>::read_dict_values_to_column(
506
2
        MutableColumnPtr& doris_column, bool* has_dict) {
507
2
    bool loaded;
508
2
    RETURN_IF_ERROR(_try_load_dict_page(&loaded, has_dict));
509
2
    if (loaded && *has_dict) {
510
2
        return _chunk_reader->read_dict_values_to_column(doris_column);
511
2
    }
512
0
    return Status::OK();
513
2
}
Unexecuted instantiation: _ZN5doris18ScalarColumnReaderILb1ELb1EE26read_dict_values_to_columnERNS_3COWINS_7IColumnEE11mutable_ptrIS3_EEPb
Unexecuted instantiation: _ZN5doris18ScalarColumnReaderILb1ELb0EE26read_dict_values_to_columnERNS_3COWINS_7IColumnEE11mutable_ptrIS3_EEPb
Unexecuted instantiation: _ZN5doris18ScalarColumnReaderILb0ELb1EE26read_dict_values_to_columnERNS_3COWINS_7IColumnEE11mutable_ptrIS3_EEPb
_ZN5doris18ScalarColumnReaderILb0ELb0EE26read_dict_values_to_columnERNS_3COWINS_7IColumnEE11mutable_ptrIS3_EEPb
Line
Count
Source
506
2
        MutableColumnPtr& doris_column, bool* has_dict) {
507
2
    bool loaded;
508
2
    RETURN_IF_ERROR(_try_load_dict_page(&loaded, has_dict));
509
2
    if (loaded && *has_dict) {
510
2
        return _chunk_reader->read_dict_values_to_column(doris_column);
511
2
    }
512
0
    return Status::OK();
513
2
}
514
template <bool IN_COLLECTION, bool OFFSET_INDEX>
515
Result<MutableColumnPtr>
516
ScalarColumnReader<IN_COLLECTION, OFFSET_INDEX>::convert_dict_column_to_string_column(
517
0
        const ColumnInt32* dict_column) {
518
0
    return _chunk_reader->convert_dict_column_to_string_column(dict_column);
519
0
}
Unexecuted instantiation: _ZN5doris18ScalarColumnReaderILb1ELb1EE36convert_dict_column_to_string_columnEPKNS_12ColumnVectorILNS_13PrimitiveTypeE5EEE
Unexecuted instantiation: _ZN5doris18ScalarColumnReaderILb1ELb0EE36convert_dict_column_to_string_columnEPKNS_12ColumnVectorILNS_13PrimitiveTypeE5EEE
Unexecuted instantiation: _ZN5doris18ScalarColumnReaderILb0ELb1EE36convert_dict_column_to_string_columnEPKNS_12ColumnVectorILNS_13PrimitiveTypeE5EEE
Unexecuted instantiation: _ZN5doris18ScalarColumnReaderILb0ELb0EE36convert_dict_column_to_string_columnEPKNS_12ColumnVectorILNS_13PrimitiveTypeE5EEE
520
521
template <bool IN_COLLECTION, bool OFFSET_INDEX>
522
Status ScalarColumnReader<IN_COLLECTION, OFFSET_INDEX>::_try_load_dict_page(bool* loaded,
523
2
                                                                            bool* has_dict) {
524
    // _chunk_reader init will load first page header to check whether has dict page
525
2
    *loaded = true;
526
2
    *has_dict = _chunk_reader->has_dict();
527
2
    return Status::OK();
528
2
}
Unexecuted instantiation: _ZN5doris18ScalarColumnReaderILb1ELb1EE19_try_load_dict_pageEPbS2_
Unexecuted instantiation: _ZN5doris18ScalarColumnReaderILb1ELb0EE19_try_load_dict_pageEPbS2_
Unexecuted instantiation: _ZN5doris18ScalarColumnReaderILb0ELb1EE19_try_load_dict_pageEPbS2_
_ZN5doris18ScalarColumnReaderILb0ELb0EE19_try_load_dict_pageEPbS2_
Line
Count
Source
523
2
                                                                            bool* has_dict) {
524
    // _chunk_reader init will load first page header to check whether has dict page
525
2
    *loaded = true;
526
2
    *has_dict = _chunk_reader->has_dict();
527
2
    return Status::OK();
528
2
}
529
530
template <bool IN_COLLECTION, bool OFFSET_INDEX>
531
Status ScalarColumnReader<IN_COLLECTION, OFFSET_INDEX>::read_column_data(
532
        ColumnPtr& doris_column, const DataTypePtr& type,
533
        const std::shared_ptr<TableSchemaChangeHelper::Node>& root_node, FilterMap& filter_map,
534
        size_t batch_size, size_t* read_rows, bool* eof, bool is_dict_filter,
535
287
        int64_t real_column_size) {
536
287
    if (_converter == nullptr) {
537
114
        _converter = parquet::PhysicalToLogicalConverter::get_converter(
538
114
                _field_schema, _field_schema->data_type, type, _ctz, is_dict_filter);
539
114
        if (!_converter->support()) {
540
0
            return Status::InternalError(
541
0
                    "The column type of '{}' is not supported: {}, is_dict_filter: {}, "
542
0
                    "src_logical_type: {}, dst_logical_type: {}",
543
0
                    _field_schema->name, _converter->get_error_msg(), is_dict_filter,
544
0
                    _field_schema->data_type->get_name(), type->get_name());
545
0
        }
546
114
    }
547
    // !FIXME: We should verify whether the get_physical_column logic is correct, why do we return a doris_column?
548
287
    ColumnPtr resolved_column =
549
287
            _converter->get_physical_column(_field_schema->physical_type, _field_schema->data_type,
550
287
                                            doris_column, type, is_dict_filter);
551
287
    if (_converter->read_directly_into_dst_logical_column()) {
552
258
        DCHECK_EQ(resolved_column.get(), doris_column.get());
553
258
        resolved_column = std::move(doris_column);
554
258
    }
555
287
    DataTypePtr& resolved_type = _converter->get_physical_type();
556
557
287
    _def_levels.clear();
558
287
    _rep_levels.clear();
559
287
    *read_rows = 0;
560
561
287
    if (_in_nested) {
562
13
        RETURN_IF_ERROR(_read_nested_column(resolved_column, resolved_type, filter_map, batch_size,
563
13
                                            read_rows, eof, is_dict_filter));
564
13
        return _converter->convert(resolved_column, _field_schema->data_type, type, doris_column,
565
13
                                   is_dict_filter);
566
13
    }
567
568
274
    int64_t right_row = 0;
569
274
    if constexpr (OFFSET_INDEX == false) {
570
274
        RETURN_IF_ERROR(_chunk_reader->parse_page_header());
571
274
        right_row = _chunk_reader->page_end_row();
572
274
    } else {
573
0
        right_row = _chunk_reader->page_end_row();
574
0
    }
575
576
274
    do {
577
        // generate the row ranges that should be read
578
274
        RowRanges read_ranges;
579
274
        _generate_read_ranges(RowRange {_current_row_index, right_row}, &read_ranges);
580
274
        if (read_ranges.count() == 0) {
581
            // skip the whole page
582
63
            _current_row_index = right_row;
583
211
        } else {
584
211
            bool skip_whole_batch = false;
585
            // Determining whether to skip page or batch will increase the calculation time.
586
            // When the filtering effect is greater than 60%, it is possible to skip the page or batch.
587
211
            if (filter_map.has_filter() && filter_map.filter_ratio() > 0.6) {
588
                // lazy read
589
0
                size_t remaining_num_values = read_ranges.count();
590
0
                if (batch_size >= remaining_num_values &&
591
0
                    filter_map.can_filter_all(remaining_num_values, _filter_map_index)) {
592
                    // We can skip the whole page if the remaining values are filtered by predicate columns
593
0
                    _filter_map_index += remaining_num_values;
594
0
                    _current_row_index = right_row;
595
0
                    *read_rows = remaining_num_values;
596
0
                    break;
597
0
                }
598
0
                skip_whole_batch = batch_size <= remaining_num_values &&
599
0
                                   filter_map.can_filter_all(batch_size, _filter_map_index);
600
0
                if (skip_whole_batch) {
601
0
                    _filter_map_index += batch_size;
602
0
                }
603
0
            }
604
            // load page data to decode or skip values
605
211
            RETURN_IF_ERROR(_chunk_reader->parse_page_header());
606
211
            RETURN_IF_ERROR(_chunk_reader->load_page_data_idempotent());
607
211
            size_t has_read = 0;
608
344
            for (size_t idx = 0; idx < read_ranges.range_size(); idx++) {
609
244
                auto range = read_ranges.get_range(idx);
610
                // generate the skipped values
611
244
                size_t skip_values = range.from() - _current_row_index;
612
244
                RETURN_IF_ERROR(_skip_values(skip_values));
613
244
                _current_row_index += skip_values;
614
                // generate the read values
615
244
                size_t read_values =
616
244
                        std::min((size_t)(range.to() - range.from()), batch_size - has_read);
617
244
                if (skip_whole_batch) {
618
0
                    RETURN_IF_ERROR(_skip_values(read_values));
619
244
                } else {
620
244
                    RETURN_IF_ERROR(_read_values(read_values, resolved_column, resolved_type,
621
244
                                                 filter_map, is_dict_filter));
622
244
                }
623
244
                has_read += read_values;
624
244
                *read_rows += read_values;
625
244
                _current_row_index += read_values;
626
244
                if (has_read == batch_size) {
627
111
                    break;
628
111
                }
629
244
            }
630
211
        }
631
274
    } while (false);
632
633
274
    if (right_row == _current_row_index) {
634
101
        if (!_chunk_reader->has_next_page()) {
635
101
            *eof = true;
636
101
        } else {
637
0
            RETURN_IF_ERROR(_chunk_reader->next_page());
638
0
        }
639
101
    }
640
641
274
    {
642
274
        SCOPED_RAW_TIMER(&_convert_time);
643
274
        RETURN_IF_ERROR(_converter->convert(resolved_column, _field_schema->data_type, type,
644
274
                                            doris_column, is_dict_filter));
645
274
    }
646
274
    return Status::OK();
647
274
}
Unexecuted instantiation: _ZN5doris18ScalarColumnReaderILb1ELb1EE16read_column_dataERNS_3COWINS_7IColumnEE13immutable_ptrIS3_EERKSt10shared_ptrIKNS_9IDataTypeEERKS8_INS_23TableSchemaChangeHelper4NodeEERNS_9FilterMapEmPmPbbl
_ZN5doris18ScalarColumnReaderILb1ELb0EE16read_column_dataERNS_3COWINS_7IColumnEE13immutable_ptrIS3_EERKSt10shared_ptrIKNS_9IDataTypeEERKS8_INS_23TableSchemaChangeHelper4NodeEERNS_9FilterMapEmPmPbbl
Line
Count
Source
535
3
        int64_t real_column_size) {
536
3
    if (_converter == nullptr) {
537
3
        _converter = parquet::PhysicalToLogicalConverter::get_converter(
538
3
                _field_schema, _field_schema->data_type, type, _ctz, is_dict_filter);
539
3
        if (!_converter->support()) {
540
0
            return Status::InternalError(
541
0
                    "The column type of '{}' is not supported: {}, is_dict_filter: {}, "
542
0
                    "src_logical_type: {}, dst_logical_type: {}",
543
0
                    _field_schema->name, _converter->get_error_msg(), is_dict_filter,
544
0
                    _field_schema->data_type->get_name(), type->get_name());
545
0
        }
546
3
    }
547
    // !FIXME: We should verify whether the get_physical_column logic is correct, why do we return a doris_column?
548
3
    ColumnPtr resolved_column =
549
3
            _converter->get_physical_column(_field_schema->physical_type, _field_schema->data_type,
550
3
                                            doris_column, type, is_dict_filter);
551
3
    if (_converter->read_directly_into_dst_logical_column()) {
552
3
        DCHECK_EQ(resolved_column.get(), doris_column.get());
553
3
        resolved_column = std::move(doris_column);
554
3
    }
555
3
    DataTypePtr& resolved_type = _converter->get_physical_type();
556
557
3
    _def_levels.clear();
558
3
    _rep_levels.clear();
559
3
    *read_rows = 0;
560
561
3
    if (_in_nested) {
562
3
        RETURN_IF_ERROR(_read_nested_column(resolved_column, resolved_type, filter_map, batch_size,
563
3
                                            read_rows, eof, is_dict_filter));
564
3
        return _converter->convert(resolved_column, _field_schema->data_type, type, doris_column,
565
3
                                   is_dict_filter);
566
3
    }
567
568
0
    int64_t right_row = 0;
569
0
    if constexpr (OFFSET_INDEX == false) {
570
0
        RETURN_IF_ERROR(_chunk_reader->parse_page_header());
571
0
        right_row = _chunk_reader->page_end_row();
572
    } else {
573
        right_row = _chunk_reader->page_end_row();
574
    }
575
576
0
    do {
577
        // generate the row ranges that should be read
578
0
        RowRanges read_ranges;
579
0
        _generate_read_ranges(RowRange {_current_row_index, right_row}, &read_ranges);
580
0
        if (read_ranges.count() == 0) {
581
            // skip the whole page
582
0
            _current_row_index = right_row;
583
0
        } else {
584
0
            bool skip_whole_batch = false;
585
            // Determining whether to skip page or batch will increase the calculation time.
586
            // When the filtering effect is greater than 60%, it is possible to skip the page or batch.
587
0
            if (filter_map.has_filter() && filter_map.filter_ratio() > 0.6) {
588
                // lazy read
589
0
                size_t remaining_num_values = read_ranges.count();
590
0
                if (batch_size >= remaining_num_values &&
591
0
                    filter_map.can_filter_all(remaining_num_values, _filter_map_index)) {
592
                    // We can skip the whole page if the remaining values are filtered by predicate columns
593
0
                    _filter_map_index += remaining_num_values;
594
0
                    _current_row_index = right_row;
595
0
                    *read_rows = remaining_num_values;
596
0
                    break;
597
0
                }
598
0
                skip_whole_batch = batch_size <= remaining_num_values &&
599
0
                                   filter_map.can_filter_all(batch_size, _filter_map_index);
600
0
                if (skip_whole_batch) {
601
0
                    _filter_map_index += batch_size;
602
0
                }
603
0
            }
604
            // load page data to decode or skip values
605
0
            RETURN_IF_ERROR(_chunk_reader->parse_page_header());
606
0
            RETURN_IF_ERROR(_chunk_reader->load_page_data_idempotent());
607
0
            size_t has_read = 0;
608
0
            for (size_t idx = 0; idx < read_ranges.range_size(); idx++) {
609
0
                auto range = read_ranges.get_range(idx);
610
                // generate the skipped values
611
0
                size_t skip_values = range.from() - _current_row_index;
612
0
                RETURN_IF_ERROR(_skip_values(skip_values));
613
0
                _current_row_index += skip_values;
614
                // generate the read values
615
0
                size_t read_values =
616
0
                        std::min((size_t)(range.to() - range.from()), batch_size - has_read);
617
0
                if (skip_whole_batch) {
618
0
                    RETURN_IF_ERROR(_skip_values(read_values));
619
0
                } else {
620
0
                    RETURN_IF_ERROR(_read_values(read_values, resolved_column, resolved_type,
621
0
                                                 filter_map, is_dict_filter));
622
0
                }
623
0
                has_read += read_values;
624
0
                *read_rows += read_values;
625
0
                _current_row_index += read_values;
626
0
                if (has_read == batch_size) {
627
0
                    break;
628
0
                }
629
0
            }
630
0
        }
631
0
    } while (false);
632
633
0
    if (right_row == _current_row_index) {
634
0
        if (!_chunk_reader->has_next_page()) {
635
0
            *eof = true;
636
0
        } else {
637
0
            RETURN_IF_ERROR(_chunk_reader->next_page());
638
0
        }
639
0
    }
640
641
0
    {
642
0
        SCOPED_RAW_TIMER(&_convert_time);
643
0
        RETURN_IF_ERROR(_converter->convert(resolved_column, _field_schema->data_type, type,
644
0
                                            doris_column, is_dict_filter));
645
0
    }
646
0
    return Status::OK();
647
0
}
Unexecuted instantiation: _ZN5doris18ScalarColumnReaderILb0ELb1EE16read_column_dataERNS_3COWINS_7IColumnEE13immutable_ptrIS3_EERKSt10shared_ptrIKNS_9IDataTypeEERKS8_INS_23TableSchemaChangeHelper4NodeEERNS_9FilterMapEmPmPbbl
_ZN5doris18ScalarColumnReaderILb0ELb0EE16read_column_dataERNS_3COWINS_7IColumnEE13immutable_ptrIS3_EERKSt10shared_ptrIKNS_9IDataTypeEERKS8_INS_23TableSchemaChangeHelper4NodeEERNS_9FilterMapEmPmPbbl
Line
Count
Source
535
284
        int64_t real_column_size) {
536
284
    if (_converter == nullptr) {
537
111
        _converter = parquet::PhysicalToLogicalConverter::get_converter(
538
111
                _field_schema, _field_schema->data_type, type, _ctz, is_dict_filter);
539
111
        if (!_converter->support()) {
540
0
            return Status::InternalError(
541
0
                    "The column type of '{}' is not supported: {}, is_dict_filter: {}, "
542
0
                    "src_logical_type: {}, dst_logical_type: {}",
543
0
                    _field_schema->name, _converter->get_error_msg(), is_dict_filter,
544
0
                    _field_schema->data_type->get_name(), type->get_name());
545
0
        }
546
111
    }
547
    // !FIXME: We should verify whether the get_physical_column logic is correct, why do we return a doris_column?
548
284
    ColumnPtr resolved_column =
549
284
            _converter->get_physical_column(_field_schema->physical_type, _field_schema->data_type,
550
284
                                            doris_column, type, is_dict_filter);
551
284
    if (_converter->read_directly_into_dst_logical_column()) {
552
255
        DCHECK_EQ(resolved_column.get(), doris_column.get());
553
255
        resolved_column = std::move(doris_column);
554
255
    }
555
284
    DataTypePtr& resolved_type = _converter->get_physical_type();
556
557
284
    _def_levels.clear();
558
284
    _rep_levels.clear();
559
284
    *read_rows = 0;
560
561
284
    if (_in_nested) {
562
10
        RETURN_IF_ERROR(_read_nested_column(resolved_column, resolved_type, filter_map, batch_size,
563
10
                                            read_rows, eof, is_dict_filter));
564
10
        return _converter->convert(resolved_column, _field_schema->data_type, type, doris_column,
565
10
                                   is_dict_filter);
566
10
    }
567
568
274
    int64_t right_row = 0;
569
274
    if constexpr (OFFSET_INDEX == false) {
570
274
        RETURN_IF_ERROR(_chunk_reader->parse_page_header());
571
274
        right_row = _chunk_reader->page_end_row();
572
    } else {
573
        right_row = _chunk_reader->page_end_row();
574
    }
575
576
274
    do {
577
        // generate the row ranges that should be read
578
274
        RowRanges read_ranges;
579
274
        _generate_read_ranges(RowRange {_current_row_index, right_row}, &read_ranges);
580
274
        if (read_ranges.count() == 0) {
581
            // skip the whole page
582
63
            _current_row_index = right_row;
583
211
        } else {
584
211
            bool skip_whole_batch = false;
585
            // Determining whether to skip page or batch will increase the calculation time.
586
            // When the filtering effect is greater than 60%, it is possible to skip the page or batch.
587
211
            if (filter_map.has_filter() && filter_map.filter_ratio() > 0.6) {
588
                // lazy read
589
0
                size_t remaining_num_values = read_ranges.count();
590
0
                if (batch_size >= remaining_num_values &&
591
0
                    filter_map.can_filter_all(remaining_num_values, _filter_map_index)) {
592
                    // We can skip the whole page if the remaining values are filtered by predicate columns
593
0
                    _filter_map_index += remaining_num_values;
594
0
                    _current_row_index = right_row;
595
0
                    *read_rows = remaining_num_values;
596
0
                    break;
597
0
                }
598
0
                skip_whole_batch = batch_size <= remaining_num_values &&
599
0
                                   filter_map.can_filter_all(batch_size, _filter_map_index);
600
0
                if (skip_whole_batch) {
601
0
                    _filter_map_index += batch_size;
602
0
                }
603
0
            }
604
            // load page data to decode or skip values
605
211
            RETURN_IF_ERROR(_chunk_reader->parse_page_header());
606
211
            RETURN_IF_ERROR(_chunk_reader->load_page_data_idempotent());
607
211
            size_t has_read = 0;
608
344
            for (size_t idx = 0; idx < read_ranges.range_size(); idx++) {
609
244
                auto range = read_ranges.get_range(idx);
610
                // generate the skipped values
611
244
                size_t skip_values = range.from() - _current_row_index;
612
244
                RETURN_IF_ERROR(_skip_values(skip_values));
613
244
                _current_row_index += skip_values;
614
                // generate the read values
615
244
                size_t read_values =
616
244
                        std::min((size_t)(range.to() - range.from()), batch_size - has_read);
617
244
                if (skip_whole_batch) {
618
0
                    RETURN_IF_ERROR(_skip_values(read_values));
619
244
                } else {
620
244
                    RETURN_IF_ERROR(_read_values(read_values, resolved_column, resolved_type,
621
244
                                                 filter_map, is_dict_filter));
622
244
                }
623
244
                has_read += read_values;
624
244
                *read_rows += read_values;
625
244
                _current_row_index += read_values;
626
244
                if (has_read == batch_size) {
627
111
                    break;
628
111
                }
629
244
            }
630
211
        }
631
274
    } while (false);
632
633
274
    if (right_row == _current_row_index) {
634
101
        if (!_chunk_reader->has_next_page()) {
635
101
            *eof = true;
636
101
        } else {
637
0
            RETURN_IF_ERROR(_chunk_reader->next_page());
638
0
        }
639
101
    }
640
641
274
    {
642
274
        SCOPED_RAW_TIMER(&_convert_time);
643
274
        RETURN_IF_ERROR(_converter->convert(resolved_column, _field_schema->data_type, type,
644
274
                                            doris_column, is_dict_filter));
645
274
    }
646
274
    return Status::OK();
647
274
}
648
649
Status ArrayColumnReader::init(std::unique_ptr<ParquetColumnReader> element_reader,
650
2
                               FieldSchema* field) {
651
2
    _field_schema = field;
652
2
    _element_reader = std::move(element_reader);
653
2
    return Status::OK();
654
2
}
655
656
Status ArrayColumnReader::read_column_data(
657
        ColumnPtr& doris_column, const DataTypePtr& type,
658
        const std::shared_ptr<TableSchemaChangeHelper::Node>& root_node, FilterMap& filter_map,
659
        size_t batch_size, size_t* read_rows, bool* eof, bool is_dict_filter,
660
2
        int64_t real_column_size) {
661
2
    MutableColumnPtr data_column;
662
2
    NullMap* null_map_ptr = nullptr;
663
2
    doris_column = IColumn::mutate(std::move(doris_column));
664
2
    if (doris_column->is_nullable()) {
665
2
        auto mutable_column = doris_column->assert_mutable();
666
2
        auto* nullable_column = assert_cast<ColumnNullable*>(mutable_column.get());
667
2
        null_map_ptr = &nullable_column->get_null_map_data();
668
2
        data_column = nullable_column->get_nested_column_ptr();
669
2
    } else {
670
0
        if (_field_schema->data_type->is_nullable()) {
671
0
            return Status::Corruption("Not nullable column has null values in parquet file");
672
0
        }
673
0
        data_column = doris_column->assert_mutable();
674
0
    }
675
2
    if (type->get_primitive_type() != PrimitiveType::TYPE_ARRAY) {
676
0
        return Status::Corruption(
677
0
                "Wrong data type for column '{}', expected Array type, actual type: {}.",
678
0
                _field_schema->name, type->get_name());
679
0
    }
680
681
2
    ColumnPtr& element_column = assert_cast<ColumnArray&>(*data_column).get_data_ptr();
682
2
    const DataTypePtr& element_type =
683
2
            (assert_cast<const DataTypeArray*>(remove_nullable(type).get()))->get_nested_type();
684
    // read nested column
685
2
    RETURN_IF_ERROR(_element_reader->read_column_data(element_column, element_type,
686
2
                                                      root_node->get_element_node(), filter_map,
687
2
                                                      batch_size, read_rows, eof, is_dict_filter));
688
2
    if (*read_rows == 0) {
689
0
        return Status::OK();
690
0
    }
691
692
2
    ColumnArray::Offsets64& offsets_data = assert_cast<ColumnArray&>(*data_column).get_offsets();
693
    // fill offset and null map
694
2
    fill_array_offset(_field_schema, offsets_data, null_map_ptr, _element_reader->get_rep_level(),
695
2
                      _element_reader->get_def_level());
696
2
    DCHECK_EQ(element_column->size(), offsets_data.back());
697
2
#ifndef NDEBUG
698
2
    doris_column->sanity_check();
699
2
#endif
700
2
    return Status::OK();
701
2
}
702
703
Status MapColumnReader::init(std::unique_ptr<ParquetColumnReader> key_reader,
704
                             std::unique_ptr<ParquetColumnReader> value_reader,
705
0
                             FieldSchema* field) {
706
0
    _field_schema = field;
707
0
    _key_reader = std::move(key_reader);
708
0
    _value_reader = std::move(value_reader);
709
0
    return Status::OK();
710
0
}
711
712
Status MapColumnReader::read_column_data(
713
        ColumnPtr& doris_column, const DataTypePtr& type,
714
        const std::shared_ptr<TableSchemaChangeHelper::Node>& root_node, FilterMap& filter_map,
715
        size_t batch_size, size_t* read_rows, bool* eof, bool is_dict_filter,
716
0
        int64_t real_column_size) {
717
0
    MutableColumnPtr data_column;
718
0
    NullMap* null_map_ptr = nullptr;
719
0
    doris_column = IColumn::mutate(std::move(doris_column));
720
0
    if (doris_column->is_nullable()) {
721
0
        auto mutable_column = doris_column->assert_mutable();
722
0
        auto* nullable_column = assert_cast<ColumnNullable*>(mutable_column.get());
723
0
        null_map_ptr = &nullable_column->get_null_map_data();
724
0
        data_column = nullable_column->get_nested_column_ptr();
725
0
    } else {
726
0
        if (_field_schema->data_type->is_nullable()) {
727
0
            return Status::Corruption("Not nullable column has null values in parquet file");
728
0
        }
729
0
        data_column = doris_column->assert_mutable();
730
0
    }
731
0
    if (remove_nullable(type)->get_primitive_type() != PrimitiveType::TYPE_MAP) {
732
0
        return Status::Corruption(
733
0
                "Wrong data type for column '{}', expected Map type, actual type id {}.",
734
0
                _field_schema->name, type->get_name());
735
0
    }
736
737
0
    auto& map = assert_cast<ColumnMap&>(*data_column);
738
0
    const DataTypePtr& key_type =
739
0
            assert_cast<const DataTypeMap*>(remove_nullable(type).get())->get_key_type();
740
0
    const DataTypePtr& value_type =
741
0
            assert_cast<const DataTypeMap*>(remove_nullable(type).get())->get_value_type();
742
0
    ColumnPtr& key_column = map.get_keys_ptr();
743
0
    ColumnPtr& value_column = map.get_values_ptr();
744
745
0
    size_t key_rows = 0;
746
0
    size_t value_rows = 0;
747
0
    bool key_eof = false;
748
0
    bool value_eof = false;
749
0
    int64_t orig_col_column_size = key_column->size();
750
751
0
    RETURN_IF_ERROR(_key_reader->read_column_data(key_column, key_type, root_node->get_key_node(),
752
0
                                                  filter_map, batch_size, &key_rows, &key_eof,
753
0
                                                  is_dict_filter));
754
755
0
    while (value_rows < key_rows && !value_eof) {
756
0
        size_t loop_rows = 0;
757
0
        RETURN_IF_ERROR(_value_reader->read_column_data(
758
0
                value_column, value_type, root_node->get_value_node(), filter_map,
759
0
                key_rows - value_rows, &loop_rows, &value_eof, is_dict_filter,
760
0
                key_column->size() - orig_col_column_size));
761
0
        value_rows += loop_rows;
762
0
    }
763
0
    DCHECK_EQ(key_rows, value_rows);
764
0
    *read_rows = key_rows;
765
0
    *eof = key_eof;
766
767
0
    if (*read_rows == 0) {
768
0
        return Status::OK();
769
0
    }
770
771
0
    DCHECK_EQ(key_column->size(), value_column->size());
772
    // fill offset and null map
773
0
    fill_array_offset(_field_schema, map.get_offsets(), null_map_ptr, _key_reader->get_rep_level(),
774
0
                      _key_reader->get_def_level());
775
0
    DCHECK_EQ(key_column->size(), map.get_offsets().back());
776
0
#ifndef NDEBUG
777
0
    doris_column->sanity_check();
778
0
#endif
779
0
    return Status::OK();
780
0
}
781
782
Status StructColumnReader::init(
783
        std::unordered_map<std::string, std::unique_ptr<ParquetColumnReader>>&& child_readers,
784
11
        FieldSchema* field) {
785
11
    _field_schema = field;
786
11
    _child_readers = std::move(child_readers);
787
11
    return Status::OK();
788
11
}
789
Status StructColumnReader::read_column_data(
790
        ColumnPtr& doris_column, const DataTypePtr& type,
791
        const std::shared_ptr<TableSchemaChangeHelper::Node>& root_node, FilterMap& filter_map,
792
        size_t batch_size, size_t* read_rows, bool* eof, bool is_dict_filter,
793
11
        int64_t real_column_size) {
794
11
    MutableColumnPtr data_column;
795
11
    NullMap* null_map_ptr = nullptr;
796
11
    doris_column = IColumn::mutate(std::move(doris_column));
797
11
    if (doris_column->is_nullable()) {
798
11
        auto mutable_column = doris_column->assert_mutable();
799
11
        auto* nullable_column = assert_cast<ColumnNullable*>(mutable_column.get());
800
11
        null_map_ptr = &nullable_column->get_null_map_data();
801
11
        data_column = nullable_column->get_nested_column_ptr();
802
11
    } else {
803
0
        if (_field_schema->data_type->is_nullable()) {
804
0
            return Status::Corruption("Not nullable column has null values in parquet file");
805
0
        }
806
0
        data_column = doris_column->assert_mutable();
807
0
    }
808
11
    if (type->get_primitive_type() != PrimitiveType::TYPE_STRUCT) {
809
0
        return Status::Corruption(
810
0
                "Wrong data type for column '{}', expected Struct type, actual type id {}.",
811
0
                _field_schema->name, type->get_name());
812
0
    }
813
814
11
    auto& doris_struct = assert_cast<ColumnStruct&>(*data_column);
815
11
    const auto* doris_struct_type = assert_cast<const DataTypeStruct*>(remove_nullable(type).get());
816
817
11
    int64_t not_missing_column_id = -1;
818
11
    size_t not_missing_orig_column_size = 0;
819
11
    std::vector<size_t> missing_column_idxs {};
820
11
    std::vector<size_t> skip_reading_column_idxs {};
821
822
11
    _read_column_names.clear();
823
824
37
    for (size_t i = 0; i < doris_struct.tuple_size(); ++i) {
825
26
        ColumnPtr& doris_field = doris_struct.get_column_ptr(i);
826
26
        auto& doris_type = doris_struct_type->get_element(i);
827
26
        auto& doris_name = doris_struct_type->get_element_name(i);
828
26
        if (!root_node->children_column_exists(doris_name)) {
829
0
            missing_column_idxs.push_back(i);
830
0
            VLOG_DEBUG << "[ParquetReader] Missing column in schema: column_idx[" << i
831
0
                       << "], doris_name: " << doris_name << " (column not exists in root node)";
832
0
            continue;
833
0
        }
834
26
        auto file_name = root_node->children_file_column_name(doris_name);
835
836
        // Check if this is a SkipReadingReader - we should skip it when choosing reference column
837
        // because SkipReadingReader doesn't know the actual data size in nested context
838
26
        bool is_skip_reader =
839
26
                dynamic_cast<SkipReadingReader*>(_child_readers[file_name].get()) != nullptr;
840
841
26
        if (is_skip_reader) {
842
            // Store SkipReadingReader columns to fill them later based on reference column size
843
4
            skip_reading_column_idxs.push_back(i);
844
4
            continue;
845
4
        }
846
847
        // Only add non-SkipReadingReader columns to _read_column_names
848
        // This ensures get_rep_level() and get_def_level() return valid levels
849
22
        _read_column_names.emplace_back(file_name);
850
851
22
        size_t field_rows = 0;
852
22
        bool field_eof = false;
853
22
        if (not_missing_column_id == -1) {
854
11
            not_missing_column_id = i;
855
11
            not_missing_orig_column_size = doris_field->size();
856
11
            RETURN_IF_ERROR(_child_readers[file_name]->read_column_data(
857
11
                    doris_field, doris_type, root_node->get_children_node(doris_name), filter_map,
858
11
                    batch_size, &field_rows, &field_eof, is_dict_filter));
859
11
            *read_rows = field_rows;
860
11
            *eof = field_eof;
861
            /*
862
             * Considering the issue in the `_read_nested_column` function where data may span across pages, leading
863
             * to missing definition and repetition levels, when filling the null_map of the struct later, it is
864
             * crucial to use the definition and repetition levels from the first read column
865
             * (since `_read_nested_column` is not called repeatedly).
866
             *
867
             *  It is worth mentioning that, theoretically, any sub-column can be chosen to fill the null_map,
868
             *  and selecting the shortest one will offer better performance
869
             */
870
11
        } else {
871
22
            while (field_rows < *read_rows && !field_eof) {
872
11
                size_t loop_rows = 0;
873
11
                RETURN_IF_ERROR(_child_readers[file_name]->read_column_data(
874
11
                        doris_field, doris_type, root_node->get_children_node(doris_name),
875
11
                        filter_map, *read_rows - field_rows, &loop_rows, &field_eof,
876
11
                        is_dict_filter));
877
11
                field_rows += loop_rows;
878
11
            }
879
11
            DCHECK_EQ(*read_rows, field_rows);
880
            //            DCHECK_EQ(*eof, field_eof);
881
11
        }
882
22
    }
883
884
11
    int64_t missing_column_sz = -1;
885
886
11
    if (not_missing_column_id == -1) {
887
        // All queried columns are missing in the file (e.g., all added after schema change)
888
        // We need to pick a column from _field_schema children that exists in the file for RL/DL reference
889
0
        std::string reference_file_column_name;
890
0
        std::unique_ptr<ParquetColumnReader>* reference_reader = nullptr;
891
892
0
        for (const auto& child : _field_schema->children) {
893
0
            auto it = _child_readers.find(child.name);
894
0
            if (it != _child_readers.end()) {
895
                // Skip SkipReadingReader as they don't have valid RL/DL
896
0
                bool is_skip_reader = dynamic_cast<SkipReadingReader*>(it->second.get()) != nullptr;
897
0
                if (!is_skip_reader) {
898
0
                    reference_file_column_name = child.name;
899
0
                    reference_reader = &(it->second);
900
0
                    break;
901
0
                }
902
0
            }
903
0
        }
904
905
0
        if (reference_reader != nullptr) {
906
            // Read the reference column to get correct RL/DL information
907
            // TODO: Optimize by only reading RL/DL without actual data decoding
908
909
            // We need to find the FieldSchema for the reference column from _field_schema children
910
0
            FieldSchema* ref_field_schema = nullptr;
911
0
            for (auto& child : _field_schema->children) {
912
0
                if (child.name == reference_file_column_name) {
913
0
                    ref_field_schema = &child;
914
0
                    break;
915
0
                }
916
0
            }
917
918
0
            if (ref_field_schema == nullptr) {
919
0
                return Status::InternalError(
920
0
                        "Cannot find field schema for reference column '{}' in struct '{}'",
921
0
                        reference_file_column_name, _field_schema->name);
922
0
            }
923
924
            // Create a temporary column to hold the data (we'll use its size for missing_column_sz)
925
0
            ColumnPtr temp_column = ref_field_schema->data_type->create_column();
926
0
            auto temp_type = ref_field_schema->data_type;
927
928
0
            size_t field_rows = 0;
929
0
            bool field_eof = false;
930
931
            // Use ConstNode for the reference column instead of looking up from root_node.
932
            // The reference column is only used to get RL/DL information for determining the number
933
            // of elements in the struct. It may be a column that has been dropped from the table
934
            // schema (e.g., 'removed' field), but still exists in older parquet files.
935
            // Since we don't need schema mapping for this column (we just need its RL/DL levels),
936
            // using ConstNode is safe and avoids the issue where the reference column doesn't exist
937
            // in root_node (because it was dropped from table schema).
938
0
            auto ref_child_node = TableSchemaChangeHelper::ConstNode::get_instance();
939
0
            not_missing_orig_column_size = temp_column->size();
940
941
0
            RETURN_IF_ERROR((*reference_reader)
942
0
                                    ->read_column_data(temp_column, temp_type, ref_child_node,
943
0
                                                       filter_map, batch_size, &field_rows,
944
0
                                                       &field_eof, is_dict_filter));
945
946
0
            *read_rows = field_rows;
947
0
            *eof = field_eof;
948
949
            // Store this reference column name for get_rep_level/get_def_level to use
950
0
            _read_column_names.emplace_back(reference_file_column_name);
951
952
0
            missing_column_sz = temp_column->size() - not_missing_orig_column_size;
953
0
        } else {
954
0
            return Status::Corruption(
955
0
                    "Cannot read struct '{}': all queried columns are missing and no reference "
956
0
                    "column found in file",
957
0
                    _field_schema->name);
958
0
        }
959
0
    }
960
961
    //  This missing_column_sz is not *read_rows. Because read_rows returns the number of rows.
962
    //  For example: suppose we have a column array<struct<a:int,b:string>>,
963
    //  where b is a newly added column, that is, a missing column.
964
    //  There are two rows of data in this column,
965
    //      [{1,null},{2,null},{3,null}]
966
    //      [{4,null},{5,null}]
967
    //  When you first read subcolumn a, you read 5 data items and the value of *read_rows is 2.
968
    //  You should insert 5 records into subcolumn b instead of 2.
969
11
    if (missing_column_sz == -1) {
970
11
        missing_column_sz = doris_struct.get_column(not_missing_column_id).size() -
971
11
                            not_missing_orig_column_size;
972
11
    }
973
974
    // Fill SkipReadingReader columns with the correct amount of data based on reference column
975
    // Let SkipReadingReader handle the data filling through its read_column_data method
976
11
    for (auto idx : skip_reading_column_idxs) {
977
4
        auto& doris_field = doris_struct.get_column_ptr(idx);
978
4
        auto& doris_type = const_cast<DataTypePtr&>(doris_struct_type->get_element(idx));
979
4
        auto& doris_name = const_cast<String&>(doris_struct_type->get_element_name(idx));
980
4
        auto file_name = root_node->children_file_column_name(doris_name);
981
982
4
        size_t field_rows = 0;
983
4
        bool field_eof = false;
984
4
        RETURN_IF_ERROR(_child_readers[file_name]->read_column_data(
985
4
                doris_field, doris_type, root_node->get_children_node(doris_name), filter_map,
986
4
                missing_column_sz, &field_rows, &field_eof, is_dict_filter, missing_column_sz));
987
4
    }
988
989
    // Fill truly missing columns (not in root_node) with null or default value
990
11
    for (auto idx : missing_column_idxs) {
991
0
        auto& doris_field = doris_struct.get_column_ptr(idx);
992
0
        auto& doris_type = doris_struct_type->get_element(idx);
993
0
        DCHECK(doris_type->is_nullable());
994
0
        doris_field = IColumn::mutate(std::move(doris_field));
995
0
        auto mutable_column = doris_field->assert_mutable();
996
0
        auto* nullable_column = static_cast<ColumnNullable*>(mutable_column.get());
997
0
        nullable_column->insert_many_defaults(missing_column_sz);
998
0
    }
999
1000
11
    if (null_map_ptr != nullptr) {
1001
11
        fill_struct_null_map(_field_schema, *null_map_ptr, this->get_rep_level(),
1002
11
                             this->get_def_level());
1003
11
    }
1004
11
#ifndef NDEBUG
1005
11
    doris_column->sanity_check();
1006
11
#endif
1007
11
    return Status::OK();
1008
11
}
1009
1010
template class ScalarColumnReader<true, true>;
1011
template class ScalarColumnReader<true, false>;
1012
template class ScalarColumnReader<false, true>;
1013
template class ScalarColumnReader<false, false>;
1014
1015
}; // namespace doris