Coverage Report

Created: 2026-06-04 13:48

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
be/src/storage/segment/binary_plain_page.h
Line
Count
Source
1
// Licensed to the Apache Software Foundation (ASF) under one
2
// or more contributor license agreements.  See the NOTICE file
3
// distributed with this work for additional information
4
// regarding copyright ownership.  The ASF licenses this file
5
// to you under the Apache License, Version 2.0 (the
6
// "License"); you may not use this file except in compliance
7
// with the License.  You may obtain a copy of the License at
8
//
9
//   http://www.apache.org/licenses/LICENSE-2.0
10
//
11
// Unless required by applicable law or agreed to in writing,
12
// software distributed under the License is distributed on an
13
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
14
// KIND, either express or implied.  See the License for the
15
// specific language governing permissions and limitations
16
// under the License.
17
18
// Simplistic page encoding for strings.
19
//
20
// The page consists of:
21
// Strings:
22
//   raw strings that were written
23
// Trailer
24
//  Offsets:
25
//    offsets pointing to the beginning of each string
26
//  num_elems (32-bit fixed)
27
//
28
29
#pragma once
30
31
#include "common/logging.h"
32
#include "core/column/column_complex.h"
33
#include "storage/olap_common.h"
34
#include "storage/segment/options.h"
35
#include "storage/segment/page_builder.h"
36
#include "storage/segment/page_decoder.h"
37
#include "storage/types.h"
38
#include "util/coding.h"
39
#include "util/faststring.h"
40
41
namespace doris {
42
namespace segment_v2 {
43
44
template <FieldType Type>
45
class BinaryPlainPageBuilder : public PageBuilderHelper<BinaryPlainPageBuilder<Type>> {
46
public:
47
    using Self = BinaryPlainPageBuilder<Type>;
48
    friend class PageBuilderHelper<Self>;
49
50
15.3k
    Status init() override { return reset(); }
_ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE13EE4initEv
Line
Count
Source
50
1
    Status init() override { return reset(); }
_ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE17EE4initEv
Line
Count
Source
50
4.92k
    Status init() override { return reset(); }
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE26EE4initEv
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE34EE4initEv
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE35EE4initEv
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE23EE4initEv
_ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE25EE4initEv
Line
Count
Source
50
10.4k
    Status init() override { return reset(); }
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE27EE4initEv
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE36EE4initEv
51
52
1.22M
    bool is_page_full() override {
53
1.22M
        bool ret = false;
54
1.22M
        if (_options.is_dict_page) {
55
            // dict_page_size is 0, do not limit the page size
56
831k
            ret = _options.dict_page_size != 0 && _size_estimate > _options.dict_page_size;
57
831k
        } else {
58
391k
            ret = _options.data_page_size != 0 && _size_estimate > _options.data_page_size;
59
391k
        }
60
1.22M
        return ret;
61
1.22M
    }
_ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE13EE12is_page_fullEv
Line
Count
Source
52
6
    bool is_page_full() override {
53
6
        bool ret = false;
54
6
        if (_options.is_dict_page) {
55
            // dict_page_size is 0, do not limit the page size
56
0
            ret = _options.dict_page_size != 0 && _size_estimate > _options.dict_page_size;
57
6
        } else {
58
6
            ret = _options.data_page_size != 0 && _size_estimate > _options.data_page_size;
59
6
        }
60
6
        return ret;
61
6
    }
_ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE17EE12is_page_fullEv
Line
Count
Source
52
1.17M
    bool is_page_full() override {
53
1.17M
        bool ret = false;
54
1.17M
        if (_options.is_dict_page) {
55
            // dict_page_size is 0, do not limit the page size
56
831k
            ret = _options.dict_page_size != 0 && _size_estimate > _options.dict_page_size;
57
831k
        } else {
58
347k
            ret = _options.data_page_size != 0 && _size_estimate > _options.data_page_size;
59
347k
        }
60
1.17M
        return ret;
61
1.17M
    }
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE26EE12is_page_fullEv
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE34EE12is_page_fullEv
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE35EE12is_page_fullEv
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE23EE12is_page_fullEv
_ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE25EE12is_page_fullEv
Line
Count
Source
52
43.3k
    bool is_page_full() override {
53
43.3k
        bool ret = false;
54
43.3k
        if (_options.is_dict_page) {
55
            // dict_page_size is 0, do not limit the page size
56
0
            ret = _options.dict_page_size != 0 && _size_estimate > _options.dict_page_size;
57
43.3k
        } else {
58
43.3k
            ret = _options.data_page_size != 0 && _size_estimate > _options.data_page_size;
59
43.3k
        }
60
43.3k
        return ret;
61
43.3k
    }
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE27EE12is_page_fullEv
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE36EE12is_page_fullEv
62
63
205k
    Status add(const uint8_t* vals, size_t* count) override {
64
205k
        DCHECK(!_finished);
65
205k
        DCHECK_GT(*count, 0);
66
205k
        size_t i = 0;
67
68
        // If the page is full, should stop adding more items.
69
448k
        while (!is_page_full() && i < *count) {
70
242k
            const auto* src = reinterpret_cast<const Slice*>(vals);
71
242k
            if constexpr (Type == FieldType::OLAP_FIELD_TYPE_BITMAP) {
72
14.4k
                if (_options.need_check_bitmap) {
73
0
                    RETURN_IF_ERROR(BitmapTypeCode::validate(*(src->data)));
74
0
                }
75
14.4k
            }
76
14.4k
            size_t offset = _buffer.size();
77
242k
            _offsets.push_back(cast_set<uint32_t>(offset));
78
            // This may need a large memory, should return error if could not allocated
79
            // successfully, to avoid BE OOM.
80
242k
            RETURN_IF_CATCH_EXCEPTION(_buffer.append(src->data, src->size));
81
82
242k
            _last_value_size = cast_set<uint32_t>(src->size);
83
242k
            _size_estimate += src->size;
84
242k
            _size_estimate += sizeof(uint32_t);
85
242k
            _raw_data_size += src->size;
86
87
242k
            i++;
88
242k
            vals += sizeof(Slice);
89
242k
        }
90
91
205k
        *count = i;
92
205k
        return Status::OK();
93
205k
    }
_ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE13EE3addEPKhPm
Line
Count
Source
63
1
    Status add(const uint8_t* vals, size_t* count) override {
64
1
        DCHECK(!_finished);
65
1
        DCHECK_GT(*count, 0);
66
1
        size_t i = 0;
67
68
        // If the page is full, should stop adding more items.
69
6
        while (!is_page_full() && i < *count) {
70
5
            const auto* src = reinterpret_cast<const Slice*>(vals);
71
            if constexpr (Type == FieldType::OLAP_FIELD_TYPE_BITMAP) {
72
                if (_options.need_check_bitmap) {
73
                    RETURN_IF_ERROR(BitmapTypeCode::validate(*(src->data)));
74
                }
75
            }
76
5
            size_t offset = _buffer.size();
77
5
            _offsets.push_back(cast_set<uint32_t>(offset));
78
            // This may need a large memory, should return error if could not allocated
79
            // successfully, to avoid BE OOM.
80
5
            RETURN_IF_CATCH_EXCEPTION(_buffer.append(src->data, src->size));
81
82
5
            _last_value_size = cast_set<uint32_t>(src->size);
83
5
            _size_estimate += src->size;
84
5
            _size_estimate += sizeof(uint32_t);
85
5
            _raw_data_size += src->size;
86
87
5
            i++;
88
5
            vals += sizeof(Slice);
89
5
        }
90
91
1
        *count = i;
92
1
        return Status::OK();
93
1
    }
_ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE17EE3addEPKhPm
Line
Count
Source
63
191k
    Status add(const uint8_t* vals, size_t* count) override {
64
191k
        DCHECK(!_finished);
65
191k
        DCHECK_GT(*count, 0);
66
191k
        size_t i = 0;
67
68
        // If the page is full, should stop adding more items.
69
419k
        while (!is_page_full() && i < *count) {
70
228k
            const auto* src = reinterpret_cast<const Slice*>(vals);
71
            if constexpr (Type == FieldType::OLAP_FIELD_TYPE_BITMAP) {
72
                if (_options.need_check_bitmap) {
73
                    RETURN_IF_ERROR(BitmapTypeCode::validate(*(src->data)));
74
                }
75
            }
76
228k
            size_t offset = _buffer.size();
77
228k
            _offsets.push_back(cast_set<uint32_t>(offset));
78
            // This may need a large memory, should return error if could not allocated
79
            // successfully, to avoid BE OOM.
80
228k
            RETURN_IF_CATCH_EXCEPTION(_buffer.append(src->data, src->size));
81
82
228k
            _last_value_size = cast_set<uint32_t>(src->size);
83
228k
            _size_estimate += src->size;
84
228k
            _size_estimate += sizeof(uint32_t);
85
228k
            _raw_data_size += src->size;
86
87
228k
            i++;
88
228k
            vals += sizeof(Slice);
89
228k
        }
90
91
191k
        *count = i;
92
191k
        return Status::OK();
93
191k
    }
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE26EE3addEPKhPm
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE34EE3addEPKhPm
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE35EE3addEPKhPm
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE23EE3addEPKhPm
_ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE25EE3addEPKhPm
Line
Count
Source
63
14.4k
    Status add(const uint8_t* vals, size_t* count) override {
64
14.4k
        DCHECK(!_finished);
65
14.4k
        DCHECK_GT(*count, 0);
66
14.4k
        size_t i = 0;
67
68
        // If the page is full, should stop adding more items.
69
28.9k
        while (!is_page_full() && i < *count) {
70
14.4k
            const auto* src = reinterpret_cast<const Slice*>(vals);
71
14.4k
            if constexpr (Type == FieldType::OLAP_FIELD_TYPE_BITMAP) {
72
14.4k
                if (_options.need_check_bitmap) {
73
0
                    RETURN_IF_ERROR(BitmapTypeCode::validate(*(src->data)));
74
0
                }
75
14.4k
            }
76
14.4k
            size_t offset = _buffer.size();
77
14.4k
            _offsets.push_back(cast_set<uint32_t>(offset));
78
            // This may need a large memory, should return error if could not allocated
79
            // successfully, to avoid BE OOM.
80
14.4k
            RETURN_IF_CATCH_EXCEPTION(_buffer.append(src->data, src->size));
81
82
14.4k
            _last_value_size = cast_set<uint32_t>(src->size);
83
14.4k
            _size_estimate += src->size;
84
14.4k
            _size_estimate += sizeof(uint32_t);
85
14.4k
            _raw_data_size += src->size;
86
87
14.4k
            i++;
88
14.4k
            vals += sizeof(Slice);
89
14.4k
        }
90
91
14.4k
        *count = i;
92
14.4k
        return Status::OK();
93
14.4k
    }
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE27EE3addEPKhPm
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE36EE3addEPKhPm
94
95
17.2k
    Status finish(OwnedSlice* slice) override {
96
17.2k
        DCHECK(!_finished);
97
17.2k
        _finished = true;
98
17.2k
        RETURN_IF_CATCH_EXCEPTION({
99
            // Set up trailer
100
17.2k
            for (uint32_t _offset : _offsets) {
101
17.2k
                put_fixed32_le(&_buffer, _offset);
102
17.2k
            }
103
17.2k
            put_fixed32_le(&_buffer, cast_set<uint32_t>(_offsets.size()));
104
17.2k
            *slice = _buffer.build();
105
17.2k
        });
106
17.2k
        return Status::OK();
107
17.2k
    }
_ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE13EE6finishEPNS_10OwnedSliceE
Line
Count
Source
95
1
    Status finish(OwnedSlice* slice) override {
96
1
        DCHECK(!_finished);
97
1
        _finished = true;
98
1
        RETURN_IF_CATCH_EXCEPTION({
99
            // Set up trailer
100
1
            for (uint32_t _offset : _offsets) {
101
1
                put_fixed32_le(&_buffer, _offset);
102
1
            }
103
1
            put_fixed32_le(&_buffer, cast_set<uint32_t>(_offsets.size()));
104
1
            *slice = _buffer.build();
105
1
        });
106
1
        return Status::OK();
107
1
    }
_ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE17EE6finishEPNS_10OwnedSliceE
Line
Count
Source
95
6.85k
    Status finish(OwnedSlice* slice) override {
96
6.85k
        DCHECK(!_finished);
97
6.85k
        _finished = true;
98
6.85k
        RETURN_IF_CATCH_EXCEPTION({
99
            // Set up trailer
100
6.85k
            for (uint32_t _offset : _offsets) {
101
6.85k
                put_fixed32_le(&_buffer, _offset);
102
6.85k
            }
103
6.85k
            put_fixed32_le(&_buffer, cast_set<uint32_t>(_offsets.size()));
104
6.85k
            *slice = _buffer.build();
105
6.85k
        });
106
6.85k
        return Status::OK();
107
6.85k
    }
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE26EE6finishEPNS_10OwnedSliceE
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE34EE6finishEPNS_10OwnedSliceE
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE35EE6finishEPNS_10OwnedSliceE
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE23EE6finishEPNS_10OwnedSliceE
_ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE25EE6finishEPNS_10OwnedSliceE
Line
Count
Source
95
10.4k
    Status finish(OwnedSlice* slice) override {
96
10.4k
        DCHECK(!_finished);
97
10.4k
        _finished = true;
98
10.4k
        RETURN_IF_CATCH_EXCEPTION({
99
            // Set up trailer
100
10.4k
            for (uint32_t _offset : _offsets) {
101
10.4k
                put_fixed32_le(&_buffer, _offset);
102
10.4k
            }
103
10.4k
            put_fixed32_le(&_buffer, cast_set<uint32_t>(_offsets.size()));
104
10.4k
            *slice = _buffer.build();
105
10.4k
        });
106
10.4k
        return Status::OK();
107
10.4k
    }
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE27EE6finishEPNS_10OwnedSliceE
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE36EE6finishEPNS_10OwnedSliceE
108
109
29.3k
    Status reset() override {
110
29.3k
        RETURN_IF_CATCH_EXCEPTION({
111
29.3k
            _offsets.clear();
112
29.3k
            _buffer.clear();
113
29.3k
            _buffer.reserve(_options.data_page_size == 0
114
29.3k
                                    ? 1024
115
29.3k
                                    : std::min(_options.data_page_size, _options.dict_page_size));
116
29.3k
            _size_estimate = sizeof(uint32_t);
117
29.3k
            _finished = false;
118
29.3k
            _last_value_size = 0;
119
29.3k
            _raw_data_size = 0;
120
29.3k
        });
121
29.3k
        return Status::OK();
122
29.3k
    }
_ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE13EE5resetEv
Line
Count
Source
109
1
    Status reset() override {
110
1
        RETURN_IF_CATCH_EXCEPTION({
111
1
            _offsets.clear();
112
1
            _buffer.clear();
113
1
            _buffer.reserve(_options.data_page_size == 0
114
1
                                    ? 1024
115
1
                                    : std::min(_options.data_page_size, _options.dict_page_size));
116
1
            _size_estimate = sizeof(uint32_t);
117
1
            _finished = false;
118
1
            _last_value_size = 0;
119
1
            _raw_data_size = 0;
120
1
        });
121
1
        return Status::OK();
122
1
    }
_ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE17EE5resetEv
Line
Count
Source
109
8.56k
    Status reset() override {
110
8.56k
        RETURN_IF_CATCH_EXCEPTION({
111
8.56k
            _offsets.clear();
112
8.56k
            _buffer.clear();
113
8.56k
            _buffer.reserve(_options.data_page_size == 0
114
8.56k
                                    ? 1024
115
8.56k
                                    : std::min(_options.data_page_size, _options.dict_page_size));
116
8.56k
            _size_estimate = sizeof(uint32_t);
117
8.56k
            _finished = false;
118
8.56k
            _last_value_size = 0;
119
8.56k
            _raw_data_size = 0;
120
8.56k
        });
121
8.56k
        return Status::OK();
122
8.56k
    }
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE26EE5resetEv
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE34EE5resetEv
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE35EE5resetEv
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE23EE5resetEv
_ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE25EE5resetEv
Line
Count
Source
109
20.8k
    Status reset() override {
110
20.8k
        RETURN_IF_CATCH_EXCEPTION({
111
20.8k
            _offsets.clear();
112
20.8k
            _buffer.clear();
113
20.8k
            _buffer.reserve(_options.data_page_size == 0
114
20.8k
                                    ? 1024
115
20.8k
                                    : std::min(_options.data_page_size, _options.dict_page_size));
116
20.8k
            _size_estimate = sizeof(uint32_t);
117
20.8k
            _finished = false;
118
20.8k
            _last_value_size = 0;
119
20.8k
            _raw_data_size = 0;
120
20.8k
        });
121
20.8k
        return Status::OK();
122
20.8k
    }
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE27EE5resetEv
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE36EE5resetEv
123
124
10.5k
    size_t count() const override { return _offsets.size(); }
Unexecuted instantiation: _ZNK5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE13EE5countEv
_ZNK5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE17EE5countEv
Line
Count
Source
124
118
    size_t count() const override { return _offsets.size(); }
Unexecuted instantiation: _ZNK5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE26EE5countEv
Unexecuted instantiation: _ZNK5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE34EE5countEv
Unexecuted instantiation: _ZNK5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE35EE5countEv
Unexecuted instantiation: _ZNK5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE23EE5countEv
_ZNK5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE25EE5countEv
Line
Count
Source
124
10.4k
    size_t count() const override { return _offsets.size(); }
Unexecuted instantiation: _ZNK5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE27EE5countEv
Unexecuted instantiation: _ZNK5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE36EE5countEv
125
126
1.02k
    uint64_t size() const override { return _size_estimate; }
Unexecuted instantiation: _ZNK5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE13EE4sizeEv
_ZNK5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE17EE4sizeEv
Line
Count
Source
126
1.02k
    uint64_t size() const override { return _size_estimate; }
Unexecuted instantiation: _ZNK5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE26EE4sizeEv
Unexecuted instantiation: _ZNK5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE34EE4sizeEv
Unexecuted instantiation: _ZNK5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE35EE4sizeEv
Unexecuted instantiation: _ZNK5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE23EE4sizeEv
Unexecuted instantiation: _ZNK5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE25EE4sizeEv
Unexecuted instantiation: _ZNK5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE27EE4sizeEv
Unexecuted instantiation: _ZNK5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE36EE4sizeEv
127
128
0
    uint64_t get_raw_data_size() const override { return _raw_data_size; }
Unexecuted instantiation: _ZNK5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE13EE17get_raw_data_sizeEv
Unexecuted instantiation: _ZNK5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE17EE17get_raw_data_sizeEv
Unexecuted instantiation: _ZNK5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE26EE17get_raw_data_sizeEv
Unexecuted instantiation: _ZNK5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE34EE17get_raw_data_sizeEv
Unexecuted instantiation: _ZNK5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE35EE17get_raw_data_sizeEv
Unexecuted instantiation: _ZNK5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE23EE17get_raw_data_sizeEv
Unexecuted instantiation: _ZNK5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE25EE17get_raw_data_sizeEv
Unexecuted instantiation: _ZNK5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE27EE17get_raw_data_sizeEv
Unexecuted instantiation: _ZNK5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE36EE17get_raw_data_sizeEv
129
130
private:
131
    BinaryPlainPageBuilder(const PageBuilderOptions& options)
132
15.3k
            : _size_estimate(0), _options(options) {}
_ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE13EEC2ERKNS0_18PageBuilderOptionsE
Line
Count
Source
132
1
            : _size_estimate(0), _options(options) {}
_ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE17EEC2ERKNS0_18PageBuilderOptionsE
Line
Count
Source
132
4.92k
            : _size_estimate(0), _options(options) {}
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE26EEC2ERKNS0_18PageBuilderOptionsE
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE34EEC2ERKNS0_18PageBuilderOptionsE
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE35EEC2ERKNS0_18PageBuilderOptionsE
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE23EEC2ERKNS0_18PageBuilderOptionsE
_ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE25EEC2ERKNS0_18PageBuilderOptionsE
Line
Count
Source
132
10.4k
            : _size_estimate(0), _options(options) {}
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE27EEC2ERKNS0_18PageBuilderOptionsE
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageBuilderILNS_9FieldTypeE36EEC2ERKNS0_18PageBuilderOptionsE
133
134
    faststring _buffer;
135
    size_t _size_estimate;
136
    // Offsets of each entry, relative to the start of the page
137
    std::vector<uint32_t> _offsets;
138
    bool _finished;
139
    PageBuilderOptions _options;
140
    // size of last added value
141
    uint32_t _last_value_size = 0;
142
    uint64_t _raw_data_size = 0;
143
};
144
145
template <FieldType Type>
146
class BinaryPlainPageDecoder : public PageDecoder {
147
public:
148
    BinaryPlainPageDecoder(Slice data) : BinaryPlainPageDecoder(data, PageDecoderOptions()) {}
149
150
    BinaryPlainPageDecoder(Slice data, const PageDecoderOptions& options)
151
4.96k
            : _data(data),
152
4.96k
              _options(options),
153
4.96k
              _parsed(false),
154
4.96k
              _num_elems(0),
155
4.96k
              _offsets_pos(0),
156
4.96k
              _cur_idx(0) {}
_ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE17EEC2ENS_5SliceERKNS0_18PageDecoderOptionsE
Line
Count
Source
151
2.14k
            : _data(data),
152
2.14k
              _options(options),
153
2.14k
              _parsed(false),
154
2.14k
              _num_elems(0),
155
2.14k
              _offsets_pos(0),
156
2.14k
              _cur_idx(0) {}
_ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE26EEC2ENS_5SliceERKNS0_18PageDecoderOptionsE
Line
Count
Source
151
2.67k
            : _data(data),
152
2.67k
              _options(options),
153
2.67k
              _parsed(false),
154
2.67k
              _num_elems(0),
155
2.67k
              _offsets_pos(0),
156
2.67k
              _cur_idx(0) {}
_ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE13EEC2ENS_5SliceERKNS0_18PageDecoderOptionsE
Line
Count
Source
151
9
            : _data(data),
152
9
              _options(options),
153
9
              _parsed(false),
154
9
              _num_elems(0),
155
9
              _offsets_pos(0),
156
9
              _cur_idx(0) {}
_ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE36EEC2ENS_5SliceERKNS0_18PageDecoderOptionsE
Line
Count
Source
151
1
            : _data(data),
152
1
              _options(options),
153
1
              _parsed(false),
154
1
              _num_elems(0),
155
1
              _offsets_pos(0),
156
1
              _cur_idx(0) {}
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE34EEC2ENS_5SliceERKNS0_18PageDecoderOptionsE
_ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE35EEC2ENS_5SliceERKNS0_18PageDecoderOptionsE
Line
Count
Source
151
117
            : _data(data),
152
117
              _options(options),
153
117
              _parsed(false),
154
117
              _num_elems(0),
155
117
              _offsets_pos(0),
156
117
              _cur_idx(0) {}
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE23EEC2ENS_5SliceERKNS0_18PageDecoderOptionsE
_ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE25EEC2ENS_5SliceERKNS0_18PageDecoderOptionsE
Line
Count
Source
151
21
            : _data(data),
152
21
              _options(options),
153
21
              _parsed(false),
154
21
              _num_elems(0),
155
21
              _offsets_pos(0),
156
21
              _cur_idx(0) {}
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE27EEC2ENS_5SliceERKNS0_18PageDecoderOptionsE
157
158
4.96k
    Status init() override {
159
4.96k
        CHECK(!_parsed);
160
161
4.96k
        if (_data.size < sizeof(uint32_t)) {
162
0
            return Status::Corruption(
163
0
                    "file corruption: not enough bytes for trailer in BinaryPlainPageDecoder ."
164
0
                    "invalid data size:{}, trailer size:{}",
165
0
                    _data.size, sizeof(uint32_t));
166
0
        }
167
168
        // Decode trailer
169
4.96k
        _num_elems = decode_fixed32_le((const uint8_t*)&_data[_data.get_size() - sizeof(uint32_t)]);
170
4.96k
        _offsets_pos = cast_set<uint32_t>(_data.get_size() - ((_num_elems + 1) * sizeof(uint32_t)));
171
172
4.96k
        if (_offsets_pos > _data.get_size() - sizeof(uint32_t)) {
173
0
            return Status::Corruption(
174
0
                    "file corruption: offsets pos beyonds data_size: {}, num_element: {}"
175
0
                    ", offset_pos: {}",
176
0
                    _data.size, _num_elems, _offsets_pos);
177
0
        }
178
4.96k
        _parsed = true;
179
180
4.96k
        return Status::OK();
181
4.96k
    }
_ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE17EE4initEv
Line
Count
Source
158
2.14k
    Status init() override {
159
2.14k
        CHECK(!_parsed);
160
161
2.14k
        if (_data.size < sizeof(uint32_t)) {
162
0
            return Status::Corruption(
163
0
                    "file corruption: not enough bytes for trailer in BinaryPlainPageDecoder ."
164
0
                    "invalid data size:{}, trailer size:{}",
165
0
                    _data.size, sizeof(uint32_t));
166
0
        }
167
168
        // Decode trailer
169
2.14k
        _num_elems = decode_fixed32_le((const uint8_t*)&_data[_data.get_size() - sizeof(uint32_t)]);
170
2.14k
        _offsets_pos = cast_set<uint32_t>(_data.get_size() - ((_num_elems + 1) * sizeof(uint32_t)));
171
172
2.14k
        if (_offsets_pos > _data.get_size() - sizeof(uint32_t)) {
173
0
            return Status::Corruption(
174
0
                    "file corruption: offsets pos beyonds data_size: {}, num_element: {}"
175
0
                    ", offset_pos: {}",
176
0
                    _data.size, _num_elems, _offsets_pos);
177
0
        }
178
2.14k
        _parsed = true;
179
180
2.14k
        return Status::OK();
181
2.14k
    }
_ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE26EE4initEv
Line
Count
Source
158
2.67k
    Status init() override {
159
2.67k
        CHECK(!_parsed);
160
161
2.67k
        if (_data.size < sizeof(uint32_t)) {
162
0
            return Status::Corruption(
163
0
                    "file corruption: not enough bytes for trailer in BinaryPlainPageDecoder ."
164
0
                    "invalid data size:{}, trailer size:{}",
165
0
                    _data.size, sizeof(uint32_t));
166
0
        }
167
168
        // Decode trailer
169
2.67k
        _num_elems = decode_fixed32_le((const uint8_t*)&_data[_data.get_size() - sizeof(uint32_t)]);
170
2.67k
        _offsets_pos = cast_set<uint32_t>(_data.get_size() - ((_num_elems + 1) * sizeof(uint32_t)));
171
172
2.67k
        if (_offsets_pos > _data.get_size() - sizeof(uint32_t)) {
173
0
            return Status::Corruption(
174
0
                    "file corruption: offsets pos beyonds data_size: {}, num_element: {}"
175
0
                    ", offset_pos: {}",
176
0
                    _data.size, _num_elems, _offsets_pos);
177
0
        }
178
2.67k
        _parsed = true;
179
180
2.67k
        return Status::OK();
181
2.67k
    }
_ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE13EE4initEv
Line
Count
Source
158
9
    Status init() override {
159
9
        CHECK(!_parsed);
160
161
9
        if (_data.size < sizeof(uint32_t)) {
162
0
            return Status::Corruption(
163
0
                    "file corruption: not enough bytes for trailer in BinaryPlainPageDecoder ."
164
0
                    "invalid data size:{}, trailer size:{}",
165
0
                    _data.size, sizeof(uint32_t));
166
0
        }
167
168
        // Decode trailer
169
9
        _num_elems = decode_fixed32_le((const uint8_t*)&_data[_data.get_size() - sizeof(uint32_t)]);
170
9
        _offsets_pos = cast_set<uint32_t>(_data.get_size() - ((_num_elems + 1) * sizeof(uint32_t)));
171
172
9
        if (_offsets_pos > _data.get_size() - sizeof(uint32_t)) {
173
0
            return Status::Corruption(
174
0
                    "file corruption: offsets pos beyonds data_size: {}, num_element: {}"
175
0
                    ", offset_pos: {}",
176
0
                    _data.size, _num_elems, _offsets_pos);
177
0
        }
178
9
        _parsed = true;
179
180
9
        return Status::OK();
181
9
    }
_ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE36EE4initEv
Line
Count
Source
158
1
    Status init() override {
159
1
        CHECK(!_parsed);
160
161
1
        if (_data.size < sizeof(uint32_t)) {
162
0
            return Status::Corruption(
163
0
                    "file corruption: not enough bytes for trailer in BinaryPlainPageDecoder ."
164
0
                    "invalid data size:{}, trailer size:{}",
165
0
                    _data.size, sizeof(uint32_t));
166
0
        }
167
168
        // Decode trailer
169
1
        _num_elems = decode_fixed32_le((const uint8_t*)&_data[_data.get_size() - sizeof(uint32_t)]);
170
1
        _offsets_pos = cast_set<uint32_t>(_data.get_size() - ((_num_elems + 1) * sizeof(uint32_t)));
171
172
1
        if (_offsets_pos > _data.get_size() - sizeof(uint32_t)) {
173
0
            return Status::Corruption(
174
0
                    "file corruption: offsets pos beyonds data_size: {}, num_element: {}"
175
0
                    ", offset_pos: {}",
176
0
                    _data.size, _num_elems, _offsets_pos);
177
0
        }
178
1
        _parsed = true;
179
180
1
        return Status::OK();
181
1
    }
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE34EE4initEv
_ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE35EE4initEv
Line
Count
Source
158
117
    Status init() override {
159
117
        CHECK(!_parsed);
160
161
117
        if (_data.size < sizeof(uint32_t)) {
162
0
            return Status::Corruption(
163
0
                    "file corruption: not enough bytes for trailer in BinaryPlainPageDecoder ."
164
0
                    "invalid data size:{}, trailer size:{}",
165
0
                    _data.size, sizeof(uint32_t));
166
0
        }
167
168
        // Decode trailer
169
117
        _num_elems = decode_fixed32_le((const uint8_t*)&_data[_data.get_size() - sizeof(uint32_t)]);
170
117
        _offsets_pos = cast_set<uint32_t>(_data.get_size() - ((_num_elems + 1) * sizeof(uint32_t)));
171
172
117
        if (_offsets_pos > _data.get_size() - sizeof(uint32_t)) {
173
0
            return Status::Corruption(
174
0
                    "file corruption: offsets pos beyonds data_size: {}, num_element: {}"
175
0
                    ", offset_pos: {}",
176
0
                    _data.size, _num_elems, _offsets_pos);
177
0
        }
178
117
        _parsed = true;
179
180
117
        return Status::OK();
181
117
    }
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE23EE4initEv
_ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE25EE4initEv
Line
Count
Source
158
21
    Status init() override {
159
21
        CHECK(!_parsed);
160
161
21
        if (_data.size < sizeof(uint32_t)) {
162
0
            return Status::Corruption(
163
0
                    "file corruption: not enough bytes for trailer in BinaryPlainPageDecoder ."
164
0
                    "invalid data size:{}, trailer size:{}",
165
0
                    _data.size, sizeof(uint32_t));
166
0
        }
167
168
        // Decode trailer
169
21
        _num_elems = decode_fixed32_le((const uint8_t*)&_data[_data.get_size() - sizeof(uint32_t)]);
170
21
        _offsets_pos = cast_set<uint32_t>(_data.get_size() - ((_num_elems + 1) * sizeof(uint32_t)));
171
172
21
        if (_offsets_pos > _data.get_size() - sizeof(uint32_t)) {
173
0
            return Status::Corruption(
174
0
                    "file corruption: offsets pos beyonds data_size: {}, num_element: {}"
175
0
                    ", offset_pos: {}",
176
0
                    _data.size, _num_elems, _offsets_pos);
177
0
        }
178
21
        _parsed = true;
179
180
21
        return Status::OK();
181
21
    }
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE27EE4initEv
182
183
293
    Status seek_to_position_in_page(size_t pos) override {
184
293
        if (_num_elems == 0) [[unlikely]] {
185
0
            if (pos != 0) {
186
0
                return Status::Error<ErrorCode::INTERNAL_ERROR, false>(
187
0
                        "seek pos {} is larger than total elements  {}", pos, _num_elems);
188
0
            }
189
0
        }
190
293
        DCHECK_LE(pos, _num_elems);
191
293
        _cur_idx = pos;
192
293
        return Status::OK();
193
293
    }
_ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE17EE24seek_to_position_in_pageEm
Line
Count
Source
183
242
    Status seek_to_position_in_page(size_t pos) override {
184
242
        if (_num_elems == 0) [[unlikely]] {
185
0
            if (pos != 0) {
186
0
                return Status::Error<ErrorCode::INTERNAL_ERROR, false>(
187
0
                        "seek pos {} is larger than total elements  {}", pos, _num_elems);
188
0
            }
189
0
        }
190
242
        DCHECK_LE(pos, _num_elems);
191
242
        _cur_idx = pos;
192
242
        return Status::OK();
193
242
    }
_ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE26EE24seek_to_position_in_pageEm
Line
Count
Source
183
4
    Status seek_to_position_in_page(size_t pos) override {
184
4
        if (_num_elems == 0) [[unlikely]] {
185
0
            if (pos != 0) {
186
0
                return Status::Error<ErrorCode::INTERNAL_ERROR, false>(
187
0
                        "seek pos {} is larger than total elements  {}", pos, _num_elems);
188
0
            }
189
0
        }
190
4
        DCHECK_LE(pos, _num_elems);
191
4
        _cur_idx = pos;
192
4
        return Status::OK();
193
4
    }
_ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE13EE24seek_to_position_in_pageEm
Line
Count
Source
183
4
    Status seek_to_position_in_page(size_t pos) override {
184
4
        if (_num_elems == 0) [[unlikely]] {
185
0
            if (pos != 0) {
186
0
                return Status::Error<ErrorCode::INTERNAL_ERROR, false>(
187
0
                        "seek pos {} is larger than total elements  {}", pos, _num_elems);
188
0
            }
189
0
        }
190
4
        DCHECK_LE(pos, _num_elems);
191
4
        _cur_idx = pos;
192
4
        return Status::OK();
193
4
    }
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE36EE24seek_to_position_in_pageEm
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE34EE24seek_to_position_in_pageEm
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE35EE24seek_to_position_in_pageEm
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE23EE24seek_to_position_in_pageEm
_ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE25EE24seek_to_position_in_pageEm
Line
Count
Source
183
43
    Status seek_to_position_in_page(size_t pos) override {
184
43
        if (_num_elems == 0) [[unlikely]] {
185
0
            if (pos != 0) {
186
0
                return Status::Error<ErrorCode::INTERNAL_ERROR, false>(
187
0
                        "seek pos {} is larger than total elements  {}", pos, _num_elems);
188
0
            }
189
0
        }
190
43
        DCHECK_LE(pos, _num_elems);
191
43
        _cur_idx = pos;
192
43
        return Status::OK();
193
43
    }
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE27EE24seek_to_position_in_pageEm
194
195
1.68k
    Status next_batch(size_t* n, MutableColumnPtr& dst) override {
196
1.68k
        DCHECK(_parsed);
197
1.68k
        if (*n == 0 || _cur_idx >= _num_elems) [[unlikely]] {
198
3
            *n = 0;
199
3
            return Status::OK();
200
3
        }
201
1.68k
        const size_t max_fetch = std::min(*n, static_cast<size_t>(_num_elems - _cur_idx));
202
203
1.68k
        if (_options.only_read_offsets) {
204
            // OFFSET_ONLY mode: read string lengths from page offset trailer
205
            // without copying actual char data. This allows length() to work.
206
0
            _offsets.resize(max_fetch);
207
0
            for (size_t i = 0; i < max_fetch; ++i) {
208
0
                uint32_t str_start = offset(_cur_idx + i);
209
0
                uint32_t str_end = offset(_cur_idx + i + 1);
210
0
                _offsets[i] = str_end - str_start;
211
0
            }
212
0
            dst->insert_offsets_from_lengths(_offsets.data(), max_fetch);
213
0
            _cur_idx += max_fetch;
214
0
            *n = max_fetch;
215
0
            return Status::OK();
216
0
        }
217
218
1.68k
        uint32_t last_offset = guarded_offset(_cur_idx);
219
1.68k
        _offsets.resize(max_fetch + 1);
220
1.68k
        _offsets[0] = last_offset;
221
456k
        for (int i = 0; i < max_fetch - 1; i++, _cur_idx++) {
222
454k
            const uint32_t start_offset = last_offset;
223
454k
            last_offset = guarded_offset(_cur_idx + 1);
224
454k
            _offsets[i + 1] = last_offset;
225
454k
            if constexpr (Type == FieldType::OLAP_FIELD_TYPE_BITMAP) {
226
0
                if (_options.need_check_bitmap) {
227
0
                    RETURN_IF_ERROR(BitmapTypeCode::validate(*(_data.data + start_offset)));
228
0
                }
229
0
            }
230
454k
        }
231
1.68k
        _cur_idx++;
232
1.68k
        _offsets[max_fetch] = offset(_cur_idx);
233
1.68k
        if constexpr (Type == FieldType::OLAP_FIELD_TYPE_BITMAP) {
234
43
            if (_options.need_check_bitmap) {
235
0
                RETURN_IF_ERROR(BitmapTypeCode::validate(*(_data.data + last_offset)));
236
0
            }
237
43
        }
238
43
        dst->insert_many_continuous_binary_data(_data.data, _offsets.data(), max_fetch);
239
240
1.68k
        *n = max_fetch;
241
1.68k
        return Status::OK();
242
1.68k
    }
_ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE17EE10next_batchEPmRNS_3COWINS_7IColumnEE11mutable_ptrIS6_EE
Line
Count
Source
195
1.62k
    Status next_batch(size_t* n, MutableColumnPtr& dst) override {
196
1.62k
        DCHECK(_parsed);
197
1.62k
        if (*n == 0 || _cur_idx >= _num_elems) [[unlikely]] {
198
2
            *n = 0;
199
2
            return Status::OK();
200
2
        }
201
1.62k
        const size_t max_fetch = std::min(*n, static_cast<size_t>(_num_elems - _cur_idx));
202
203
1.62k
        if (_options.only_read_offsets) {
204
            // OFFSET_ONLY mode: read string lengths from page offset trailer
205
            // without copying actual char data. This allows length() to work.
206
0
            _offsets.resize(max_fetch);
207
0
            for (size_t i = 0; i < max_fetch; ++i) {
208
0
                uint32_t str_start = offset(_cur_idx + i);
209
0
                uint32_t str_end = offset(_cur_idx + i + 1);
210
0
                _offsets[i] = str_end - str_start;
211
0
            }
212
0
            dst->insert_offsets_from_lengths(_offsets.data(), max_fetch);
213
0
            _cur_idx += max_fetch;
214
0
            *n = max_fetch;
215
0
            return Status::OK();
216
0
        }
217
218
1.62k
        uint32_t last_offset = guarded_offset(_cur_idx);
219
1.62k
        _offsets.resize(max_fetch + 1);
220
1.62k
        _offsets[0] = last_offset;
221
456k
        for (int i = 0; i < max_fetch - 1; i++, _cur_idx++) {
222
454k
            const uint32_t start_offset = last_offset;
223
454k
            last_offset = guarded_offset(_cur_idx + 1);
224
454k
            _offsets[i + 1] = last_offset;
225
            if constexpr (Type == FieldType::OLAP_FIELD_TYPE_BITMAP) {
226
                if (_options.need_check_bitmap) {
227
                    RETURN_IF_ERROR(BitmapTypeCode::validate(*(_data.data + start_offset)));
228
                }
229
            }
230
454k
        }
231
1.62k
        _cur_idx++;
232
1.62k
        _offsets[max_fetch] = offset(_cur_idx);
233
        if constexpr (Type == FieldType::OLAP_FIELD_TYPE_BITMAP) {
234
            if (_options.need_check_bitmap) {
235
                RETURN_IF_ERROR(BitmapTypeCode::validate(*(_data.data + last_offset)));
236
            }
237
        }
238
1.62k
        dst->insert_many_continuous_binary_data(_data.data, _offsets.data(), max_fetch);
239
240
1.62k
        *n = max_fetch;
241
1.62k
        return Status::OK();
242
1.62k
    }
_ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE26EE10next_batchEPmRNS_3COWINS_7IColumnEE11mutable_ptrIS6_EE
Line
Count
Source
195
8
    Status next_batch(size_t* n, MutableColumnPtr& dst) override {
196
8
        DCHECK(_parsed);
197
8
        if (*n == 0 || _cur_idx >= _num_elems) [[unlikely]] {
198
1
            *n = 0;
199
1
            return Status::OK();
200
1
        }
201
7
        const size_t max_fetch = std::min(*n, static_cast<size_t>(_num_elems - _cur_idx));
202
203
7
        if (_options.only_read_offsets) {
204
            // OFFSET_ONLY mode: read string lengths from page offset trailer
205
            // without copying actual char data. This allows length() to work.
206
0
            _offsets.resize(max_fetch);
207
0
            for (size_t i = 0; i < max_fetch; ++i) {
208
0
                uint32_t str_start = offset(_cur_idx + i);
209
0
                uint32_t str_end = offset(_cur_idx + i + 1);
210
0
                _offsets[i] = str_end - str_start;
211
0
            }
212
0
            dst->insert_offsets_from_lengths(_offsets.data(), max_fetch);
213
0
            _cur_idx += max_fetch;
214
0
            *n = max_fetch;
215
0
            return Status::OK();
216
0
        }
217
218
7
        uint32_t last_offset = guarded_offset(_cur_idx);
219
7
        _offsets.resize(max_fetch + 1);
220
7
        _offsets[0] = last_offset;
221
18
        for (int i = 0; i < max_fetch - 1; i++, _cur_idx++) {
222
11
            const uint32_t start_offset = last_offset;
223
11
            last_offset = guarded_offset(_cur_idx + 1);
224
11
            _offsets[i + 1] = last_offset;
225
            if constexpr (Type == FieldType::OLAP_FIELD_TYPE_BITMAP) {
226
                if (_options.need_check_bitmap) {
227
                    RETURN_IF_ERROR(BitmapTypeCode::validate(*(_data.data + start_offset)));
228
                }
229
            }
230
11
        }
231
7
        _cur_idx++;
232
7
        _offsets[max_fetch] = offset(_cur_idx);
233
        if constexpr (Type == FieldType::OLAP_FIELD_TYPE_BITMAP) {
234
            if (_options.need_check_bitmap) {
235
                RETURN_IF_ERROR(BitmapTypeCode::validate(*(_data.data + last_offset)));
236
            }
237
        }
238
7
        dst->insert_many_continuous_binary_data(_data.data, _offsets.data(), max_fetch);
239
240
7
        *n = max_fetch;
241
7
        return Status::OK();
242
7
    }
_ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE13EE10next_batchEPmRNS_3COWINS_7IColumnEE11mutable_ptrIS6_EE
Line
Count
Source
195
11
    Status next_batch(size_t* n, MutableColumnPtr& dst) override {
196
11
        DCHECK(_parsed);
197
11
        if (*n == 0 || _cur_idx >= _num_elems) [[unlikely]] {
198
0
            *n = 0;
199
0
            return Status::OK();
200
0
        }
201
11
        const size_t max_fetch = std::min(*n, static_cast<size_t>(_num_elems - _cur_idx));
202
203
11
        if (_options.only_read_offsets) {
204
            // OFFSET_ONLY mode: read string lengths from page offset trailer
205
            // without copying actual char data. This allows length() to work.
206
0
            _offsets.resize(max_fetch);
207
0
            for (size_t i = 0; i < max_fetch; ++i) {
208
0
                uint32_t str_start = offset(_cur_idx + i);
209
0
                uint32_t str_end = offset(_cur_idx + i + 1);
210
0
                _offsets[i] = str_end - str_start;
211
0
            }
212
0
            dst->insert_offsets_from_lengths(_offsets.data(), max_fetch);
213
0
            _cur_idx += max_fetch;
214
0
            *n = max_fetch;
215
0
            return Status::OK();
216
0
        }
217
218
11
        uint32_t last_offset = guarded_offset(_cur_idx);
219
11
        _offsets.resize(max_fetch + 1);
220
11
        _offsets[0] = last_offset;
221
36
        for (int i = 0; i < max_fetch - 1; i++, _cur_idx++) {
222
25
            const uint32_t start_offset = last_offset;
223
25
            last_offset = guarded_offset(_cur_idx + 1);
224
25
            _offsets[i + 1] = last_offset;
225
            if constexpr (Type == FieldType::OLAP_FIELD_TYPE_BITMAP) {
226
                if (_options.need_check_bitmap) {
227
                    RETURN_IF_ERROR(BitmapTypeCode::validate(*(_data.data + start_offset)));
228
                }
229
            }
230
25
        }
231
11
        _cur_idx++;
232
11
        _offsets[max_fetch] = offset(_cur_idx);
233
        if constexpr (Type == FieldType::OLAP_FIELD_TYPE_BITMAP) {
234
            if (_options.need_check_bitmap) {
235
                RETURN_IF_ERROR(BitmapTypeCode::validate(*(_data.data + last_offset)));
236
            }
237
        }
238
11
        dst->insert_many_continuous_binary_data(_data.data, _offsets.data(), max_fetch);
239
240
11
        *n = max_fetch;
241
11
        return Status::OK();
242
11
    }
_ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE36EE10next_batchEPmRNS_3COWINS_7IColumnEE11mutable_ptrIS6_EE
Line
Count
Source
195
1
    Status next_batch(size_t* n, MutableColumnPtr& dst) override {
196
1
        DCHECK(_parsed);
197
1
        if (*n == 0 || _cur_idx >= _num_elems) [[unlikely]] {
198
0
            *n = 0;
199
0
            return Status::OK();
200
0
        }
201
1
        const size_t max_fetch = std::min(*n, static_cast<size_t>(_num_elems - _cur_idx));
202
203
1
        if (_options.only_read_offsets) {
204
            // OFFSET_ONLY mode: read string lengths from page offset trailer
205
            // without copying actual char data. This allows length() to work.
206
0
            _offsets.resize(max_fetch);
207
0
            for (size_t i = 0; i < max_fetch; ++i) {
208
0
                uint32_t str_start = offset(_cur_idx + i);
209
0
                uint32_t str_end = offset(_cur_idx + i + 1);
210
0
                _offsets[i] = str_end - str_start;
211
0
            }
212
0
            dst->insert_offsets_from_lengths(_offsets.data(), max_fetch);
213
0
            _cur_idx += max_fetch;
214
0
            *n = max_fetch;
215
0
            return Status::OK();
216
0
        }
217
218
1
        uint32_t last_offset = guarded_offset(_cur_idx);
219
1
        _offsets.resize(max_fetch + 1);
220
1
        _offsets[0] = last_offset;
221
4
        for (int i = 0; i < max_fetch - 1; i++, _cur_idx++) {
222
3
            const uint32_t start_offset = last_offset;
223
3
            last_offset = guarded_offset(_cur_idx + 1);
224
3
            _offsets[i + 1] = last_offset;
225
            if constexpr (Type == FieldType::OLAP_FIELD_TYPE_BITMAP) {
226
                if (_options.need_check_bitmap) {
227
                    RETURN_IF_ERROR(BitmapTypeCode::validate(*(_data.data + start_offset)));
228
                }
229
            }
230
3
        }
231
1
        _cur_idx++;
232
1
        _offsets[max_fetch] = offset(_cur_idx);
233
        if constexpr (Type == FieldType::OLAP_FIELD_TYPE_BITMAP) {
234
            if (_options.need_check_bitmap) {
235
                RETURN_IF_ERROR(BitmapTypeCode::validate(*(_data.data + last_offset)));
236
            }
237
        }
238
1
        dst->insert_many_continuous_binary_data(_data.data, _offsets.data(), max_fetch);
239
240
1
        *n = max_fetch;
241
1
        return Status::OK();
242
1
    }
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE34EE10next_batchEPmRNS_3COWINS_7IColumnEE11mutable_ptrIS6_EE
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE35EE10next_batchEPmRNS_3COWINS_7IColumnEE11mutable_ptrIS6_EE
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE23EE10next_batchEPmRNS_3COWINS_7IColumnEE11mutable_ptrIS6_EE
_ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE25EE10next_batchEPmRNS_3COWINS_7IColumnEE11mutable_ptrIS6_EE
Line
Count
Source
195
43
    Status next_batch(size_t* n, MutableColumnPtr& dst) override {
196
43
        DCHECK(_parsed);
197
43
        if (*n == 0 || _cur_idx >= _num_elems) [[unlikely]] {
198
0
            *n = 0;
199
0
            return Status::OK();
200
0
        }
201
43
        const size_t max_fetch = std::min(*n, static_cast<size_t>(_num_elems - _cur_idx));
202
203
43
        if (_options.only_read_offsets) {
204
            // OFFSET_ONLY mode: read string lengths from page offset trailer
205
            // without copying actual char data. This allows length() to work.
206
0
            _offsets.resize(max_fetch);
207
0
            for (size_t i = 0; i < max_fetch; ++i) {
208
0
                uint32_t str_start = offset(_cur_idx + i);
209
0
                uint32_t str_end = offset(_cur_idx + i + 1);
210
0
                _offsets[i] = str_end - str_start;
211
0
            }
212
0
            dst->insert_offsets_from_lengths(_offsets.data(), max_fetch);
213
0
            _cur_idx += max_fetch;
214
0
            *n = max_fetch;
215
0
            return Status::OK();
216
0
        }
217
218
43
        uint32_t last_offset = guarded_offset(_cur_idx);
219
43
        _offsets.resize(max_fetch + 1);
220
43
        _offsets[0] = last_offset;
221
43
        for (int i = 0; i < max_fetch - 1; i++, _cur_idx++) {
222
0
            const uint32_t start_offset = last_offset;
223
0
            last_offset = guarded_offset(_cur_idx + 1);
224
0
            _offsets[i + 1] = last_offset;
225
0
            if constexpr (Type == FieldType::OLAP_FIELD_TYPE_BITMAP) {
226
0
                if (_options.need_check_bitmap) {
227
0
                    RETURN_IF_ERROR(BitmapTypeCode::validate(*(_data.data + start_offset)));
228
0
                }
229
0
            }
230
0
        }
231
43
        _cur_idx++;
232
43
        _offsets[max_fetch] = offset(_cur_idx);
233
43
        if constexpr (Type == FieldType::OLAP_FIELD_TYPE_BITMAP) {
234
43
            if (_options.need_check_bitmap) {
235
0
                RETURN_IF_ERROR(BitmapTypeCode::validate(*(_data.data + last_offset)));
236
0
            }
237
43
        }
238
43
        dst->insert_many_continuous_binary_data(_data.data, _offsets.data(), max_fetch);
239
240
43
        *n = max_fetch;
241
43
        return Status::OK();
242
43
    }
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE27EE10next_batchEPmRNS_3COWINS_7IColumnEE11mutable_ptrIS6_EE
243
244
    Status read_by_rowids(const rowid_t* rowids, ordinal_t page_first_ordinal, size_t* n,
245
558
                          MutableColumnPtr& dst) override {
246
558
        DCHECK(_parsed);
247
558
        if (*n == 0) [[unlikely]] {
248
0
            *n = 0;
249
0
            return Status::OK();
250
0
        }
251
252
558
        auto total = *n;
253
254
558
        if (_options.only_read_offsets) {
255
            // OFFSET_ONLY mode: read string lengths from page offset trailer
256
            // without copying actual char data. This allows length() to work.
257
0
            size_t read_count = 0;
258
0
            _offsets.resize(total);
259
0
            for (size_t i = 0; i < total; ++i) {
260
0
                ordinal_t ord = rowids[i] - page_first_ordinal;
261
0
                if (UNLIKELY(ord >= _num_elems)) {
262
0
                    break;
263
0
                }
264
0
                uint32_t str_start = offset(ord);
265
0
                uint32_t str_end = offset(ord + 1);
266
0
                _offsets[read_count] = str_end - str_start;
267
0
                read_count++;
268
0
            }
269
0
            if (read_count > 0) {
270
0
                dst->insert_offsets_from_lengths(_offsets.data(), read_count);
271
0
            }
272
0
            *n = read_count;
273
0
            return Status::OK();
274
0
        }
275
276
558
        size_t read_count = 0;
277
558
        _binary_data.resize(total);
278
2.51k
        for (size_t i = 0; i < total; ++i) {
279
1.96k
            ordinal_t ord = rowids[i] - page_first_ordinal;
280
1.96k
            if (UNLIKELY(ord >= _num_elems)) {
281
0
                break;
282
0
            }
283
284
1.96k
            const uint32_t start_offset = offset(ord);
285
1.96k
            _binary_data[read_count].data = _data.mutable_data() + start_offset;
286
1.96k
            _binary_data[read_count].size = offset(ord + 1) - start_offset;
287
1.96k
            read_count++;
288
1.96k
        }
289
290
558
        if (LIKELY(read_count > 0)) {
291
558
            dst->insert_many_strings(_binary_data.data(), read_count);
292
558
        }
293
294
558
        *n = read_count;
295
558
        return Status::OK();
296
558
    }
_ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE17EE14read_by_rowidsEPKjmPmRNS_3COWINS_7IColumnEE11mutable_ptrIS8_EE
Line
Count
Source
245
556
                          MutableColumnPtr& dst) override {
246
556
        DCHECK(_parsed);
247
556
        if (*n == 0) [[unlikely]] {
248
0
            *n = 0;
249
0
            return Status::OK();
250
0
        }
251
252
556
        auto total = *n;
253
254
556
        if (_options.only_read_offsets) {
255
            // OFFSET_ONLY mode: read string lengths from page offset trailer
256
            // without copying actual char data. This allows length() to work.
257
0
            size_t read_count = 0;
258
0
            _offsets.resize(total);
259
0
            for (size_t i = 0; i < total; ++i) {
260
0
                ordinal_t ord = rowids[i] - page_first_ordinal;
261
0
                if (UNLIKELY(ord >= _num_elems)) {
262
0
                    break;
263
0
                }
264
0
                uint32_t str_start = offset(ord);
265
0
                uint32_t str_end = offset(ord + 1);
266
0
                _offsets[read_count] = str_end - str_start;
267
0
                read_count++;
268
0
            }
269
0
            if (read_count > 0) {
270
0
                dst->insert_offsets_from_lengths(_offsets.data(), read_count);
271
0
            }
272
0
            *n = read_count;
273
0
            return Status::OK();
274
0
        }
275
276
556
        size_t read_count = 0;
277
556
        _binary_data.resize(total);
278
2.50k
        for (size_t i = 0; i < total; ++i) {
279
1.95k
            ordinal_t ord = rowids[i] - page_first_ordinal;
280
1.95k
            if (UNLIKELY(ord >= _num_elems)) {
281
0
                break;
282
0
            }
283
284
1.95k
            const uint32_t start_offset = offset(ord);
285
1.95k
            _binary_data[read_count].data = _data.mutable_data() + start_offset;
286
1.95k
            _binary_data[read_count].size = offset(ord + 1) - start_offset;
287
1.95k
            read_count++;
288
1.95k
        }
289
290
556
        if (LIKELY(read_count > 0)) {
291
556
            dst->insert_many_strings(_binary_data.data(), read_count);
292
556
        }
293
294
556
        *n = read_count;
295
556
        return Status::OK();
296
556
    }
_ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE26EE14read_by_rowidsEPKjmPmRNS_3COWINS_7IColumnEE11mutable_ptrIS8_EE
Line
Count
Source
245
1
                          MutableColumnPtr& dst) override {
246
1
        DCHECK(_parsed);
247
1
        if (*n == 0) [[unlikely]] {
248
0
            *n = 0;
249
0
            return Status::OK();
250
0
        }
251
252
1
        auto total = *n;
253
254
1
        if (_options.only_read_offsets) {
255
            // OFFSET_ONLY mode: read string lengths from page offset trailer
256
            // without copying actual char data. This allows length() to work.
257
0
            size_t read_count = 0;
258
0
            _offsets.resize(total);
259
0
            for (size_t i = 0; i < total; ++i) {
260
0
                ordinal_t ord = rowids[i] - page_first_ordinal;
261
0
                if (UNLIKELY(ord >= _num_elems)) {
262
0
                    break;
263
0
                }
264
0
                uint32_t str_start = offset(ord);
265
0
                uint32_t str_end = offset(ord + 1);
266
0
                _offsets[read_count] = str_end - str_start;
267
0
                read_count++;
268
0
            }
269
0
            if (read_count > 0) {
270
0
                dst->insert_offsets_from_lengths(_offsets.data(), read_count);
271
0
            }
272
0
            *n = read_count;
273
0
            return Status::OK();
274
0
        }
275
276
1
        size_t read_count = 0;
277
1
        _binary_data.resize(total);
278
5
        for (size_t i = 0; i < total; ++i) {
279
4
            ordinal_t ord = rowids[i] - page_first_ordinal;
280
4
            if (UNLIKELY(ord >= _num_elems)) {
281
0
                break;
282
0
            }
283
284
4
            const uint32_t start_offset = offset(ord);
285
4
            _binary_data[read_count].data = _data.mutable_data() + start_offset;
286
4
            _binary_data[read_count].size = offset(ord + 1) - start_offset;
287
4
            read_count++;
288
4
        }
289
290
1
        if (LIKELY(read_count > 0)) {
291
1
            dst->insert_many_strings(_binary_data.data(), read_count);
292
1
        }
293
294
1
        *n = read_count;
295
1
        return Status::OK();
296
1
    }
_ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE13EE14read_by_rowidsEPKjmPmRNS_3COWINS_7IColumnEE11mutable_ptrIS8_EE
Line
Count
Source
245
1
                          MutableColumnPtr& dst) override {
246
1
        DCHECK(_parsed);
247
1
        if (*n == 0) [[unlikely]] {
248
0
            *n = 0;
249
0
            return Status::OK();
250
0
        }
251
252
1
        auto total = *n;
253
254
1
        if (_options.only_read_offsets) {
255
            // OFFSET_ONLY mode: read string lengths from page offset trailer
256
            // without copying actual char data. This allows length() to work.
257
0
            size_t read_count = 0;
258
0
            _offsets.resize(total);
259
0
            for (size_t i = 0; i < total; ++i) {
260
0
                ordinal_t ord = rowids[i] - page_first_ordinal;
261
0
                if (UNLIKELY(ord >= _num_elems)) {
262
0
                    break;
263
0
                }
264
0
                uint32_t str_start = offset(ord);
265
0
                uint32_t str_end = offset(ord + 1);
266
0
                _offsets[read_count] = str_end - str_start;
267
0
                read_count++;
268
0
            }
269
0
            if (read_count > 0) {
270
0
                dst->insert_offsets_from_lengths(_offsets.data(), read_count);
271
0
            }
272
0
            *n = read_count;
273
0
            return Status::OK();
274
0
        }
275
276
1
        size_t read_count = 0;
277
1
        _binary_data.resize(total);
278
5
        for (size_t i = 0; i < total; ++i) {
279
4
            ordinal_t ord = rowids[i] - page_first_ordinal;
280
4
            if (UNLIKELY(ord >= _num_elems)) {
281
0
                break;
282
0
            }
283
284
4
            const uint32_t start_offset = offset(ord);
285
4
            _binary_data[read_count].data = _data.mutable_data() + start_offset;
286
4
            _binary_data[read_count].size = offset(ord + 1) - start_offset;
287
4
            read_count++;
288
4
        }
289
290
1
        if (LIKELY(read_count > 0)) {
291
1
            dst->insert_many_strings(_binary_data.data(), read_count);
292
1
        }
293
294
1
        *n = read_count;
295
1
        return Status::OK();
296
1
    }
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE36EE14read_by_rowidsEPKjmPmRNS_3COWINS_7IColumnEE11mutable_ptrIS8_EE
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE34EE14read_by_rowidsEPKjmPmRNS_3COWINS_7IColumnEE11mutable_ptrIS8_EE
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE35EE14read_by_rowidsEPKjmPmRNS_3COWINS_7IColumnEE11mutable_ptrIS8_EE
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE23EE14read_by_rowidsEPKjmPmRNS_3COWINS_7IColumnEE11mutable_ptrIS8_EE
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE25EE14read_by_rowidsEPKjmPmRNS_3COWINS_7IColumnEE11mutable_ptrIS8_EE
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE27EE14read_by_rowidsEPKjmPmRNS_3COWINS_7IColumnEE11mutable_ptrIS8_EE
297
298
5.62k
    size_t count() const override {
299
5.62k
        DCHECK(_parsed);
300
5.62k
        return _num_elems;
301
5.62k
    }
_ZNK5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE17EE5countEv
Line
Count
Source
298
45
    size_t count() const override {
299
        DCHECK(_parsed);
300
45
        return _num_elems;
301
45
    }
_ZNK5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE26EE5countEv
Line
Count
Source
298
5.34k
    size_t count() const override {
299
        DCHECK(_parsed);
300
5.34k
        return _num_elems;
301
5.34k
    }
_ZNK5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE13EE5countEv
Line
Count
Source
298
7
    size_t count() const override {
299
        DCHECK(_parsed);
300
7
        return _num_elems;
301
7
    }
_ZNK5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE36EE5countEv
Line
Count
Source
298
1
    size_t count() const override {
299
        DCHECK(_parsed);
300
1
        return _num_elems;
301
1
    }
Unexecuted instantiation: _ZNK5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE34EE5countEv
_ZNK5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE35EE5countEv
Line
Count
Source
298
234
    size_t count() const override {
299
        DCHECK(_parsed);
300
234
        return _num_elems;
301
234
    }
Unexecuted instantiation: _ZNK5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE23EE5countEv
Unexecuted instantiation: _ZNK5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE25EE5countEv
Unexecuted instantiation: _ZNK5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE27EE5countEv
302
303
146
    size_t current_index() const override {
304
146
        DCHECK(_parsed);
305
146
        return _cur_idx;
306
146
    }
_ZNK5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE17EE13current_indexEv
Line
Count
Source
303
95
    size_t current_index() const override {
304
        DCHECK(_parsed);
305
95
        return _cur_idx;
306
95
    }
_ZNK5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE26EE13current_indexEv
Line
Count
Source
303
4
    size_t current_index() const override {
304
        DCHECK(_parsed);
305
4
        return _cur_idx;
306
4
    }
_ZNK5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE13EE13current_indexEv
Line
Count
Source
303
4
    size_t current_index() const override {
304
        DCHECK(_parsed);
305
4
        return _cur_idx;
306
4
    }
Unexecuted instantiation: _ZNK5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE36EE13current_indexEv
Unexecuted instantiation: _ZNK5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE34EE13current_indexEv
Unexecuted instantiation: _ZNK5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE35EE13current_indexEv
Unexecuted instantiation: _ZNK5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE23EE13current_indexEv
_ZNK5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE25EE13current_indexEv
Line
Count
Source
303
43
    size_t current_index() const override {
304
        DCHECK(_parsed);
305
43
        return _cur_idx;
306
43
    }
Unexecuted instantiation: _ZNK5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE27EE13current_indexEv
307
308
2.79k
    Status get_dict_word_info(StringRef* dict_word_info) override {
309
2.79k
        if (UNLIKELY(_num_elems <= 0)) {
310
0
            return Status::OK();
311
0
        }
312
313
2.79k
        char* data_begin = (char*)&_data[0];
314
2.79k
        char* offset_ptr = (char*)&_data[_offsets_pos];
315
316
76.6k
        for (uint32_t i = 0; i < _num_elems; ++i) {
317
73.8k
            uint32_t offset = decode_fixed32_le((uint8_t*)offset_ptr);
318
73.8k
            if (offset > _offsets_pos) {
319
0
                return Status::Corruption(
320
0
                        "file corruption: offsets pos beyonds data_size: {}, num_element: {}"
321
0
                        ", offset_pos: {}, offset: {}",
322
0
                        _data.size, _num_elems, _offsets_pos, offset);
323
0
            }
324
73.8k
            dict_word_info[i].data = data_begin + offset;
325
73.8k
            offset_ptr += sizeof(uint32_t);
326
73.8k
        }
327
328
73.8k
        for (int i = 0; i < (int)_num_elems - 1; ++i) {
329
71.0k
            dict_word_info[i].size =
330
71.0k
                    (char*)dict_word_info[i + 1].data - (char*)dict_word_info[i].data;
331
71.0k
        }
332
333
2.79k
        dict_word_info[_num_elems - 1].size =
334
2.79k
                (data_begin + _offsets_pos) - (char*)dict_word_info[_num_elems - 1].data;
335
2.79k
        return Status::OK();
336
2.79k
    }
_ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE17EE18get_dict_word_infoEPNS_9StringRefE
Line
Count
Source
308
9
    Status get_dict_word_info(StringRef* dict_word_info) override {
309
9
        if (UNLIKELY(_num_elems <= 0)) {
310
0
            return Status::OK();
311
0
        }
312
313
9
        char* data_begin = (char*)&_data[0];
314
9
        char* offset_ptr = (char*)&_data[_offsets_pos];
315
316
3.27k
        for (uint32_t i = 0; i < _num_elems; ++i) {
317
3.26k
            uint32_t offset = decode_fixed32_le((uint8_t*)offset_ptr);
318
3.26k
            if (offset > _offsets_pos) {
319
0
                return Status::Corruption(
320
0
                        "file corruption: offsets pos beyonds data_size: {}, num_element: {}"
321
0
                        ", offset_pos: {}, offset: {}",
322
0
                        _data.size, _num_elems, _offsets_pos, offset);
323
0
            }
324
3.26k
            dict_word_info[i].data = data_begin + offset;
325
3.26k
            offset_ptr += sizeof(uint32_t);
326
3.26k
        }
327
328
3.26k
        for (int i = 0; i < (int)_num_elems - 1; ++i) {
329
3.25k
            dict_word_info[i].size =
330
3.25k
                    (char*)dict_word_info[i + 1].data - (char*)dict_word_info[i].data;
331
3.25k
        }
332
333
9
        dict_word_info[_num_elems - 1].size =
334
9
                (data_begin + _offsets_pos) - (char*)dict_word_info[_num_elems - 1].data;
335
9
        return Status::OK();
336
9
    }
_ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE26EE18get_dict_word_infoEPNS_9StringRefE
Line
Count
Source
308
2.66k
    Status get_dict_word_info(StringRef* dict_word_info) override {
309
2.66k
        if (UNLIKELY(_num_elems <= 0)) {
310
0
            return Status::OK();
311
0
        }
312
313
2.66k
        char* data_begin = (char*)&_data[0];
314
2.66k
        char* offset_ptr = (char*)&_data[_offsets_pos];
315
316
73.1k
        for (uint32_t i = 0; i < _num_elems; ++i) {
317
70.4k
            uint32_t offset = decode_fixed32_le((uint8_t*)offset_ptr);
318
70.4k
            if (offset > _offsets_pos) {
319
0
                return Status::Corruption(
320
0
                        "file corruption: offsets pos beyonds data_size: {}, num_element: {}"
321
0
                        ", offset_pos: {}, offset: {}",
322
0
                        _data.size, _num_elems, _offsets_pos, offset);
323
0
            }
324
70.4k
            dict_word_info[i].data = data_begin + offset;
325
70.4k
            offset_ptr += sizeof(uint32_t);
326
70.4k
        }
327
328
70.4k
        for (int i = 0; i < (int)_num_elems - 1; ++i) {
329
67.8k
            dict_word_info[i].size =
330
67.8k
                    (char*)dict_word_info[i + 1].data - (char*)dict_word_info[i].data;
331
67.8k
        }
332
333
2.66k
        dict_word_info[_num_elems - 1].size =
334
2.66k
                (data_begin + _offsets_pos) - (char*)dict_word_info[_num_elems - 1].data;
335
2.66k
        return Status::OK();
336
2.66k
    }
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE13EE18get_dict_word_infoEPNS_9StringRefE
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE36EE18get_dict_word_infoEPNS_9StringRefE
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE34EE18get_dict_word_infoEPNS_9StringRefE
_ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE35EE18get_dict_word_infoEPNS_9StringRefE
Line
Count
Source
308
117
    Status get_dict_word_info(StringRef* dict_word_info) override {
309
117
        if (UNLIKELY(_num_elems <= 0)) {
310
0
            return Status::OK();
311
0
        }
312
313
117
        char* data_begin = (char*)&_data[0];
314
117
        char* offset_ptr = (char*)&_data[_offsets_pos];
315
316
234
        for (uint32_t i = 0; i < _num_elems; ++i) {
317
117
            uint32_t offset = decode_fixed32_le((uint8_t*)offset_ptr);
318
117
            if (offset > _offsets_pos) {
319
0
                return Status::Corruption(
320
0
                        "file corruption: offsets pos beyonds data_size: {}, num_element: {}"
321
0
                        ", offset_pos: {}, offset: {}",
322
0
                        _data.size, _num_elems, _offsets_pos, offset);
323
0
            }
324
117
            dict_word_info[i].data = data_begin + offset;
325
117
            offset_ptr += sizeof(uint32_t);
326
117
        }
327
328
117
        for (int i = 0; i < (int)_num_elems - 1; ++i) {
329
0
            dict_word_info[i].size =
330
0
                    (char*)dict_word_info[i + 1].data - (char*)dict_word_info[i].data;
331
0
        }
332
333
117
        dict_word_info[_num_elems - 1].size =
334
117
                (data_begin + _offsets_pos) - (char*)dict_word_info[_num_elems - 1].data;
335
117
        return Status::OK();
336
117
    }
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE23EE18get_dict_word_infoEPNS_9StringRefE
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE25EE18get_dict_word_infoEPNS_9StringRefE
Unexecuted instantiation: _ZN5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE27EE18get_dict_word_infoEPNS_9StringRefE
337
338
private:
339
    static constexpr size_t SIZE_OF_INT32 = sizeof(uint32_t);
340
    // Return the offset within '_data' where the string value with index 'idx' can be found.
341
5.60k
    uint32_t offset(size_t idx) const {
342
5.60k
        if (idx >= _num_elems) {
343
2.13k
            return _offsets_pos;
344
2.13k
        }
345
3.47k
        return guarded_offset(idx);
346
5.60k
    }
_ZNK5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE17EE6offsetEm
Line
Count
Source
341
5.52k
    uint32_t offset(size_t idx) const {
342
5.52k
        if (idx >= _num_elems) {
343
2.09k
            return _offsets_pos;
344
2.09k
        }
345
3.42k
        return guarded_offset(idx);
346
5.52k
    }
_ZNK5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE26EE6offsetEm
Line
Count
Source
341
15
    uint32_t offset(size_t idx) const {
342
15
        if (idx >= _num_elems) {
343
6
            return _offsets_pos;
344
6
        }
345
9
        return guarded_offset(idx);
346
15
    }
_ZNK5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE13EE6offsetEm
Line
Count
Source
341
19
    uint32_t offset(size_t idx) const {
342
19
        if (idx >= _num_elems) {
343
9
            return _offsets_pos;
344
9
        }
345
10
        return guarded_offset(idx);
346
19
    }
_ZNK5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE36EE6offsetEm
Line
Count
Source
341
1
    uint32_t offset(size_t idx) const {
342
1
        if (idx >= _num_elems) {
343
1
            return _offsets_pos;
344
1
        }
345
0
        return guarded_offset(idx);
346
1
    }
Unexecuted instantiation: _ZNK5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE34EE6offsetEm
Unexecuted instantiation: _ZNK5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE35EE6offsetEm
Unexecuted instantiation: _ZNK5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE23EE6offsetEm
_ZNK5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE25EE6offsetEm
Line
Count
Source
341
43
    uint32_t offset(size_t idx) const {
342
43
        if (idx >= _num_elems) {
343
21
            return _offsets_pos;
344
21
        }
345
22
        return guarded_offset(idx);
346
43
    }
Unexecuted instantiation: _ZNK5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE27EE6offsetEm
347
348
459k
    uint32_t guarded_offset(size_t idx) const {
349
459k
        const auto* p =
350
459k
                reinterpret_cast<const uint8_t*>(&_data[_offsets_pos + idx * SIZE_OF_INT32]);
351
459k
        return decode_fixed32_le(p);
352
459k
    }
_ZNK5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE17EE14guarded_offsetEm
Line
Count
Source
348
459k
    uint32_t guarded_offset(size_t idx) const {
349
459k
        const auto* p =
350
459k
                reinterpret_cast<const uint8_t*>(&_data[_offsets_pos + idx * SIZE_OF_INT32]);
351
459k
        return decode_fixed32_le(p);
352
459k
    }
_ZNK5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE26EE14guarded_offsetEm
Line
Count
Source
348
27
    uint32_t guarded_offset(size_t idx) const {
349
27
        const auto* p =
350
27
                reinterpret_cast<const uint8_t*>(&_data[_offsets_pos + idx * SIZE_OF_INT32]);
351
27
        return decode_fixed32_le(p);
352
27
    }
_ZNK5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE13EE14guarded_offsetEm
Line
Count
Source
348
46
    uint32_t guarded_offset(size_t idx) const {
349
46
        const auto* p =
350
46
                reinterpret_cast<const uint8_t*>(&_data[_offsets_pos + idx * SIZE_OF_INT32]);
351
46
        return decode_fixed32_le(p);
352
46
    }
_ZNK5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE36EE14guarded_offsetEm
Line
Count
Source
348
4
    uint32_t guarded_offset(size_t idx) const {
349
4
        const auto* p =
350
4
                reinterpret_cast<const uint8_t*>(&_data[_offsets_pos + idx * SIZE_OF_INT32]);
351
4
        return decode_fixed32_le(p);
352
4
    }
Unexecuted instantiation: _ZNK5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE34EE14guarded_offsetEm
Unexecuted instantiation: _ZNK5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE35EE14guarded_offsetEm
Unexecuted instantiation: _ZNK5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE23EE14guarded_offsetEm
_ZNK5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE25EE14guarded_offsetEm
Line
Count
Source
348
65
    uint32_t guarded_offset(size_t idx) const {
349
65
        const auto* p =
350
65
                reinterpret_cast<const uint8_t*>(&_data[_offsets_pos + idx * SIZE_OF_INT32]);
351
65
        return decode_fixed32_le(p);
352
65
    }
Unexecuted instantiation: _ZNK5doris10segment_v222BinaryPlainPageDecoderILNS_9FieldTypeE27EE14guarded_offsetEm
353
354
    Slice _data;
355
    PageDecoderOptions _options;
356
    bool _parsed;
357
358
    uint32_t _num_elems;
359
    uint32_t _offsets_pos;
360
361
    std::vector<uint32_t> _offsets;
362
    std::vector<StringRef> _binary_data;
363
364
    // Index of the currently seeked element in the page.
365
    size_t _cur_idx;
366
    friend class BinaryDictPageDecoder;
367
    friend class FileColumnIterator;
368
};
369
370
} // namespace segment_v2
371
} // namespace doris