be/src/util/jsonb_document.h
Line | Count | Source |
1 | | /* |
2 | | * Copyright (c) 2014, Facebook, Inc. |
3 | | * All rights reserved. |
4 | | * |
5 | | * This source code is licensed under the BSD-style license found in the |
6 | | * LICENSE file in the root directory of this source tree. An additional grant |
7 | | * of patent rights can be found in the PATENTS file in the same directory. |
8 | | * |
9 | | */ |
10 | | |
11 | | /* |
12 | | * This header defines JsonbDocument, JsonbKeyValue, and various value classes |
13 | | * which are derived from JsonbValue, and a forward iterator for container |
14 | | * values - essentially everything that is related to JSONB binary data |
15 | | * structures. |
16 | | * |
17 | | * Implementation notes: |
18 | | * |
19 | | * None of the classes in this header file can be instantiated directly (i.e. |
20 | | * you cannot create a JsonbKeyValue or JsonbValue object - all constructors |
21 | | * are declared non-public). We use the classes as wrappers on the packed JSONB |
22 | | * bytes (serialized), and cast the classes (types) to the underlying packed |
23 | | * byte array. |
24 | | * |
25 | | * For the same reason, we cannot define any JSONB value class to be virtual, |
26 | | * since we never call constructors, and will not instantiate vtbl and vptrs. |
27 | | * |
28 | | * Therefore, the classes are defined as packed structures (i.e. no data |
29 | | * alignment and padding), and the private member variables of the classes are |
30 | | * defined precisely in the same order as the JSONB spec. This ensures we |
31 | | * access the packed JSONB bytes correctly. |
32 | | * |
33 | | * The packed structures are highly optimized for in-place operations with low |
34 | | * overhead. The reads (and in-place writes) are performed directly on packed |
35 | | * bytes. There is no memory allocation at all at runtime. |
36 | | * |
37 | | * For updates/writes of values that will expand the original JSONB size, the |
38 | | * write will fail, and the caller needs to handle buffer increase. |
39 | | * |
40 | | * ** Iterator ** |
41 | | * Both ObjectVal class and ArrayVal class have iterator type that you can use |
42 | | * to declare an iterator on a container object to go through the key-value |
43 | | * pairs or value list. The iterator has both non-const and const types. |
44 | | * |
45 | | * Note: iterators are forward direction only. |
46 | | * |
47 | | * ** Query ** |
48 | | * Querying into containers is through the member functions find (for key/value |
49 | | * pairs) and get (for array elements), and is in streaming style. We don't |
50 | | * need to read/scan the whole JSONB packed bytes in order to return results. |
51 | | * Once the key/index is found, we will stop search. You can use text to query |
52 | | * both objects and array (for array, text will be converted to integer index), |
53 | | * and use index to retrieve from array. Array index is 0-based. |
54 | | * |
55 | | * ** External dictionary ** |
56 | | * During query processing, you can also pass a call-back function, so the |
57 | | * search will first try to check if the key string exists in the dictionary. |
58 | | * If so, search will be based on the id instead of the key string. |
59 | | * @author Tian Xia <tianx@fb.com> |
60 | | * |
61 | | * this file is copied from |
62 | | * https://github.com/facebook/mysql-5.6/blob/fb-mysql-5.6.35/fbson/FbsonDocument.h |
63 | | * and modified by Doris |
64 | | */ |
65 | | |
66 | | #ifndef JSONB_JSONBDOCUMENT_H |
67 | | #define JSONB_JSONBDOCUMENT_H |
68 | | |
69 | | #include <algorithm> |
70 | | #include <array> |
71 | | #include <cctype> |
72 | | #include <charconv> |
73 | | #include <cmath> |
74 | | #include <cstddef> |
75 | | #include <cstdint> |
76 | | #include <limits> |
77 | | #include <string> |
78 | | #include <string_view> |
79 | | #include <type_traits> |
80 | | |
81 | | #include "common/compiler_util.h" // IWYU pragma: keep |
82 | | #include "common/status.h" |
83 | | #include "core/data_type/define_primitive_type.h" |
84 | | #include "core/string_ref.h" |
85 | | #include "core/types.h" |
86 | | #include "util/string_util.h" |
87 | | |
88 | | // #include "util/string_parser.hpp" |
89 | | |
90 | | // Concept to check for supported decimal types |
91 | | template <typename T> |
92 | | concept JsonbDecimalType = |
93 | | std::same_as<T, doris::Decimal256> || std::same_as<T, doris::Decimal64> || |
94 | | std::same_as<T, doris::Decimal128V3> || std::same_as<T, doris::Decimal32>; |
95 | | |
96 | | namespace doris { |
97 | | |
98 | | template <typename T> |
99 | | constexpr bool is_pod_v = std::is_trivial_v<T> && std::is_standard_layout_v<T>; |
100 | | |
101 | | struct JsonbStringVal; |
102 | | struct ObjectVal; |
103 | | struct ArrayVal; |
104 | | struct JsonbBinaryVal; |
105 | | struct ContainerVal; |
106 | | |
107 | | template <JsonbDecimalType T> |
108 | | struct JsonbDecimalVal; |
109 | | |
110 | | using JsonbDecimal256 = JsonbDecimalVal<Decimal256>; |
111 | | using JsonbDecimal128 = JsonbDecimalVal<Decimal128V3>; |
112 | | using JsonbDecimal64 = JsonbDecimalVal<Decimal64>; |
113 | | using JsonbDecimal32 = JsonbDecimalVal<Decimal32>; |
114 | | |
115 | | template <typename T> |
116 | | requires std::is_integral_v<T> || std::is_floating_point_v<T> |
117 | | struct NumberValT; |
118 | | |
119 | | using JsonbInt8Val = NumberValT<int8_t>; |
120 | | using JsonbInt16Val = NumberValT<int16_t>; |
121 | | using JsonbInt32Val = NumberValT<int32_t>; |
122 | | using JsonbInt64Val = NumberValT<int64_t>; |
123 | | using JsonbInt128Val = NumberValT<int128_t>; |
124 | | using JsonbDoubleVal = NumberValT<double>; |
125 | | using JsonbFloatVal = NumberValT<float>; |
126 | | |
127 | | template <typename T> |
128 | | concept JsonbPodType = (std::same_as<T, JsonbStringVal> || std::same_as<T, ObjectVal> || |
129 | | std::same_as<T, ContainerVal> || std::same_as<T, ArrayVal> || |
130 | | std::same_as<T, JsonbBinaryVal> || std::same_as<T, JsonbDecimal32> || |
131 | | std::same_as<T, JsonbDecimal64> || std::same_as<T, JsonbDecimal128> || |
132 | | std::same_as<T, JsonbDecimal256> || std::same_as<T, JsonbDecimal32> || |
133 | | std::same_as<T, JsonbInt8Val> || std::same_as<T, JsonbInt16Val> || |
134 | | std::same_as<T, JsonbInt32Val> || std::same_as<T, JsonbInt64Val> || |
135 | | std::same_as<T, JsonbInt128Val> || std::same_as<T, JsonbFloatVal> || |
136 | | std::same_as<T, JsonbFloatVal> || std::same_as<T, JsonbDoubleVal>); |
137 | | |
138 | 1.21M | #define JSONB_VER 1 |
139 | | |
140 | | using int128_t = __int128; |
141 | | |
142 | | // forward declaration |
143 | | struct JsonbValue; |
144 | | |
145 | | class JsonbOutStream; |
146 | | |
147 | | template <class OS_TYPE> |
148 | | class JsonbWriterT; |
149 | | |
150 | | using JsonbWriter = JsonbWriterT<JsonbOutStream>; |
151 | | |
152 | | const int MaxNestingLevel = 100; |
153 | | |
154 | | /* |
155 | | * JsonbType defines 10 primitive types and 2 container types, as described |
156 | | * below. |
157 | | * NOTE: Do NOT modify the existing values or their order in this enum. |
158 | | * You may only append new entries at the end before `NUM_TYPES`. |
159 | | * This enum will be used in serialized data and/or persisted data. |
160 | | * Changing existing values may break backward compatibility |
161 | | * with previously stored or transmitted data. |
162 | | * |
163 | | * primitive_value ::= |
164 | | * 0x00 //null value (0 byte) |
165 | | * | 0x01 //boolean true (0 byte) |
166 | | * | 0x02 //boolean false (0 byte) |
167 | | * | 0x03 int8 //char/int8 (1 byte) |
168 | | * | 0x04 int16 //int16 (2 bytes) |
169 | | * | 0x05 int32 //int32 (4 bytes) |
170 | | * | 0x06 int64 //int64 (8 bytes) |
171 | | * | 0x07 double //floating point (8 bytes) |
172 | | * | 0x08 string //variable length string |
173 | | * | 0x09 binary //variable length binary |
174 | | * |
175 | | * container ::= |
176 | | * 0x0A int32 key_value_list //object, int32 is the total bytes of the object |
177 | | * | 0x0B int32 value_list //array, int32 is the total bytes of the array |
178 | | */ |
179 | | enum class JsonbType : char { |
180 | | T_Null = 0x00, |
181 | | T_True = 0x01, |
182 | | T_False = 0x02, |
183 | | T_Int8 = 0x03, |
184 | | T_Int16 = 0x04, |
185 | | T_Int32 = 0x05, |
186 | | T_Int64 = 0x06, |
187 | | T_Double = 0x07, |
188 | | T_String = 0x08, |
189 | | T_Binary = 0x09, |
190 | | T_Object = 0x0A, |
191 | | T_Array = 0x0B, |
192 | | T_Int128 = 0x0C, |
193 | | T_Float = 0x0D, |
194 | | T_Decimal32 = 0x0E, // DecimalV3 only |
195 | | T_Decimal64 = 0x0F, // DecimalV3 only |
196 | | T_Decimal128 = 0x10, // DecimalV3 only |
197 | | T_Decimal256 = 0x11, // DecimalV3 only |
198 | | NUM_TYPES, |
199 | | }; |
200 | | |
201 | 11 | inline PrimitiveType get_primitive_type_from_json_type(JsonbType json_type) { |
202 | 11 | switch (json_type) { |
203 | 1 | case JsonbType::T_Null: |
204 | 1 | return TYPE_NULL; |
205 | 1 | case JsonbType::T_True: |
206 | 2 | case JsonbType::T_False: |
207 | 2 | return TYPE_BOOLEAN; |
208 | 0 | case JsonbType::T_Int8: |
209 | 0 | return TYPE_TINYINT; |
210 | 0 | case JsonbType::T_Int16: |
211 | 0 | return TYPE_SMALLINT; |
212 | 0 | case JsonbType::T_Int32: |
213 | 0 | return TYPE_INT; |
214 | 0 | case JsonbType::T_Int64: |
215 | 0 | return TYPE_BIGINT; |
216 | 0 | case JsonbType::T_Double: |
217 | 0 | return TYPE_DOUBLE; |
218 | 1 | case JsonbType::T_String: |
219 | 1 | return TYPE_STRING; |
220 | 0 | case JsonbType::T_Binary: |
221 | 0 | return TYPE_BINARY; |
222 | 0 | case JsonbType::T_Object: |
223 | 0 | return TYPE_STRUCT; |
224 | 1 | case JsonbType::T_Array: |
225 | 1 | return TYPE_ARRAY; |
226 | 1 | case JsonbType::T_Int128: |
227 | 1 | return TYPE_LARGEINT; |
228 | 1 | case JsonbType::T_Float: |
229 | 1 | return TYPE_FLOAT; |
230 | 1 | case JsonbType::T_Decimal32: |
231 | 1 | return TYPE_DECIMAL32; |
232 | 1 | case JsonbType::T_Decimal64: |
233 | 1 | return TYPE_DECIMAL64; |
234 | 1 | case JsonbType::T_Decimal128: |
235 | 1 | return TYPE_DECIMAL128I; |
236 | 1 | case JsonbType::T_Decimal256: |
237 | 1 | return TYPE_DECIMAL256; |
238 | 0 | default: |
239 | 0 | throw Exception(ErrorCode::INTERNAL_ERROR, "Unsupported JsonbType: {}", |
240 | 0 | static_cast<int>(json_type)); |
241 | 11 | } |
242 | 11 | } |
243 | | |
244 | | //for parse json path |
245 | | constexpr char SCOPE = '$'; |
246 | | constexpr char BEGIN_MEMBER = '.'; |
247 | | constexpr char BEGIN_ARRAY = '['; |
248 | | constexpr char END_ARRAY = ']'; |
249 | | constexpr char DOUBLE_QUOTE = '"'; |
250 | | constexpr char WILDCARD = '*'; |
251 | | constexpr char MINUS = '-'; |
252 | | constexpr char LAST[] = "last"; |
253 | | constexpr char ESCAPE = '\\'; |
254 | | constexpr unsigned int MEMBER_CODE = 0; |
255 | | constexpr unsigned int ARRAY_CODE = 1; |
256 | | |
257 | | /// A simple input stream class for the JSON path parser. |
258 | | class Stream { |
259 | | public: |
260 | | /// Creates an input stream reading from a character string. |
261 | | /// @param string the input string |
262 | | /// @param length the length of the input string |
263 | 109 | Stream(const char* string, size_t length) : m_position(string), m_end(string + length) {} |
264 | | |
265 | | /// Returns a pointer to the current position in the stream. |
266 | 99 | const char* position() const { return m_position; } |
267 | | |
268 | | /// Returns a pointer to the position just after the end of the stream. |
269 | 0 | const char* end() const { return m_end; } |
270 | | |
271 | | /// Returns the number of bytes remaining in the stream. |
272 | 2.01k | size_t remaining() const { |
273 | 2.01k | assert(m_position <= m_end); |
274 | 2.01k | return m_end - m_position; |
275 | 2.01k | } |
276 | | |
277 | | /// Tells if the stream has been exhausted. |
278 | 1.84k | bool exhausted() const { return remaining() == 0; } |
279 | | |
280 | | /// Reads the next byte from the stream and moves the position forward. |
281 | 101 | char read() { |
282 | 101 | assert(!exhausted()); |
283 | 101 | return *m_position++; |
284 | 101 | } |
285 | | |
286 | | /// Reads the next byte from the stream without moving the position forward. |
287 | 986 | char peek() const { |
288 | 986 | assert(!exhausted()); |
289 | 986 | return *m_position; |
290 | 986 | } |
291 | | |
292 | | /// Moves the position to the next non-whitespace character. |
293 | 365 | void skip_whitespace() { |
294 | 365 | m_position = std::find_if_not(m_position, m_end, [](char c) { return std::isspace(c); }); |
295 | 365 | } |
296 | | |
297 | | /// Moves the position n bytes forward. |
298 | 169 | void skip(size_t n) { |
299 | 169 | assert(remaining() >= n); |
300 | 169 | m_position += n; |
301 | 169 | skip_whitespace(); |
302 | 169 | } |
303 | | |
304 | 160 | void advance() { m_position++; } |
305 | | |
306 | 200 | void clear_leg_ptr() { leg_ptr = nullptr; } |
307 | | |
308 | 105 | void set_leg_ptr(char* ptr) { |
309 | 105 | clear_leg_ptr(); |
310 | 105 | leg_ptr = ptr; |
311 | 105 | } |
312 | | |
313 | 132 | char* get_leg_ptr() { return leg_ptr; } |
314 | | |
315 | 103 | void clear_leg_len() { leg_len = 0; } |
316 | | |
317 | 245 | void add_leg_len() { leg_len++; } |
318 | | |
319 | 198 | unsigned int get_leg_len() const { return leg_len; } |
320 | | |
321 | 10 | void remove_escapes() { |
322 | 10 | unsigned int new_len = 0; |
323 | 78 | for (unsigned int i = 0; i < leg_len; ++i) { |
324 | 69 | if (leg_ptr[i] != ESCAPE) { |
325 | 41 | leg_ptr[new_len++] = leg_ptr[i]; |
326 | 41 | continue; |
327 | 41 | } |
328 | | |
329 | 28 | ++i; |
330 | 28 | if (i >= leg_len) { |
331 | 1 | break; |
332 | 1 | } |
333 | | |
334 | 27 | switch (leg_ptr[i]) { |
335 | 2 | case 'b': |
336 | 2 | leg_ptr[new_len++] = '\b'; |
337 | 2 | break; |
338 | 2 | case 'f': |
339 | 2 | leg_ptr[new_len++] = '\f'; |
340 | 2 | break; |
341 | 2 | case 'n': |
342 | 2 | leg_ptr[new_len++] = '\n'; |
343 | 2 | break; |
344 | 2 | case 'r': |
345 | 2 | leg_ptr[new_len++] = '\r'; |
346 | 2 | break; |
347 | 2 | case 't': |
348 | 2 | leg_ptr[new_len++] = '\t'; |
349 | 2 | break; |
350 | 11 | case 'u': { |
351 | 11 | if (i + 4 >= leg_len || leg_ptr[i + 1] != '0' || leg_ptr[i + 2] != '0') { |
352 | 2 | leg_ptr[new_len++] = leg_ptr[i]; |
353 | 2 | break; |
354 | 2 | } |
355 | | |
356 | 18 | auto hex_to_int = [](char c) -> int { |
357 | 18 | if (c >= '0' && c <= '9') { |
358 | 12 | return c - '0'; |
359 | 12 | } |
360 | 6 | if (c >= 'a' && c <= 'f') { |
361 | 2 | return c - 'a' + 10; |
362 | 2 | } |
363 | 4 | if (c >= 'A' && c <= 'F') { |
364 | 1 | return c - 'A' + 10; |
365 | 1 | } |
366 | 3 | return -1; |
367 | 4 | }; |
368 | 9 | int high = hex_to_int(leg_ptr[i + 3]); |
369 | 9 | int low = hex_to_int(leg_ptr[i + 4]); |
370 | 9 | if (high < 0 || low < 0) { |
371 | 3 | leg_ptr[new_len++] = leg_ptr[i]; |
372 | 3 | break; |
373 | 3 | } |
374 | 6 | leg_ptr[new_len++] = static_cast<char>((high << 4) | low); |
375 | 6 | i += 4; |
376 | 6 | break; |
377 | 9 | } |
378 | 6 | default: |
379 | 6 | leg_ptr[new_len++] = leg_ptr[i]; |
380 | 6 | break; |
381 | 27 | } |
382 | 27 | } |
383 | 10 | leg_ptr[new_len] = '\0'; |
384 | 10 | leg_len = new_len; |
385 | 10 | } |
386 | | |
387 | 10 | void set_has_escapes(bool has) { has_escapes = has; } |
388 | | |
389 | 37 | bool get_has_escapes() const { return has_escapes; } |
390 | | |
391 | | private: |
392 | | /// The current position in the stream. |
393 | | const char* m_position = nullptr; |
394 | | |
395 | | /// The end of the stream. |
396 | | const char* const m_end; |
397 | | |
398 | | ///path leg ptr |
399 | | char* leg_ptr = nullptr; |
400 | | |
401 | | ///path leg len |
402 | | unsigned int leg_len; |
403 | | |
404 | | ///Whether to contain escape characters |
405 | | bool has_escapes = false; |
406 | | }; |
407 | | |
408 | | struct leg_info { |
409 | | ///path leg ptr |
410 | | char* leg_ptr = nullptr; |
411 | | |
412 | | ///path leg len |
413 | | unsigned int leg_len; |
414 | | |
415 | | ///array_index |
416 | | int array_index; |
417 | | |
418 | | ///type: 0 is member 1 is array |
419 | | unsigned int type; |
420 | | |
421 | | // NOLINTNEXTLINE(readability-non-const-parameter): str is an output parameter. |
422 | 4 | bool to_string(std::string* str) const { |
423 | 4 | if (type == MEMBER_CODE) { |
424 | 4 | str->push_back(BEGIN_MEMBER); |
425 | 4 | bool contains_space = false; |
426 | 4 | std::string tmp; |
427 | 46 | for (auto* it = leg_ptr; it != (leg_ptr + leg_len); ++it) { |
428 | 42 | auto c = static_cast<unsigned char>(*it); |
429 | 42 | if (std::isspace(c)) { |
430 | 8 | contains_space = true; |
431 | 8 | } |
432 | | |
433 | 42 | switch (*it) { |
434 | 2 | case '"': |
435 | 2 | tmp.append("\\\""); |
436 | 2 | break; |
437 | 2 | case ESCAPE: |
438 | 2 | tmp.append("\\\\"); |
439 | 2 | break; |
440 | 2 | case '\b': |
441 | 2 | tmp.append("\\b"); |
442 | 2 | break; |
443 | 2 | case '\f': |
444 | 2 | tmp.append("\\f"); |
445 | 2 | break; |
446 | 2 | case '\n': |
447 | 2 | tmp.append("\\n"); |
448 | 2 | break; |
449 | 2 | case '\r': |
450 | 2 | tmp.append("\\r"); |
451 | 2 | break; |
452 | 2 | case '\t': |
453 | 2 | tmp.append("\\t"); |
454 | 2 | break; |
455 | 28 | default: |
456 | 28 | if (c < 0x20) { |
457 | 6 | constexpr char hex[] = "0123456789abcdef"; |
458 | 6 | tmp.append("\\u00"); |
459 | 6 | tmp.push_back(hex[c >> 4]); |
460 | 6 | tmp.push_back(hex[c & 0x0F]); |
461 | 22 | } else { |
462 | 22 | tmp.push_back(*it); |
463 | 22 | } |
464 | 28 | break; |
465 | 42 | } |
466 | 42 | } |
467 | 4 | if (contains_space) { |
468 | 4 | str->push_back(DOUBLE_QUOTE); |
469 | 4 | } |
470 | 4 | str->append(tmp); |
471 | 4 | if (contains_space) { |
472 | 4 | str->push_back(DOUBLE_QUOTE); |
473 | 4 | } |
474 | 4 | return true; |
475 | 4 | } else if (type == ARRAY_CODE) { |
476 | 0 | str->push_back(BEGIN_ARRAY); |
477 | 0 | std::string int_str = std::to_string(array_index); |
478 | 0 | str->append(int_str); |
479 | 0 | str->push_back(END_ARRAY); |
480 | 0 | return true; |
481 | 0 | } else { |
482 | 0 | return false; |
483 | 0 | } |
484 | 4 | } |
485 | | }; |
486 | | |
487 | | class JsonbPath { |
488 | | public: |
489 | | // parse json path |
490 | | static bool parsePath(Stream* stream, JsonbPath* path); |
491 | | |
492 | | static bool parse_array(Stream* stream, JsonbPath* path); |
493 | | static bool parse_member(Stream* stream, JsonbPath* path); |
494 | | |
495 | | //return true if json path valid else return false |
496 | | bool seek(const char* string, size_t length); |
497 | | |
498 | 95 | void add_leg_to_leg_vector(std::unique_ptr<leg_info> leg) { |
499 | 95 | leg_vector.emplace_back(leg.release()); |
500 | 95 | } |
501 | | |
502 | 0 | void pop_leg_from_leg_vector() { leg_vector.pop_back(); } |
503 | | |
504 | | // NOLINTNEXTLINE(readability-non-const-parameter): res is an output parameter. |
505 | 2 | bool to_string(std::string* res) const { |
506 | 2 | res->push_back(SCOPE); |
507 | 2 | for (const auto& leg : leg_vector) { |
508 | 2 | auto valid = leg->to_string(res); |
509 | 2 | if (!valid) { |
510 | 0 | return false; |
511 | 0 | } |
512 | 2 | } |
513 | 2 | return true; |
514 | 2 | } |
515 | | |
516 | 187 | size_t get_leg_vector_size() const { return leg_vector.size(); } |
517 | | |
518 | 300 | leg_info* get_leg_from_leg_vector(size_t i) const { return leg_vector[i].get(); } |
519 | | |
520 | 3 | bool is_wildcard() const { return _is_wildcard; } |
521 | 99 | bool is_supper_wildcard() const { return _is_supper_wildcard; } |
522 | | |
523 | 6 | void clean() { leg_vector.clear(); } |
524 | | |
525 | | private: |
526 | | std::vector<std::unique_ptr<leg_info>> leg_vector; |
527 | | bool _is_wildcard = false; // whether the path is a wildcard path |
528 | | bool _is_supper_wildcard = false; // supper wildcard likes '$**.a' or '$**[1]' |
529 | | }; |
530 | | |
531 | | /* |
532 | | * JsonbFwdIteratorT implements JSONB's iterator template. |
533 | | * |
534 | | * Note: it is an FORWARD iterator only due to the design of JSONB format. |
535 | | */ |
536 | | template <class Iter_Type, class Cont_Type> |
537 | | class JsonbFwdIteratorT { |
538 | | public: |
539 | | using iterator = Iter_Type; |
540 | | using pointer = typename std::iterator_traits<Iter_Type>::pointer; |
541 | | using reference = typename std::iterator_traits<Iter_Type>::reference; |
542 | | |
543 | | explicit JsonbFwdIteratorT() : current_(nullptr) {} |
544 | 20.5k | explicit JsonbFwdIteratorT(const iterator& i) : current_(i) {}_ZN5doris17JsonbFwdIteratorTIPKNS_13JsonbKeyValueENS_9ObjectValEEC2ERKS3_ Line | Count | Source | 544 | 20.4k | explicit JsonbFwdIteratorT(const iterator& i) : current_(i) {} |
_ZN5doris17JsonbFwdIteratorTIPKNS_10JsonbValueENS_8ArrayValEEC2ERKS3_ Line | Count | Source | 544 | 147 | explicit JsonbFwdIteratorT(const iterator& i) : current_(i) {} |
|
545 | | |
546 | | // allow non-const to const iterator conversion (same container type) |
547 | | template <class Iter_Ty> |
548 | | JsonbFwdIteratorT(const JsonbFwdIteratorT<Iter_Ty, Cont_Type>& rhs) : current_(rhs.base()) {} |
549 | | |
550 | 20.7k | bool operator==(const JsonbFwdIteratorT& rhs) const { return (current_ == rhs.current_); }_ZNK5doris17JsonbFwdIteratorTIPKNS_13JsonbKeyValueENS_9ObjectValEEeqERKS5_ Line | Count | Source | 550 | 19.3k | bool operator==(const JsonbFwdIteratorT& rhs) const { return (current_ == rhs.current_); } |
_ZNK5doris17JsonbFwdIteratorTIPKNS_10JsonbValueENS_8ArrayValEEeqERKS5_ Line | Count | Source | 550 | 1.37k | bool operator==(const JsonbFwdIteratorT& rhs) const { return (current_ == rhs.current_); } |
|
551 | | |
552 | 20.1k | bool operator!=(const JsonbFwdIteratorT& rhs) const { return !operator==(rhs); }_ZNK5doris17JsonbFwdIteratorTIPKNS_13JsonbKeyValueENS_9ObjectValEEneERKS5_ Line | Count | Source | 552 | 18.8k | bool operator!=(const JsonbFwdIteratorT& rhs) const { return !operator==(rhs); } |
_ZNK5doris17JsonbFwdIteratorTIPKNS_10JsonbValueENS_8ArrayValEEneERKS5_ Line | Count | Source | 552 | 1.30k | bool operator!=(const JsonbFwdIteratorT& rhs) const { return !operator==(rhs); } |
|
553 | | |
554 | 1.14k | bool operator<(const JsonbFwdIteratorT& rhs) const { return (current_ < rhs.current_); } |
555 | | |
556 | | bool operator>(const JsonbFwdIteratorT& rhs) const { return !operator<(rhs); } |
557 | | |
558 | 18.2k | JsonbFwdIteratorT& operator++() { |
559 | 18.2k | current_ = (iterator)(((char*)current_) + current_->numPackedBytes()); |
560 | 18.2k | return *this; |
561 | 18.2k | } _ZN5doris17JsonbFwdIteratorTIPKNS_13JsonbKeyValueENS_9ObjectValEEppEv Line | Count | Source | 558 | 17.6k | JsonbFwdIteratorT& operator++() { | 559 | 17.6k | current_ = (iterator)(((char*)current_) + current_->numPackedBytes()); | 560 | 17.6k | return *this; | 561 | 17.6k | } |
_ZN5doris17JsonbFwdIteratorTIPKNS_10JsonbValueENS_8ArrayValEEppEv Line | Count | Source | 558 | 616 | JsonbFwdIteratorT& operator++() { | 559 | 616 | current_ = (iterator)(((char*)current_) + current_->numPackedBytes()); | 560 | 616 | return *this; | 561 | 616 | } |
|
562 | | |
563 | | JsonbFwdIteratorT operator++(int) { |
564 | | auto tmp = *this; |
565 | | current_ = (iterator)(((char*)current_) + current_->numPackedBytes()); |
566 | | return tmp; |
567 | | } |
568 | | |
569 | 616 | explicit operator pointer() { return current_; } |
570 | | |
571 | 39 | reference operator*() const { return *current_; }Unexecuted instantiation: _ZNK5doris17JsonbFwdIteratorTIPKNS_10JsonbValueENS_8ArrayValEEdeEv _ZNK5doris17JsonbFwdIteratorTIPKNS_13JsonbKeyValueENS_9ObjectValEEdeEv Line | Count | Source | 571 | 39 | reference operator*() const { return *current_; } |
|
572 | | |
573 | 29.0k | pointer operator->() const { return current_; }_ZNK5doris17JsonbFwdIteratorTIPKNS_13JsonbKeyValueENS_9ObjectValEEptEv Line | Count | Source | 573 | 29.0k | pointer operator->() const { return current_; } |
_ZNK5doris17JsonbFwdIteratorTIPKNS_10JsonbValueENS_8ArrayValEEptEv Line | Count | Source | 573 | 3 | pointer operator->() const { return current_; } |
|
574 | | |
575 | | iterator base() const { return current_; } |
576 | | |
577 | | private: |
578 | | iterator current_; |
579 | | }; |
580 | | using JsonbTypeUnder = std::underlying_type_t<JsonbType>; |
581 | | |
582 | | #if defined(__clang__) |
583 | | #pragma clang diagnostic push |
584 | | #pragma clang diagnostic ignored "-Wzero-length-array" |
585 | | #endif |
586 | | #pragma pack(push, 1) |
587 | | |
588 | | /* |
589 | | * JsonbDocument is the main object that accesses and queries JSONB packed |
590 | | * bytes. NOTE: JsonbDocument only allows object container as the top level |
591 | | * JSONB value. However, you can use the static method "createValue" to get any |
592 | | * JsonbValue object from the packed bytes. |
593 | | * |
594 | | * JsonbDocument object also dereferences to an object container value |
595 | | * (ObjectVal) once JSONB is loaded. |
596 | | * |
597 | | * ** Load ** |
598 | | * JsonbDocument is usable after loading packed bytes (memory location) into |
599 | | * the object. We only need the header and first few bytes of the payload after |
600 | | * header to verify the JSONB. |
601 | | * |
602 | | * Note: creating an JsonbDocument (through createDocument) does not allocate |
603 | | * any memory. The document object is an efficient wrapper on the packed bytes |
604 | | * which is accessed directly. |
605 | | * |
606 | | * ** Query ** |
607 | | * Query is through dereferencing into ObjectVal. |
608 | | */ |
609 | | class JsonbDocument { |
610 | | public: |
611 | | // create an JsonbDocument object from JSONB packed bytes |
612 | | [[nodiscard]] static Status checkAndCreateDocument(const char* pb, size_t size, |
613 | | const JsonbDocument** doc); |
614 | | |
615 | | // create an JsonbValue from JSONB packed bytes |
616 | | static const JsonbValue* createValue(const char* pb, size_t size); |
617 | | |
618 | 0 | uint8_t version() const { return header_.ver_; } |
619 | | |
620 | 26.4k | const JsonbValue* getValue() const { return ((const JsonbValue*)payload_); } |
621 | | |
622 | | unsigned int numPackedBytes() const; |
623 | | |
624 | | const ObjectVal* operator->() const; |
625 | | |
626 | | private: |
627 | | /* |
628 | | * JsonbHeader class defines JSONB header (internal to JsonbDocument). |
629 | | * |
630 | | * Currently it only contains version information (1-byte). We may expand the |
631 | | * header to include checksum of the JSONB binary for more security. |
632 | | */ |
633 | | struct JsonbHeader { |
634 | | uint8_t ver_; |
635 | | } header_; |
636 | | |
637 | | char payload_[0]; |
638 | | }; |
639 | | |
640 | | /* |
641 | | * JsonbKeyValue class defines JSONB key type, as described below. |
642 | | * |
643 | | * key ::= |
644 | | * 0x00 int8 //1-byte dictionary id |
645 | | * | int8 (byte*) //int8 (>0) is the size of the key string |
646 | | * |
647 | | * value ::= primitive_value | container |
648 | | * |
649 | | * JsonbKeyValue can be either an id mapping to the key string in an external |
650 | | * dictionary, or it is the original key string. Whether to read an id or a |
651 | | * string is decided by the first byte (size). |
652 | | * |
653 | | * Note: a key object must be followed by a value object. Therefore, a key |
654 | | * object implicitly refers to a key-value pair, and you can get the value |
655 | | * object right after the key object. The function numPackedBytes hence |
656 | | * indicates the total size of the key-value pair, so that we will be able go |
657 | | * to next pair from the key. |
658 | | * |
659 | | * ** Dictionary size ** |
660 | | * By default, the dictionary size is 255 (1-byte). Users can define |
661 | | * "USE_LARGE_DICT" to increase the dictionary size to 655535 (2-byte). |
662 | | */ |
663 | | class JsonbKeyValue { |
664 | | public: |
665 | | // now we use sMaxKeyId to represent an empty key |
666 | | static const int sMaxKeyId = 65535; |
667 | | using keyid_type = uint16_t; |
668 | | |
669 | | static const uint8_t sMaxKeyLen = 64; |
670 | | |
671 | | // size of the key. 0 indicates it is stored as id |
672 | 1.42k | uint8_t klen() const { return size; } |
673 | | |
674 | | // get the key string. Note the string may not be null terminated. |
675 | 767 | const char* getKeyStr() const { return key.str_; } |
676 | | |
677 | 9.33k | keyid_type getKeyId() const { return key.id_; } |
678 | | |
679 | 35.4k | unsigned int keyPackedBytes() const { |
680 | 35.4k | return size ? (sizeof(size) + size) : (sizeof(size) + sizeof(keyid_type)); |
681 | 35.4k | } |
682 | | |
683 | 17.7k | const JsonbValue* value() const { |
684 | 17.7k | return (const JsonbValue*)(((char*)this) + keyPackedBytes()); |
685 | 17.7k | } |
686 | | |
687 | | // size of the total packed bytes (key+value) |
688 | | unsigned int numPackedBytes() const; |
689 | | |
690 | | uint8_t size; |
691 | | |
692 | | union key_ { |
693 | | keyid_type id_; |
694 | | char str_[1]; |
695 | | } key; |
696 | | }; |
697 | | |
698 | | struct JsonbFindResult { |
699 | | const JsonbValue* value = nullptr; // found value |
700 | | std::unique_ptr<JsonbWriter> writer; // writer to write the value |
701 | | bool is_wildcard = false; // whether the path is a wildcard path |
702 | | }; |
703 | | |
704 | | /* |
705 | | * JsonbValue is the base class of all JSONB types. It contains only one member |
706 | | * variable - type info, which can be retrieved by member functions is[Type]() |
707 | | * or type(). |
708 | | */ |
709 | | struct JsonbValue { |
710 | | static const uint32_t sMaxValueLen = 1 << 24; // 16M |
711 | | |
712 | 4.27k | bool isNull() const { return (type == JsonbType::T_Null); } |
713 | 21 | bool isTrue() const { return (type == JsonbType::T_True); } |
714 | 1 | bool isFalse() const { return (type == JsonbType::T_False); } |
715 | 54 | bool isInt() const { return isInt8() || isInt16() || isInt32() || isInt64() || isInt128(); } |
716 | 54 | bool isInt8() const { return (type == JsonbType::T_Int8); } |
717 | 30 | bool isInt16() const { return (type == JsonbType::T_Int16); } |
718 | 28 | bool isInt32() const { return (type == JsonbType::T_Int32); } |
719 | 31 | bool isInt64() const { return (type == JsonbType::T_Int64); } |
720 | 190 | bool isDouble() const { return (type == JsonbType::T_Double); } |
721 | 153 | bool isFloat() const { return (type == JsonbType::T_Float); } |
722 | 45 | bool isString() const { return (type == JsonbType::T_String); } |
723 | 1.09k | bool isBinary() const { return (type == JsonbType::T_Binary); } |
724 | 97 | bool isObject() const { return (type == JsonbType::T_Object); } |
725 | 15 | bool isArray() const { return (type == JsonbType::T_Array); } |
726 | 31 | bool isInt128() const { return (type == JsonbType::T_Int128); } |
727 | 74 | bool isDecimal() const { |
728 | 74 | return (type == JsonbType::T_Decimal32 || type == JsonbType::T_Decimal64 || |
729 | 74 | type == JsonbType::T_Decimal128 || type == JsonbType::T_Decimal256); |
730 | 74 | } |
731 | 1 | bool isDecimal32() const { return (type == JsonbType::T_Decimal32); } |
732 | 1 | bool isDecimal64() const { return (type == JsonbType::T_Decimal64); } |
733 | 1 | bool isDecimal128() const { return (type == JsonbType::T_Decimal128); } |
734 | 1 | bool isDecimal256() const { return (type == JsonbType::T_Decimal256); } |
735 | | |
736 | 11 | PrimitiveType get_primitive_type() const { return get_primitive_type_from_json_type(type); } |
737 | | |
738 | 0 | const char* typeName() const { |
739 | 0 | switch (type) { |
740 | 0 | case JsonbType::T_Null: |
741 | 0 | return "null"; |
742 | 0 | case JsonbType::T_True: |
743 | 0 | case JsonbType::T_False: |
744 | 0 | return "bool"; |
745 | 0 | case JsonbType::T_Int8: |
746 | 0 | case JsonbType::T_Int16: |
747 | 0 | case JsonbType::T_Int32: |
748 | 0 | return "int"; |
749 | 0 | case JsonbType::T_Int64: |
750 | 0 | return "bigint"; |
751 | 0 | case JsonbType::T_Int128: |
752 | 0 | return "largeint"; |
753 | 0 | case JsonbType::T_Double: |
754 | 0 | return "double"; |
755 | 0 | case JsonbType::T_Float: |
756 | 0 | return "float"; |
757 | 0 | case JsonbType::T_String: |
758 | 0 | return "string"; |
759 | 0 | case JsonbType::T_Binary: |
760 | 0 | return "binary"; |
761 | 0 | case JsonbType::T_Object: |
762 | 0 | return "object"; |
763 | 0 | case JsonbType::T_Array: |
764 | 0 | return "array"; |
765 | 0 | case JsonbType::T_Decimal32: |
766 | 0 | return "Decimal32"; |
767 | 0 | case JsonbType::T_Decimal64: |
768 | 0 | return "Decimal64"; |
769 | 0 | case JsonbType::T_Decimal128: |
770 | 0 | return "Decimal128"; |
771 | 0 | case JsonbType::T_Decimal256: |
772 | 0 | return "Decimal256"; |
773 | 0 | default: |
774 | 0 | return "unknown"; |
775 | 0 | } |
776 | 0 | } |
777 | | |
778 | | // size of the total packed bytes |
779 | | unsigned int numPackedBytes() const; |
780 | | |
781 | | // size of the value in bytes |
782 | | unsigned int size() const; |
783 | | |
784 | | //Get the number of jsonbvalue elements |
785 | | int numElements() const; |
786 | | |
787 | | //Whether to include the jsonbvalue rhs |
788 | | bool contains(const JsonbValue* rhs) const; |
789 | | |
790 | | // find the JSONB value by JsonbPath |
791 | | JsonbFindResult findValue(JsonbPath& path) const; |
792 | | friend class JsonbDocument; |
793 | | |
794 | | JsonbType type; // type info |
795 | | |
796 | | char payload[0]; // payload, which is the packed bytes of the value |
797 | | |
798 | | /** |
799 | | * @brief Unpacks the underlying Jsonb binary content as a pointer to type `T`. |
800 | | * |
801 | | * @tparam T A POD (Plain Old Data) type that must satisfy the `JsonbPodType` concept. |
802 | | * This ensures that `T` is trivially copyable, standard-layout, and safe to |
803 | | * reinterpret from raw bytes without invoking undefined behavior. |
804 | | * |
805 | | * @return A pointer to a `const T` object, interpreted from the internal buffer. |
806 | | * |
807 | | * @note The caller must ensure that the current JsonbValue actually contains data |
808 | | * compatible with type `T`, otherwise the result is undefined. |
809 | | */ |
810 | | template <JsonbPodType T> |
811 | 52.6k | const T* unpack() const { |
812 | 52.6k | static_assert(is_pod_v<T>, "T must be a POD type"); |
813 | 52.6k | return reinterpret_cast<const T*>(payload); |
814 | 52.6k | } _ZNK5doris10JsonbValue6unpackITkNS_12JsonbPodTypeENS_9ObjectValEEEPKT_v Line | Count | Source | 811 | 19.8k | const T* unpack() const { | 812 | 19.8k | static_assert(is_pod_v<T>, "T must be a POD type"); | 813 | 19.8k | return reinterpret_cast<const T*>(payload); | 814 | 19.8k | } |
_ZNK5doris10JsonbValue6unpackITkNS_12JsonbPodTypeENS_10NumberValTIaEEEEPKT_v Line | Count | Source | 811 | 740 | const T* unpack() const { | 812 | 740 | static_assert(is_pod_v<T>, "T must be a POD type"); | 813 | 740 | return reinterpret_cast<const T*>(payload); | 814 | 740 | } |
_ZNK5doris10JsonbValue6unpackITkNS_12JsonbPodTypeENS_10NumberValTIsEEEEPKT_v Line | Count | Source | 811 | 108 | const T* unpack() const { | 812 | 108 | static_assert(is_pod_v<T>, "T must be a POD type"); | 813 | 108 | return reinterpret_cast<const T*>(payload); | 814 | 108 | } |
_ZNK5doris10JsonbValue6unpackITkNS_12JsonbPodTypeENS_10NumberValTIiEEEEPKT_v Line | Count | Source | 811 | 3.48k | const T* unpack() const { | 812 | 3.48k | static_assert(is_pod_v<T>, "T must be a POD type"); | 813 | 3.48k | return reinterpret_cast<const T*>(payload); | 814 | 3.48k | } |
_ZNK5doris10JsonbValue6unpackITkNS_12JsonbPodTypeENS_10NumberValTIlEEEEPKT_v Line | Count | Source | 811 | 1.91k | const T* unpack() const { | 812 | 1.91k | static_assert(is_pod_v<T>, "T must be a POD type"); | 813 | 1.91k | return reinterpret_cast<const T*>(payload); | 814 | 1.91k | } |
_ZNK5doris10JsonbValue6unpackITkNS_12JsonbPodTypeENS_10NumberValTInEEEEPKT_v Line | Count | Source | 811 | 4.17k | const T* unpack() const { | 812 | 4.17k | static_assert(is_pod_v<T>, "T must be a POD type"); | 813 | 4.17k | return reinterpret_cast<const T*>(payload); | 814 | 4.17k | } |
_ZNK5doris10JsonbValue6unpackITkNS_12JsonbPodTypeENS_10NumberValTIdEEEEPKT_v Line | Count | Source | 811 | 184 | const T* unpack() const { | 812 | 184 | static_assert(is_pod_v<T>, "T must be a POD type"); | 813 | 184 | return reinterpret_cast<const T*>(payload); | 814 | 184 | } |
_ZNK5doris10JsonbValue6unpackITkNS_12JsonbPodTypeENS_10NumberValTIfEEEEPKT_v Line | Count | Source | 811 | 28 | const T* unpack() const { | 812 | 28 | static_assert(is_pod_v<T>, "T must be a POD type"); | 813 | 28 | return reinterpret_cast<const T*>(payload); | 814 | 28 | } |
_ZNK5doris10JsonbValue6unpackITkNS_12JsonbPodTypeENS_15JsonbDecimalValINS_7DecimalIiEEEEEEPKT_v Line | Count | Source | 811 | 25 | const T* unpack() const { | 812 | 25 | static_assert(is_pod_v<T>, "T must be a POD type"); | 813 | 25 | return reinterpret_cast<const T*>(payload); | 814 | 25 | } |
_ZNK5doris10JsonbValue6unpackITkNS_12JsonbPodTypeENS_15JsonbDecimalValINS_7DecimalIlEEEEEEPKT_v Line | Count | Source | 811 | 15 | const T* unpack() const { | 812 | 15 | static_assert(is_pod_v<T>, "T must be a POD type"); | 813 | 15 | return reinterpret_cast<const T*>(payload); | 814 | 15 | } |
_ZNK5doris10JsonbValue6unpackITkNS_12JsonbPodTypeENS_15JsonbDecimalValINS_12Decimal128V3EEEEEPKT_v Line | Count | Source | 811 | 23 | const T* unpack() const { | 812 | 23 | static_assert(is_pod_v<T>, "T must be a POD type"); | 813 | 23 | return reinterpret_cast<const T*>(payload); | 814 | 23 | } |
_ZNK5doris10JsonbValue6unpackITkNS_12JsonbPodTypeENS_15JsonbDecimalValINS_7DecimalIN4wide7integerILm256EiEEEEEEEEPKT_v Line | Count | Source | 811 | 13 | const T* unpack() const { | 812 | 13 | static_assert(is_pod_v<T>, "T must be a POD type"); | 813 | 13 | return reinterpret_cast<const T*>(payload); | 814 | 13 | } |
_ZNK5doris10JsonbValue6unpackITkNS_12JsonbPodTypeENS_14JsonbBinaryValEEEPKT_v Line | Count | Source | 811 | 19.7k | const T* unpack() const { | 812 | 19.7k | static_assert(is_pod_v<T>, "T must be a POD type"); | 813 | 19.7k | return reinterpret_cast<const T*>(payload); | 814 | 19.7k | } |
_ZNK5doris10JsonbValue6unpackITkNS_12JsonbPodTypeENS_12ContainerValEEEPKT_v Line | Count | Source | 811 | 1.96k | const T* unpack() const { | 812 | 1.96k | static_assert(is_pod_v<T>, "T must be a POD type"); | 813 | 1.96k | return reinterpret_cast<const T*>(payload); | 814 | 1.96k | } |
_ZNK5doris10JsonbValue6unpackITkNS_12JsonbPodTypeENS_8ArrayValEEEPKT_v Line | Count | Source | 811 | 121 | const T* unpack() const { | 812 | 121 | static_assert(is_pod_v<T>, "T must be a POD type"); | 813 | 121 | return reinterpret_cast<const T*>(payload); | 814 | 121 | } |
_ZNK5doris10JsonbValue6unpackITkNS_12JsonbPodTypeENS_14JsonbStringValEEEPKT_v Line | Count | Source | 811 | 339 | const T* unpack() const { | 812 | 339 | static_assert(is_pod_v<T>, "T must be a POD type"); | 813 | 339 | return reinterpret_cast<const T*>(payload); | 814 | 339 | } |
|
815 | | |
816 | | // /** |
817 | | // * @brief Unpacks the underlying Jsonb binary content as a pointer to type `T`. |
818 | | // * |
819 | | // * @tparam T A POD (Plain Old Data) type that must satisfy the `JsonbPodType` concept. |
820 | | // * This ensures that `T` is trivially copyable, standard-layout, and safe to |
821 | | // * reinterpret from raw bytes without invoking undefined behavior. |
822 | | // * |
823 | | // * @return A pointer to a `T` object, interpreted from the internal buffer. |
824 | | // * |
825 | | // * @note The caller must ensure that the current JsonbValue actually contains data |
826 | | // * compatible with type `T`, otherwise the result is undefined. |
827 | | // */ |
828 | | // template <JsonbPodType T> |
829 | | // T* unpack() { |
830 | | // static_assert(is_pod_v<T>, "T must be a POD type"); |
831 | | // return reinterpret_cast<T*>(payload); |
832 | | // } |
833 | | |
834 | | int128_t int_val() const; |
835 | | }; |
836 | | |
837 | | // inline ObjectVal* JsonbDocument::operator->() { |
838 | | // return (((JsonbValue*)payload_)->unpack<ObjectVal>()); |
839 | | // } |
840 | | |
841 | 19.2k | inline const ObjectVal* JsonbDocument::operator->() const { |
842 | 19.2k | return (((const JsonbValue*)payload_)->unpack<ObjectVal>()); |
843 | 19.2k | } |
844 | | |
845 | | /* |
846 | | * NumerValT is the template class (derived from JsonbValue) of all number |
847 | | * types (integers and double). |
848 | | */ |
849 | | template <typename T> |
850 | | requires std::is_integral_v<T> || std::is_floating_point_v<T> |
851 | | struct NumberValT { |
852 | | public: |
853 | 10.6k | T val() const { return num; }_ZNK5doris10NumberValTIaE3valEv Line | Count | Source | 853 | 740 | T val() const { return num; } |
_ZNK5doris10NumberValTIsE3valEv Line | Count | Source | 853 | 108 | T val() const { return num; } |
_ZNK5doris10NumberValTIiE3valEv Line | Count | Source | 853 | 3.48k | T val() const { return num; } |
_ZNK5doris10NumberValTIlE3valEv Line | Count | Source | 853 | 1.91k | T val() const { return num; } |
_ZNK5doris10NumberValTInE3valEv Line | Count | Source | 853 | 4.17k | T val() const { return num; } |
_ZNK5doris10NumberValTIdE3valEv Line | Count | Source | 853 | 184 | T val() const { return num; } |
_ZNK5doris10NumberValTIfE3valEv Line | Count | Source | 853 | 28 | T val() const { return num; } |
|
854 | | |
855 | | static unsigned int numPackedBytes() { return sizeof(JsonbValue) + sizeof(T); } |
856 | | |
857 | | T num; |
858 | | }; |
859 | | |
860 | 49 | inline int128_t JsonbValue::int_val() const { |
861 | 49 | switch (type) { |
862 | 42 | case JsonbType::T_Int8: |
863 | 42 | return unpack<JsonbInt8Val>()->val(); |
864 | 1 | case JsonbType::T_Int16: |
865 | 1 | return unpack<JsonbInt16Val>()->val(); |
866 | 0 | case JsonbType::T_Int32: |
867 | 0 | return unpack<JsonbInt32Val>()->val(); |
868 | 3 | case JsonbType::T_Int64: |
869 | 3 | return unpack<JsonbInt64Val>()->val(); |
870 | 3 | case JsonbType::T_Int128: |
871 | 3 | return unpack<JsonbInt128Val>()->val(); |
872 | 0 | default: |
873 | 0 | throw Exception(ErrorCode::INTERNAL_ERROR, "Invalid JSONB value type: {}", |
874 | 0 | static_cast<int32_t>(type)); |
875 | 49 | } |
876 | 49 | } |
877 | | |
878 | | template <JsonbDecimalType T> |
879 | | struct JsonbDecimalVal { |
880 | | public: |
881 | | using NativeType = typename T::NativeType; |
882 | | |
883 | | // get the decimal value |
884 | 44 | NativeType val() const { |
885 | | // to avoid memory alignment issues, we use memcpy to copy the value |
886 | 44 | NativeType tmp; |
887 | 44 | memcpy(&tmp, &value, sizeof(NativeType)); |
888 | 44 | return tmp; |
889 | 44 | } _ZNK5doris15JsonbDecimalValINS_7DecimalIiEEE3valEv Line | Count | Source | 884 | 16 | NativeType val() const { | 885 | | // to avoid memory alignment issues, we use memcpy to copy the value | 886 | 16 | NativeType tmp; | 887 | 16 | memcpy(&tmp, &value, sizeof(NativeType)); | 888 | 16 | return tmp; | 889 | 16 | } |
_ZNK5doris15JsonbDecimalValINS_7DecimalIlEEE3valEv Line | Count | Source | 884 | 8 | NativeType val() const { | 885 | | // to avoid memory alignment issues, we use memcpy to copy the value | 886 | 8 | NativeType tmp; | 887 | 8 | memcpy(&tmp, &value, sizeof(NativeType)); | 888 | 8 | return tmp; | 889 | 8 | } |
_ZNK5doris15JsonbDecimalValINS_12Decimal128V3EE3valEv Line | Count | Source | 884 | 14 | NativeType val() const { | 885 | | // to avoid memory alignment issues, we use memcpy to copy the value | 886 | 14 | NativeType tmp; | 887 | 14 | memcpy(&tmp, &value, sizeof(NativeType)); | 888 | 14 | return tmp; | 889 | 14 | } |
_ZNK5doris15JsonbDecimalValINS_7DecimalIN4wide7integerILm256EiEEEEE3valEv Line | Count | Source | 884 | 6 | NativeType val() const { | 885 | | // to avoid memory alignment issues, we use memcpy to copy the value | 886 | 6 | NativeType tmp; | 887 | 6 | memcpy(&tmp, &value, sizeof(NativeType)); | 888 | 6 | return tmp; | 889 | 6 | } |
|
890 | | |
891 | 49 | static constexpr int numPackedBytes() { |
892 | 49 | return sizeof(JsonbValue) + sizeof(precision) + sizeof(scale) + sizeof(value); |
893 | 49 | } _ZN5doris15JsonbDecimalValINS_7DecimalIiEEE14numPackedBytesEv Line | Count | Source | 891 | 19 | static constexpr int numPackedBytes() { | 892 | 19 | return sizeof(JsonbValue) + sizeof(precision) + sizeof(scale) + sizeof(value); | 893 | 19 | } |
_ZN5doris15JsonbDecimalValINS_7DecimalIlEEE14numPackedBytesEv Line | Count | Source | 891 | 9 | static constexpr int numPackedBytes() { | 892 | 9 | return sizeof(JsonbValue) + sizeof(precision) + sizeof(scale) + sizeof(value); | 893 | 9 | } |
_ZN5doris15JsonbDecimalValINS_12Decimal128V3EE14numPackedBytesEv Line | Count | Source | 891 | 15 | static constexpr int numPackedBytes() { | 892 | 15 | return sizeof(JsonbValue) + sizeof(precision) + sizeof(scale) + sizeof(value); | 893 | 15 | } |
_ZN5doris15JsonbDecimalValINS_7DecimalIN4wide7integerILm256EiEEEEE14numPackedBytesEv Line | Count | Source | 891 | 6 | static constexpr int numPackedBytes() { | 892 | 6 | return sizeof(JsonbValue) + sizeof(precision) + sizeof(scale) + sizeof(value); | 893 | 6 | } |
|
894 | | |
895 | | uint32_t precision; |
896 | | uint32_t scale; |
897 | | NativeType value; |
898 | | }; |
899 | | |
900 | | /* |
901 | | * BlobVal is the base class (derived from JsonbValue) for string and binary |
902 | | * types. The size indicates the total bytes of the payload. |
903 | | */ |
904 | | struct JsonbBinaryVal { |
905 | | public: |
906 | | // size of the blob payload only |
907 | 2.14k | unsigned int getBlobLen() const { return size; } |
908 | | |
909 | | // return the blob as byte array |
910 | 4.59k | const char* getBlob() const { return payload; } |
911 | | |
912 | | // size of the total packed bytes |
913 | 15.2k | unsigned int numPackedBytes() const { return sizeof(JsonbValue) + sizeof(size) + size; } |
914 | | friend class JsonbDocument; |
915 | | |
916 | | uint32_t size; |
917 | | char payload[0]; |
918 | | }; |
919 | | |
920 | | /* |
921 | | * String type |
922 | | * Note: JSONB string may not be a c-string (NULL-terminated) |
923 | | */ |
924 | | struct JsonbStringVal : public JsonbBinaryVal { |
925 | | public: |
926 | | /* |
927 | | This function return the actual size of a string. Since for |
928 | | a string, it can be null-terminated with null paddings or it |
929 | | can take all the space in the payload without null in the end. |
930 | | So we need to check it to get the true actual length of a string. |
931 | | */ |
932 | 170 | size_t length() const { |
933 | | // It's an empty string |
934 | 170 | if (0 == size) { |
935 | 0 | return size; |
936 | 0 | } |
937 | | // The string stored takes all the spaces in payload |
938 | 170 | if (payload[size - 1] != 0) { |
939 | 170 | return size; |
940 | 170 | } |
941 | | // It's shorter than the size of payload |
942 | 0 | return strnlen(payload, size); |
943 | 170 | } |
944 | | }; |
945 | | |
946 | | /* |
947 | | * ContainerVal is the base class (derived from JsonbValue) for object and |
948 | | * array types. The size indicates the total bytes of the payload. |
949 | | */ |
950 | | struct ContainerVal { |
951 | | // size of the container payload only |
952 | 0 | unsigned int getContainerSize() const { return size; } |
953 | | |
954 | | // return the container payload as byte array |
955 | 0 | const char* getPayload() const { return payload; } |
956 | | |
957 | | // size of the total packed bytes |
958 | 1.96k | unsigned int numPackedBytes() const { return sizeof(JsonbValue) + sizeof(size) + size; } |
959 | | friend class JsonbDocument; |
960 | | |
961 | | uint32_t size; |
962 | | char payload[0]; |
963 | | }; |
964 | | |
965 | | /* |
966 | | * Object type |
967 | | */ |
968 | | struct ObjectVal : public ContainerVal { |
969 | | using value_type = JsonbKeyValue; |
970 | | using pointer = value_type*; |
971 | | using const_pointer = const value_type*; |
972 | | using const_iterator = JsonbFwdIteratorT<const_pointer, ObjectVal>; |
973 | | |
974 | 1 | const_iterator search(const char* key) const { |
975 | 1 | if (!key) { |
976 | 0 | return end(); |
977 | 0 | } |
978 | 1 | return search(key, (unsigned int)strlen(key)); |
979 | 1 | } |
980 | | |
981 | 32 | const_iterator search(const char* key, unsigned int klen) const { |
982 | 32 | if (!key || !klen) { |
983 | 0 | return end(); |
984 | 0 | } |
985 | 32 | return internalSearch(key, klen); |
986 | 32 | } |
987 | | |
988 | | // Get number of elements in object |
989 | 57 | int numElem() const { |
990 | 57 | const char* pch = payload; |
991 | 57 | const char* fence = payload + size; |
992 | | |
993 | 57 | unsigned int num = 0; |
994 | 149 | while (pch < fence) { |
995 | 92 | auto* pkey = (JsonbKeyValue*)(pch); |
996 | 92 | ++num; |
997 | 92 | pch += pkey->numPackedBytes(); |
998 | 92 | } |
999 | | |
1000 | 57 | assert(pch == fence); |
1001 | | |
1002 | 57 | return num; |
1003 | 57 | } |
1004 | | |
1005 | | // find the JSONB value by a key string (null terminated) |
1006 | 1 | const JsonbValue* find(const char* key) const { |
1007 | 1 | if (!key) { |
1008 | 0 | return nullptr; |
1009 | 0 | } |
1010 | 1 | return find(key, (unsigned int)strlen(key)); |
1011 | 1 | } |
1012 | | |
1013 | | // find the JSONB value by a key string (with length) |
1014 | 30 | const JsonbValue* find(const char* key, unsigned int klen) const { |
1015 | 30 | const_iterator kv = search(key, klen); |
1016 | 30 | if (end() == kv) { |
1017 | 2 | return nullptr; |
1018 | 2 | } |
1019 | 28 | return kv->value(); |
1020 | 30 | } |
1021 | | |
1022 | 1.69k | const_iterator begin() const { return const_iterator((pointer)payload); } |
1023 | | |
1024 | 18.7k | const_iterator end() const { return const_iterator((pointer)(payload + size)); } |
1025 | | |
1026 | | std::vector<std::pair<StringRef, const JsonbValue*>> get_ordered_key_value_pairs() const; |
1027 | | |
1028 | | private: |
1029 | 32 | const_iterator internalSearch(const char* key, unsigned int klen) const { |
1030 | 32 | const char* pch = payload; |
1031 | 32 | const char* fence = payload + size; |
1032 | | |
1033 | 42 | while (pch < fence) { |
1034 | 40 | const auto* pkey = (const JsonbKeyValue*)(pch); |
1035 | 40 | if (klen == pkey->klen() && strncmp(key, pkey->getKeyStr(), klen) == 0) { |
1036 | 30 | return const_iterator(pkey); |
1037 | 30 | } |
1038 | 10 | pch += pkey->numPackedBytes(); |
1039 | 10 | } |
1040 | | |
1041 | 32 | assert(pch == fence); |
1042 | | |
1043 | 2 | return end(); |
1044 | 2 | } |
1045 | | }; |
1046 | | |
1047 | | /* |
1048 | | * Array type |
1049 | | */ |
1050 | | struct ArrayVal : public ContainerVal { |
1051 | | using value_type = JsonbValue; |
1052 | | using pointer = value_type*; |
1053 | | using const_pointer = const value_type*; |
1054 | | using const_iterator = JsonbFwdIteratorT<const_pointer, ArrayVal>; |
1055 | | |
1056 | | // get the JSONB value at index |
1057 | 64 | const JsonbValue* get(int idx) const { |
1058 | 64 | if (idx < 0) { |
1059 | 0 | return nullptr; |
1060 | 0 | } |
1061 | | |
1062 | 64 | const char* pch = payload; |
1063 | 64 | const char* fence = payload + size; |
1064 | | |
1065 | 119 | while (pch < fence && idx-- > 0) { |
1066 | 55 | pch += ((const JsonbValue*)pch)->numPackedBytes(); |
1067 | 55 | } |
1068 | 64 | if (idx > 0 || pch == fence) { |
1069 | 7 | return nullptr; |
1070 | 7 | } |
1071 | | |
1072 | 57 | return (const JsonbValue*)pch; |
1073 | 64 | } |
1074 | | |
1075 | | // Get number of elements in array |
1076 | 28 | int numElem() const { |
1077 | 28 | const char* pch = payload; |
1078 | 28 | const char* fence = payload + size; |
1079 | | |
1080 | 28 | unsigned int num = 0; |
1081 | 91 | while (pch < fence) { |
1082 | 63 | ++num; |
1083 | 63 | pch += ((const JsonbValue*)pch)->numPackedBytes(); |
1084 | 63 | } |
1085 | | |
1086 | 28 | assert(pch == fence); |
1087 | | |
1088 | 28 | return num; |
1089 | 28 | } |
1090 | | |
1091 | 74 | const_iterator begin() const { return const_iterator((pointer)payload); } |
1092 | | |
1093 | 73 | const_iterator end() const { return const_iterator((pointer)(payload + size)); } |
1094 | | }; |
1095 | | |
1096 | | namespace jsonb_detail { |
1097 | | |
1098 | | struct JsonbScaledDecimal { |
1099 | | wide::Int256 value; |
1100 | | uint32_t scale; |
1101 | | }; |
1102 | | |
1103 | 26 | inline void validate_decimal_scale(uint32_t scale) { |
1104 | 26 | if (scale > static_cast<uint32_t>(BeConsts::MAX_DECIMALV3_SCALE)) { |
1105 | 2 | throw Exception(ErrorCode::INTERNAL_ERROR, |
1106 | 2 | "Invalid JSONB decimal scale: {}, max allowed scale: {}", scale, |
1107 | 2 | BeConsts::MAX_DECIMALV3_SCALE); |
1108 | 2 | } |
1109 | 26 | } |
1110 | | |
1111 | 39 | inline bool is_numeric(const JsonbValue* value) { |
1112 | 39 | return value->isInt() || value->isDouble() || value->isFloat() || value->isDecimal(); |
1113 | 39 | } |
1114 | | |
1115 | 10 | inline double floating_value(const JsonbValue* value) { |
1116 | 10 | if (value->isDouble()) { |
1117 | 10 | return value->unpack<JsonbDoubleVal>()->val(); |
1118 | 10 | } |
1119 | 0 | return value->unpack<JsonbFloatVal>()->val(); |
1120 | 10 | } |
1121 | | |
1122 | 20 | inline JsonbScaledDecimal get_scaled_decimal(const JsonbValue* value) { |
1123 | 20 | switch (value->type) { |
1124 | 12 | case JsonbType::T_Decimal32: { |
1125 | 12 | const auto* decimal = value->unpack<JsonbDecimal32>(); |
1126 | 12 | validate_decimal_scale(decimal->scale); |
1127 | 12 | return {wide::Int256(decimal->val()), decimal->scale}; |
1128 | 0 | } |
1129 | 2 | case JsonbType::T_Decimal64: { |
1130 | 2 | const auto* decimal = value->unpack<JsonbDecimal64>(); |
1131 | 2 | validate_decimal_scale(decimal->scale); |
1132 | 2 | return {wide::Int256(decimal->val()), decimal->scale}; |
1133 | 0 | } |
1134 | 6 | case JsonbType::T_Decimal128: { |
1135 | 6 | const auto* decimal = value->unpack<JsonbDecimal128>(); |
1136 | 6 | validate_decimal_scale(decimal->scale); |
1137 | 6 | return {wide::Int256(decimal->val()), decimal->scale}; |
1138 | 0 | } |
1139 | 0 | case JsonbType::T_Decimal256: { |
1140 | 0 | const auto* decimal = value->unpack<JsonbDecimal256>(); |
1141 | 0 | validate_decimal_scale(decimal->scale); |
1142 | 0 | return {decimal->val(), decimal->scale}; |
1143 | 0 | } |
1144 | 0 | default: |
1145 | 0 | throw Exception(ErrorCode::INTERNAL_ERROR, "Invalid JSONB decimal value type: {}", |
1146 | 0 | static_cast<int32_t>(value->type)); |
1147 | 20 | } |
1148 | 20 | } |
1149 | | |
1150 | | inline bool scaled_decimal_equal_decimal(const JsonbScaledDecimal& lhs, |
1151 | 4 | const JsonbScaledDecimal& rhs) { |
1152 | 4 | if (lhs.scale == rhs.scale) { |
1153 | 0 | return lhs.value == rhs.value; |
1154 | 0 | } |
1155 | | |
1156 | 4 | if (lhs.scale < rhs.scale) { |
1157 | 2 | const auto scale_multiplier = decimal_scale_multiplier<wide::Int256>(rhs.scale - lhs.scale); |
1158 | 2 | return rhs.value % scale_multiplier == 0 && lhs.value == rhs.value / scale_multiplier; |
1159 | 2 | } |
1160 | | |
1161 | 2 | const auto scale_multiplier = decimal_scale_multiplier<wide::Int256>(lhs.scale - rhs.scale); |
1162 | 2 | return lhs.value % scale_multiplier == 0 && lhs.value / scale_multiplier == rhs.value; |
1163 | 4 | } |
1164 | | |
1165 | 4 | inline bool scaled_decimal_equal_integer(const JsonbScaledDecimal& decimal, int128_t integer) { |
1166 | 4 | const auto integer_value = wide::Int256(integer); |
1167 | 4 | if (decimal.scale == 0) { |
1168 | 0 | return decimal.value == integer_value; |
1169 | 0 | } |
1170 | | |
1171 | 4 | const auto scale_multiplier = decimal_scale_multiplier<wide::Int256>(decimal.scale); |
1172 | 4 | return decimal.value % scale_multiplier == 0 && |
1173 | 4 | decimal.value / scale_multiplier == integer_value; |
1174 | 4 | } |
1175 | | |
1176 | | inline constexpr auto kPowersOfFive = [] { |
1177 | | std::array<wide::Int256, BeConsts::MAX_DECIMALV3_SCALE + 1> powers {}; |
1178 | | powers[0] = 1; |
1179 | | for (size_t i = 1; i < powers.size(); ++i) { |
1180 | | powers[i] = powers[i - 1] * 5; |
1181 | | } |
1182 | | return powers; |
1183 | | }(); |
1184 | | |
1185 | 6 | inline wide::Int256 power_of_five(uint32_t exponent) { |
1186 | 6 | validate_decimal_scale(exponent); |
1187 | 6 | return kPowersOfFive[exponent]; |
1188 | 6 | } |
1189 | | |
1190 | 6 | inline bool scaled_binary_equal(wide::Int256 value, int exponent, wide::Int256 significand) { |
1191 | 6 | if (exponent < 0) { |
1192 | 4 | const int divisor_exponent = -exponent; |
1193 | 4 | if (divisor_exponent >= std::numeric_limits<int64_t>::digits) { |
1194 | 0 | return false; |
1195 | 0 | } |
1196 | 4 | const auto divisor = wide::Int256(1) << divisor_exponent; |
1197 | 4 | return significand % divisor == 0 && value == significand / divisor; |
1198 | 4 | } |
1199 | 2 | constexpr int max_positive_int256_shift = std::numeric_limits<wide::Int256>::digits; |
1200 | | // wide::Int256 is signed, so shifting 1 by 255 reaches the sign bit. |
1201 | 2 | if (exponent >= max_positive_int256_shift) { |
1202 | 0 | return false; |
1203 | 0 | } |
1204 | 2 | const auto multiplier = wide::Int256(1) << exponent; |
1205 | 2 | return value % multiplier == 0 && value / multiplier == significand; |
1206 | 2 | } |
1207 | | |
1208 | 4 | inline bool floating_equal_integer(const JsonbValue* floating, int128_t integer) { |
1209 | 4 | const double value = floating_value(floating); |
1210 | 4 | int exponent = 0; |
1211 | 4 | std::frexp(value, &exponent); |
1212 | 4 | if (!std::isfinite(value) || std::trunc(value) != value) { |
1213 | 1 | return false; |
1214 | 1 | } |
1215 | 3 | if (exponent >= 128) { |
1216 | 0 | return value == -std::ldexp(1.0, 127) && integer == std::numeric_limits<int128_t>::min(); |
1217 | 0 | } |
1218 | 3 | if (exponent <= -1) { |
1219 | 0 | return false; |
1220 | 0 | } |
1221 | 3 | return static_cast<int128_t>(value) == integer; |
1222 | 3 | } |
1223 | | |
1224 | 6 | inline bool floating_equal_decimal(const JsonbValue* floating, const JsonbScaledDecimal& decimal) { |
1225 | 6 | const double value = floating_value(floating); |
1226 | 6 | if (!std::isfinite(value)) { |
1227 | 0 | return false; |
1228 | 0 | } |
1229 | 6 | if (value == 0) { |
1230 | 0 | return decimal.value == 0; |
1231 | 0 | } |
1232 | | |
1233 | 6 | int exponent = 0; |
1234 | 6 | const double significand_fraction = std::frexp(value, &exponent); |
1235 | 6 | const double significand_double = |
1236 | 6 | std::ldexp(significand_fraction, std::numeric_limits<double>::digits); |
1237 | 6 | auto significand = wide::Int256(static_cast<int64_t>(significand_double)); |
1238 | 6 | exponent -= std::numeric_limits<double>::digits; |
1239 | | |
1240 | 6 | const auto five_multiplier = power_of_five(decimal.scale); |
1241 | 6 | if (decimal.value % five_multiplier != 0) { |
1242 | 0 | return false; |
1243 | 0 | } |
1244 | 6 | const auto binary_scaled_decimal = decimal.value / five_multiplier; |
1245 | 6 | return scaled_binary_equal(binary_scaled_decimal, exponent + decimal.scale, significand); |
1246 | 6 | } |
1247 | | |
1248 | 39 | inline bool numeric_equal(const JsonbValue* lhs, const JsonbValue* rhs) { |
1249 | 39 | if (!is_numeric(rhs)) { |
1250 | 2 | return false; |
1251 | 2 | } |
1252 | | |
1253 | 37 | if ((lhs->isDouble() || lhs->isFloat()) && rhs->isInt()) { |
1254 | 1 | return floating_equal_integer(lhs, rhs->int_val()); |
1255 | 1 | } |
1256 | | |
1257 | 36 | if ((rhs->isDouble() || rhs->isFloat()) && lhs->isInt()) { |
1258 | 3 | return floating_equal_integer(rhs, lhs->int_val()); |
1259 | 3 | } |
1260 | | |
1261 | 33 | if ((lhs->isDouble() || lhs->isFloat()) && rhs->isDecimal()) { |
1262 | 4 | return floating_equal_decimal(lhs, get_scaled_decimal(rhs)); |
1263 | 4 | } |
1264 | | |
1265 | 29 | if ((rhs->isDouble() || rhs->isFloat()) && lhs->isDecimal()) { |
1266 | 4 | return floating_equal_decimal(rhs, get_scaled_decimal(lhs)); |
1267 | 4 | } |
1268 | | |
1269 | 25 | if (lhs->isDouble() || lhs->isFloat()) { |
1270 | 0 | return (rhs->isDouble() || rhs->isFloat()) && floating_value(lhs) == floating_value(rhs); |
1271 | 0 | } |
1272 | | |
1273 | 25 | if (lhs->isDecimal()) { |
1274 | 6 | const auto lhs_decimal = get_scaled_decimal(lhs); |
1275 | 6 | if (rhs->isDecimal()) { |
1276 | 4 | return scaled_decimal_equal_decimal(lhs_decimal, get_scaled_decimal(rhs)); |
1277 | 4 | } |
1278 | 2 | return scaled_decimal_equal_integer(lhs_decimal, rhs->int_val()); |
1279 | 6 | } |
1280 | | |
1281 | 19 | if (rhs->isDecimal()) { |
1282 | 2 | return scaled_decimal_equal_integer(get_scaled_decimal(rhs), lhs->int_val()); |
1283 | 2 | } |
1284 | | |
1285 | 17 | return lhs->int_val() == rhs->int_val(); |
1286 | 19 | } |
1287 | | |
1288 | 14 | inline bool array_contains_value(const ArrayVal* target_array, const JsonbValue* candidate) { |
1289 | 14 | const int target_num = target_array->numElem(); |
1290 | 25 | for (int i = 0; i < target_num; ++i) { |
1291 | 22 | if (target_array->get(i)->contains(candidate)) { |
1292 | 11 | return true; |
1293 | 11 | } |
1294 | 22 | } |
1295 | 3 | return false; |
1296 | 14 | } |
1297 | | |
1298 | 7 | inline bool array_contains_array(const ArrayVal* target_array, const ArrayVal* candidate_array) { |
1299 | 7 | const int candidate_num = candidate_array->numElem(); |
1300 | 17 | for (int i = 0; i < candidate_num; ++i) { |
1301 | 12 | if (!array_contains_value(target_array, candidate_array->get(i))) { |
1302 | 2 | return false; |
1303 | 2 | } |
1304 | 12 | } |
1305 | 5 | return true; |
1306 | 7 | } |
1307 | | |
1308 | | } // namespace jsonb_detail |
1309 | | |
1310 | 12 | inline const JsonbValue* JsonbDocument::createValue(const char* pb, size_t size) { |
1311 | 12 | if (!pb || size < sizeof(JsonbHeader) + sizeof(JsonbValue)) { |
1312 | 0 | return nullptr; |
1313 | 0 | } |
1314 | | |
1315 | 12 | auto* doc = (JsonbDocument*)pb; |
1316 | 12 | if (doc->header_.ver_ != JSONB_VER) { |
1317 | 0 | return nullptr; |
1318 | 0 | } |
1319 | | |
1320 | 12 | const auto* val = (const JsonbValue*)doc->payload_; |
1321 | | // Same as checkAndCreateDocument(), this is intentionally a lightweight structural check for |
1322 | | // hot paths. Do not recursively validate container bodies here unless the caller is a clearly |
1323 | | // untrusted raw binary boundary and accepts the O(document size) cost. |
1324 | 12 | if (size != sizeof(JsonbHeader) + val->numPackedBytes()) { |
1325 | 0 | return nullptr; |
1326 | 0 | } |
1327 | | |
1328 | 12 | return val; |
1329 | 12 | } |
1330 | | |
1331 | 0 | inline unsigned int JsonbDocument::numPackedBytes() const { |
1332 | 0 | return ((const JsonbValue*)payload_)->numPackedBytes() + sizeof(header_); |
1333 | 0 | } |
1334 | | |
1335 | 17.7k | inline unsigned int JsonbKeyValue::numPackedBytes() const { |
1336 | 17.7k | unsigned int ks = keyPackedBytes(); |
1337 | 17.7k | const auto* val = (const JsonbValue*)(((char*)this) + ks); |
1338 | 17.7k | return ks + val->numPackedBytes(); |
1339 | 17.7k | } |
1340 | | |
1341 | | // Poor man's "virtual" function JsonbValue::numPackedBytes |
1342 | 71.4k | inline unsigned int JsonbValue::numPackedBytes() const { |
1343 | 71.4k | switch (type) { |
1344 | 2.77k | case JsonbType::T_Null: |
1345 | 12.2k | case JsonbType::T_True: |
1346 | 12.8k | case JsonbType::T_False: { |
1347 | 12.8k | return sizeof(type); |
1348 | 12.2k | } |
1349 | | |
1350 | 854 | case JsonbType::T_Int8: { |
1351 | 854 | return sizeof(type) + sizeof(int8_t); |
1352 | 12.2k | } |
1353 | 125 | case JsonbType::T_Int16: { |
1354 | 125 | return sizeof(type) + sizeof(int16_t); |
1355 | 12.2k | } |
1356 | 3.51k | case JsonbType::T_Int32: { |
1357 | 3.51k | return sizeof(type) + sizeof(int32_t); |
1358 | 12.2k | } |
1359 | 12.1k | case JsonbType::T_Int64: { |
1360 | 12.1k | return sizeof(type) + sizeof(int64_t); |
1361 | 12.2k | } |
1362 | 10.6k | case JsonbType::T_Double: { |
1363 | 10.6k | return sizeof(type) + sizeof(double); |
1364 | 12.2k | } |
1365 | 29 | case JsonbType::T_Float: { |
1366 | 29 | return sizeof(type) + sizeof(float); |
1367 | 12.2k | } |
1368 | 13.9k | case JsonbType::T_Int128: { |
1369 | 13.9k | return sizeof(type) + sizeof(int128_t); |
1370 | 12.2k | } |
1371 | 10.8k | case JsonbType::T_String: |
1372 | 15.2k | case JsonbType::T_Binary: { |
1373 | 15.2k | return unpack<JsonbBinaryVal>()->numPackedBytes(); |
1374 | 10.8k | } |
1375 | | |
1376 | 1.77k | case JsonbType::T_Object: |
1377 | 1.96k | case JsonbType::T_Array: { |
1378 | 1.96k | return unpack<ContainerVal>()->numPackedBytes(); |
1379 | 1.77k | } |
1380 | 19 | case JsonbType::T_Decimal32: { |
1381 | 19 | return JsonbDecimal32::numPackedBytes(); |
1382 | 1.77k | } |
1383 | 9 | case JsonbType::T_Decimal64: { |
1384 | 9 | return JsonbDecimal64::numPackedBytes(); |
1385 | 1.77k | } |
1386 | 15 | case JsonbType::T_Decimal128: { |
1387 | 15 | return JsonbDecimal128::numPackedBytes(); |
1388 | 1.77k | } |
1389 | 6 | case JsonbType::T_Decimal256: { |
1390 | 6 | return JsonbDecimal256::numPackedBytes(); |
1391 | 1.77k | } |
1392 | 0 | case JsonbType::NUM_TYPES: |
1393 | 0 | break; |
1394 | 71.4k | } |
1395 | | |
1396 | 0 | throw Exception(ErrorCode::INTERNAL_ERROR, "Invalid JSONB value type: {}", |
1397 | 0 | static_cast<int32_t>(type)); |
1398 | 71.4k | } |
1399 | | |
1400 | 6 | inline int JsonbValue::numElements() const { |
1401 | 6 | switch (type) { |
1402 | 0 | case JsonbType::T_Int8: |
1403 | 0 | case JsonbType::T_Int16: |
1404 | 0 | case JsonbType::T_Int32: |
1405 | 0 | case JsonbType::T_Int64: |
1406 | 0 | case JsonbType::T_Double: |
1407 | 0 | case JsonbType::T_Float: |
1408 | 0 | case JsonbType::T_Int128: |
1409 | 1 | case JsonbType::T_String: |
1410 | 1 | case JsonbType::T_Binary: |
1411 | 2 | case JsonbType::T_Null: |
1412 | 2 | case JsonbType::T_True: |
1413 | 2 | case JsonbType::T_False: |
1414 | 2 | case JsonbType::T_Decimal32: |
1415 | 2 | case JsonbType::T_Decimal64: |
1416 | 2 | case JsonbType::T_Decimal128: |
1417 | 2 | case JsonbType::T_Decimal256: { |
1418 | 2 | return 1; |
1419 | 2 | } |
1420 | 0 | case JsonbType::T_Object: { |
1421 | 0 | return unpack<ObjectVal>()->numElem(); |
1422 | 2 | } |
1423 | 4 | case JsonbType::T_Array: { |
1424 | 4 | return unpack<ArrayVal>()->numElem(); |
1425 | 2 | } |
1426 | 0 | case JsonbType::NUM_TYPES: |
1427 | 0 | break; |
1428 | 6 | } |
1429 | 0 | throw Exception(ErrorCode::INTERNAL_ERROR, "Invalid JSONB value type: {}", |
1430 | 0 | static_cast<int32_t>(type)); |
1431 | 6 | } |
1432 | | |
1433 | 52 | inline bool JsonbValue::contains(const JsonbValue* rhs) const { |
1434 | 52 | switch (type) { |
1435 | 23 | case JsonbType::T_Int8: |
1436 | 23 | case JsonbType::T_Int16: |
1437 | 23 | case JsonbType::T_Int32: |
1438 | 23 | case JsonbType::T_Int64: |
1439 | 24 | case JsonbType::T_Int128: |
1440 | 29 | case JsonbType::T_Double: |
1441 | 29 | case JsonbType::T_Float: |
1442 | 35 | case JsonbType::T_Decimal32: |
1443 | 36 | case JsonbType::T_Decimal64: |
1444 | 39 | case JsonbType::T_Decimal128: |
1445 | 39 | case JsonbType::T_Decimal256: { |
1446 | 39 | return jsonb_detail::numeric_equal(this, rhs); |
1447 | 39 | } |
1448 | 1 | case JsonbType::T_String: |
1449 | 1 | case JsonbType::T_Binary: { |
1450 | 1 | if (rhs->isString() || rhs->isBinary()) { |
1451 | 1 | const auto* str_value1 = unpack<JsonbStringVal>(); |
1452 | 1 | const auto* str_value2 = rhs->unpack<JsonbStringVal>(); |
1453 | 1 | return str_value1->length() == str_value2->length() && |
1454 | 1 | std::memcmp(str_value1->getBlob(), str_value2->getBlob(), |
1455 | 1 | str_value1->length()) == 0; |
1456 | 1 | } |
1457 | 0 | return false; |
1458 | 1 | } |
1459 | 9 | case JsonbType::T_Array: { |
1460 | 9 | const auto* lhs_array = unpack<ArrayVal>(); |
1461 | 9 | if (rhs->isArray()) { |
1462 | 7 | return jsonb_detail::array_contains_array(lhs_array, rhs->unpack<ArrayVal>()); |
1463 | 7 | } |
1464 | 2 | return jsonb_detail::array_contains_value(lhs_array, rhs); |
1465 | 9 | } |
1466 | 3 | case JsonbType::T_Object: { |
1467 | 3 | if (rhs->isObject()) { |
1468 | 2 | const auto* obj_value1 = unpack<ObjectVal>(); |
1469 | 2 | const auto* obj_value2 = rhs->unpack<ObjectVal>(); |
1470 | 3 | for (auto it = obj_value2->begin(); it != obj_value2->end(); ++it) { |
1471 | 2 | const JsonbValue* value = obj_value1->find(it->getKeyStr(), it->klen()); |
1472 | 2 | if (value == nullptr || !value->contains(it->value())) { |
1473 | 1 | return false; |
1474 | 1 | } |
1475 | 2 | } |
1476 | 1 | return true; |
1477 | 2 | } |
1478 | 1 | return false; |
1479 | 3 | } |
1480 | 0 | case JsonbType::T_Null: { |
1481 | 0 | return rhs->isNull(); |
1482 | 3 | } |
1483 | 0 | case JsonbType::T_True: { |
1484 | 0 | return rhs->isTrue(); |
1485 | 3 | } |
1486 | 0 | case JsonbType::T_False: { |
1487 | 0 | return rhs->isFalse(); |
1488 | 3 | } |
1489 | 0 | case JsonbType::NUM_TYPES: |
1490 | 0 | break; |
1491 | 52 | } |
1492 | | |
1493 | 0 | throw Exception(ErrorCode::INTERNAL_ERROR, "Invalid JSONB value type: {}", |
1494 | 0 | static_cast<int32_t>(type)); |
1495 | 52 | } |
1496 | | |
1497 | 101 | inline bool JsonbPath::seek(const char* key_path, size_t kp_len) { |
1498 | 101 | while (kp_len > 0 && std::isspace(key_path[kp_len - 1])) { |
1499 | 0 | --kp_len; |
1500 | 0 | } |
1501 | | |
1502 | | //path invalid |
1503 | 101 | if (!key_path || kp_len == 0) { |
1504 | 0 | return false; |
1505 | 0 | } |
1506 | 101 | Stream stream(key_path, kp_len); |
1507 | 101 | stream.skip_whitespace(); |
1508 | 101 | if (stream.exhausted() || stream.read() != SCOPE) { |
1509 | | //path invalid |
1510 | 0 | return false; |
1511 | 0 | } |
1512 | | |
1513 | 196 | while (!stream.exhausted()) { |
1514 | 95 | stream.skip_whitespace(); |
1515 | 95 | stream.clear_leg_ptr(); |
1516 | 95 | stream.clear_leg_len(); |
1517 | | |
1518 | 95 | if (!JsonbPath::parsePath(&stream, this)) { |
1519 | | //path invalid |
1520 | 0 | return false; |
1521 | 0 | } |
1522 | 95 | } |
1523 | 101 | return true; |
1524 | 101 | } |
1525 | | |
1526 | 95 | inline bool JsonbPath::parsePath(Stream* stream, JsonbPath* path) { |
1527 | | // $[0] |
1528 | 95 | if (stream->peek() == BEGIN_ARRAY) { |
1529 | 58 | return parse_array(stream, path); |
1530 | 58 | } |
1531 | | // $.a or $.[0] |
1532 | | // Keep $.[0] for backward compatibility: although the dot before an array |
1533 | | // leg is non-standard, existing JSONB users may rely on it. |
1534 | 37 | else if (stream->peek() == BEGIN_MEMBER) { |
1535 | | // advance past the . |
1536 | 35 | stream->skip(1); |
1537 | | |
1538 | 35 | if (stream->exhausted()) { |
1539 | 0 | return false; |
1540 | 0 | } |
1541 | | |
1542 | | // $.[0] |
1543 | 35 | if (stream->peek() == BEGIN_ARRAY) { |
1544 | 0 | return parse_array(stream, path); |
1545 | 0 | } |
1546 | | // $.a |
1547 | 35 | else { |
1548 | 35 | return parse_member(stream, path); |
1549 | 35 | } |
1550 | 35 | } else if (stream->peek() == WILDCARD) { |
1551 | 2 | stream->skip(1); |
1552 | 2 | if (stream->exhausted()) { |
1553 | 0 | return false; |
1554 | 0 | } |
1555 | | |
1556 | | // $** |
1557 | 2 | if (stream->peek() == WILDCARD) { |
1558 | 2 | path->_is_supper_wildcard = true; |
1559 | 2 | } |
1560 | | |
1561 | 2 | stream->skip(1); |
1562 | 2 | if (stream->exhausted()) { |
1563 | 0 | return false; |
1564 | 0 | } |
1565 | | |
1566 | 2 | if (stream->peek() == BEGIN_ARRAY) { |
1567 | 0 | return parse_array(stream, path); |
1568 | 2 | } else if (stream->peek() == BEGIN_MEMBER) { |
1569 | | // advance past the . |
1570 | 2 | stream->skip(1); |
1571 | | |
1572 | 2 | if (stream->exhausted()) { |
1573 | 0 | return false; |
1574 | 0 | } |
1575 | | |
1576 | | // $**.[0] |
1577 | | // Keep the dot-array form compatible with the root path behavior. |
1578 | 2 | if (stream->peek() == BEGIN_ARRAY) { |
1579 | 0 | return parse_array(stream, path); |
1580 | 0 | } |
1581 | | // $.a |
1582 | 2 | else { |
1583 | 2 | return parse_member(stream, path); |
1584 | 2 | } |
1585 | 2 | } |
1586 | 0 | return false; |
1587 | 2 | } else { |
1588 | 0 | return false; //invalid json path |
1589 | 0 | } |
1590 | 95 | } |
1591 | | |
1592 | 58 | inline bool JsonbPath::parse_array(Stream* stream, JsonbPath* path) { |
1593 | 58 | assert(stream->peek() == BEGIN_ARRAY); |
1594 | 58 | stream->skip(1); |
1595 | 58 | if (stream->exhausted()) { |
1596 | 0 | return false; |
1597 | 0 | } |
1598 | | |
1599 | 58 | if (stream->peek() == WILDCARD) { |
1600 | | // Called by function_jsonb.cpp, the variables passed in originate from a mutable block; |
1601 | | // using const_cast is acceptable. |
1602 | 0 | stream->set_leg_ptr(const_cast<char*>(stream->position())); |
1603 | 0 | stream->add_leg_len(); |
1604 | 0 | stream->skip(1); |
1605 | 0 | if (stream->exhausted()) { |
1606 | 0 | return false; |
1607 | 0 | } |
1608 | | |
1609 | 0 | if (stream->peek() == END_ARRAY) { |
1610 | 0 | std::unique_ptr<leg_info> leg( |
1611 | 0 | new leg_info(stream->get_leg_ptr(), stream->get_leg_len(), 0, ARRAY_CODE)); |
1612 | 0 | path->add_leg_to_leg_vector(std::move(leg)); |
1613 | 0 | stream->skip(1); |
1614 | 0 | path->_is_wildcard = true; |
1615 | 0 | return true; |
1616 | 0 | } else { |
1617 | 0 | return false; |
1618 | 0 | } |
1619 | 0 | } |
1620 | | |
1621 | | // Called by function_jsonb.cpp, the variables passed in originate from a mutable block; |
1622 | | // using const_cast is acceptable. |
1623 | 58 | stream->set_leg_ptr(const_cast<char*>(stream->position())); |
1624 | | |
1625 | 116 | for (; !stream->exhausted() && stream->peek() != END_ARRAY; stream->advance()) { |
1626 | 58 | stream->add_leg_len(); |
1627 | 58 | } |
1628 | | |
1629 | 58 | if (stream->exhausted() || stream->peek() != END_ARRAY) { |
1630 | 0 | return false; |
1631 | 58 | } else { |
1632 | 58 | stream->skip(1); |
1633 | 58 | } |
1634 | | |
1635 | | //parse array index to int |
1636 | | |
1637 | 58 | std::string_view idx_string(stream->get_leg_ptr(), stream->get_leg_len()); |
1638 | 58 | int index = 0; |
1639 | | |
1640 | | // Match "last" case-insensitively for compatibility with existing JSONB |
1641 | | // paths such as [Last] and [LAST]. |
1642 | 58 | if (stream->get_leg_len() >= 4 && |
1643 | 58 | std::equal(LAST, LAST + 4, stream->get_leg_ptr(), |
1644 | 0 | [](char c1, char c2) { return std::tolower(c1) == std::tolower(c2); })) { |
1645 | 0 | auto pos = idx_string.find(MINUS); |
1646 | |
|
1647 | 0 | if (pos != std::string::npos) { |
1648 | 0 | for (size_t i = 4; i < pos; ++i) { |
1649 | 0 | if (std::isspace(idx_string[i])) { |
1650 | 0 | continue; |
1651 | 0 | } else { |
1652 | | // leading zeroes are not allowed |
1653 | 0 | LOG(WARNING) << "Non-space char in idx_string: '" << idx_string << "'"; |
1654 | 0 | return false; |
1655 | 0 | } |
1656 | 0 | } |
1657 | 0 | idx_string = idx_string.substr(pos + 1); |
1658 | 0 | idx_string = trim(idx_string); |
1659 | | |
1660 | | // Keep numeric-prefix parsing for last-N offsets as existing JSONB |
1661 | | // path behavior. |
1662 | 0 | auto result = std::from_chars(idx_string.data(), idx_string.data() + idx_string.size(), |
1663 | 0 | index); |
1664 | 0 | if (result.ec != std::errc()) { |
1665 | 0 | LOG(WARNING) << "Invalid index in JSON path: '" << idx_string << "'"; |
1666 | 0 | return false; |
1667 | 0 | } |
1668 | |
|
1669 | 0 | } else if (stream->get_leg_len() > 4) { |
1670 | 0 | return false; |
1671 | 0 | } |
1672 | | |
1673 | 0 | std::unique_ptr<leg_info> leg(new leg_info(nullptr, 0, -index - 1, ARRAY_CODE)); |
1674 | 0 | path->add_leg_to_leg_vector(std::move(leg)); |
1675 | |
|
1676 | 0 | return true; |
1677 | 0 | } |
1678 | | |
1679 | | // Preserve legacy numeric-prefix parsing for array indexes. std::from_chars |
1680 | | // may stop before the end (for example [1.5] is parsed as index 1), and |
1681 | | // current JSONB path semantics treat that as supported behavior. |
1682 | 58 | auto result = std::from_chars(idx_string.data(), idx_string.data() + idx_string.size(), index); |
1683 | | |
1684 | 58 | if (result.ec != std::errc()) { |
1685 | 0 | return false; |
1686 | 0 | } |
1687 | | |
1688 | 58 | std::unique_ptr<leg_info> leg(new leg_info(nullptr, 0, index, ARRAY_CODE)); |
1689 | 58 | path->add_leg_to_leg_vector(std::move(leg)); |
1690 | | |
1691 | 58 | return true; |
1692 | 58 | } |
1693 | | |
1694 | 37 | inline bool JsonbPath::parse_member(Stream* stream, JsonbPath* path) { |
1695 | 37 | if (stream->exhausted()) { |
1696 | 0 | return false; |
1697 | 0 | } |
1698 | | |
1699 | 37 | if (stream->peek() == WILDCARD) { |
1700 | | // Called by function_jsonb.cpp, the variables passed in originate from a mutable block; |
1701 | | // using const_cast is acceptable. |
1702 | 0 | stream->set_leg_ptr(const_cast<char*>(stream->position())); |
1703 | 0 | stream->add_leg_len(); |
1704 | 0 | stream->skip(1); |
1705 | 0 | std::unique_ptr<leg_info> leg( |
1706 | 0 | new leg_info(stream->get_leg_ptr(), stream->get_leg_len(), 0, MEMBER_CODE)); |
1707 | 0 | path->add_leg_to_leg_vector(std::move(leg)); |
1708 | 0 | path->_is_wildcard = true; |
1709 | 0 | return true; |
1710 | 0 | } |
1711 | | |
1712 | | // Called by function_jsonb.cpp, the variables passed in originate from a mutable block; |
1713 | | // using const_cast is acceptable. |
1714 | 37 | stream->set_leg_ptr(const_cast<char*>(stream->position())); |
1715 | | |
1716 | 37 | const char* left_quotation_marks = nullptr; |
1717 | 37 | const char* right_quotation_marks = nullptr; |
1718 | | |
1719 | 139 | for (; !stream->exhausted(); stream->advance()) { |
1720 | | // Only accept space characters quoted by double quotes. |
1721 | 104 | if (std::isspace(stream->peek()) && left_quotation_marks == nullptr) { |
1722 | 0 | return false; |
1723 | 104 | } else if (stream->peek() == ESCAPE) { |
1724 | 10 | stream->add_leg_len(); |
1725 | 10 | stream->skip(1); |
1726 | 10 | stream->add_leg_len(); |
1727 | 10 | stream->set_has_escapes(true); |
1728 | 10 | if (stream->exhausted()) { |
1729 | 0 | return false; |
1730 | 0 | } |
1731 | 10 | continue; |
1732 | 94 | } else if (stream->peek() == DOUBLE_QUOTE) { |
1733 | 4 | if (left_quotation_marks == nullptr) { |
1734 | 2 | left_quotation_marks = stream->position(); |
1735 | | // Called by function_jsonb.cpp, the variables passed in originate from a mutable block; |
1736 | | // using const_cast is acceptable. |
1737 | 2 | stream->set_leg_ptr(const_cast<char*>(++left_quotation_marks)); |
1738 | 2 | continue; |
1739 | 2 | } else { |
1740 | 2 | right_quotation_marks = stream->position(); |
1741 | 2 | stream->skip(1); |
1742 | 2 | break; |
1743 | 2 | } |
1744 | 90 | } else if (stream->peek() == BEGIN_MEMBER || stream->peek() == BEGIN_ARRAY) { |
1745 | 0 | if (left_quotation_marks == nullptr) { |
1746 | 0 | break; |
1747 | 0 | } |
1748 | 0 | } |
1749 | | |
1750 | 90 | stream->add_leg_len(); |
1751 | 90 | } |
1752 | | |
1753 | 37 | if ((left_quotation_marks != nullptr && right_quotation_marks == nullptr) || |
1754 | 37 | stream->get_leg_ptr() == nullptr || stream->get_leg_len() == 0) { |
1755 | 0 | return false; //invalid json path |
1756 | 0 | } |
1757 | | |
1758 | 37 | if (stream->get_has_escapes()) { |
1759 | 2 | stream->remove_escapes(); |
1760 | 2 | } |
1761 | | |
1762 | 37 | std::unique_ptr<leg_info> leg( |
1763 | 37 | new leg_info(stream->get_leg_ptr(), stream->get_leg_len(), 0, MEMBER_CODE)); |
1764 | 37 | path->add_leg_to_leg_vector(std::move(leg)); |
1765 | | |
1766 | 37 | return true; |
1767 | 37 | } |
1768 | | |
1769 | | static_assert(is_pod_v<JsonbDocument>, "JsonbDocument must be standard layout and trivial"); |
1770 | | static_assert(is_pod_v<JsonbValue>, "JsonbValue must be standard layout and trivial"); |
1771 | | static_assert(is_pod_v<JsonbDecimal32>, "JsonbDecimal32 must be standard layout and trivial"); |
1772 | | static_assert(is_pod_v<JsonbDecimal64>, "JsonbDecimal64 must be standard layout and trivial"); |
1773 | | static_assert(is_pod_v<JsonbDecimal128>, "JsonbDecimal128 must be standard layout and trivial"); |
1774 | | static_assert(is_pod_v<JsonbDecimal256>, "JsonbDecimal256 must be standard layout and trivial"); |
1775 | | static_assert(is_pod_v<JsonbInt8Val>, "JsonbInt8Val must be standard layout and trivial"); |
1776 | | static_assert(is_pod_v<JsonbInt32Val>, "JsonbInt32Val must be standard layout and trivial"); |
1777 | | static_assert(is_pod_v<JsonbInt64Val>, "JsonbInt64Val must be standard layout and trivial"); |
1778 | | static_assert(is_pod_v<JsonbInt128Val>, "JsonbInt128Val must be standard layout and trivial"); |
1779 | | static_assert(is_pod_v<JsonbDoubleVal>, "JsonbDoubleVal must be standard layout and trivial"); |
1780 | | static_assert(is_pod_v<JsonbFloatVal>, "JsonbFloatVal must be standard layout and trivial"); |
1781 | | static_assert(is_pod_v<JsonbBinaryVal>, "JsonbBinaryVal must be standard layout and trivial"); |
1782 | | static_assert(is_pod_v<ContainerVal>, "ContainerVal must be standard layout and trivial"); |
1783 | | |
1784 | | #define ASSERT_DECIMAL_LAYOUT(type) \ |
1785 | | static_assert(offsetof(type, precision) == 0); \ |
1786 | | static_assert(offsetof(type, scale) == 4); \ |
1787 | | static_assert(offsetof(type, value) == 8); |
1788 | | |
1789 | | ASSERT_DECIMAL_LAYOUT(JsonbDecimal32) |
1790 | | ASSERT_DECIMAL_LAYOUT(JsonbDecimal64) |
1791 | | ASSERT_DECIMAL_LAYOUT(JsonbDecimal128) |
1792 | | ASSERT_DECIMAL_LAYOUT(JsonbDecimal256) |
1793 | | |
1794 | | #define ASSERT_NUMERIC_LAYOUT(type) static_assert(offsetof(type, num) == 0); |
1795 | | |
1796 | | ASSERT_NUMERIC_LAYOUT(JsonbInt8Val) |
1797 | | ASSERT_NUMERIC_LAYOUT(JsonbInt32Val) |
1798 | | ASSERT_NUMERIC_LAYOUT(JsonbInt64Val) |
1799 | | ASSERT_NUMERIC_LAYOUT(JsonbInt128Val) |
1800 | | ASSERT_NUMERIC_LAYOUT(JsonbDoubleVal) |
1801 | | |
1802 | | static_assert(offsetof(JsonbBinaryVal, size) == 0); |
1803 | | static_assert(offsetof(JsonbBinaryVal, payload) == 4); |
1804 | | |
1805 | | static_assert(offsetof(ContainerVal, size) == 0); |
1806 | | static_assert(offsetof(ContainerVal, payload) == 4); |
1807 | | |
1808 | | #pragma pack(pop) |
1809 | | #if defined(__clang__) |
1810 | | #pragma clang diagnostic pop |
1811 | | #endif |
1812 | | } // namespace doris |
1813 | | |
1814 | | #endif // JSONB_JSONBDOCUMENT_H |