/root/doris/be/src/util/jsonb_utils.h
Line | Count | Source |
1 | | /* |
2 | | * Copyright (c) 2014, Facebook, Inc. |
3 | | * All rights reserved. |
4 | | * |
5 | | * This source code is licensed under the BSD-style license found in the |
6 | | * LICENSE file in the root directory of this source tree. An additional grant |
7 | | * of patent rights can be found in the PATENTS file in the same directory. |
8 | | * |
9 | | */ |
10 | | |
11 | | /* |
12 | | * This header file defines miscellaneous utility classes. |
13 | | * |
14 | | * @author Tian Xia <tianx@fb.com> |
15 | | * |
16 | | * this file is copied from |
17 | | * https://github.com/facebook/mysql-5.6/blob/fb-mysql-5.6.35/fbson/FbsonUtil.h |
18 | | * and modified by Doris |
19 | | */ |
20 | | |
21 | | #ifndef JSONB_JSONBUTIL_H |
22 | | #define JSONB_JSONBUTIL_H |
23 | | |
24 | | #include "common/status.h" |
25 | | #include "jsonb_document.h" |
26 | | #include "jsonb_stream.h" |
27 | | |
28 | | namespace doris { |
29 | | |
30 | 218 | #define OUT_BUF_SIZE 1024 |
31 | | |
32 | | /* |
33 | | * JsonbToJson converts an JsonbValue object to a JSON string. |
34 | | */ |
35 | | class JsonbToJson { |
36 | | public: |
37 | 218 | JsonbToJson() : os_(buffer_, OUT_BUF_SIZE) {} |
38 | | |
39 | | // get json string |
40 | 218 | std::string to_json_string(const char* data, size_t size) { |
41 | 218 | JsonbDocument* pdoc; |
42 | 218 | THROW_IF_ERROR(doris::JsonbDocument::checkAndCreateDocument(data, size, &pdoc)); |
43 | 218 | return to_json_string(pdoc->getValue()); |
44 | 218 | } |
45 | | |
46 | 218 | std::string to_json_string(const JsonbValue* val) { |
47 | 218 | os_.clear(); |
48 | 218 | os_.seekp(0); |
49 | | |
50 | 218 | if (val) { |
51 | 218 | intern_json(val); |
52 | 218 | } |
53 | | |
54 | 218 | os_.put(0); |
55 | | |
56 | 218 | std::string json_string {os_.getBuffer()}; |
57 | 218 | return json_string; |
58 | 218 | } |
59 | | |
60 | 218 | static std::string jsonb_to_json_string(const char* data, size_t size) { |
61 | 218 | JsonbToJson jsonb_to_json; |
62 | 218 | return jsonb_to_json.to_json_string(data, size); |
63 | 218 | } |
64 | | |
65 | | private: |
66 | | // recursively convert JsonbValue |
67 | 1.47k | void intern_json(const JsonbValue* val) { |
68 | 1.47k | switch (val->type) { |
69 | 40 | case JsonbType::T_Null: { |
70 | 40 | os_.write("null", 4); |
71 | 40 | break; |
72 | 0 | } |
73 | 47 | case JsonbType::T_True: { |
74 | 47 | os_.write("true", 4); |
75 | 47 | break; |
76 | 0 | } |
77 | 14 | case JsonbType::T_False: { |
78 | 14 | os_.write("false", 5); |
79 | 14 | break; |
80 | 0 | } |
81 | 605 | case JsonbType::T_Int8: { |
82 | 605 | os_.write(val->unpack<JsonbInt8Val>()->val()); |
83 | 605 | break; |
84 | 0 | } |
85 | 8 | case JsonbType::T_Int16: { |
86 | 8 | os_.write(val->unpack<JsonbInt16Val>()->val()); |
87 | 8 | break; |
88 | 0 | } |
89 | 13 | case JsonbType::T_Int32: { |
90 | 13 | os_.write(val->unpack<JsonbInt32Val>()->val()); |
91 | 13 | break; |
92 | 0 | } |
93 | 5 | case JsonbType::T_Int64: { |
94 | 5 | os_.write(val->unpack<JsonbInt64Val>()->val()); |
95 | 5 | break; |
96 | 0 | } |
97 | 38 | case JsonbType::T_Double: { |
98 | 38 | os_.write(val->unpack<JsonbDoubleVal>()->val()); |
99 | 38 | break; |
100 | 0 | } |
101 | 2 | case JsonbType::T_Float: { |
102 | 2 | os_.write(val->unpack<JsonbFloatVal>()->val()); |
103 | 2 | break; |
104 | 0 | } |
105 | 1 | case JsonbType::T_Int128: { |
106 | 1 | os_.write(val->unpack<JsonbInt128Val>()->val()); |
107 | 1 | break; |
108 | 0 | } |
109 | 126 | case JsonbType::T_String: { |
110 | 126 | string_to_json(val->unpack<JsonbStringVal>()->getBlob(), |
111 | 126 | val->unpack<JsonbStringVal>()->length()); |
112 | 126 | break; |
113 | 0 | } |
114 | 0 | case JsonbType::T_Binary: { |
115 | 0 | os_.write("\"<BINARY>", 9); |
116 | 0 | os_.write(val->unpack<JsonbBinaryVal>()->getBlob(), |
117 | 0 | val->unpack<JsonbBinaryVal>()->getBlobLen()); |
118 | 0 | os_.write("<BINARY>\"", 9); |
119 | 0 | break; |
120 | 0 | } |
121 | 507 | case JsonbType::T_Object: { |
122 | 507 | object_to_json(val->unpack<ObjectVal>()); |
123 | 507 | break; |
124 | 0 | } |
125 | 63 | case JsonbType::T_Array: { |
126 | 63 | array_to_json(val->unpack<ArrayVal>()); |
127 | 63 | break; |
128 | 0 | } |
129 | 1 | case JsonbType::T_Decimal32: { |
130 | 1 | const auto* decimal_val = val->unpack<JsonbDecimal32>(); |
131 | 1 | decimal_to_json(vectorized::Decimal32 {decimal_val->val()}, decimal_val->precision, |
132 | 1 | decimal_val->scale); |
133 | 1 | break; |
134 | 0 | } |
135 | 1 | case JsonbType::T_Decimal64: { |
136 | 1 | const auto* decimal_val = val->unpack<JsonbDecimal64>(); |
137 | 1 | decimal_to_json(vectorized::Decimal64 {decimal_val->val()}, decimal_val->precision, |
138 | 1 | decimal_val->scale); |
139 | 1 | break; |
140 | 0 | } |
141 | 2 | case JsonbType::T_Decimal128: { |
142 | 2 | const auto* decimal_val = val->unpack<JsonbDecimal128>(); |
143 | 2 | decimal_to_json(vectorized::Decimal128V3 {decimal_val->val()}, decimal_val->precision, |
144 | 2 | decimal_val->scale); |
145 | 2 | break; |
146 | 0 | } |
147 | 1 | case JsonbType::T_Decimal256: { |
148 | 1 | const auto* decimal_val = val->unpack<JsonbDecimal256>(); |
149 | 1 | decimal_to_json(vectorized::Decimal256 {decimal_val->val()}, decimal_val->precision, |
150 | 1 | decimal_val->scale); |
151 | 1 | break; |
152 | 0 | } |
153 | 0 | default: |
154 | 0 | break; |
155 | 1.47k | } |
156 | 1.47k | } |
157 | | |
158 | 742 | void string_to_json(const char* str, size_t len) { |
159 | 742 | os_.put('"'); |
160 | 742 | if (nullptr == str) { |
161 | 1 | os_.put('"'); |
162 | 1 | return; |
163 | 1 | } |
164 | 741 | char char_buffer[16]; |
165 | 1.00M | for (const char* ptr = str; ptr != str + len && *ptr; ++ptr) { |
166 | 1.00M | if ((unsigned char)*ptr > 31 && *ptr != '\"' && *ptr != '\\') { |
167 | 1.00M | os_.put(*ptr); |
168 | 1.00M | } else { |
169 | 6 | os_.put('\\'); |
170 | 6 | unsigned char token; |
171 | 6 | switch (token = *ptr) { |
172 | 0 | case '\\': |
173 | 0 | os_.put('\\'); |
174 | 0 | break; |
175 | 1 | case '\"': |
176 | 1 | os_.put('\"'); |
177 | 1 | break; |
178 | 1 | case '\b': |
179 | 1 | os_.put('b'); |
180 | 1 | break; |
181 | 1 | case '\f': |
182 | 1 | os_.put('f'); |
183 | 1 | break; |
184 | 1 | case '\n': |
185 | 1 | os_.put('n'); |
186 | 1 | break; |
187 | 1 | case '\r': |
188 | 1 | os_.put('r'); |
189 | 1 | break; |
190 | 1 | case '\t': |
191 | 1 | os_.put('t'); |
192 | 1 | break; |
193 | 0 | default: { |
194 | 0 | int char_num = snprintf(char_buffer, sizeof(char_buffer), "u%04x", token); |
195 | 0 | os_.write(char_buffer, char_num); |
196 | 0 | break; |
197 | 0 | } |
198 | 6 | } |
199 | 6 | } |
200 | 1.00M | } |
201 | 741 | os_.put('"'); |
202 | 741 | } |
203 | | |
204 | | // convert object |
205 | 507 | void object_to_json(const ObjectVal* val) { |
206 | 507 | os_.put('{'); |
207 | | |
208 | 507 | auto iter = val->begin(); |
209 | 507 | auto iter_fence = val->end(); |
210 | | |
211 | 1.12k | while (iter < iter_fence) { |
212 | | // write key |
213 | 616 | if (iter->klen()) { |
214 | 615 | string_to_json(iter->getKeyStr(), iter->klen()); |
215 | 615 | } else { |
216 | | // NOTE: we use sMaxKeyId to represent an empty key. see jsonb_writer.h |
217 | 1 | if (iter->getKeyId() == JsonbKeyValue::sMaxKeyId) { |
218 | 1 | string_to_json(nullptr, 0); |
219 | 1 | } else { |
220 | 0 | os_.write(iter->getKeyId()); |
221 | 0 | } |
222 | 1 | } |
223 | 616 | os_.put(':'); |
224 | | |
225 | | // convert value |
226 | 616 | intern_json(iter->value()); |
227 | | |
228 | 616 | ++iter; |
229 | 616 | if (iter != iter_fence) { |
230 | 121 | os_.put(','); |
231 | 121 | } |
232 | 616 | } |
233 | | |
234 | 507 | assert(iter == iter_fence); |
235 | | |
236 | 507 | os_.put('}'); |
237 | 507 | } |
238 | | |
239 | | // convert array to json |
240 | 63 | void array_to_json(const ArrayVal* val) { |
241 | 63 | os_.put('['); |
242 | | |
243 | 63 | auto iter = val->begin(); |
244 | 63 | auto iter_fence = val->end(); |
245 | | |
246 | 703 | while (iter != iter_fence) { |
247 | | // convert value |
248 | 640 | intern_json((const JsonbValue*)iter); |
249 | 640 | ++iter; |
250 | 640 | if (iter != iter_fence) { |
251 | 588 | os_.put(','); |
252 | 588 | } |
253 | 640 | } |
254 | | |
255 | 63 | assert(iter == iter_fence); |
256 | | |
257 | 63 | os_.put(']'); |
258 | 63 | } |
259 | | |
260 | | template <JsonbDecimalType T> |
261 | | void decimal_to_json(const T& value, const uint32_t precision, const uint32_t scale); |
262 | | |
263 | | JsonbOutStream os_; |
264 | | char buffer_[OUT_BUF_SIZE]; |
265 | | }; |
266 | | |
267 | | } // namespace doris |
268 | | |
269 | | #endif // JSONB_JSONBUTIL_H |