|
1 /* |
|
2 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS HEADER. |
|
3 * |
|
4 * Copyright 2024 Mike Becker, Olaf Wintermann All rights reserved. |
|
5 * |
|
6 * Redistribution and use in source and binary forms, with or without |
|
7 * modification, are permitted provided that the following conditions are met: |
|
8 * |
|
9 * 1. Redistributions of source code must retain the above copyright |
|
10 * notice, this list of conditions and the following disclaimer. |
|
11 * |
|
12 * 2. Redistributions in binary form must reproduce the above copyright |
|
13 * notice, this list of conditions and the following disclaimer in the |
|
14 * documentation and/or other materials provided with the distribution. |
|
15 * |
|
16 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" |
|
17 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE |
|
18 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE |
|
19 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE |
|
20 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR |
|
21 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF |
|
22 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS |
|
23 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN |
|
24 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) |
|
25 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE |
|
26 * POSSIBILITY OF SUCH DAMAGE. |
|
27 */ |
|
28 |
|
29 #include "cx/json.h" |
|
30 |
|
31 #include <string.h> |
|
32 #include <assert.h> |
|
33 #include <stdio.h> |
|
34 #include <inttypes.h> |
|
35 |
|
36 /* |
|
37 * RFC 8259 |
|
38 * https://tools.ietf.org/html/rfc8259 |
|
39 */ |
|
40 |
|
41 static CxJsonValue cx_json_value_nothing = {.type = CX_JSON_NOTHING}; |
|
42 |
|
43 static int json_cmp_objvalue(const void *l, const void *r) { |
|
44 const CxJsonObjValue *left = l; |
|
45 const CxJsonObjValue *right = r; |
|
46 return cx_strcmp(cx_strcast(left->name), cx_strcast(right->name)); |
|
47 } |
|
48 |
|
49 static CxJsonObjValue *json_find_objvalue(const CxJsonValue *obj, cxstring name) { |
|
50 assert(obj->type == CX_JSON_OBJECT); |
|
51 CxJsonObjValue kv_dummy; |
|
52 kv_dummy.name = cx_mutstrn((char*) name.ptr, name.length); |
|
53 size_t index = cx_array_binary_search( |
|
54 obj->value.object.values, |
|
55 obj->value.object.values_size, |
|
56 sizeof(CxJsonObjValue), |
|
57 &kv_dummy, |
|
58 json_cmp_objvalue |
|
59 ); |
|
60 if (index == obj->value.object.values_size) { |
|
61 return NULL; |
|
62 } else { |
|
63 return &obj->value.object.values[index]; |
|
64 } |
|
65 } |
|
66 |
|
67 static int json_add_objvalue(CxJsonValue *objv, CxJsonObjValue member) { |
|
68 assert(objv->type == CX_JSON_OBJECT); |
|
69 const CxAllocator * const al = objv->allocator; |
|
70 CxJsonObject *obj = &(objv->value.object); |
|
71 |
|
72 // determine the index where we need to insert the new member |
|
73 size_t index = cx_array_binary_search_sup( |
|
74 obj->values, |
|
75 obj->values_size, |
|
76 sizeof(CxJsonObjValue), |
|
77 &member, json_cmp_objvalue |
|
78 ); |
|
79 |
|
80 // is the name already present? |
|
81 if (index < obj->values_size && 0 == json_cmp_objvalue(&member, &obj->values[index])) { |
|
82 // free the original value |
|
83 cx_strfree_a(al, &obj->values[index].name); |
|
84 cxJsonValueFree(obj->values[index].value); |
|
85 // replace the item |
|
86 obj->values[index] = member; |
|
87 |
|
88 // nothing more to do |
|
89 return 0; |
|
90 } |
|
91 |
|
92 // determine the old capacity and reserve for one more element |
|
93 CxArrayReallocator arealloc = cx_array_reallocator(al, NULL); |
|
94 size_t oldcap = obj->values_capacity; |
|
95 if (cx_array_simple_reserve_a(&arealloc, obj->values, 1)) return 1; |
|
96 |
|
97 // check the new capacity, if we need to realloc the index array |
|
98 size_t newcap = obj->values_capacity; |
|
99 if (newcap > oldcap) { |
|
100 if (cxReallocateArray(al, &obj->indices, newcap, sizeof(size_t))) { |
|
101 return 1; |
|
102 } |
|
103 } |
|
104 |
|
105 // check if append or insert |
|
106 if (index < obj->values_size) { |
|
107 // move the other elements |
|
108 memmove( |
|
109 &obj->values[index+1], |
|
110 &obj->values[index], |
|
111 (obj->values_size - index) * sizeof(CxJsonObjValue) |
|
112 ); |
|
113 // increase indices for the moved elements |
|
114 for (size_t i = 0; i < obj->values_size ; i++) { |
|
115 if (obj->indices[i] >= index) { |
|
116 obj->indices[i]++; |
|
117 } |
|
118 } |
|
119 } |
|
120 |
|
121 // insert the element and set the index |
|
122 obj->values[index] = member; |
|
123 obj->indices[obj->values_size] = index; |
|
124 obj->values_size++; |
|
125 |
|
126 return 0; |
|
127 } |
|
128 |
|
129 static void token_destroy(CxJsonToken *token) { |
|
130 if (token->allocated) { |
|
131 cx_strfree(&token->content); |
|
132 } |
|
133 } |
|
134 |
|
135 static bool json_isdigit(char c) { |
|
136 // TODO: remove once UCX has public API for this |
|
137 return c >= '0' && c <= '9'; |
|
138 } |
|
139 |
|
140 static bool json_isspace(char c) { |
|
141 // TODO: remove once UCX has public API for this |
|
142 return c == ' ' || c == '\t' || c == '\r' || c == '\n' || c == '\v' || c == '\f'; |
|
143 } |
|
144 |
|
145 static int num_isexp(const char *content, size_t length, size_t pos) { |
|
146 if (pos >= length) { |
|
147 return 0; |
|
148 } |
|
149 |
|
150 int ok = 0; |
|
151 for (size_t i = pos; i < length; i++) { |
|
152 char c = content[i]; |
|
153 if (json_isdigit(c)) { |
|
154 ok = 1; |
|
155 } else if (i == pos) { |
|
156 if (!(c == '+' || c == '-')) { |
|
157 return 0; |
|
158 } |
|
159 } else { |
|
160 return 0; |
|
161 } |
|
162 } |
|
163 |
|
164 return ok; |
|
165 } |
|
166 |
|
167 static CxJsonTokenType token_numbertype(const char *content, size_t length) { |
|
168 if (length == 0) return CX_JSON_TOKEN_ERROR; |
|
169 |
|
170 if (content[0] != '-' && !json_isdigit(content[0])) { |
|
171 return CX_JSON_TOKEN_ERROR; |
|
172 } |
|
173 |
|
174 CxJsonTokenType type = CX_JSON_TOKEN_INTEGER; |
|
175 for (size_t i = 1; i < length; i++) { |
|
176 if (content[i] == '.') { |
|
177 if (type == CX_JSON_TOKEN_NUMBER) { |
|
178 return CX_JSON_TOKEN_ERROR; // more than one decimal separator |
|
179 } |
|
180 type = CX_JSON_TOKEN_NUMBER; |
|
181 } else if (content[i] == 'e' || content[i] == 'E') { |
|
182 return num_isexp(content, length, i + 1) ? CX_JSON_TOKEN_NUMBER : CX_JSON_TOKEN_ERROR; |
|
183 } else if (!json_isdigit(content[i])) { |
|
184 return CX_JSON_TOKEN_ERROR; // char is not a digit, decimal separator or exponent sep |
|
185 } |
|
186 } |
|
187 |
|
188 return type; |
|
189 } |
|
190 |
|
191 static CxJsonToken token_create(CxJson *json, bool isstring, size_t start, size_t end) { |
|
192 cxmutstr str = cx_mutstrn(json->buffer.space + start, end - start); |
|
193 bool allocated = false; |
|
194 if (json->uncompleted.tokentype != CX_JSON_NO_TOKEN) { |
|
195 allocated = true; |
|
196 str = cx_strcat_m(json->uncompleted.content, 1, str); |
|
197 if (str.ptr == NULL) { // LCOV_EXCL_START |
|
198 return (CxJsonToken){CX_JSON_NO_TOKEN, false, {NULL, 0}}; |
|
199 } // LCOV_EXCL_STOP |
|
200 } |
|
201 json->uncompleted = (CxJsonToken){0}; |
|
202 CxJsonTokenType ttype; |
|
203 if (isstring) { |
|
204 ttype = CX_JSON_TOKEN_STRING; |
|
205 } else { |
|
206 cxstring s = cx_strcast(str); |
|
207 if (!cx_strcmp(s, CX_STR("true")) || !cx_strcmp(s, CX_STR("false")) |
|
208 || !cx_strcmp(s, CX_STR("null"))) { |
|
209 ttype = CX_JSON_TOKEN_LITERAL; |
|
210 } else { |
|
211 ttype = token_numbertype(str.ptr, str.length); |
|
212 } |
|
213 } |
|
214 if (ttype == CX_JSON_TOKEN_ERROR) { |
|
215 if (allocated) { |
|
216 cx_strfree(&str); |
|
217 } |
|
218 return (CxJsonToken){CX_JSON_TOKEN_ERROR, false, {NULL, 0}}; |
|
219 } |
|
220 return (CxJsonToken){ttype, allocated, str}; |
|
221 } |
|
222 |
|
223 static CxJsonTokenType char2ttype(char c) { |
|
224 switch (c) { |
|
225 case '[': { |
|
226 return CX_JSON_TOKEN_BEGIN_ARRAY; |
|
227 } |
|
228 case '{': { |
|
229 return CX_JSON_TOKEN_BEGIN_OBJECT; |
|
230 } |
|
231 case ']': { |
|
232 return CX_JSON_TOKEN_END_ARRAY; |
|
233 } |
|
234 case '}': { |
|
235 return CX_JSON_TOKEN_END_OBJECT; |
|
236 } |
|
237 case ':': { |
|
238 return CX_JSON_TOKEN_NAME_SEPARATOR; |
|
239 } |
|
240 case ',': { |
|
241 return CX_JSON_TOKEN_VALUE_SEPARATOR; |
|
242 } |
|
243 case '"': { |
|
244 return CX_JSON_TOKEN_STRING; |
|
245 } |
|
246 default: { |
|
247 if (json_isspace(c)) { |
|
248 return CX_JSON_TOKEN_SPACE; |
|
249 } |
|
250 } |
|
251 } |
|
252 return CX_JSON_NO_TOKEN; |
|
253 } |
|
254 |
|
255 static enum cx_json_status token_parse_next(CxJson *json, CxJsonToken *result) { |
|
256 // check if there is data in the buffer |
|
257 if (cxBufferEof(&json->buffer)) { |
|
258 return json->uncompleted.tokentype == CX_JSON_NO_TOKEN ? |
|
259 CX_JSON_NO_DATA : CX_JSON_INCOMPLETE_DATA; |
|
260 } |
|
261 |
|
262 // current token type and start index |
|
263 CxJsonTokenType ttype = json->uncompleted.tokentype; |
|
264 size_t token_part_start = json->buffer.pos; |
|
265 |
|
266 bool escape_end_of_string = ttype == CX_JSON_TOKEN_STRING |
|
267 && json->uncompleted.content.ptr[json->uncompleted.content.length-1] == '\\'; |
|
268 |
|
269 for (size_t i = json->buffer.pos; i < json->buffer.size; i++) { |
|
270 char c = json->buffer.space[i]; |
|
271 if (ttype != CX_JSON_TOKEN_STRING) { |
|
272 // currently non-string token |
|
273 CxJsonTokenType ctype = char2ttype(c); // start of new token? |
|
274 if (ttype == CX_JSON_NO_TOKEN) { |
|
275 if (ctype == CX_JSON_TOKEN_SPACE) { |
|
276 json->buffer.pos++; |
|
277 continue; |
|
278 } else if (ctype == CX_JSON_TOKEN_STRING) { |
|
279 // begin string |
|
280 ttype = CX_JSON_TOKEN_STRING; |
|
281 token_part_start = i; |
|
282 } else if (ctype != CX_JSON_NO_TOKEN) { |
|
283 // single-char token |
|
284 json->buffer.pos = i + 1; |
|
285 *result = (CxJsonToken){ctype, false, {NULL, 0}}; |
|
286 return CX_JSON_NO_ERROR; |
|
287 } else { |
|
288 ttype = CX_JSON_TOKEN_LITERAL; // number or literal |
|
289 token_part_start = i; |
|
290 } |
|
291 } else { |
|
292 // finish token |
|
293 if (ctype != CX_JSON_NO_TOKEN) { |
|
294 *result = token_create(json, false, token_part_start, i); |
|
295 if (result->tokentype == CX_JSON_NO_TOKEN) { |
|
296 return CX_JSON_BUFFER_ALLOC_FAILED; // LCOV_EXCL_LINE |
|
297 } |
|
298 if (result->tokentype == CX_JSON_TOKEN_ERROR) { |
|
299 return CX_JSON_FORMAT_ERROR_NUMBER; |
|
300 } |
|
301 json->buffer.pos = i; |
|
302 return CX_JSON_NO_ERROR; |
|
303 } |
|
304 } |
|
305 } else { |
|
306 // currently inside a string |
|
307 if (escape_end_of_string) { |
|
308 escape_end_of_string = false; |
|
309 } else { |
|
310 if (c == '"') { |
|
311 *result = token_create(json, true, token_part_start, i + 1); |
|
312 if (result->tokentype == CX_JSON_NO_TOKEN) { |
|
313 return CX_JSON_BUFFER_ALLOC_FAILED; // LCOV_EXCL_LINE |
|
314 } |
|
315 json->buffer.pos = i + 1; |
|
316 return CX_JSON_NO_ERROR; |
|
317 } else if (c == '\\') { |
|
318 escape_end_of_string = true; |
|
319 } |
|
320 } |
|
321 } |
|
322 } |
|
323 |
|
324 if (ttype != CX_JSON_NO_TOKEN) { |
|
325 // uncompleted token |
|
326 size_t uncompleted_len = json->buffer.size - token_part_start; |
|
327 if (json->uncompleted.tokentype == CX_JSON_NO_TOKEN) { |
|
328 // current token is uncompleted |
|
329 // save current token content |
|
330 CxJsonToken uncompleted = { |
|
331 ttype, true, |
|
332 cx_strdup(cx_strn(json->buffer.space + token_part_start, uncompleted_len)) |
|
333 }; |
|
334 if (uncompleted.content.ptr == NULL) { |
|
335 return CX_JSON_BUFFER_ALLOC_FAILED; // LCOV_EXCL_LINE |
|
336 } |
|
337 json->uncompleted = uncompleted; |
|
338 } else { |
|
339 // previously we also had an uncompleted token |
|
340 // combine the uncompleted token with the current token |
|
341 assert(json->uncompleted.allocated); |
|
342 cxmutstr str = cx_strcat_m(json->uncompleted.content, 1, |
|
343 cx_strn(json->buffer.space + token_part_start, uncompleted_len)); |
|
344 if (str.ptr == NULL) { |
|
345 return CX_JSON_BUFFER_ALLOC_FAILED; // LCOV_EXCL_LINE |
|
346 } |
|
347 json->uncompleted.content = str; |
|
348 } |
|
349 // advance the buffer position - we saved the stuff in the uncompleted token |
|
350 json->buffer.pos += uncompleted_len; |
|
351 } |
|
352 |
|
353 return CX_JSON_INCOMPLETE_DATA; |
|
354 } |
|
355 |
|
356 // converts a Unicode codepoint to utf8 |
|
357 static unsigned codepoint_to_utf8(uint32_t codepoint, char *output_buf) { |
|
358 if (codepoint <= 0x7F) { |
|
359 *output_buf = (char)codepoint; |
|
360 return 1; |
|
361 } else if (codepoint <= 0x7FF) { |
|
362 output_buf[0] = (char)(0xC0 | ((codepoint >> 6) & 0x1F)); |
|
363 output_buf[1] = (char)(0x80 | (codepoint & 0x3F)); |
|
364 return 2; |
|
365 } else if (codepoint <= 0xFFFF) { |
|
366 output_buf[0] = (char)(0xE0 | ((codepoint >> 12) & 0x0F)); |
|
367 output_buf[1] = (char)(0x80 | ((codepoint >> 6) & 0x3F)); |
|
368 output_buf[2] = (char)(0x80 | (codepoint & 0x3F)); |
|
369 return 3; |
|
370 } else if (codepoint <= 0x10FFFF) { |
|
371 output_buf[0] = (char)(0xF0 | ((codepoint >> 18) & 0x07)); |
|
372 output_buf[1] = (char)(0x80 | ((codepoint >> 12) & 0x3F)); |
|
373 output_buf[2] = (char)(0x80 | ((codepoint >> 6) & 0x3F)); |
|
374 output_buf[3] = (char)(0x80 | (codepoint & 0x3F)); |
|
375 return 4; |
|
376 } |
|
377 |
|
378 return 0; // LCOV_EXCL_LINE |
|
379 } |
|
380 |
|
381 // converts a utf16 surrogate pair to utf8 |
|
382 static inline uint32_t utf16pair_to_codepoint(uint16_t c0, uint16_t c1) { |
|
383 return ((c0 - 0xD800) << 10) + (c1 - 0xDC00) + 0x10000; |
|
384 } |
|
385 |
|
386 static unsigned unescape_unicode_string(cxstring str, char *utf8buf) { |
|
387 // str is supposed to start with "\uXXXX" or "\uXXXX\uXXXX" |
|
388 // remaining bytes in the string are ignored (str may be larger!) |
|
389 |
|
390 if (str.length < 6 || str.ptr[0] != '\\' || str.ptr[1] != 'u') { |
|
391 return 0; |
|
392 } |
|
393 |
|
394 unsigned utf8len = 0; |
|
395 cxstring ustr1 = { str.ptr + 2, 4}; |
|
396 uint16_t utf16a, utf16b; |
|
397 if (!cx_strtou16_lc(ustr1, &utf16a, 16, "")) { |
|
398 uint32_t codepoint; |
|
399 if (utf16a < 0xD800 || utf16a > 0xE000) { |
|
400 // character is in the Basic Multilingual Plane |
|
401 // and encoded as a single utf16 char |
|
402 codepoint = utf16a; |
|
403 utf8len = codepoint_to_utf8(codepoint, utf8buf); |
|
404 } else if (utf16a >= 0xD800 && utf16a <= 0xDBFF) { |
|
405 // character is encoded as a surrogate pair |
|
406 // get next 6 bytes |
|
407 if (str.length >= 12) { |
|
408 if (str.ptr[6] == '\\' && str.ptr[7] == 'u') { |
|
409 cxstring ustr2 = { str.ptr+8, 4 }; |
|
410 if (!cx_strtou16_lc(ustr2, &utf16b, 16, "") |
|
411 && utf16b >= 0xDC00 && utf16b <= 0xDFFF) { |
|
412 codepoint = utf16pair_to_codepoint(utf16a, utf16b); |
|
413 utf8len = codepoint_to_utf8(codepoint, utf8buf); |
|
414 } |
|
415 } |
|
416 } |
|
417 } |
|
418 } |
|
419 return utf8len; |
|
420 } |
|
421 |
|
422 static cxmutstr unescape_string(const CxAllocator *a, cxmutstr str) { |
|
423 // note: this function expects that str contains the enclosing quotes! |
|
424 |
|
425 cxmutstr result; |
|
426 result.length = 0; |
|
427 result.ptr = cxMalloc(a, str.length - 1); |
|
428 if (result.ptr == NULL) return result; // LCOV_EXCL_LINE |
|
429 |
|
430 bool u = false; |
|
431 for (size_t i = 1; i < str.length - 1; i++) { |
|
432 char c = str.ptr[i]; |
|
433 if (u) { |
|
434 u = false; |
|
435 if (c == 'n') { |
|
436 c = '\n'; |
|
437 } else if (c == '"') { |
|
438 c = '"'; |
|
439 } else if (c == 't') { |
|
440 c = '\t'; |
|
441 } else if (c == 'r') { |
|
442 c = '\r'; |
|
443 } else if (c == '\\') { |
|
444 c = '\\'; |
|
445 } else if (c == '/') { |
|
446 c = '/'; // always unescape, we don't need settings here |
|
447 } else if (c == 'f') { |
|
448 c = '\f'; |
|
449 } else if (c == 'b') { |
|
450 c = '\b'; |
|
451 } else if (c == 'u') { |
|
452 char utf8buf[4]; |
|
453 unsigned utf8len = unescape_unicode_string( |
|
454 cx_strn(str.ptr + i - 1, str.length + 1 - i), |
|
455 utf8buf |
|
456 ); |
|
457 if(utf8len > 0) { |
|
458 i += utf8len < 4 ? 4 : 10; |
|
459 // add all bytes from utf8buf except the last char |
|
460 // to the result (last char will be added below) |
|
461 utf8len--; |
|
462 c = utf8buf[utf8len]; |
|
463 for (unsigned x = 0; x < utf8len; x++) { |
|
464 result.ptr[result.length++] = utf8buf[x]; |
|
465 } |
|
466 } else { |
|
467 // decoding failed, ignore the entire sequence |
|
468 result.ptr[result.length++] = '\\'; |
|
469 } |
|
470 } else { |
|
471 // TODO: discuss the behavior for unrecognized escape sequences |
|
472 // most parsers throw an error here - we just ignore it |
|
473 result.ptr[result.length++] = '\\'; |
|
474 } |
|
475 |
|
476 result.ptr[result.length++] = c; |
|
477 } else { |
|
478 if (c == '\\') { |
|
479 u = true; |
|
480 } else { |
|
481 result.ptr[result.length++] = c; |
|
482 } |
|
483 } |
|
484 } |
|
485 result.ptr[result.length] = 0; |
|
486 |
|
487 return result; |
|
488 } |
|
489 |
|
490 static cxmutstr escape_string(cxmutstr str, bool escape_slash) { |
|
491 // note: this function produces the string without enclosing quotes |
|
492 // the reason is that we don't want to allocate memory just for that |
|
493 CxBuffer buf = {0}; |
|
494 |
|
495 bool all_printable = true; |
|
496 for (size_t i = 0; i < str.length; i++) { |
|
497 unsigned char c = str.ptr[i]; |
|
498 bool escape = c < 0x20 || c == '\\' || c == '"' |
|
499 || (escape_slash && c == '/'); |
|
500 |
|
501 if (all_printable && escape) { |
|
502 size_t capa = str.length + 32; |
|
503 char *space = malloc(capa); |
|
504 if (space == NULL) return cx_mutstrn(NULL, 0); |
|
505 cxBufferInit(&buf, space, capa, NULL, CX_BUFFER_AUTO_EXTEND); |
|
506 cxBufferWrite(str.ptr, 1, i, &buf); |
|
507 all_printable = false; |
|
508 } |
|
509 if (escape) { |
|
510 cxBufferPut(&buf, '\\'); |
|
511 if (c == '\"') { |
|
512 cxBufferPut(&buf, '\"'); |
|
513 } else if (c == '\n') { |
|
514 cxBufferPut(&buf, 'n'); |
|
515 } else if (c == '\t') { |
|
516 cxBufferPut(&buf, 't'); |
|
517 } else if (c == '\r') { |
|
518 cxBufferPut(&buf, 'r'); |
|
519 } else if (c == '\\') { |
|
520 cxBufferPut(&buf, '\\'); |
|
521 } else if (c == '/') { |
|
522 cxBufferPut(&buf, '/'); |
|
523 } else if (c == '\f') { |
|
524 cxBufferPut(&buf, 'f'); |
|
525 } else if (c == '\b') { |
|
526 cxBufferPut(&buf, 'b'); |
|
527 } else { |
|
528 char code[6]; |
|
529 snprintf(code, sizeof(code), "u%04x", (unsigned int) c); |
|
530 cxBufferPutString(&buf, code); |
|
531 } |
|
532 } else if (!all_printable) { |
|
533 cxBufferPut(&buf, c); |
|
534 } |
|
535 } |
|
536 if (!all_printable) { |
|
537 str = cx_mutstrn(buf.space, buf.size); |
|
538 } |
|
539 cxBufferDestroy(&buf); |
|
540 return str; |
|
541 } |
|
542 |
|
543 static CxJsonValue* json_create_value(CxJson *json, CxJsonValueType type) { |
|
544 CxJsonValue *v = cxCalloc(json->allocator, 1, sizeof(CxJsonValue)); |
|
545 if (v == NULL) return NULL; // LCOV_EXCL_LINE |
|
546 |
|
547 // initialize the value |
|
548 v->type = type; |
|
549 v->allocator = json->allocator; |
|
550 if (type == CX_JSON_ARRAY) { |
|
551 cx_array_initialize_a(json->allocator, v->value.array.array, 16); |
|
552 if (v->value.array.array == NULL) goto create_json_value_exit_error; // LCOV_EXCL_LINE |
|
553 } else if (type == CX_JSON_OBJECT) { |
|
554 cx_array_initialize_a(json->allocator, v->value.object.values, 16); |
|
555 v->value.object.indices = cxCalloc(json->allocator, 16, sizeof(size_t)); |
|
556 if (v->value.object.values == NULL || |
|
557 v->value.object.indices == NULL) |
|
558 goto create_json_value_exit_error; // LCOV_EXCL_LINE |
|
559 } |
|
560 |
|
561 // add the new value to a possible parent |
|
562 if (json->vbuf_size > 0) { |
|
563 CxJsonValue *parent = json->vbuf[json->vbuf_size - 1]; |
|
564 assert(parent != NULL); |
|
565 if (parent->type == CX_JSON_ARRAY) { |
|
566 CxArrayReallocator value_realloc = cx_array_reallocator(json->allocator, NULL); |
|
567 if (cx_array_simple_add_a(&value_realloc, parent->value.array.array, v)) { |
|
568 goto create_json_value_exit_error; // LCOV_EXCL_LINE |
|
569 } |
|
570 } else if (parent->type == CX_JSON_OBJECT) { |
|
571 // the member was already created after parsing the name |
|
572 assert(json->uncompleted_member.name.ptr != NULL); |
|
573 json->uncompleted_member.value = v; |
|
574 if (json_add_objvalue(parent, json->uncompleted_member)) { |
|
575 goto create_json_value_exit_error; // LCOV_EXCL_LINE |
|
576 } |
|
577 json->uncompleted_member.name = (cxmutstr) {NULL, 0}; |
|
578 } else { |
|
579 assert(false); // LCOV_EXCL_LINE |
|
580 } |
|
581 } |
|
582 |
|
583 // add the new value to the stack, if it is an array or object |
|
584 if (type == CX_JSON_ARRAY || type == CX_JSON_OBJECT) { |
|
585 CxArrayReallocator vbuf_realloc = cx_array_reallocator(NULL, json->vbuf_internal); |
|
586 if (cx_array_simple_add_a(&vbuf_realloc, json->vbuf, v)) { |
|
587 goto create_json_value_exit_error; // LCOV_EXCL_LINE |
|
588 } |
|
589 } |
|
590 |
|
591 // if currently no value is parsed, this is now the value of interest |
|
592 if (json->parsed == NULL) { |
|
593 json->parsed = v; |
|
594 } |
|
595 |
|
596 return v; |
|
597 // LCOV_EXCL_START |
|
598 create_json_value_exit_error: |
|
599 cxJsonValueFree(v); |
|
600 return NULL; |
|
601 // LCOV_EXCL_STOP |
|
602 } |
|
603 |
|
604 #define JP_STATE_VALUE_BEGIN 0 |
|
605 #define JP_STATE_VALUE_END 10 |
|
606 #define JP_STATE_VALUE_BEGIN_OBJ 1 |
|
607 #define JP_STATE_OBJ_SEP_OR_CLOSE 11 |
|
608 #define JP_STATE_VALUE_BEGIN_AR 2 |
|
609 #define JP_STATE_ARRAY_SEP_OR_CLOSE 12 |
|
610 #define JP_STATE_OBJ_NAME_OR_CLOSE 5 |
|
611 #define JP_STATE_OBJ_NAME 6 |
|
612 #define JP_STATE_OBJ_COLON 7 |
|
613 |
|
614 void cxJsonInit(CxJson *json, const CxAllocator *allocator) { |
|
615 if (allocator == NULL) { |
|
616 allocator = cxDefaultAllocator; |
|
617 } |
|
618 |
|
619 memset(json, 0, sizeof(CxJson)); |
|
620 json->allocator = allocator; |
|
621 |
|
622 json->states = json->states_internal; |
|
623 json->states_capacity = cx_nmemb(json->states_internal); |
|
624 json->states[0] = JP_STATE_VALUE_BEGIN; |
|
625 json->states_size = 1; |
|
626 |
|
627 json->vbuf = json->vbuf_internal; |
|
628 json->vbuf_capacity = cx_nmemb(json->vbuf_internal); |
|
629 } |
|
630 |
|
631 void cxJsonDestroy(CxJson *json) { |
|
632 cxBufferDestroy(&json->buffer); |
|
633 if (json->states != json->states_internal) { |
|
634 free(json->states); |
|
635 } |
|
636 if (json->vbuf != json->vbuf_internal) { |
|
637 free(json->vbuf); |
|
638 } |
|
639 cxJsonValueFree(json->parsed); |
|
640 json->parsed = NULL; |
|
641 if (json->uncompleted_member.name.ptr != NULL) { |
|
642 cx_strfree_a(json->allocator, &json->uncompleted_member.name); |
|
643 json->uncompleted_member = (CxJsonObjValue){{NULL, 0}, NULL}; |
|
644 } |
|
645 } |
|
646 |
|
647 int cxJsonFilln(CxJson *json, const char *buf, size_t size) { |
|
648 if (cxBufferEof(&json->buffer)) { |
|
649 // reinitialize the buffer |
|
650 cxBufferDestroy(&json->buffer); |
|
651 cxBufferInit(&json->buffer, (char*) buf, size, |
|
652 NULL, CX_BUFFER_AUTO_EXTEND | CX_BUFFER_COPY_ON_WRITE); |
|
653 json->buffer.size = size; |
|
654 return 0; |
|
655 } else { |
|
656 return size != cxBufferAppend(buf, 1, size, &json->buffer); |
|
657 } |
|
658 } |
|
659 |
|
660 static void json_add_state(CxJson *json, int state) { |
|
661 // we have guaranteed the necessary space with cx_array_simple_reserve() |
|
662 // therefore, we can safely add the state in the simplest way possible |
|
663 json->states[json->states_size++] = state; |
|
664 } |
|
665 |
|
666 #define return_rec(code) \ |
|
667 token_destroy(&token); \ |
|
668 return code |
|
669 |
|
670 static enum cx_json_status json_parse(CxJson *json) { |
|
671 // Reserve a pointer for a possibly read value |
|
672 CxJsonValue *vbuf = NULL; |
|
673 |
|
674 // grab the next token |
|
675 CxJsonToken token; |
|
676 { |
|
677 enum cx_json_status ret = token_parse_next(json, &token); |
|
678 if (ret != CX_JSON_NO_ERROR) { |
|
679 return ret; |
|
680 } |
|
681 } |
|
682 |
|
683 // pop the current state |
|
684 assert(json->states_size > 0); |
|
685 int state = json->states[--json->states_size]; |
|
686 |
|
687 // guarantee that at least two more states fit on the stack |
|
688 CxArrayReallocator state_realloc = cx_array_reallocator(NULL, json->states_internal); |
|
689 if (cx_array_simple_reserve_a(&state_realloc, json->states, 2)) { |
|
690 return CX_JSON_BUFFER_ALLOC_FAILED; // LCOV_EXCL_LINE |
|
691 } |
|
692 |
|
693 |
|
694 // 0 JP_STATE_VALUE_BEGIN value begin |
|
695 // 10 JP_STATE_VALUE_END expect value end |
|
696 // 1 JP_STATE_VALUE_BEGIN_OBJ value begin (inside object) |
|
697 // 11 JP_STATE_OBJ_SEP_OR_CLOSE object, expect separator, objclose |
|
698 // 2 JP_STATE_VALUE_BEGIN_AR value begin (inside array) |
|
699 // 12 JP_STATE_ARRAY_SEP_OR_CLOSE array, expect separator or arrayclose |
|
700 // 5 JP_STATE_OBJ_NAME_OR_CLOSE object, expect name or objclose |
|
701 // 6 JP_STATE_OBJ_NAME object, expect name |
|
702 // 7 JP_STATE_OBJ_COLON object, expect ':' |
|
703 |
|
704 if (state < 3) { |
|
705 // push expected end state to the stack |
|
706 json_add_state(json, 10 + state); |
|
707 switch (token.tokentype) { |
|
708 case CX_JSON_TOKEN_BEGIN_ARRAY: { |
|
709 if (json_create_value(json, CX_JSON_ARRAY) == NULL) { |
|
710 return_rec(CX_JSON_VALUE_ALLOC_FAILED); // LCOV_EXCL_LINE |
|
711 } |
|
712 json_add_state(json, JP_STATE_VALUE_BEGIN_AR); |
|
713 return_rec(CX_JSON_NO_ERROR); |
|
714 } |
|
715 case CX_JSON_TOKEN_BEGIN_OBJECT: { |
|
716 if (json_create_value(json, CX_JSON_OBJECT) == NULL) { |
|
717 return_rec(CX_JSON_VALUE_ALLOC_FAILED); // LCOV_EXCL_LINE |
|
718 } |
|
719 json_add_state(json, JP_STATE_OBJ_NAME_OR_CLOSE); |
|
720 return_rec(CX_JSON_NO_ERROR); |
|
721 } |
|
722 case CX_JSON_TOKEN_STRING: { |
|
723 if ((vbuf = json_create_value(json, CX_JSON_STRING)) == NULL) { |
|
724 return_rec(CX_JSON_VALUE_ALLOC_FAILED); // LCOV_EXCL_LINE |
|
725 } |
|
726 cxmutstr str = unescape_string(json->allocator, token.content); |
|
727 if (str.ptr == NULL) { |
|
728 return_rec(CX_JSON_VALUE_ALLOC_FAILED); // LCOV_EXCL_LINE |
|
729 } |
|
730 vbuf->value.string = str; |
|
731 return_rec(CX_JSON_NO_ERROR); |
|
732 } |
|
733 case CX_JSON_TOKEN_INTEGER: |
|
734 case CX_JSON_TOKEN_NUMBER: { |
|
735 int type = token.tokentype == CX_JSON_TOKEN_INTEGER ? CX_JSON_INTEGER : CX_JSON_NUMBER; |
|
736 if (NULL == (vbuf = json_create_value(json, type))) { |
|
737 return_rec(CX_JSON_VALUE_ALLOC_FAILED); // LCOV_EXCL_LINE |
|
738 } |
|
739 if (type == CX_JSON_INTEGER) { |
|
740 if (cx_strtoi64(token.content, &vbuf->value.integer, 10)) { |
|
741 return_rec(CX_JSON_FORMAT_ERROR_NUMBER); |
|
742 } |
|
743 } else { |
|
744 if (cx_strtod(token.content, &vbuf->value.number)) { |
|
745 return_rec(CX_JSON_FORMAT_ERROR_NUMBER); |
|
746 } |
|
747 } |
|
748 return_rec(CX_JSON_NO_ERROR); |
|
749 } |
|
750 case CX_JSON_TOKEN_LITERAL: { |
|
751 if ((vbuf = json_create_value(json, CX_JSON_LITERAL)) == NULL) { |
|
752 return_rec(CX_JSON_VALUE_ALLOC_FAILED); // LCOV_EXCL_LINE |
|
753 } |
|
754 if (0 == cx_strcmp(cx_strcast(token.content), cx_str("true"))) { |
|
755 vbuf->value.literal = CX_JSON_TRUE; |
|
756 } else if (0 == cx_strcmp(cx_strcast(token.content), cx_str("false"))) { |
|
757 vbuf->value.literal = CX_JSON_FALSE; |
|
758 } else { |
|
759 vbuf->value.literal = CX_JSON_NULL; |
|
760 } |
|
761 return_rec(CX_JSON_NO_ERROR); |
|
762 } |
|
763 default: { |
|
764 return_rec(CX_JSON_FORMAT_ERROR_UNEXPECTED_TOKEN); |
|
765 } |
|
766 } |
|
767 } else if (state == JP_STATE_ARRAY_SEP_OR_CLOSE) { |
|
768 // expect ',' or ']' |
|
769 if (token.tokentype == CX_JSON_TOKEN_VALUE_SEPARATOR) { |
|
770 json_add_state(json, JP_STATE_VALUE_BEGIN_AR); |
|
771 return_rec(CX_JSON_NO_ERROR); |
|
772 } else if (token.tokentype == CX_JSON_TOKEN_END_ARRAY) { |
|
773 // discard the array from the value buffer |
|
774 json->vbuf_size--; |
|
775 return_rec(CX_JSON_NO_ERROR); |
|
776 } else { |
|
777 return_rec(CX_JSON_FORMAT_ERROR_UNEXPECTED_TOKEN); |
|
778 } |
|
779 } else if (state == JP_STATE_OBJ_NAME_OR_CLOSE || state == JP_STATE_OBJ_NAME) { |
|
780 if (state == JP_STATE_OBJ_NAME_OR_CLOSE && token.tokentype == CX_JSON_TOKEN_END_OBJECT) { |
|
781 // discard the obj from the value buffer |
|
782 json->vbuf_size--; |
|
783 return_rec(CX_JSON_NO_ERROR); |
|
784 } else { |
|
785 // expect string |
|
786 if (token.tokentype != CX_JSON_TOKEN_STRING) { |
|
787 return_rec(CX_JSON_FORMAT_ERROR_UNEXPECTED_TOKEN); |
|
788 } |
|
789 |
|
790 // add new entry |
|
791 cxmutstr name = unescape_string(json->allocator, token.content); |
|
792 if (name.ptr == NULL) { |
|
793 return_rec(CX_JSON_VALUE_ALLOC_FAILED); // LCOV_EXCL_LINE |
|
794 } |
|
795 assert(json->uncompleted_member.name.ptr == NULL); |
|
796 json->uncompleted_member.name = name; |
|
797 assert(json->vbuf_size > 0); |
|
798 |
|
799 // next state |
|
800 json_add_state(json, JP_STATE_OBJ_COLON); |
|
801 return_rec(CX_JSON_NO_ERROR); |
|
802 } |
|
803 } else if (state == JP_STATE_OBJ_COLON) { |
|
804 // expect ':' |
|
805 if (token.tokentype != CX_JSON_TOKEN_NAME_SEPARATOR) { |
|
806 return_rec(CX_JSON_FORMAT_ERROR_UNEXPECTED_TOKEN); |
|
807 } |
|
808 // next state |
|
809 json_add_state(json, JP_STATE_VALUE_BEGIN_OBJ); |
|
810 return_rec(CX_JSON_NO_ERROR); |
|
811 } else if (state == JP_STATE_OBJ_SEP_OR_CLOSE) { |
|
812 // expect ',' or '}' |
|
813 if (token.tokentype == CX_JSON_TOKEN_VALUE_SEPARATOR) { |
|
814 json_add_state(json, JP_STATE_OBJ_NAME); |
|
815 return_rec(CX_JSON_NO_ERROR); |
|
816 } else if (token.tokentype == CX_JSON_TOKEN_END_OBJECT) { |
|
817 // discard the obj from the value buffer |
|
818 json->vbuf_size--; |
|
819 return_rec(CX_JSON_NO_ERROR); |
|
820 } else { |
|
821 return_rec(CX_JSON_FORMAT_ERROR_UNEXPECTED_TOKEN); |
|
822 } |
|
823 } else { |
|
824 // should be unreachable |
|
825 assert(false); |
|
826 return_rec(-1); |
|
827 } |
|
828 } |
|
829 |
|
830 CxJsonStatus cxJsonNext(CxJson *json, CxJsonValue **value) { |
|
831 // check if buffer has been filled |
|
832 if (json->buffer.space == NULL) { |
|
833 return CX_JSON_NULL_DATA; |
|
834 } |
|
835 |
|
836 // initialize output value |
|
837 *value = &cx_json_value_nothing; |
|
838 |
|
839 // parse data |
|
840 CxJsonStatus result; |
|
841 do { |
|
842 result = json_parse(json); |
|
843 if (result == CX_JSON_NO_ERROR && json->states_size == 1) { |
|
844 // final state reached |
|
845 assert(json->states[0] == JP_STATE_VALUE_END); |
|
846 assert(json->vbuf_size == 0); |
|
847 |
|
848 // write output value |
|
849 *value = json->parsed; |
|
850 json->parsed = NULL; |
|
851 |
|
852 // re-initialize state machine |
|
853 json->states[0] = JP_STATE_VALUE_BEGIN; |
|
854 |
|
855 return CX_JSON_NO_ERROR; |
|
856 } |
|
857 } while (result == CX_JSON_NO_ERROR); |
|
858 |
|
859 // the parser might think there is no data |
|
860 // but when we did not reach the final state, |
|
861 // we know that there must be more to come |
|
862 if (result == CX_JSON_NO_DATA && json->states_size > 1) { |
|
863 return CX_JSON_INCOMPLETE_DATA; |
|
864 } |
|
865 |
|
866 return result; |
|
867 } |
|
868 |
|
869 void cxJsonValueFree(CxJsonValue *value) { |
|
870 if (value == NULL || value->type == CX_JSON_NOTHING) return; |
|
871 switch (value->type) { |
|
872 case CX_JSON_OBJECT: { |
|
873 CxJsonObject obj = value->value.object; |
|
874 for (size_t i = 0; i < obj.values_size; i++) { |
|
875 cxJsonValueFree(obj.values[i].value); |
|
876 cx_strfree_a(value->allocator, &obj.values[i].name); |
|
877 } |
|
878 cxFree(value->allocator, obj.values); |
|
879 cxFree(value->allocator, obj.indices); |
|
880 break; |
|
881 } |
|
882 case CX_JSON_ARRAY: { |
|
883 CxJsonArray array = value->value.array; |
|
884 for (size_t i = 0; i < array.array_size; i++) { |
|
885 cxJsonValueFree(array.array[i]); |
|
886 } |
|
887 cxFree(value->allocator, array.array); |
|
888 break; |
|
889 } |
|
890 case CX_JSON_STRING: { |
|
891 cxFree(value->allocator, value->value.string.ptr); |
|
892 break; |
|
893 } |
|
894 default: { |
|
895 break; |
|
896 } |
|
897 } |
|
898 cxFree(value->allocator, value); |
|
899 } |
|
900 |
|
901 CxJsonValue* cxJsonCreateObj(const CxAllocator* allocator) { |
|
902 if (allocator == NULL) allocator = cxDefaultAllocator; |
|
903 CxJsonValue* v = cxMalloc(allocator, sizeof(CxJsonValue)); |
|
904 if (v == NULL) return NULL; |
|
905 v->allocator = allocator; |
|
906 v->type = CX_JSON_OBJECT; |
|
907 cx_array_initialize_a(allocator, v->value.object.values, 16); |
|
908 if (v->value.object.values == NULL) { // LCOV_EXCL_START |
|
909 cxFree(allocator, v); |
|
910 return NULL; |
|
911 // LCOV_EXCL_STOP |
|
912 } |
|
913 v->value.object.indices = cxCalloc(allocator, 16, sizeof(size_t)); |
|
914 if (v->value.object.indices == NULL) { // LCOV_EXCL_START |
|
915 cxFree(allocator, v->value.object.values); |
|
916 cxFree(allocator, v); |
|
917 return NULL; |
|
918 // LCOV_EXCL_STOP |
|
919 } |
|
920 return v; |
|
921 } |
|
922 |
|
923 CxJsonValue* cxJsonCreateArr(const CxAllocator* allocator) { |
|
924 if (allocator == NULL) allocator = cxDefaultAllocator; |
|
925 CxJsonValue* v = cxMalloc(allocator, sizeof(CxJsonValue)); |
|
926 if (v == NULL) return NULL; |
|
927 v->allocator = allocator; |
|
928 v->type = CX_JSON_ARRAY; |
|
929 cx_array_initialize_a(allocator, v->value.array.array, 16); |
|
930 if (v->value.array.array == NULL) { cxFree(allocator, v); return NULL; } |
|
931 return v; |
|
932 } |
|
933 |
|
934 CxJsonValue* cxJsonCreateNumber(const CxAllocator* allocator, double num) { |
|
935 if (allocator == NULL) allocator = cxDefaultAllocator; |
|
936 CxJsonValue* v = cxMalloc(allocator, sizeof(CxJsonValue)); |
|
937 if (v == NULL) return NULL; |
|
938 v->allocator = allocator; |
|
939 v->type = CX_JSON_NUMBER; |
|
940 v->value.number = num; |
|
941 return v; |
|
942 } |
|
943 |
|
944 CxJsonValue* cxJsonCreateInteger(const CxAllocator* allocator, int64_t num) { |
|
945 if (allocator == NULL) allocator = cxDefaultAllocator; |
|
946 CxJsonValue* v = cxMalloc(allocator, sizeof(CxJsonValue)); |
|
947 if (v == NULL) return NULL; |
|
948 v->allocator = allocator; |
|
949 v->type = CX_JSON_INTEGER; |
|
950 v->value.integer = num; |
|
951 return v; |
|
952 } |
|
953 |
|
954 CxJsonValue* cxJsonCreateString(const CxAllocator* allocator, const char* str) { |
|
955 return cxJsonCreateCxString(allocator, cx_str(str)); |
|
956 } |
|
957 |
|
958 CxJsonValue* cxJsonCreateCxString(const CxAllocator* allocator, cxstring str) { |
|
959 if (allocator == NULL) allocator = cxDefaultAllocator; |
|
960 CxJsonValue* v = cxMalloc(allocator, sizeof(CxJsonValue)); |
|
961 if (v == NULL) return NULL; |
|
962 v->allocator = allocator; |
|
963 v->type = CX_JSON_STRING; |
|
964 cxmutstr s = cx_strdup_a(allocator, str); |
|
965 if (s.ptr == NULL) { cxFree(allocator, v); return NULL; } |
|
966 v->value.string = s; |
|
967 return v; |
|
968 } |
|
969 |
|
970 CxJsonValue* cxJsonCreateLiteral(const CxAllocator* allocator, CxJsonLiteral lit) { |
|
971 if (allocator == NULL) allocator = cxDefaultAllocator; |
|
972 CxJsonValue* v = cxMalloc(allocator, sizeof(CxJsonValue)); |
|
973 if (v == NULL) return NULL; |
|
974 v->allocator = allocator; |
|
975 v->type = CX_JSON_LITERAL; |
|
976 v->value.literal = lit; |
|
977 return v; |
|
978 } |
|
979 |
|
980 // LCOV_EXCL_START |
|
981 // never called as long as malloc() does not return NULL |
|
982 static void json_arr_free_temp(CxJsonValue** values, size_t count) { |
|
983 for (size_t i = 0; i < count; i++) { |
|
984 if (values[i] == NULL) break; |
|
985 cxJsonValueFree(values[i]); |
|
986 } |
|
987 free(values); |
|
988 } |
|
989 // LCOV_EXCL_STOP |
|
990 |
|
991 int cxJsonArrAddNumbers(CxJsonValue* arr, const double* num, size_t count) { |
|
992 CxJsonValue** values = calloc(count, sizeof(CxJsonValue*)); |
|
993 if (values == NULL) return -1; |
|
994 for (size_t i = 0; i < count; i++) { |
|
995 values[i] = cxJsonCreateNumber(arr->allocator, num[i]); |
|
996 if (values[i] == NULL) { json_arr_free_temp(values, count); return -1; } |
|
997 } |
|
998 int ret = cxJsonArrAddValues(arr, values, count); |
|
999 free(values); |
|
1000 return ret; |
|
1001 } |
|
1002 |
|
1003 int cxJsonArrAddIntegers(CxJsonValue* arr, const int64_t* num, size_t count) { |
|
1004 CxJsonValue** values = calloc(count, sizeof(CxJsonValue*)); |
|
1005 if (values == NULL) return -1; |
|
1006 for (size_t i = 0; i < count; i++) { |
|
1007 values[i] = cxJsonCreateInteger(arr->allocator, num[i]); |
|
1008 if (values[i] == NULL) { json_arr_free_temp(values, count); return -1; } |
|
1009 } |
|
1010 int ret = cxJsonArrAddValues(arr, values, count); |
|
1011 free(values); |
|
1012 return ret; |
|
1013 } |
|
1014 |
|
1015 int cxJsonArrAddStrings(CxJsonValue* arr, const char* const* str, size_t count) { |
|
1016 CxJsonValue** values = calloc(count, sizeof(CxJsonValue*)); |
|
1017 if (values == NULL) return -1; |
|
1018 for (size_t i = 0; i < count; i++) { |
|
1019 values[i] = cxJsonCreateString(arr->allocator, str[i]); |
|
1020 if (values[i] == NULL) { json_arr_free_temp(values, count); return -1; } |
|
1021 } |
|
1022 int ret = cxJsonArrAddValues(arr, values, count); |
|
1023 free(values); |
|
1024 return ret; |
|
1025 } |
|
1026 |
|
1027 int cxJsonArrAddCxStrings(CxJsonValue* arr, const cxstring* str, size_t count) { |
|
1028 CxJsonValue** values = calloc(count, sizeof(CxJsonValue*)); |
|
1029 if (values == NULL) return -1; |
|
1030 for (size_t i = 0; i < count; i++) { |
|
1031 values[i] = cxJsonCreateCxString(arr->allocator, str[i]); |
|
1032 if (values[i] == NULL) { json_arr_free_temp(values, count); return -1; } |
|
1033 } |
|
1034 int ret = cxJsonArrAddValues(arr, values, count); |
|
1035 free(values); |
|
1036 return ret; |
|
1037 } |
|
1038 |
|
1039 int cxJsonArrAddLiterals(CxJsonValue* arr, const CxJsonLiteral* lit, size_t count) { |
|
1040 CxJsonValue** values = calloc(count, sizeof(CxJsonValue*)); |
|
1041 if (values == NULL) return -1; |
|
1042 for (size_t i = 0; i < count; i++) { |
|
1043 values[i] = cxJsonCreateLiteral(arr->allocator, lit[i]); |
|
1044 if (values[i] == NULL) { json_arr_free_temp(values, count); return -1; } |
|
1045 } |
|
1046 int ret = cxJsonArrAddValues(arr, values, count); |
|
1047 free(values); |
|
1048 return ret; |
|
1049 } |
|
1050 |
|
1051 int cxJsonArrAddValues(CxJsonValue* arr, CxJsonValue* const* val, size_t count) { |
|
1052 CxArrayReallocator value_realloc = cx_array_reallocator(arr->allocator, NULL); |
|
1053 assert(arr->type == CX_JSON_ARRAY); |
|
1054 return cx_array_simple_copy_a(&value_realloc, |
|
1055 arr->value.array.array, |
|
1056 arr->value.array.array_size, |
|
1057 val, count |
|
1058 ); |
|
1059 } |
|
1060 |
|
1061 int cxJsonObjPut(CxJsonValue* obj, cxstring name, CxJsonValue* child) { |
|
1062 cxmutstr k = cx_strdup_a(obj->allocator, name); |
|
1063 if (k.ptr == NULL) return -1; |
|
1064 CxJsonObjValue kv = {k, child}; |
|
1065 if (json_add_objvalue(obj, kv)) { |
|
1066 cx_strfree_a(obj->allocator, &k); |
|
1067 return 1; |
|
1068 } else { |
|
1069 return 0; |
|
1070 } |
|
1071 } |
|
1072 |
|
1073 CxJsonValue* cxJsonObjPutObj(CxJsonValue* obj, cxstring name) { |
|
1074 CxJsonValue* v = cxJsonCreateObj(obj->allocator); |
|
1075 if (v == NULL) return NULL; |
|
1076 if (cxJsonObjPut(obj, name, v)) { cxJsonValueFree(v); return NULL; } |
|
1077 return v; |
|
1078 } |
|
1079 |
|
1080 CxJsonValue* cxJsonObjPutArr(CxJsonValue* obj, cxstring name) { |
|
1081 CxJsonValue* v = cxJsonCreateArr(obj->allocator); |
|
1082 if (v == NULL) return NULL; |
|
1083 if (cxJsonObjPut(obj, name, v)) { cxJsonValueFree(v); return NULL; } |
|
1084 return v; |
|
1085 } |
|
1086 |
|
1087 CxJsonValue* cxJsonObjPutNumber(CxJsonValue* obj, cxstring name, double num) { |
|
1088 CxJsonValue* v = cxJsonCreateNumber(obj->allocator, num); |
|
1089 if (v == NULL) return NULL; |
|
1090 if (cxJsonObjPut(obj, name, v)) { cxJsonValueFree(v); return NULL; } |
|
1091 return v; |
|
1092 } |
|
1093 |
|
1094 CxJsonValue* cxJsonObjPutInteger(CxJsonValue* obj, cxstring name, int64_t num) { |
|
1095 CxJsonValue* v = cxJsonCreateInteger(obj->allocator, num); |
|
1096 if (v == NULL) return NULL; |
|
1097 if (cxJsonObjPut(obj, name, v)) { cxJsonValueFree(v); return NULL; } |
|
1098 return v; |
|
1099 } |
|
1100 |
|
1101 CxJsonValue* cxJsonObjPutString(CxJsonValue* obj, cxstring name, const char* str) { |
|
1102 CxJsonValue* v = cxJsonCreateString(obj->allocator, str); |
|
1103 if (v == NULL) return NULL; |
|
1104 if (cxJsonObjPut(obj, name, v)) { cxJsonValueFree(v); return NULL; } |
|
1105 return v; |
|
1106 } |
|
1107 |
|
1108 CxJsonValue* cxJsonObjPutCxString(CxJsonValue* obj, cxstring name, cxstring str) { |
|
1109 CxJsonValue* v = cxJsonCreateCxString(obj->allocator, str); |
|
1110 if (v == NULL) return NULL; |
|
1111 if (cxJsonObjPut(obj, name, v)) { cxJsonValueFree(v); return NULL; } |
|
1112 return v; |
|
1113 } |
|
1114 |
|
1115 CxJsonValue* cxJsonObjPutLiteral(CxJsonValue* obj, cxstring name, CxJsonLiteral lit) { |
|
1116 CxJsonValue* v = cxJsonCreateLiteral(obj->allocator, lit); |
|
1117 if (v == NULL) return NULL; |
|
1118 if (cxJsonObjPut(obj, name, v)) { cxJsonValueFree(v); return NULL;} |
|
1119 return v; |
|
1120 } |
|
1121 |
|
1122 CxJsonValue *cxJsonArrGet(const CxJsonValue *value, size_t index) { |
|
1123 if (index >= value->value.array.array_size) { |
|
1124 return &cx_json_value_nothing; |
|
1125 } |
|
1126 return value->value.array.array[index]; |
|
1127 } |
|
1128 |
|
1129 CxIterator cxJsonArrIter(const CxJsonValue *value) { |
|
1130 return cxIteratorPtr( |
|
1131 value->value.array.array, |
|
1132 value->value.array.array_size |
|
1133 ); |
|
1134 } |
|
1135 |
|
1136 CxIterator cxJsonObjIter(const CxJsonValue *value) { |
|
1137 return cxIterator( |
|
1138 value->value.object.values, |
|
1139 sizeof(CxJsonObjValue), |
|
1140 value->value.object.values_size |
|
1141 ); |
|
1142 } |
|
1143 |
|
1144 CxJsonValue *cx_json_obj_get_cxstr(const CxJsonValue *value, cxstring name) { |
|
1145 CxJsonObjValue *member = json_find_objvalue(value, name); |
|
1146 if (member == NULL) { |
|
1147 return &cx_json_value_nothing; |
|
1148 } else { |
|
1149 return member->value; |
|
1150 } |
|
1151 } |
|
1152 |
|
1153 CxJsonWriter cxJsonWriterCompact(void) { |
|
1154 return (CxJsonWriter) { |
|
1155 false, |
|
1156 true, |
|
1157 6, |
|
1158 false, |
|
1159 4, |
|
1160 false |
|
1161 }; |
|
1162 } |
|
1163 |
|
1164 CxJsonWriter cxJsonWriterPretty(bool use_spaces) { |
|
1165 return (CxJsonWriter) { |
|
1166 true, |
|
1167 true, |
|
1168 6, |
|
1169 use_spaces, |
|
1170 4, |
|
1171 false |
|
1172 }; |
|
1173 } |
|
1174 |
|
1175 static int cx_json_writer_indent( |
|
1176 void *target, |
|
1177 cx_write_func wfunc, |
|
1178 const CxJsonWriter *settings, |
|
1179 unsigned int depth |
|
1180 ) { |
|
1181 if (depth == 0) return 0; |
|
1182 |
|
1183 // determine the width and characters to use |
|
1184 const char* indent; // for 32 prepared chars |
|
1185 size_t width = depth; |
|
1186 if (settings->indent_space) { |
|
1187 if (settings->indent == 0) return 0; |
|
1188 width *= settings->indent; |
|
1189 indent = " "; |
|
1190 } else { |
|
1191 indent = "\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t"; |
|
1192 } |
|
1193 |
|
1194 // calculate the number of write calls and write |
|
1195 size_t full = width / 32; |
|
1196 size_t remaining = width % 32; |
|
1197 for (size_t i = 0; i < full; i++) { |
|
1198 if (32 != wfunc(indent, 1, 32, target)) return 1; |
|
1199 } |
|
1200 if (remaining != wfunc(indent, 1, remaining, target)) return 1; |
|
1201 |
|
1202 return 0; |
|
1203 } |
|
1204 |
|
1205 |
|
1206 int cx_json_write_rec( |
|
1207 void *target, |
|
1208 const CxJsonValue *value, |
|
1209 cx_write_func wfunc, |
|
1210 const CxJsonWriter *settings, |
|
1211 unsigned int depth |
|
1212 ) { |
|
1213 // keep track of written items |
|
1214 // the idea is to reduce the number of jumps for error checking |
|
1215 size_t actual = 0, expected = 0; |
|
1216 |
|
1217 // small buffer for number to string conversions |
|
1218 char numbuf[40]; |
|
1219 |
|
1220 // recursively write the values |
|
1221 switch (value->type) { |
|
1222 case CX_JSON_OBJECT: { |
|
1223 const char *begin_obj = "{\n"; |
|
1224 if (settings->pretty) { |
|
1225 actual += wfunc(begin_obj, 1, 2, target); |
|
1226 expected += 2; |
|
1227 } else { |
|
1228 actual += wfunc(begin_obj, 1, 1, target); |
|
1229 expected++; |
|
1230 } |
|
1231 depth++; |
|
1232 size_t elem_count = value->value.object.values_size; |
|
1233 for (size_t look_idx = 0; look_idx < elem_count; look_idx++) { |
|
1234 // get the member either via index array or directly |
|
1235 size_t elem_idx = settings->sort_members |
|
1236 ? look_idx |
|
1237 : value->value.object.indices[look_idx]; |
|
1238 CxJsonObjValue *member = &value->value.object.values[elem_idx]; |
|
1239 if (settings->sort_members) { |
|
1240 depth++;depth--; |
|
1241 } |
|
1242 |
|
1243 // possible indentation |
|
1244 if (settings->pretty) { |
|
1245 if (cx_json_writer_indent(target, wfunc, settings, depth)) { |
|
1246 return 1; // LCOV_EXCL_LINE |
|
1247 } |
|
1248 } |
|
1249 |
|
1250 // the name |
|
1251 actual += wfunc("\"", 1, 1, target); |
|
1252 cxmutstr name = escape_string(member->name, settings->escape_slash); |
|
1253 actual += wfunc(name.ptr, 1, name.length, target); |
|
1254 if (name.ptr != member->name.ptr) { |
|
1255 cx_strfree(&name); |
|
1256 } |
|
1257 actual += wfunc("\"", 1, 1, target); |
|
1258 const char *obj_name_sep = ": "; |
|
1259 if (settings->pretty) { |
|
1260 actual += wfunc(obj_name_sep, 1, 2, target); |
|
1261 expected += 4 + member->name.length; |
|
1262 } else { |
|
1263 actual += wfunc(obj_name_sep, 1, 1, target); |
|
1264 expected += 3 + member->name.length; |
|
1265 } |
|
1266 |
|
1267 // the value |
|
1268 if (cx_json_write_rec(target, member->value, wfunc, settings, depth)) return 1; |
|
1269 |
|
1270 // end of object-value |
|
1271 if (look_idx < elem_count - 1) { |
|
1272 const char *obj_value_sep = ",\n"; |
|
1273 if (settings->pretty) { |
|
1274 actual += wfunc(obj_value_sep, 1, 2, target); |
|
1275 expected += 2; |
|
1276 } else { |
|
1277 actual += wfunc(obj_value_sep, 1, 1, target); |
|
1278 expected++; |
|
1279 } |
|
1280 } else { |
|
1281 if (settings->pretty) { |
|
1282 actual += wfunc("\n", 1, 1, target); |
|
1283 expected ++; |
|
1284 } |
|
1285 } |
|
1286 } |
|
1287 depth--; |
|
1288 if (settings->pretty) { |
|
1289 if (cx_json_writer_indent(target, wfunc, settings, depth)) return 1; |
|
1290 } |
|
1291 actual += wfunc("}", 1, 1, target); |
|
1292 expected++; |
|
1293 break; |
|
1294 } |
|
1295 case CX_JSON_ARRAY: { |
|
1296 actual += wfunc("[", 1, 1, target); |
|
1297 expected++; |
|
1298 CxIterator iter = cxJsonArrIter(value); |
|
1299 cx_foreach(CxJsonValue*, element, iter) { |
|
1300 if (cx_json_write_rec( |
|
1301 target, element, |
|
1302 wfunc, settings, depth) |
|
1303 ) return 1; |
|
1304 |
|
1305 if (iter.index < iter.elem_count - 1) { |
|
1306 const char *arr_value_sep = ", "; |
|
1307 if (settings->pretty) { |
|
1308 actual += wfunc(arr_value_sep, 1, 2, target); |
|
1309 expected += 2; |
|
1310 } else { |
|
1311 actual += wfunc(arr_value_sep, 1, 1, target); |
|
1312 expected++; |
|
1313 } |
|
1314 } |
|
1315 } |
|
1316 actual += wfunc("]", 1, 1, target); |
|
1317 expected++; |
|
1318 break; |
|
1319 } |
|
1320 case CX_JSON_STRING: { |
|
1321 actual += wfunc("\"", 1, 1, target); |
|
1322 cxmutstr str = escape_string(value->value.string, settings->escape_slash); |
|
1323 actual += wfunc(str.ptr, 1, str.length, target); |
|
1324 if (str.ptr != value->value.string.ptr) { |
|
1325 cx_strfree(&str); |
|
1326 } |
|
1327 actual += wfunc("\"", 1, 1, target); |
|
1328 expected += 2 + value->value.string.length; |
|
1329 break; |
|
1330 } |
|
1331 case CX_JSON_NUMBER: { |
|
1332 int precision = settings->frac_max_digits; |
|
1333 // because of the way how %g is defined, we need to |
|
1334 // double the precision and truncate ourselves |
|
1335 precision = 1 + (precision > 15 ? 30 : 2 * precision); |
|
1336 snprintf(numbuf, 40, "%.*g", precision, value->value.number); |
|
1337 char *dot, *exp; |
|
1338 unsigned char max_digits; |
|
1339 // find the decimal separator and hope that it's one of . or , |
|
1340 dot = strchr(numbuf, '.'); |
|
1341 if (dot == NULL) { |
|
1342 dot = strchr(numbuf, ','); |
|
1343 } |
|
1344 if (dot == NULL) { |
|
1345 // no decimal separator found |
|
1346 // output everything until a possible exponent |
|
1347 max_digits = 30; |
|
1348 dot = numbuf; |
|
1349 } else { |
|
1350 // found a decimal separator |
|
1351 // output everything until the separator |
|
1352 // and set max digits to what the settings say |
|
1353 size_t len = dot - numbuf; |
|
1354 actual += wfunc(numbuf, 1, len, target); |
|
1355 expected += len; |
|
1356 max_digits = settings->frac_max_digits; |
|
1357 if (max_digits > 15) { |
|
1358 max_digits = 15; |
|
1359 } |
|
1360 // locale independent separator |
|
1361 if (max_digits > 0) { |
|
1362 actual += wfunc(".", 1, 1, target); |
|
1363 expected++; |
|
1364 } |
|
1365 dot++; |
|
1366 } |
|
1367 // find the exponent |
|
1368 exp = strchr(dot, 'e'); |
|
1369 if (exp == NULL) { |
|
1370 // no exponent - output the rest |
|
1371 if (max_digits > 0) { |
|
1372 size_t len = strlen(dot); |
|
1373 if (len > max_digits) { |
|
1374 len = max_digits; |
|
1375 } |
|
1376 actual += wfunc(dot, 1, len, target); |
|
1377 expected += len; |
|
1378 } |
|
1379 } else { |
|
1380 // exponent found - truncate the frac digits |
|
1381 // and then output the rest |
|
1382 if (max_digits > 0) { |
|
1383 size_t len = exp - dot - 1; |
|
1384 if (len > max_digits) { |
|
1385 len = max_digits; |
|
1386 } |
|
1387 actual += wfunc(dot, 1, len, target); |
|
1388 expected += len; |
|
1389 } |
|
1390 actual += wfunc("e", 1, 1, target); |
|
1391 expected++; |
|
1392 exp++; |
|
1393 size_t len = strlen(exp); |
|
1394 actual += wfunc(exp, 1, len, target); |
|
1395 expected += len; |
|
1396 } |
|
1397 break; |
|
1398 } |
|
1399 case CX_JSON_INTEGER: { |
|
1400 snprintf(numbuf, 32, "%" PRIi64, value->value.integer); |
|
1401 size_t len = strlen(numbuf); |
|
1402 actual += wfunc(numbuf, 1, len, target); |
|
1403 expected += len; |
|
1404 break; |
|
1405 } |
|
1406 case CX_JSON_LITERAL: { |
|
1407 if (value->value.literal == CX_JSON_TRUE) { |
|
1408 actual += wfunc("true", 1, 4, target); |
|
1409 expected += 4; |
|
1410 } else if (value->value.literal == CX_JSON_FALSE) { |
|
1411 actual += wfunc("false", 1, 5, target); |
|
1412 expected += 5; |
|
1413 } else { |
|
1414 actual += wfunc("null", 1, 4, target); |
|
1415 expected += 4; |
|
1416 } |
|
1417 break; |
|
1418 } |
|
1419 case CX_JSON_NOTHING: { |
|
1420 // deliberately supported as an empty string! |
|
1421 // users might want to just write the result |
|
1422 // of a get operation without testing the value |
|
1423 // and therefore this should not blow up |
|
1424 break; |
|
1425 } |
|
1426 default: assert(false); // LCOV_EXCL_LINE |
|
1427 } |
|
1428 |
|
1429 return expected != actual; |
|
1430 } |
|
1431 |
|
1432 int cxJsonWrite( |
|
1433 void *target, |
|
1434 const CxJsonValue *value, |
|
1435 cx_write_func wfunc, |
|
1436 const CxJsonWriter *settings |
|
1437 ) { |
|
1438 assert(target != NULL); |
|
1439 assert(value != NULL); |
|
1440 assert(wfunc != NULL); |
|
1441 |
|
1442 CxJsonWriter writer_default = cxJsonWriterCompact(); |
|
1443 if (settings == NULL) { |
|
1444 settings = &writer_default; |
|
1445 } |
|
1446 return cx_json_write_rec(target, value, wfunc, settings, 0); |
|
1447 } |