ucx/json.c

changeset 852
83fdf679df99
equal deleted inserted replaced
850:bbe2925eb590 852:83fdf679df99
1 /*
2 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS HEADER.
3 *
4 * Copyright 2024 Mike Becker, Olaf Wintermann All rights reserved.
5 *
6 * Redistribution and use in source and binary forms, with or without
7 * modification, are permitted provided that the following conditions are met:
8 *
9 * 1. Redistributions of source code must retain the above copyright
10 * notice, this list of conditions and the following disclaimer.
11 *
12 * 2. Redistributions in binary form must reproduce the above copyright
13 * notice, this list of conditions and the following disclaimer in the
14 * documentation and/or other materials provided with the distribution.
15 *
16 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
17 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
18 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
19 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE
20 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
21 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
22 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
23 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
24 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
25 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
26 * POSSIBILITY OF SUCH DAMAGE.
27 */
28
29 #include "cx/json.h"
30 #include "cx/compare.h"
31
32 #include <string.h>
33 #include <ctype.h>
34 #include <assert.h>
35 #include <stdio.h>
36 #include <errno.h>
37 #include <inttypes.h>
38
39 /*
40 * RFC 8259
41 * https://tools.ietf.org/html/rfc8259
42 */
43
44 static CxJsonValue cx_json_value_nothing = {.type = CX_JSON_NOTHING};
45
46 static int json_cmp_objvalue(const void *l, const void *r) {
47 const CxJsonObjValue *left = l;
48 const CxJsonObjValue *right = r;
49 return cx_strcmp(cx_strcast(left->name), cx_strcast(right->name));
50 }
51
52 static CxJsonObjValue *json_find_objvalue(const CxJsonValue *obj, cxstring name) {
53 assert(obj->type == CX_JSON_OBJECT);
54 CxJsonObjValue kv_dummy;
55 kv_dummy.name = cx_mutstrn((char*) name.ptr, name.length);
56 size_t index = cx_array_binary_search(
57 obj->value.object.values,
58 obj->value.object.values_size,
59 sizeof(CxJsonObjValue),
60 &kv_dummy,
61 json_cmp_objvalue
62 );
63 if (index == obj->value.object.values_size) {
64 return NULL;
65 } else {
66 return &obj->value.object.values[index];
67 }
68 }
69
70 static int json_add_objvalue(CxJsonValue *objv, CxJsonObjValue member) {
71 assert(objv->type == CX_JSON_OBJECT);
72 const CxAllocator * const al = objv->allocator;
73 CxJsonObject *obj = &(objv->value.object);
74
75 // determine the index where we need to insert the new member
76 size_t index = cx_array_binary_search_sup(
77 obj->values,
78 obj->values_size,
79 sizeof(CxJsonObjValue),
80 &member, json_cmp_objvalue
81 );
82
83 // is the name already present?
84 if (index < obj->values_size && 0 == json_cmp_objvalue(&member, &obj->values[index])) {
85 // free the original value
86 cx_strfree_a(al, &obj->values[index].name);
87 cxJsonValueFree(obj->values[index].value);
88 // replace the item
89 obj->values[index] = member;
90
91 // nothing more to do
92 return 0;
93 }
94
95 // determine the old capacity and reserve for one more element
96 CxArrayReallocator arealloc = cx_array_reallocator(al, NULL);
97 size_t oldcap = obj->values_capacity;
98 if (cx_array_simple_reserve_a(&arealloc, obj->values, 1)) return 1;
99
100 // check the new capacity, if we need to realloc the index array
101 size_t newcap = obj->values_capacity;
102 if (newcap > oldcap) {
103 if (cxReallocateArray(al, &obj->indices, newcap, sizeof(size_t))) {
104 return 1;
105 }
106 }
107
108 // check if append or insert
109 if (index < obj->values_size) {
110 // move the other elements
111 memmove(
112 &obj->values[index+1],
113 &obj->values[index],
114 (obj->values_size - index) * sizeof(CxJsonObjValue)
115 );
116 // increase indices for the moved elements
117 for (size_t i = 0; i < obj->values_size ; i++) {
118 if (obj->indices[i] >= index) {
119 obj->indices[i]++;
120 }
121 }
122 }
123
124 // insert the element and set the index
125 obj->values[index] = member;
126 obj->indices[obj->values_size] = index;
127 obj->values_size++;
128
129 return 0;
130 }
131
132 static void token_destroy(CxJsonToken *token) {
133 if (token->allocated) {
134 cx_strfree(&token->content);
135 }
136 }
137
138 static int num_isexp(const char *content, size_t length, size_t pos) {
139 if (pos >= length) {
140 return 0;
141 }
142
143 int ok = 0;
144 for (size_t i = pos; i < length; i++) {
145 char c = content[i];
146 if (isdigit(c)) {
147 ok = 1;
148 } else if (i == pos) {
149 if (!(c == '+' || c == '-')) {
150 return 0;
151 }
152 } else {
153 return 0;
154 }
155 }
156
157 return ok;
158 }
159
160 static CxJsonTokenType token_numbertype(const char *content, size_t length) {
161 if (length == 0) return CX_JSON_TOKEN_ERROR;
162
163 if (content[0] != '-' && !isdigit(content[0])) {
164 return CX_JSON_TOKEN_ERROR;
165 }
166
167 CxJsonTokenType type = CX_JSON_TOKEN_INTEGER;
168 for (size_t i = 1; i < length; i++) {
169 if (content[i] == '.') {
170 if (type == CX_JSON_TOKEN_NUMBER) {
171 return CX_JSON_TOKEN_ERROR; // more than one decimal separator
172 }
173 type = CX_JSON_TOKEN_NUMBER;
174 } else if (content[i] == 'e' || content[i] == 'E') {
175 return num_isexp(content, length, i + 1) ? CX_JSON_TOKEN_NUMBER : CX_JSON_TOKEN_ERROR;
176 } else if (!isdigit(content[i])) {
177 return CX_JSON_TOKEN_ERROR; // char is not a digit, decimal separator or exponent sep
178 }
179 }
180
181 return type;
182 }
183
184 static CxJsonToken token_create(CxJson *json, bool isstring, size_t start, size_t end) {
185 cxmutstr str = cx_mutstrn(json->buffer.space + start, end - start);
186 bool allocated = false;
187 if (json->uncompleted.tokentype != CX_JSON_NO_TOKEN) {
188 allocated = true;
189 str = cx_strcat_m(json->uncompleted.content, 1, str);
190 if (str.ptr == NULL) { // LCOV_EXCL_START
191 return (CxJsonToken){CX_JSON_NO_TOKEN, false, {NULL, 0}};
192 } // LCOV_EXCL_STOP
193 }
194 json->uncompleted = (CxJsonToken){0};
195 CxJsonTokenType ttype;
196 if (isstring) {
197 ttype = CX_JSON_TOKEN_STRING;
198 } else {
199 cxstring s = cx_strcast(str);
200 if (!cx_strcmp(s, CX_STR("true")) || !cx_strcmp(s, CX_STR("false"))
201 || !cx_strcmp(s, CX_STR("null"))) {
202 ttype = CX_JSON_TOKEN_LITERAL;
203 } else {
204 ttype = token_numbertype(str.ptr, str.length);
205 }
206 }
207 if (ttype == CX_JSON_TOKEN_ERROR) {
208 if (allocated) {
209 cx_strfree(&str);
210 }
211 return (CxJsonToken){CX_JSON_TOKEN_ERROR, false, {NULL, 0}};
212 }
213 return (CxJsonToken){ttype, allocated, str};
214 }
215
216 static CxJsonTokenType char2ttype(char c) {
217 switch (c) {
218 case '[': {
219 return CX_JSON_TOKEN_BEGIN_ARRAY;
220 }
221 case '{': {
222 return CX_JSON_TOKEN_BEGIN_OBJECT;
223 }
224 case ']': {
225 return CX_JSON_TOKEN_END_ARRAY;
226 }
227 case '}': {
228 return CX_JSON_TOKEN_END_OBJECT;
229 }
230 case ':': {
231 return CX_JSON_TOKEN_NAME_SEPARATOR;
232 }
233 case ',': {
234 return CX_JSON_TOKEN_VALUE_SEPARATOR;
235 }
236 case '"': {
237 return CX_JSON_TOKEN_STRING;
238 }
239 default: {
240 if (isspace(c)) {
241 return CX_JSON_TOKEN_SPACE;
242 }
243 }
244 }
245 return CX_JSON_NO_TOKEN;
246 }
247
248 static enum cx_json_status token_parse_next(CxJson *json, CxJsonToken *result) {
249 // check if there is data in the buffer
250 if (cxBufferEof(&json->buffer)) {
251 return json->uncompleted.tokentype == CX_JSON_NO_TOKEN ?
252 CX_JSON_NO_DATA : CX_JSON_INCOMPLETE_DATA;
253 }
254
255 // current token type and start index
256 CxJsonTokenType ttype = json->uncompleted.tokentype;
257 size_t token_start = json->buffer.pos;
258
259 for (size_t i = json->buffer.pos; i < json->buffer.size; i++) {
260 char c = json->buffer.space[i];
261 if (ttype != CX_JSON_TOKEN_STRING) {
262 // currently non-string token
263 CxJsonTokenType ctype = char2ttype(c); // start of new token?
264 if (ttype == CX_JSON_NO_TOKEN) {
265 if (ctype == CX_JSON_TOKEN_SPACE) {
266 json->buffer.pos++;
267 continue;
268 } else if (ctype == CX_JSON_TOKEN_STRING) {
269 // begin string
270 ttype = CX_JSON_TOKEN_STRING;
271 token_start = i;
272 } else if (ctype != CX_JSON_NO_TOKEN) {
273 // single-char token
274 json->buffer.pos = i + 1;
275 *result = (CxJsonToken){ctype, false, {NULL, 0}};
276 return CX_JSON_NO_ERROR;
277 } else {
278 ttype = CX_JSON_TOKEN_LITERAL; // number or literal
279 token_start = i;
280 }
281 } else {
282 // finish token
283 if (ctype != CX_JSON_NO_TOKEN) {
284 *result = token_create(json, false, token_start, i);
285 if (result->tokentype == CX_JSON_NO_TOKEN) {
286 return CX_JSON_BUFFER_ALLOC_FAILED; // LCOV_EXCL_LINE
287 }
288 if (result->tokentype == CX_JSON_TOKEN_ERROR) {
289 return CX_JSON_FORMAT_ERROR_NUMBER;
290 }
291 json->buffer.pos = i;
292 return CX_JSON_NO_ERROR;
293 }
294 }
295 } else {
296 // currently inside a string
297 if (json->tokenizer_escape) {
298 json->tokenizer_escape = false;
299 } else {
300 if (c == '"') {
301 *result = token_create(json, true, token_start, i + 1);
302 if (result->tokentype == CX_JSON_NO_TOKEN) {
303 return CX_JSON_BUFFER_ALLOC_FAILED; // LCOV_EXCL_LINE
304 }
305 json->buffer.pos = i + 1;
306 return CX_JSON_NO_ERROR;
307 } else if (c == '\\') {
308 json->tokenizer_escape = true;
309 }
310 }
311 }
312 }
313
314 if (ttype != CX_JSON_NO_TOKEN) {
315 // uncompleted token
316 size_t uncompleted_len = json->buffer.size - token_start;
317 if (json->uncompleted.tokentype == CX_JSON_NO_TOKEN) {
318 // current token is uncompleted
319 // save current token content
320 CxJsonToken uncompleted = {
321 ttype, true,
322 cx_strdup(cx_strn(json->buffer.space + token_start, uncompleted_len))
323 };
324 if (uncompleted.content.ptr == NULL) {
325 return CX_JSON_BUFFER_ALLOC_FAILED; // LCOV_EXCL_LINE
326 }
327 json->uncompleted = uncompleted;
328 } else {
329 // previously we also had an uncompleted token
330 // combine the uncompleted token with the current token
331 assert(json->uncompleted.allocated);
332 cxmutstr str = cx_strcat_m(json->uncompleted.content, 1,
333 cx_strn(json->buffer.space + token_start, uncompleted_len));
334 if (str.ptr == NULL) {
335 return CX_JSON_BUFFER_ALLOC_FAILED; // LCOV_EXCL_LINE
336 }
337 json->uncompleted.content = str;
338 }
339 // advance the buffer position - we saved the stuff in the uncompleted token
340 json->buffer.pos += uncompleted_len;
341 }
342
343 return CX_JSON_INCOMPLETE_DATA;
344 }
345
346 static cxmutstr unescape_string(const CxAllocator *a, cxmutstr str) {
347 // TODO: support more escape sequences
348 // we know that the unescaped string will be shorter by at least 2 chars
349 cxmutstr result;
350 result.length = 0;
351 result.ptr = cxMalloc(a, str.length - 1);
352 if (result.ptr == NULL) return result; // LCOV_EXCL_LINE
353
354 bool u = false;
355 for (size_t i = 1; i < str.length - 1; i++) {
356 char c = str.ptr[i];
357 if (u) {
358 u = false;
359 if (c == 'n') {
360 c = '\n';
361 } else if (c == 't') {
362 c = '\t';
363 }
364 result.ptr[result.length++] = c;
365 } else {
366 if (c == '\\') {
367 u = true;
368 } else {
369 result.ptr[result.length++] = c;
370 }
371 }
372 }
373 result.ptr[result.length] = 0;
374
375 return result;
376 }
377
378 static CxJsonValue* create_json_value(CxJson *json, CxJsonValueType type) {
379 CxJsonValue *v = cxCalloc(json->allocator, 1, sizeof(CxJsonValue));
380 if (v == NULL) return NULL; // LCOV_EXCL_LINE
381
382 // initialize the value
383 v->type = type;
384 v->allocator = json->allocator;
385 if (type == CX_JSON_ARRAY) {
386 cx_array_initialize_a(json->allocator, v->value.array.array, 16);
387 if (v->value.array.array == NULL) goto create_json_value_exit_error; // LCOV_EXCL_LINE
388 } else if (type == CX_JSON_OBJECT) {
389 cx_array_initialize_a(json->allocator, v->value.object.values, 16);
390 v->value.object.indices = cxCalloc(json->allocator, 16, sizeof(size_t));
391 if (v->value.object.values == NULL ||
392 v->value.object.indices == NULL)
393 goto create_json_value_exit_error; // LCOV_EXCL_LINE
394 }
395
396 // add the new value to a possible parent
397 if (json->vbuf_size > 0) {
398 CxJsonValue *parent = json->vbuf[json->vbuf_size - 1];
399 assert(parent != NULL);
400 if (parent->type == CX_JSON_ARRAY) {
401 CxArrayReallocator value_realloc = cx_array_reallocator(json->allocator, NULL);
402 if (cx_array_simple_add_a(&value_realloc, parent->value.array.array, v)) {
403 goto create_json_value_exit_error; // LCOV_EXCL_LINE
404 }
405 } else if (parent->type == CX_JSON_OBJECT) {
406 // the member was already created after parsing the name
407 assert(json->uncompleted_member.name.ptr != NULL);
408 json->uncompleted_member.value = v;
409 if (json_add_objvalue(parent, json->uncompleted_member)) {
410 goto create_json_value_exit_error; // LCOV_EXCL_LINE
411 }
412 json->uncompleted_member.name = (cxmutstr) {NULL, 0};
413 } else {
414 assert(false); // LCOV_EXCL_LINE
415 }
416 }
417
418 // add the new value to the stack, if it is an array or object
419 if (type == CX_JSON_ARRAY || type == CX_JSON_OBJECT) {
420 CxArrayReallocator vbuf_realloc = cx_array_reallocator(NULL, json->vbuf_internal);
421 if (cx_array_simple_add_a(&vbuf_realloc, json->vbuf, v)) {
422 goto create_json_value_exit_error; // LCOV_EXCL_LINE
423 }
424 }
425
426 // if currently no value is parsed, this is now the value of interest
427 if (json->parsed == NULL) {
428 json->parsed = v;
429 }
430
431 return v;
432 // LCOV_EXCL_START
433 create_json_value_exit_error:
434 cxJsonValueFree(v);
435 return NULL;
436 // LCOV_EXCL_STOP
437 }
438
439 #define JP_STATE_VALUE_BEGIN 0
440 #define JP_STATE_VALUE_END 10
441 #define JP_STATE_VALUE_BEGIN_OBJ 1
442 #define JP_STATE_OBJ_SEP_OR_CLOSE 11
443 #define JP_STATE_VALUE_BEGIN_AR 2
444 #define JP_STATE_ARRAY_SEP_OR_CLOSE 12
445 #define JP_STATE_OBJ_NAME_OR_CLOSE 5
446 #define JP_STATE_OBJ_NAME 6
447 #define JP_STATE_OBJ_COLON 7
448
449 void cxJsonInit(CxJson *json, const CxAllocator *allocator) {
450 if (allocator == NULL) {
451 allocator = cxDefaultAllocator;
452 }
453
454 memset(json, 0, sizeof(CxJson));
455 json->allocator = allocator;
456
457 json->states = json->states_internal;
458 json->states_capacity = cx_nmemb(json->states_internal);
459 json->states[0] = JP_STATE_VALUE_BEGIN;
460 json->states_size = 1;
461
462 json->vbuf = json->vbuf_internal;
463 json->vbuf_capacity = cx_nmemb(json->vbuf_internal);
464 }
465
466 void cxJsonDestroy(CxJson *json) {
467 cxBufferDestroy(&json->buffer);
468 if (json->states != json->states_internal) {
469 free(json->states);
470 }
471 if (json->vbuf != json->vbuf_internal) {
472 free(json->vbuf);
473 }
474 cxJsonValueFree(json->parsed);
475 json->parsed = NULL;
476 if (json->uncompleted_member.name.ptr != NULL) {
477 cx_strfree_a(json->allocator, &json->uncompleted_member.name);
478 json->uncompleted_member = (CxJsonObjValue){{NULL, 0}, NULL};
479 }
480 }
481
482 int cxJsonFilln(CxJson *json, const char *buf, size_t size) {
483 if (cxBufferEof(&json->buffer)) {
484 // reinitialize the buffer
485 cxBufferDestroy(&json->buffer);
486 cxBufferInit(&json->buffer, (char*) buf, size,
487 NULL, CX_BUFFER_AUTO_EXTEND | CX_BUFFER_COPY_ON_WRITE);
488 json->buffer.size = size;
489 return 0;
490 } else {
491 return size != cxBufferAppend(buf, 1, size, &json->buffer);
492 }
493 }
494
495 static void json_add_state(CxJson *json, int state) {
496 // we have guaranteed the necessary space with cx_array_simple_reserve()
497 // therefore, we can safely add the state in the simplest way possible
498 json->states[json->states_size++] = state;
499 }
500
501 #define return_rec(code) \
502 token_destroy(&token); \
503 return code
504
505 static enum cx_json_status json_parse(CxJson *json) {
506 // Reserve a pointer for a possibly read value
507 CxJsonValue *vbuf = NULL;
508
509 // grab the next token
510 CxJsonToken token;
511 {
512 enum cx_json_status ret = token_parse_next(json, &token);
513 if (ret != CX_JSON_NO_ERROR) {
514 return ret;
515 }
516 }
517
518 // pop the current state
519 assert(json->states_size > 0);
520 int state = json->states[--json->states_size];
521
522 // guarantee that at least two more states fit on the stack
523 CxArrayReallocator state_realloc = cx_array_reallocator(NULL, json->states_internal);
524 if (cx_array_simple_reserve_a(&state_realloc, json->states, 2)) {
525 return CX_JSON_BUFFER_ALLOC_FAILED; // LCOV_EXCL_LINE
526 }
527
528
529 // 0 JP_STATE_VALUE_BEGIN value begin
530 // 10 JP_STATE_VALUE_END expect value end
531 // 1 JP_STATE_VALUE_BEGIN_OBJ value begin (inside object)
532 // 11 JP_STATE_OBJ_SEP_OR_CLOSE object, expect separator, objclose
533 // 2 JP_STATE_VALUE_BEGIN_AR value begin (inside array)
534 // 12 JP_STATE_ARRAY_SEP_OR_CLOSE array, expect separator or arrayclose
535 // 5 JP_STATE_OBJ_NAME_OR_CLOSE object, expect name or objclose
536 // 6 JP_STATE_OBJ_NAME object, expect name
537 // 7 JP_STATE_OBJ_COLON object, expect ':'
538
539 if (state < 3) {
540 // push expected end state to the stack
541 json_add_state(json, 10 + state);
542 switch (token.tokentype) {
543 case CX_JSON_TOKEN_BEGIN_ARRAY: {
544 if (create_json_value(json, CX_JSON_ARRAY) == NULL) {
545 return_rec(CX_JSON_VALUE_ALLOC_FAILED); // LCOV_EXCL_LINE
546 }
547 json_add_state(json, JP_STATE_VALUE_BEGIN_AR);
548 return_rec(CX_JSON_NO_ERROR);
549 }
550 case CX_JSON_TOKEN_BEGIN_OBJECT: {
551 if (create_json_value(json, CX_JSON_OBJECT) == NULL) {
552 return_rec(CX_JSON_VALUE_ALLOC_FAILED); // LCOV_EXCL_LINE
553 }
554 json_add_state(json, JP_STATE_OBJ_NAME_OR_CLOSE);
555 return_rec(CX_JSON_NO_ERROR);
556 }
557 case CX_JSON_TOKEN_STRING: {
558 if ((vbuf = create_json_value(json, CX_JSON_STRING)) == NULL) {
559 return_rec(CX_JSON_VALUE_ALLOC_FAILED); // LCOV_EXCL_LINE
560 }
561 cxmutstr str = unescape_string(json->allocator, token.content);
562 if (str.ptr == NULL) {
563 return_rec(CX_JSON_VALUE_ALLOC_FAILED); // LCOV_EXCL_LINE
564 }
565 vbuf->value.string = str;
566 return_rec(CX_JSON_NO_ERROR);
567 }
568 case CX_JSON_TOKEN_INTEGER:
569 case CX_JSON_TOKEN_NUMBER: {
570 int type = token.tokentype == CX_JSON_TOKEN_INTEGER ? CX_JSON_INTEGER : CX_JSON_NUMBER;
571 if (NULL == (vbuf = create_json_value(json, type))) {
572 return_rec(CX_JSON_VALUE_ALLOC_FAILED); // LCOV_EXCL_LINE
573 }
574 if (type == CX_JSON_INTEGER) {
575 if (cx_strtoi64(token.content, &vbuf->value.integer, 10)) {
576 return_rec(CX_JSON_FORMAT_ERROR_NUMBER);
577 }
578 } else {
579 if (cx_strtod(token.content, &vbuf->value.number)) {
580 return_rec(CX_JSON_FORMAT_ERROR_NUMBER);
581 }
582 }
583 return_rec(CX_JSON_NO_ERROR);
584 }
585 case CX_JSON_TOKEN_LITERAL: {
586 if ((vbuf = create_json_value(json, CX_JSON_LITERAL)) == NULL) {
587 return_rec(CX_JSON_VALUE_ALLOC_FAILED); // LCOV_EXCL_LINE
588 }
589 if (0 == cx_strcmp(cx_strcast(token.content), cx_str("true"))) {
590 vbuf->value.literal = CX_JSON_TRUE;
591 } else if (0 == cx_strcmp(cx_strcast(token.content), cx_str("false"))) {
592 vbuf->value.literal = CX_JSON_FALSE;
593 } else {
594 vbuf->value.literal = CX_JSON_NULL;
595 }
596 return_rec(CX_JSON_NO_ERROR);
597 }
598 default: {
599 return_rec(CX_JSON_FORMAT_ERROR_UNEXPECTED_TOKEN);
600 }
601 }
602 } else if (state == JP_STATE_ARRAY_SEP_OR_CLOSE) {
603 // expect ',' or ']'
604 if (token.tokentype == CX_JSON_TOKEN_VALUE_SEPARATOR) {
605 json_add_state(json, JP_STATE_VALUE_BEGIN_AR);
606 return_rec(CX_JSON_NO_ERROR);
607 } else if (token.tokentype == CX_JSON_TOKEN_END_ARRAY) {
608 // discard the array from the value buffer
609 json->vbuf_size--;
610 return_rec(CX_JSON_NO_ERROR);
611 } else {
612 return_rec(CX_JSON_FORMAT_ERROR_UNEXPECTED_TOKEN);
613 }
614 } else if (state == JP_STATE_OBJ_NAME_OR_CLOSE || state == JP_STATE_OBJ_NAME) {
615 if (state == JP_STATE_OBJ_NAME_OR_CLOSE && token.tokentype == CX_JSON_TOKEN_END_OBJECT) {
616 // discard the obj from the value buffer
617 json->vbuf_size--;
618 return_rec(CX_JSON_NO_ERROR);
619 } else {
620 // expect string
621 if (token.tokentype != CX_JSON_TOKEN_STRING) {
622 return_rec(CX_JSON_FORMAT_ERROR_UNEXPECTED_TOKEN);
623 }
624
625 // add new entry
626 cxmutstr name = unescape_string(json->allocator, token.content);
627 if (name.ptr == NULL) {
628 return_rec(CX_JSON_VALUE_ALLOC_FAILED); // LCOV_EXCL_LINE
629 }
630 assert(json->uncompleted_member.name.ptr == NULL);
631 json->uncompleted_member.name = name;
632 assert(json->vbuf_size > 0);
633
634 // next state
635 json_add_state(json, JP_STATE_OBJ_COLON);
636 return_rec(CX_JSON_NO_ERROR);
637 }
638 } else if (state == JP_STATE_OBJ_COLON) {
639 // expect ':'
640 if (token.tokentype != CX_JSON_TOKEN_NAME_SEPARATOR) {
641 return_rec(CX_JSON_FORMAT_ERROR_UNEXPECTED_TOKEN);
642 }
643 // next state
644 json_add_state(json, JP_STATE_VALUE_BEGIN_OBJ);
645 return_rec(CX_JSON_NO_ERROR);
646 } else if (state == JP_STATE_OBJ_SEP_OR_CLOSE) {
647 // expect ',' or '}'
648 if (token.tokentype == CX_JSON_TOKEN_VALUE_SEPARATOR) {
649 json_add_state(json, JP_STATE_OBJ_NAME);
650 return_rec(CX_JSON_NO_ERROR);
651 } else if (token.tokentype == CX_JSON_TOKEN_END_OBJECT) {
652 // discard the obj from the value buffer
653 json->vbuf_size--;
654 return_rec(CX_JSON_NO_ERROR);
655 } else {
656 return_rec(CX_JSON_FORMAT_ERROR_UNEXPECTED_TOKEN);
657 }
658 } else {
659 // should be unreachable
660 assert(false);
661 return_rec(-1);
662 }
663 }
664
665 CxJsonStatus cxJsonNext(CxJson *json, CxJsonValue **value) {
666 // check if buffer has been filled
667 if (json->buffer.space == NULL) {
668 return CX_JSON_NULL_DATA;
669 }
670
671 // initialize output value
672 *value = &cx_json_value_nothing;
673
674 // parse data
675 CxJsonStatus result;
676 do {
677 result = json_parse(json);
678 if (result == CX_JSON_NO_ERROR && json->states_size == 1) {
679 // final state reached
680 assert(json->states[0] == JP_STATE_VALUE_END);
681 assert(json->vbuf_size == 0);
682
683 // write output value
684 *value = json->parsed;
685 json->parsed = NULL;
686
687 // re-initialize state machine
688 json->states[0] = JP_STATE_VALUE_BEGIN;
689
690 return CX_JSON_NO_ERROR;
691 }
692 } while (result == CX_JSON_NO_ERROR);
693
694 // the parser might think there is no data
695 // but when we did not reach the final state,
696 // we know that there must be more to come
697 if (result == CX_JSON_NO_DATA && json->states_size > 1) {
698 return CX_JSON_INCOMPLETE_DATA;
699 }
700
701 return result;
702 }
703
704 void cxJsonValueFree(CxJsonValue *value) {
705 if (value == NULL || value->type == CX_JSON_NOTHING) return;
706 switch (value->type) {
707 case CX_JSON_OBJECT: {
708 CxJsonObject obj = value->value.object;
709 for (size_t i = 0; i < obj.values_size; i++) {
710 cxJsonValueFree(obj.values[i].value);
711 cx_strfree_a(value->allocator, &obj.values[i].name);
712 }
713 cxFree(value->allocator, obj.values);
714 cxFree(value->allocator, obj.indices);
715 break;
716 }
717 case CX_JSON_ARRAY: {
718 CxJsonArray array = value->value.array;
719 for (size_t i = 0; i < array.array_size; i++) {
720 cxJsonValueFree(array.array[i]);
721 }
722 cxFree(value->allocator, array.array);
723 break;
724 }
725 case CX_JSON_STRING: {
726 cxFree(value->allocator, value->value.string.ptr);
727 break;
728 }
729 default: {
730 break;
731 }
732 }
733 cxFree(value->allocator, value);
734 }
735
736 CxJsonValue* cxJsonCreateObj(const CxAllocator* allocator) {
737 CxJsonValue* v = cxMalloc(allocator, sizeof(CxJsonValue));
738 if (v == NULL) return NULL;
739 v->allocator = allocator;
740 v->type = CX_JSON_OBJECT;
741 cx_array_initialize_a(allocator, v->value.object.values, 16);
742 if (v->value.object.values == NULL) { // LCOV_EXCL_START
743 cxFree(allocator, v);
744 return NULL;
745 // LCOV_EXCL_STOP
746 }
747 v->value.object.indices = cxCalloc(allocator, 16, sizeof(size_t));
748 if (v->value.object.indices == NULL) { // LCOV_EXCL_START
749 cxFree(allocator, v->value.object.values);
750 cxFree(allocator, v);
751 return NULL;
752 // LCOV_EXCL_STOP
753 }
754 return v;
755 }
756
757 CxJsonValue* cxJsonCreateArr(const CxAllocator* allocator) {
758 CxJsonValue* v = cxMalloc(allocator, sizeof(CxJsonValue));
759 if (v == NULL) return NULL;
760 v->allocator = allocator;
761 v->type = CX_JSON_ARRAY;
762 cx_array_initialize_a(allocator, v->value.array.array, 16);
763 if (v->value.array.array == NULL) { cxFree(allocator, v); return NULL; }
764 return v;
765 }
766
767 CxJsonValue* cxJsonCreateNumber(const CxAllocator* allocator, double num) {
768 CxJsonValue* v = cxMalloc(allocator, sizeof(CxJsonValue));
769 if (v == NULL) return NULL;
770 v->allocator = allocator;
771 v->type = CX_JSON_NUMBER;
772 v->value.number = num;
773 return v;
774 }
775
776 CxJsonValue* cxJsonCreateInteger(const CxAllocator* allocator, int64_t num) {
777 CxJsonValue* v = cxMalloc(allocator, sizeof(CxJsonValue));
778 if (v == NULL) return NULL;
779 v->allocator = allocator;
780 v->type = CX_JSON_INTEGER;
781 v->value.integer = num;
782 return v;
783 }
784
785 CxJsonValue* cxJsonCreateString(const CxAllocator* allocator, const char* str) {
786 return cxJsonCreateCxString(allocator, cx_str(str));
787 }
788
789 CxJsonValue* cxJsonCreateCxString(const CxAllocator* allocator, cxstring str) {
790 CxJsonValue* v = cxMalloc(allocator, sizeof(CxJsonValue));
791 if (v == NULL) return NULL;
792 v->allocator = allocator;
793 v->type = CX_JSON_STRING;
794 cxmutstr s = cx_strdup_a(allocator, str);
795 if (s.ptr == NULL) { cxFree(allocator, v); return NULL; }
796 v->value.string = s;
797 return v;
798 }
799
800 CxJsonValue* cxJsonCreateLiteral(const CxAllocator* allocator, CxJsonLiteral lit) {
801 CxJsonValue* v = cxMalloc(allocator, sizeof(CxJsonValue));
802 if (v == NULL) return NULL;
803 v->allocator = allocator;
804 v->type = CX_JSON_LITERAL;
805 v->value.literal = lit;
806 return v;
807 }
808
809 // LCOV_EXCL_START
810 // never called as long as malloc() does not return NULL
811 static void cx_json_arr_free_temp(CxJsonValue** values, size_t count) {
812 for (size_t i = 0; i < count; i++) {
813 if (values[i] == NULL) break;
814 cxJsonValueFree(values[i]);
815 }
816 free(values);
817 }
818 // LCOV_EXCL_STOP
819
820 int cxJsonArrAddNumbers(CxJsonValue* arr, const double* num, size_t count) {
821 CxJsonValue** values = calloc(count, sizeof(CxJsonValue*));
822 if (values == NULL) return -1;
823 for (size_t i = 0; i < count; i++) {
824 values[i] = cxJsonCreateNumber(arr->allocator, num[i]);
825 if (values[i] == NULL) { cx_json_arr_free_temp(values, count); return -1; }
826 }
827 int ret = cxJsonArrAddValues(arr, values, count);
828 free(values);
829 return ret;
830 }
831
832 int cxJsonArrAddIntegers(CxJsonValue* arr, const int64_t* num, size_t count) {
833 CxJsonValue** values = calloc(count, sizeof(CxJsonValue*));
834 if (values == NULL) return -1;
835 for (size_t i = 0; i < count; i++) {
836 values[i] = cxJsonCreateInteger(arr->allocator, num[i]);
837 if (values[i] == NULL) { cx_json_arr_free_temp(values, count); return -1; }
838 }
839 int ret = cxJsonArrAddValues(arr, values, count);
840 free(values);
841 return ret;
842 }
843
844 int cxJsonArrAddStrings(CxJsonValue* arr, const char* const* str, size_t count) {
845 CxJsonValue** values = calloc(count, sizeof(CxJsonValue*));
846 if (values == NULL) return -1;
847 for (size_t i = 0; i < count; i++) {
848 values[i] = cxJsonCreateString(arr->allocator, str[i]);
849 if (values[i] == NULL) { cx_json_arr_free_temp(values, count); return -1; }
850 }
851 int ret = cxJsonArrAddValues(arr, values, count);
852 free(values);
853 return ret;
854 }
855
856 int cxJsonArrAddCxStrings(CxJsonValue* arr, const cxstring* str, size_t count) {
857 CxJsonValue** values = calloc(count, sizeof(CxJsonValue*));
858 if (values == NULL) return -1;
859 for (size_t i = 0; i < count; i++) {
860 values[i] = cxJsonCreateCxString(arr->allocator, str[i]);
861 if (values[i] == NULL) { cx_json_arr_free_temp(values, count); return -1; }
862 }
863 int ret = cxJsonArrAddValues(arr, values, count);
864 free(values);
865 return ret;
866 }
867
868 int cxJsonArrAddLiterals(CxJsonValue* arr, const CxJsonLiteral* lit, size_t count) {
869 CxJsonValue** values = calloc(count, sizeof(CxJsonValue*));
870 if (values == NULL) return -1;
871 for (size_t i = 0; i < count; i++) {
872 values[i] = cxJsonCreateLiteral(arr->allocator, lit[i]);
873 if (values[i] == NULL) { cx_json_arr_free_temp(values, count); return -1; }
874 }
875 int ret = cxJsonArrAddValues(arr, values, count);
876 free(values);
877 return ret;
878 }
879
880 int cxJsonArrAddValues(CxJsonValue* arr, CxJsonValue* const* val, size_t count) {
881 CxArrayReallocator value_realloc = cx_array_reallocator(arr->allocator, NULL);
882 assert(arr->type == CX_JSON_ARRAY);
883 return cx_array_simple_copy_a(&value_realloc,
884 arr->value.array.array,
885 arr->value.array.array_size,
886 val, count
887 );
888 }
889
890 int cxJsonObjPut(CxJsonValue* obj, cxstring name, CxJsonValue* child) {
891 cxmutstr k = cx_strdup_a(obj->allocator, name);
892 if (k.ptr == NULL) return -1;
893 CxJsonObjValue kv = {k, child};
894 if (json_add_objvalue(obj, kv)) {
895 cx_strfree_a(obj->allocator, &k);
896 return 1;
897 } else {
898 return 0;
899 }
900 }
901
902 CxJsonValue* cxJsonObjPutObj(CxJsonValue* obj, cxstring name) {
903 CxJsonValue* v = cxJsonCreateObj(obj->allocator);
904 if (v == NULL) return NULL;
905 if (cxJsonObjPut(obj, name, v)) { cxJsonValueFree(v); return NULL; }
906 return v;
907 }
908
909 CxJsonValue* cxJsonObjPutArr(CxJsonValue* obj, cxstring name) {
910 CxJsonValue* v = cxJsonCreateArr(obj->allocator);
911 if (v == NULL) return NULL;
912 if (cxJsonObjPut(obj, name, v)) { cxJsonValueFree(v); return NULL; }
913 return v;
914 }
915
916 CxJsonValue* cxJsonObjPutNumber(CxJsonValue* obj, cxstring name, double num) {
917 CxJsonValue* v = cxJsonCreateNumber(obj->allocator, num);
918 if (v == NULL) return NULL;
919 if (cxJsonObjPut(obj, name, v)) { cxJsonValueFree(v); return NULL; }
920 return v;
921 }
922
923 CxJsonValue* cxJsonObjPutInteger(CxJsonValue* obj, cxstring name, int64_t num) {
924 CxJsonValue* v = cxJsonCreateInteger(obj->allocator, num);
925 if (v == NULL) return NULL;
926 if (cxJsonObjPut(obj, name, v)) { cxJsonValueFree(v); return NULL; }
927 return v;
928 }
929
930 CxJsonValue* cxJsonObjPutString(CxJsonValue* obj, cxstring name, const char* str) {
931 CxJsonValue* v = cxJsonCreateString(obj->allocator, str);
932 if (v == NULL) return NULL;
933 if (cxJsonObjPut(obj, name, v)) { cxJsonValueFree(v); return NULL; }
934 return v;
935 }
936
937 CxJsonValue* cxJsonObjPutCxString(CxJsonValue* obj, cxstring name, cxstring str) {
938 CxJsonValue* v = cxJsonCreateCxString(obj->allocator, str);
939 if (v == NULL) return NULL;
940 if (cxJsonObjPut(obj, name, v)) { cxJsonValueFree(v); return NULL; }
941 return v;
942 }
943
944 CxJsonValue* cxJsonObjPutLiteral(CxJsonValue* obj, cxstring name, CxJsonLiteral lit) {
945 CxJsonValue* v = cxJsonCreateLiteral(obj->allocator, lit);
946 if (v == NULL) return NULL;
947 if (cxJsonObjPut(obj, name, v)) { cxJsonValueFree(v); return NULL;}
948 return v;
949 }
950
951 CxJsonValue *cxJsonArrGet(const CxJsonValue *value, size_t index) {
952 if (index >= value->value.array.array_size) {
953 return &cx_json_value_nothing;
954 }
955 return value->value.array.array[index];
956 }
957
958 CxIterator cxJsonArrIter(const CxJsonValue *value) {
959 return cxIteratorPtr(
960 value->value.array.array,
961 value->value.array.array_size
962 );
963 }
964
965 CxIterator cxJsonObjIter(const CxJsonValue *value) {
966 return cxIterator(
967 value->value.object.values,
968 sizeof(CxJsonObjValue),
969 value->value.object.values_size
970 );
971 }
972
973 CxJsonValue *cx_json_obj_get_cxstr(const CxJsonValue *value, cxstring name) {
974 CxJsonObjValue *member = json_find_objvalue(value, name);
975 if (member == NULL) {
976 return &cx_json_value_nothing;
977 } else {
978 return member->value;
979 }
980 }
981
982 static const CxJsonWriter cx_json_writer_default = {
983 false,
984 true,
985 255,
986 false,
987 4
988 };
989
990 CxJsonWriter cxJsonWriterCompact(void) {
991 return cx_json_writer_default;
992 }
993
994 CxJsonWriter cxJsonWriterPretty(bool use_spaces) {
995 return (CxJsonWriter) {
996 true,
997 true,
998 255,
999 use_spaces,
1000 4
1001 };
1002 }
1003
1004 static int cx_json_writer_indent(
1005 void *target,
1006 cx_write_func wfunc,
1007 const CxJsonWriter *settings,
1008 unsigned int depth
1009 ) {
1010 if (depth == 0) return 0;
1011
1012 // determine the width and characters to use
1013 const char* indent; // for 32 prepared chars
1014 size_t width = depth;
1015 if (settings->indent_space) {
1016 if (settings->indent == 0) return 0;
1017 width *= settings->indent;
1018 indent = " ";
1019 } else {
1020 indent = "\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t";
1021 }
1022
1023 // calculate the number of write calls and write
1024 size_t full = width / 32;
1025 size_t remaining = width % 32;
1026 for (size_t i = 0; i < full; i++) {
1027 if (32 != wfunc(indent, 1, 32, target)) return 1;
1028 }
1029 if (remaining != wfunc(indent, 1, remaining, target)) return 1;
1030
1031 return 0;
1032 }
1033
1034
1035 int cx_json_write_rec(
1036 void *target,
1037 const CxJsonValue *value,
1038 cx_write_func wfunc,
1039 const CxJsonWriter *settings,
1040 unsigned int depth
1041 ) {
1042 // keep track of written items
1043 // the idea is to reduce the number of jumps for error checking
1044 size_t actual = 0, expected = 0;
1045
1046 // small buffer for number to string conversions
1047 char numbuf[32];
1048
1049 // recursively write the values
1050 switch (value->type) {
1051 case CX_JSON_OBJECT: {
1052 const char *begin_obj = "{\n";
1053 if (settings->pretty) {
1054 actual += wfunc(begin_obj, 1, 2, target);
1055 expected += 2;
1056 } else {
1057 actual += wfunc(begin_obj, 1, 1, target);
1058 expected++;
1059 }
1060 depth++;
1061 size_t elem_count = value->value.object.values_size;
1062 for (size_t look_idx = 0; look_idx < elem_count; look_idx++) {
1063 // get the member either via index array or directly
1064 size_t elem_idx = settings->sort_members
1065 ? look_idx
1066 : value->value.object.indices[look_idx];
1067 CxJsonObjValue *member = &value->value.object.values[elem_idx];
1068 if (settings->sort_members) {
1069 depth++;depth--;
1070 }
1071
1072 // possible indentation
1073 if (settings->pretty) {
1074 if (cx_json_writer_indent(target, wfunc, settings, depth)) {
1075 return 1; // LCOV_EXCL_LINE
1076 }
1077 }
1078
1079 // the name
1080 actual += wfunc("\"", 1, 1, target);
1081 // TODO: escape the string
1082 actual += wfunc(member->name.ptr, 1,
1083 member->name.length, target);
1084 actual += wfunc("\"", 1, 1, target);
1085 const char *obj_name_sep = ": ";
1086 if (settings->pretty) {
1087 actual += wfunc(obj_name_sep, 1, 2, target);
1088 expected += 4 + member->name.length;
1089 } else {
1090 actual += wfunc(obj_name_sep, 1, 1, target);
1091 expected += 3 + member->name.length;
1092 }
1093
1094 // the value
1095 if (cx_json_write_rec(target, member->value, wfunc, settings, depth)) return 1;
1096
1097 // end of object-value
1098 if (look_idx < elem_count - 1) {
1099 const char *obj_value_sep = ",\n";
1100 if (settings->pretty) {
1101 actual += wfunc(obj_value_sep, 1, 2, target);
1102 expected += 2;
1103 } else {
1104 actual += wfunc(obj_value_sep, 1, 1, target);
1105 expected++;
1106 }
1107 } else {
1108 if (settings->pretty) {
1109 actual += wfunc("\n", 1, 1, target);
1110 expected ++;
1111 }
1112 }
1113 }
1114 depth--;
1115 if (settings->pretty) {
1116 if (cx_json_writer_indent(target, wfunc, settings, depth)) return 1;
1117 }
1118 actual += wfunc("}", 1, 1, target);
1119 expected++;
1120 break;
1121 }
1122 case CX_JSON_ARRAY: {
1123 actual += wfunc("[", 1, 1, target);
1124 expected++;
1125 CxIterator iter = cxJsonArrIter(value);
1126 cx_foreach(CxJsonValue*, element, iter) {
1127 if (cx_json_write_rec(
1128 target, element,
1129 wfunc, settings, depth)
1130 ) return 1;
1131
1132 if (iter.index < iter.elem_count - 1) {
1133 const char *arr_value_sep = ", ";
1134 if (settings->pretty) {
1135 actual += wfunc(arr_value_sep, 1, 2, target);
1136 expected += 2;
1137 } else {
1138 actual += wfunc(arr_value_sep, 1, 1, target);
1139 expected++;
1140 }
1141 }
1142 }
1143 actual += wfunc("]", 1, 1, target);
1144 expected++;
1145 break;
1146 }
1147 case CX_JSON_STRING: {
1148 actual += wfunc("\"", 1, 1, target);
1149 // TODO: escape the string
1150 actual += wfunc(value->value.string.ptr, 1,
1151 value->value.string.length, target);
1152 actual += wfunc("\"", 1, 1, target);
1153 expected += 2 + value->value.string.length;
1154 break;
1155 }
1156 case CX_JSON_NUMBER: {
1157 // TODO: locale bullshit
1158 // TODO: formatting settings
1159 snprintf(numbuf, 32, "%g", value->value.number);
1160 size_t len = strlen(numbuf);
1161 actual += wfunc(numbuf, 1, len, target);
1162 expected += len;
1163 break;
1164 }
1165 case CX_JSON_INTEGER: {
1166 snprintf(numbuf, 32, "%" PRIi64, value->value.integer);
1167 size_t len = strlen(numbuf);
1168 actual += wfunc(numbuf, 1, len, target);
1169 expected += len;
1170 break;
1171 }
1172 case CX_JSON_LITERAL: {
1173 if (value->value.literal == CX_JSON_TRUE) {
1174 actual += wfunc("true", 1, 4, target);
1175 expected += 4;
1176 } else if (value->value.literal == CX_JSON_FALSE) {
1177 actual += wfunc("false", 1, 5, target);
1178 expected += 5;
1179 } else {
1180 actual += wfunc("null", 1, 4, target);
1181 expected += 4;
1182 }
1183 break;
1184 }
1185 case CX_JSON_NOTHING: {
1186 // deliberately supported as an empty string!
1187 // users might want to just write the result
1188 // of a get operation without testing the value
1189 // and therefore this should not blow up
1190 break;
1191 }
1192 default: assert(false); // LCOV_EXCL_LINE
1193 }
1194
1195 return expected != actual;
1196 }
1197
1198 int cxJsonWrite(
1199 void *target,
1200 const CxJsonValue *value,
1201 cx_write_func wfunc,
1202 const CxJsonWriter *settings
1203 ) {
1204 if (settings == NULL) {
1205 settings = &cx_json_writer_default;
1206 }
1207 assert(target != NULL);
1208 assert(value != NULL);
1209 assert(wfunc != NULL);
1210
1211 return cx_json_write_rec(target, value, wfunc, settings, 0);
1212 }

mercurial