micetools/src/micetools/lib/json/json.c

819 lines
31 KiB
C

/* vim: set et ts=3 sw=3 sts=3 ft=c:
*
* Copyright (C) 2012-2021 the json-parser authors All rights reserved.
* https://github.com/json-parser/json-parser
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
*
* 1. Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
*
* 2. Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution.
*
* THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
* ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
* ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
* DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
* OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
* LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
* OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
* SUCH DAMAGE.
*/
#include "json.h"
#include <ctype.h>
#include <limits.h>
#include <math.h>
#include <stdint.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include "../util/hex.h"
#define JSON_INT_MAX 9223372036854775807LL
typedef unsigned int json_uchar;
const struct _json_value json_value_none = { 0 };
static int would_overflow(json_int_t value, json_char b) { return ((JSON_INT_MAX - (b - '0')) / 10) < value; }
typedef struct {
size_t used_memory;
json_settings settings;
int first_pass;
const json_char *ptr;
unsigned int cur_line, cur_col;
} json_state;
static void *default_alloc(size_t size, int zero) { return zero ? calloc(1, size) : malloc(size); }
static void *json_alloc(json_state *state, size_t size, int zero) {
if ((ULONG_MAX - 8 - state->used_memory) < size) return 0;
if (state->settings.max_memory && (state->used_memory += size) > state->settings.max_memory) {
return 0;
}
return default_alloc(size, zero);
}
static int new_value(json_state *state, json_value **top, json_value **root, json_value **alloc, json_type type) {
json_value *value;
size_t values_size;
if (!state->first_pass) {
value = *top = *alloc;
*alloc = (*alloc)->_reserved.next_alloc;
if (!*root) *root = value;
switch (value->type) {
case json_array:
if (value->u.array.length == 0) break;
if (!(value->u.array.values =
(json_value **)json_alloc(state, value->u.array.length * sizeof(json_value *), 0))) {
return 0;
}
value->u.array.length = 0;
break;
case json_object:
if (value->u.object.length == 0) break;
values_size = sizeof(*value->u.object.values) * value->u.object.length;
if (!(value->u.object.values = (json_object_entry *)json_alloc(
state, values_size + ((uintptr_t)value->u.object.values), 0))) {
return 0;
}
value->_reserved.object_mem = (void *)(((char *)value->u.object.values) + values_size);
value->u.object.length = 0;
break;
case json_string:
if (!(value->u.string.ptr =
(json_char *)json_alloc(state, (value->u.string.length + 1) * sizeof(json_char), 0))) {
return 0;
}
value->u.string.length = 0;
break;
default:
break;
};
return 1;
}
if (!(value = (json_value *)json_alloc(state, sizeof(json_value) + state->settings.value_extra, 1))) {
return 0;
}
if (!*root) *root = value;
value->type = type;
value->parent = *top;
#ifdef JSON_TRACK_SOURCE
value->line = state->cur_line;
value->col = state->cur_col;
#endif
if (*alloc) (*alloc)->_reserved.next_alloc = value;
*alloc = *top = value;
return 1;
}
#define whitespace \
case '\n': \
++state.cur_line; \
state.cur_col = 0; /* FALLTHRU */ \
case ' ': /* FALLTHRU */ \
case '\t': /* FALLTHRU */ \
case '\r'
#define string_add(b) \
do { \
if (!state.first_pass) string[string_length] = b; \
++string_length; \
} while (0);
#define line_and_col state.cur_line, state.cur_col
static const long flag_next = 1 << 0, flag_reproc = 1 << 1, flag_need_comma = 1 << 2, flag_seek_value = 1 << 3,
flag_escaped = 1 << 4, flag_string = 1 << 5, flag_need_colon = 1 << 6, flag_done = 1 << 7,
flag_num_negative = 1 << 8, flag_num_zero = 1 << 9, flag_num_e = 1 << 10,
flag_num_e_got_sign = 1 << 11, flag_num_e_negative = 1 << 12, flag_line_comment = 1 << 13,
flag_block_comment = 1 << 14, flag_num_got_decimal = 1 << 15;
json_value *json_parse_ex(json_settings *settings, const json_char *json, size_t length, char *error_buf) {
char error[json_error_max];
const json_char *end;
json_value *top, *root, *alloc = 0;
json_state state = {0};
long flags = 0;
int num_digits = 0;
double num_e = 0, num_fraction = 0;
/* Skip UTF-8 BOM
*/
if (length >= 3 && ((unsigned char)json[0]) == 0xEF && ((unsigned char)json[1]) == 0xBB &&
((unsigned char)json[2]) == 0xBF) {
json += 3;
length -= 3;
}
error[0] = '\0';
end = (json + length);
memcpy(&state.settings, settings, sizeof(json_settings));
for (state.first_pass = 1; state.first_pass >= 0; --state.first_pass) {
json_uchar uchar;
unsigned char uc_b1, uc_b2, uc_b3, uc_b4;
json_char *string = 0;
unsigned int string_length = 0;
top = root = 0;
flags = flag_seek_value;
state.cur_line = 1;
for (state.ptr = json;; ++state.ptr) {
json_char b = (state.ptr == end ? 0 : *state.ptr);
if (flags & flag_string) {
if (!b) {
snprintf(error, json_error_max, "%u:%u: Unexpected EOF in string", line_and_col);
goto e_failed;
}
if (string_length > UINT_MAX - 8) goto e_overflow;
if (flags & flag_escaped) {
flags &= ~flag_escaped;
switch (b) {
case 'b':
string_add('\b');
break;
case 'f':
string_add('\f');
break;
case 'n':
string_add('\n');
break;
case 'r':
string_add('\r');
break;
case 't':
string_add('\t');
break;
case 'u':
if (end - state.ptr <= 4 || (uc_b1 = hex_value(*++state.ptr)) == 0xFF ||
(uc_b2 = hex_value(*++state.ptr)) == 0xFF ||
(uc_b3 = hex_value(*++state.ptr)) == 0xFF ||
(uc_b4 = hex_value(*++state.ptr)) == 0xFF) {
snprintf(error, json_error_max, "%u:%u: Invalid character value `%c`", line_and_col, b);
goto e_failed;
}
uc_b1 = (uc_b1 << 4) | uc_b2;
uc_b2 = (uc_b3 << 4) | uc_b4;
uchar = (uc_b1 << 8) | uc_b2;
if ((uchar & 0xF800) == 0xD800) {
json_uchar uchar2;
if (end - state.ptr <= 6 || (*++state.ptr) != '\\' || (*++state.ptr) != 'u' ||
(uc_b1 = hex_value(*++state.ptr)) == 0xFF ||
(uc_b2 = hex_value(*++state.ptr)) == 0xFF ||
(uc_b3 = hex_value(*++state.ptr)) == 0xFF ||
(uc_b4 = hex_value(*++state.ptr)) == 0xFF) {
snprintf(error, json_error_max, "%u:%u: Invalid character value `%c`", line_and_col,
b);
goto e_failed;
}
uc_b1 = (uc_b1 << 4) | uc_b2;
uc_b2 = (uc_b3 << 4) | uc_b4;
uchar2 = (uc_b1 << 8) | uc_b2;
uchar = 0x010000 | ((uchar & 0x3FF) << 10) | (uchar2 & 0x3FF);
}
if (sizeof(json_char) >= sizeof(json_uchar) || (uchar <= 0x7F)) {
string_add((json_char)uchar);
break;
}
if (uchar <= 0x7FF) {
if (state.first_pass)
string_length += 2;
else {
string[string_length++] = (char)(0xC0 | (uchar >> 6));
string[string_length++] = (char)(0x80 | (uchar & 0x3F));
}
break;
}
if (uchar <= 0xFFFF) {
if (state.first_pass)
string_length += 3;
else {
string[string_length++] = 0xE0 | (char)((uchar >> 12));
string[string_length++] = 0x80 | (char)(((uchar >> 6) & 0x3F));
string[string_length++] = 0x80 | (char)((uchar & 0x3F));
}
break;
}
if (state.first_pass)
string_length += 4;
else {
string[string_length++] = 0xF0 | (char)((uchar >> 18));
string[string_length++] = 0x80 | (char)(((uchar >> 12) & 0x3F));
string[string_length++] = 0x80 | (char)(((uchar >> 6) & 0x3F));
string[string_length++] = 0x80 | (char)((uchar & 0x3F));
}
break;
default:
string_add(b);
};
continue;
}
if (b == '\\') {
flags |= flag_escaped;
continue;
}
if (b == '"') {
if (!state.first_pass) string[string_length] = 0;
flags &= ~flag_string;
string = 0;
switch (top->type) {
case json_string:
top->u.string.length = string_length;
flags |= flag_next;
break;
case json_object:
if (state.first_pass) {
json_char **chars = (json_char **)&top->u.object.values;
chars[0] += string_length + 1;
} else {
top->u.object.values[top->u.object.length].name =
(json_char *)top->_reserved.object_mem;
top->u.object.values[top->u.object.length].name_length = string_length;
(*(json_char **)&top->_reserved.object_mem) += string_length + 1;
}
flags |= flag_seek_value | flag_need_colon;
continue;
default:
break;
};
} else {
string_add(b);
continue;
}
}
if (state.settings.settings & json_enable_comments) {
if (flags & (flag_line_comment | flag_block_comment)) {
if (flags & flag_line_comment) {
if (b == '\r' || b == '\n' || !b) {
flags &= ~flag_line_comment;
--state.ptr; /* so null can be reproc'd */
}
continue;
}
if (flags & flag_block_comment) {
if (!b) {
snprintf(error, json_error_max, "%u:%u: Unexpected EOF in block comment", line_and_col);
goto e_failed;
}
if (b == '*' && state.ptr < (end - 1) && state.ptr[1] == '/') {
flags &= ~flag_block_comment;
++state.ptr; /* skip closing sequence */
}
continue;
}
} else if (b == '/') {
if (!(flags & (flag_seek_value | flag_done)) && top->type != json_object) {
snprintf(error, json_error_max, "%u:%u: Comment not allowed here", line_and_col);
goto e_failed;
}
if (++state.ptr == end) {
snprintf(error, json_error_max, "%u:%u: EOF unexpected", line_and_col);
goto e_failed;
}
switch (b = *state.ptr) {
case '/':
flags |= flag_line_comment;
continue;
case '*':
flags |= flag_block_comment;
continue;
default:
snprintf(error, json_error_max, "%u:%u: Unexpected `%c` in comment opening sequence",
line_and_col, b);
goto e_failed;
};
}
}
if (flags & flag_done) {
if (!b) break;
switch (b) {
whitespace:
continue;
default:
snprintf(error, json_error_max, "%u:%u: Trailing garbage: `%c`", line_and_col, b);
goto e_failed;
};
}
if (flags & flag_seek_value) {
switch (b) {
whitespace:
continue;
case ']':
if (top && top->type == json_array)
flags = (flags & ~(flag_need_comma | flag_seek_value)) | flag_next;
else {
snprintf(error, json_error_max, "%u:%u: Unexpected `]`", line_and_col);
goto e_failed;
}
break;
default:
if (flags & flag_need_comma) {
if (b == ',') {
flags &= ~flag_need_comma;
continue;
} else {
snprintf(error, json_error_max, "%u:%u: Expected `,` before `%c`", line_and_col, b);
goto e_failed;
}
}
if (flags & flag_need_colon) {
if (b == ':') {
flags &= ~flag_need_colon;
continue;
} else {
snprintf(error, json_error_max, "%u:%u: Expected `:` before `%c`", line_and_col, b);
goto e_failed;
}
}
flags &= ~flag_seek_value;
switch (b) {
case '{':
if (!new_value(&state, &top, &root, &alloc, json_object)) goto e_alloc_failure;
continue;
case '[':
if (!new_value(&state, &top, &root, &alloc, json_array)) goto e_alloc_failure;
flags |= flag_seek_value;
continue;
case '"':
if (!new_value(&state, &top, &root, &alloc, json_string)) goto e_alloc_failure;
flags |= flag_string;
string = top->u.string.ptr;
string_length = 0;
continue;
case 't':
if ((end - state.ptr) <= 3 || *(++state.ptr) != 'r' || *(++state.ptr) != 'u' ||
*(++state.ptr) != 'e') {
goto e_unknown_value;
}
if (!new_value(&state, &top, &root, &alloc, json_boolean)) goto e_alloc_failure;
top->u.boolean = 1;
flags |= flag_next;
break;
case 'f':
if ((end - state.ptr) <= 4 || *(++state.ptr) != 'a' || *(++state.ptr) != 'l' ||
*(++state.ptr) != 's' || *(++state.ptr) != 'e') {
goto e_unknown_value;
}
if (!new_value(&state, &top, &root, &alloc, json_boolean)) goto e_alloc_failure;
flags |= flag_next;
break;
case 'n':
if ((end - state.ptr) <= 3 || *(++state.ptr) != 'u' || *(++state.ptr) != 'l' ||
*(++state.ptr) != 'l') {
goto e_unknown_value;
}
if (!new_value(&state, &top, &root, &alloc, json_null)) goto e_alloc_failure;
flags |= flag_next;
break;
default:
if (isdigit((unsigned char)b) || b == '-') {
if (!new_value(&state, &top, &root, &alloc, json_integer)) goto e_alloc_failure;
if (!state.first_pass) {
while (isdigit((unsigned char)b) || b == '+' || b == '-' || b == 'e' ||
b == 'E' || b == '.') {
if ((++state.ptr) == end) {
b = 0;
break;
}
b = *state.ptr;
}
flags |= flag_next | flag_reproc;
break;
}
flags &= ~(flag_num_negative | flag_num_e | flag_num_e_got_sign |
flag_num_e_negative | flag_num_zero);
num_digits = 0;
num_fraction = 0;
num_e = 0;
if (b != '-') {
flags |= flag_reproc;
break;
}
flags |= flag_num_negative;
continue;
} else {
snprintf(error, json_error_max, "%u:%u: Unexpected `%c` when seeking value",
line_and_col, b);
goto e_failed;
}
};
};
} else {
switch (top->type) {
case json_object:
switch (b) {
whitespace:
continue;
case '"':
if (flags & flag_need_comma) {
snprintf(error, json_error_max, "%u:%u: Expected `,` before `\"`", line_and_col);
goto e_failed;
}
flags |= flag_string;
string = (json_char *)top->_reserved.object_mem;
string_length = 0;
break;
case '}':
flags = (flags & ~flag_need_comma) | flag_next;
break;
case ',':
if (flags & flag_need_comma) {
flags &= ~flag_need_comma;
break;
} /* FALLTHRU */
default:
snprintf(error, json_error_max, "%u:%u: Unexpected `%c` in object", line_and_col, b);
goto e_failed;
};
break;
case json_integer:
case json_double:
if (isdigit((unsigned char)b)) {
++num_digits;
if (top->type == json_integer || flags & flag_num_e) {
if (!(flags & flag_num_e)) {
if (flags & flag_num_zero) {
snprintf(error, json_error_max, "%u:%u: Unexpected `0` before `%c`",
line_and_col, b);
goto e_failed;
}
if (num_digits == 1 && b == '0') flags |= flag_num_zero;
} else {
flags |= flag_num_e_got_sign;
num_e = (num_e * 10) + (b - '0');
continue;
}
if (would_overflow(top->u.integer, b)) {
json_int_t integer = top->u.integer;
--num_digits;
--state.ptr;
top->type = json_double;
top->u.dbl = (double)integer;
continue;
}
top->u.integer = (top->u.integer * 10) + (b - '0');
continue;
}
if (flags & flag_num_got_decimal)
num_fraction = (num_fraction * 10) + (b - '0');
else
top->u.dbl = (top->u.dbl * 10) + (b - '0');
continue;
}
if (b == '+' || b == '-') {
if ((flags & flag_num_e) && !(flags & flag_num_e_got_sign)) {
flags |= flag_num_e_got_sign;
if (b == '-') flags |= flag_num_e_negative;
continue;
}
} else if (b == '.' && top->type == json_integer) {
json_int_t integer = top->u.integer;
if (!num_digits) {
snprintf(error, json_error_max, "%u:%u: Expected digit before `.`", line_and_col);
goto e_failed;
}
top->type = json_double;
top->u.dbl = (double)integer;
flags |= flag_num_got_decimal;
num_digits = 0;
continue;
}
if (!(flags & flag_num_e)) {
if (top->type == json_double) {
if (!num_digits) {
snprintf(error, json_error_max, "%u:%u: Expected digit after `.`", line_and_col);
goto e_failed;
}
top->u.dbl += num_fraction / pow(10.0, num_digits);
}
if (b == 'e' || b == 'E') {
flags |= flag_num_e;
if (top->type == json_integer) {
json_int_t integer = top->u.integer;
top->type = json_double;
top->u.dbl = (double)integer;
}
num_digits = 0;
flags &= ~flag_num_zero;
continue;
}
} else {
if (!num_digits) {
snprintf(error, json_error_max, "%u:%u: Expected digit after `e`", line_and_col);
goto e_failed;
}
top->u.dbl *= pow(10.0, (flags & flag_num_e_negative ? -num_e : num_e));
}
if (flags & flag_num_negative) {
if (top->type == json_integer)
top->u.integer = -top->u.integer;
else
top->u.dbl = -top->u.dbl;
}
flags |= flag_next | flag_reproc;
break;
default:
break;
};
}
if (flags & flag_reproc) {
flags &= ~flag_reproc;
--state.ptr;
}
if (flags & flag_next) {
flags = (flags & ~flag_next) | flag_need_comma;
if (!top->parent) {
/* root value done */
flags |= flag_done;
continue;
}
if (top->parent->type == json_array) flags |= flag_seek_value;
if (!state.first_pass) {
json_value *parent = top->parent;
switch (parent->type) {
case json_object:
parent->u.object.values[parent->u.object.length].value = top;
break;
case json_array:
parent->u.array.values[parent->u.array.length] = top;
break;
default:
break;
};
}
if ((++top->parent->u.array.length) > UINT_MAX - 8) goto e_overflow;
top = top->parent;
continue;
}
}
alloc = root;
}
return root;
e_unknown_value:
snprintf(error, json_error_max, "%u:%u: Unknown value", line_and_col);
goto e_failed;
e_alloc_failure:
snprintf(error, json_error_max, "Memory allocation failure");
goto e_failed;
e_overflow:
snprintf(error, json_error_max, "%u:%u: Too long (caught overflow)", line_and_col);
goto e_failed;
e_failed:
if (error_buf) {
if (*error)
memcpy(error_buf, error, json_error_max);
else
snprintf(error_buf, json_error_max, "Unknown error");
}
if (state.first_pass) alloc = root;
while (alloc) {
top = alloc->_reserved.next_alloc;
free(alloc);
alloc = top;
}
if (!state.first_pass) json_value_free(root);
return 0;
}
json_value *json_parse(const json_char *json, size_t length) {
json_settings settings = {0};
return json_parse_ex(&settings, json, length, 0);
}
void json_value_free(json_value *value) {
json_value *cur_value;
if (!value) return;
value->parent = 0;
while (value) {
switch (value->type) {
case json_array:
if (!value->u.array.length) {
free(value->u.array.values);
break;
}
value = value->u.array.values[--value->u.array.length];
continue;
case json_object:
if (!value->u.object.length) {
free(value->u.object.values);
break;
}
value = value->u.object.values[--value->u.object.length].value;
continue;
case json_string:
free(value->u.string.ptr);
break;
default:
break;
};
cur_value = value;
value = value->parent;
free(cur_value);
}
}