Merge remote-tracking branch 'remotes/agraf/tags/signed-s390-for-upstream' into staging
[qemu.git] / qobject / json-parser.c
blob717cb8fde7e9dcd5aecb16a38a36cdd88c4cc541
1 /*
2 * JSON Parser
4 * Copyright IBM, Corp. 2009
6 * Authors:
7 * Anthony Liguori <aliguori@us.ibm.com>
9 * This work is licensed under the terms of the GNU LGPL, version 2.1 or later.
10 * See the COPYING.LIB file in the top-level directory.
14 #include <stdarg.h>
16 #include "qemu-common.h"
17 #include "qapi/qmp/qstring.h"
18 #include "qapi/qmp/qint.h"
19 #include "qapi/qmp/qdict.h"
20 #include "qapi/qmp/qlist.h"
21 #include "qapi/qmp/qfloat.h"
22 #include "qapi/qmp/qbool.h"
23 #include "qapi/qmp/json-parser.h"
24 #include "qapi/qmp/json-lexer.h"
25 #include "qapi/qmp/qerror.h"
27 typedef struct JSONParserContext
29 Error *err;
30 struct {
31 QObject **buf;
32 size_t pos;
33 size_t count;
34 } tokens;
35 } JSONParserContext;
37 #define BUG_ON(cond) assert(!(cond))
39 /**
40 * TODO
42 * 0) make errors meaningful again
43 * 1) add geometry information to tokens
44 * 3) should we return a parsed size?
45 * 4) deal with premature EOI
48 static QObject *parse_value(JSONParserContext *ctxt, va_list *ap);
50 /**
51 * Token manipulators
53 * tokens are dictionaries that contain a type, a string value, and geometry information
54 * about a token identified by the lexer. These are routines that make working with
55 * these objects a bit easier.
57 static const char *token_get_value(QObject *obj)
59 return qdict_get_str(qobject_to_qdict(obj), "token");
62 static JSONTokenType token_get_type(QObject *obj)
64 return qdict_get_int(qobject_to_qdict(obj), "type");
67 static int token_is_operator(QObject *obj, char op)
69 const char *val;
71 if (token_get_type(obj) != JSON_OPERATOR) {
72 return 0;
75 val = token_get_value(obj);
77 return (val[0] == op) && (val[1] == 0);
80 static int token_is_keyword(QObject *obj, const char *value)
82 if (token_get_type(obj) != JSON_KEYWORD) {
83 return 0;
86 return strcmp(token_get_value(obj), value) == 0;
89 static int token_is_escape(QObject *obj, const char *value)
91 if (token_get_type(obj) != JSON_ESCAPE) {
92 return 0;
95 return (strcmp(token_get_value(obj), value) == 0);
98 /**
99 * Error handler
101 static void GCC_FMT_ATTR(3, 4) parse_error(JSONParserContext *ctxt,
102 QObject *token, const char *msg, ...)
104 va_list ap;
105 char message[1024];
106 va_start(ap, msg);
107 vsnprintf(message, sizeof(message), msg, ap);
108 va_end(ap);
109 if (ctxt->err) {
110 error_free(ctxt->err);
111 ctxt->err = NULL;
113 error_setg(&ctxt->err, "JSON parse error, %s", message);
117 * String helpers
119 * These helpers are used to unescape strings.
121 static void wchar_to_utf8(uint16_t wchar, char *buffer, size_t buffer_length)
123 if (wchar <= 0x007F) {
124 BUG_ON(buffer_length < 2);
126 buffer[0] = wchar & 0x7F;
127 buffer[1] = 0;
128 } else if (wchar <= 0x07FF) {
129 BUG_ON(buffer_length < 3);
131 buffer[0] = 0xC0 | ((wchar >> 6) & 0x1F);
132 buffer[1] = 0x80 | (wchar & 0x3F);
133 buffer[2] = 0;
134 } else {
135 BUG_ON(buffer_length < 4);
137 buffer[0] = 0xE0 | ((wchar >> 12) & 0x0F);
138 buffer[1] = 0x80 | ((wchar >> 6) & 0x3F);
139 buffer[2] = 0x80 | (wchar & 0x3F);
140 buffer[3] = 0;
144 static int hex2decimal(char ch)
146 if (ch >= '0' && ch <= '9') {
147 return (ch - '0');
148 } else if (ch >= 'a' && ch <= 'f') {
149 return 10 + (ch - 'a');
150 } else if (ch >= 'A' && ch <= 'F') {
151 return 10 + (ch - 'A');
154 return -1;
158 * parse_string(): Parse a json string and return a QObject
160 * string
161 * ""
162 * " chars "
163 * chars
164 * char
165 * char chars
166 * char
167 * any-Unicode-character-
168 * except-"-or-\-or-
169 * control-character
170 * \"
171 * \\
172 * \/
173 * \b
174 * \f
175 * \n
176 * \r
177 * \t
178 * \u four-hex-digits
180 static QString *qstring_from_escaped_str(JSONParserContext *ctxt, QObject *token)
182 const char *ptr = token_get_value(token);
183 QString *str;
184 int double_quote = 1;
186 if (*ptr == '"') {
187 double_quote = 1;
188 } else {
189 double_quote = 0;
191 ptr++;
193 str = qstring_new();
194 while (*ptr &&
195 ((double_quote && *ptr != '"') || (!double_quote && *ptr != '\''))) {
196 if (*ptr == '\\') {
197 ptr++;
199 switch (*ptr) {
200 case '"':
201 qstring_append(str, "\"");
202 ptr++;
203 break;
204 case '\'':
205 qstring_append(str, "'");
206 ptr++;
207 break;
208 case '\\':
209 qstring_append(str, "\\");
210 ptr++;
211 break;
212 case '/':
213 qstring_append(str, "/");
214 ptr++;
215 break;
216 case 'b':
217 qstring_append(str, "\b");
218 ptr++;
219 break;
220 case 'f':
221 qstring_append(str, "\f");
222 ptr++;
223 break;
224 case 'n':
225 qstring_append(str, "\n");
226 ptr++;
227 break;
228 case 'r':
229 qstring_append(str, "\r");
230 ptr++;
231 break;
232 case 't':
233 qstring_append(str, "\t");
234 ptr++;
235 break;
236 case 'u': {
237 uint16_t unicode_char = 0;
238 char utf8_char[4];
239 int i = 0;
241 ptr++;
243 for (i = 0; i < 4; i++) {
244 if (qemu_isxdigit(*ptr)) {
245 unicode_char |= hex2decimal(*ptr) << ((3 - i) * 4);
246 } else {
247 parse_error(ctxt, token,
248 "invalid hex escape sequence in string");
249 goto out;
251 ptr++;
254 wchar_to_utf8(unicode_char, utf8_char, sizeof(utf8_char));
255 qstring_append(str, utf8_char);
256 } break;
257 default:
258 parse_error(ctxt, token, "invalid escape sequence in string");
259 goto out;
261 } else {
262 char dummy[2];
264 dummy[0] = *ptr++;
265 dummy[1] = 0;
267 qstring_append(str, dummy);
271 return str;
273 out:
274 QDECREF(str);
275 return NULL;
278 static QObject *parser_context_pop_token(JSONParserContext *ctxt)
280 QObject *token;
281 g_assert(ctxt->tokens.pos < ctxt->tokens.count);
282 token = ctxt->tokens.buf[ctxt->tokens.pos];
283 ctxt->tokens.pos++;
284 return token;
287 /* Note: parser_context_{peek|pop}_token do not increment the
288 * token object's refcount. In both cases the references will continue
289 * to be tracked and cleaned up in parser_context_free(), so do not
290 * attempt to free the token object.
292 static QObject *parser_context_peek_token(JSONParserContext *ctxt)
294 QObject *token;
295 g_assert(ctxt->tokens.pos < ctxt->tokens.count);
296 token = ctxt->tokens.buf[ctxt->tokens.pos];
297 return token;
300 static JSONParserContext parser_context_save(JSONParserContext *ctxt)
302 JSONParserContext saved_ctxt = {0};
303 saved_ctxt.tokens.pos = ctxt->tokens.pos;
304 saved_ctxt.tokens.count = ctxt->tokens.count;
305 saved_ctxt.tokens.buf = ctxt->tokens.buf;
306 return saved_ctxt;
309 static void parser_context_restore(JSONParserContext *ctxt,
310 JSONParserContext saved_ctxt)
312 ctxt->tokens.pos = saved_ctxt.tokens.pos;
313 ctxt->tokens.count = saved_ctxt.tokens.count;
314 ctxt->tokens.buf = saved_ctxt.tokens.buf;
317 static void tokens_append_from_iter(QObject *obj, void *opaque)
319 JSONParserContext *ctxt = opaque;
320 g_assert(ctxt->tokens.pos < ctxt->tokens.count);
321 ctxt->tokens.buf[ctxt->tokens.pos++] = obj;
322 qobject_incref(obj);
325 static JSONParserContext *parser_context_new(QList *tokens)
327 JSONParserContext *ctxt;
328 size_t count;
330 if (!tokens) {
331 return NULL;
334 count = qlist_size(tokens);
335 if (count == 0) {
336 return NULL;
339 ctxt = g_malloc0(sizeof(JSONParserContext));
340 ctxt->tokens.pos = 0;
341 ctxt->tokens.count = count;
342 ctxt->tokens.buf = g_malloc(count * sizeof(QObject *));
343 qlist_iter(tokens, tokens_append_from_iter, ctxt);
344 ctxt->tokens.pos = 0;
346 return ctxt;
349 /* to support error propagation, ctxt->err must be freed separately */
350 static void parser_context_free(JSONParserContext *ctxt)
352 int i;
353 if (ctxt) {
354 for (i = 0; i < ctxt->tokens.count; i++) {
355 qobject_decref(ctxt->tokens.buf[i]);
357 g_free(ctxt->tokens.buf);
358 g_free(ctxt);
363 * Parsing rules
365 static int parse_pair(JSONParserContext *ctxt, QDict *dict, va_list *ap)
367 QObject *key = NULL, *token = NULL, *value, *peek;
368 JSONParserContext saved_ctxt = parser_context_save(ctxt);
370 peek = parser_context_peek_token(ctxt);
371 if (peek == NULL) {
372 parse_error(ctxt, NULL, "premature EOI");
373 goto out;
376 key = parse_value(ctxt, ap);
377 if (!key || qobject_type(key) != QTYPE_QSTRING) {
378 parse_error(ctxt, peek, "key is not a string in object");
379 goto out;
382 token = parser_context_pop_token(ctxt);
383 if (token == NULL) {
384 parse_error(ctxt, NULL, "premature EOI");
385 goto out;
388 if (!token_is_operator(token, ':')) {
389 parse_error(ctxt, token, "missing : in object pair");
390 goto out;
393 value = parse_value(ctxt, ap);
394 if (value == NULL) {
395 parse_error(ctxt, token, "Missing value in dict");
396 goto out;
399 qdict_put_obj(dict, qstring_get_str(qobject_to_qstring(key)), value);
401 qobject_decref(key);
403 return 0;
405 out:
406 parser_context_restore(ctxt, saved_ctxt);
407 qobject_decref(key);
409 return -1;
412 static QObject *parse_object(JSONParserContext *ctxt, va_list *ap)
414 QDict *dict = NULL;
415 QObject *token, *peek;
416 JSONParserContext saved_ctxt = parser_context_save(ctxt);
418 token = parser_context_pop_token(ctxt);
419 if (token == NULL) {
420 goto out;
423 if (!token_is_operator(token, '{')) {
424 goto out;
427 dict = qdict_new();
429 peek = parser_context_peek_token(ctxt);
430 if (peek == NULL) {
431 parse_error(ctxt, NULL, "premature EOI");
432 goto out;
435 if (!token_is_operator(peek, '}')) {
436 if (parse_pair(ctxt, dict, ap) == -1) {
437 goto out;
440 token = parser_context_pop_token(ctxt);
441 if (token == NULL) {
442 parse_error(ctxt, NULL, "premature EOI");
443 goto out;
446 while (!token_is_operator(token, '}')) {
447 if (!token_is_operator(token, ',')) {
448 parse_error(ctxt, token, "expected separator in dict");
449 goto out;
452 if (parse_pair(ctxt, dict, ap) == -1) {
453 goto out;
456 token = parser_context_pop_token(ctxt);
457 if (token == NULL) {
458 parse_error(ctxt, NULL, "premature EOI");
459 goto out;
462 } else {
463 (void)parser_context_pop_token(ctxt);
466 return QOBJECT(dict);
468 out:
469 parser_context_restore(ctxt, saved_ctxt);
470 QDECREF(dict);
471 return NULL;
474 static QObject *parse_array(JSONParserContext *ctxt, va_list *ap)
476 QList *list = NULL;
477 QObject *token, *peek;
478 JSONParserContext saved_ctxt = parser_context_save(ctxt);
480 token = parser_context_pop_token(ctxt);
481 if (token == NULL) {
482 goto out;
485 if (!token_is_operator(token, '[')) {
486 goto out;
489 list = qlist_new();
491 peek = parser_context_peek_token(ctxt);
492 if (peek == NULL) {
493 parse_error(ctxt, NULL, "premature EOI");
494 goto out;
497 if (!token_is_operator(peek, ']')) {
498 QObject *obj;
500 obj = parse_value(ctxt, ap);
501 if (obj == NULL) {
502 parse_error(ctxt, token, "expecting value");
503 goto out;
506 qlist_append_obj(list, obj);
508 token = parser_context_pop_token(ctxt);
509 if (token == NULL) {
510 parse_error(ctxt, NULL, "premature EOI");
511 goto out;
514 while (!token_is_operator(token, ']')) {
515 if (!token_is_operator(token, ',')) {
516 parse_error(ctxt, token, "expected separator in list");
517 goto out;
520 obj = parse_value(ctxt, ap);
521 if (obj == NULL) {
522 parse_error(ctxt, token, "expecting value");
523 goto out;
526 qlist_append_obj(list, obj);
528 token = parser_context_pop_token(ctxt);
529 if (token == NULL) {
530 parse_error(ctxt, NULL, "premature EOI");
531 goto out;
534 } else {
535 (void)parser_context_pop_token(ctxt);
538 return QOBJECT(list);
540 out:
541 parser_context_restore(ctxt, saved_ctxt);
542 QDECREF(list);
543 return NULL;
546 static QObject *parse_keyword(JSONParserContext *ctxt)
548 QObject *token, *ret;
549 JSONParserContext saved_ctxt = parser_context_save(ctxt);
551 token = parser_context_pop_token(ctxt);
552 if (token == NULL) {
553 goto out;
556 if (token_get_type(token) != JSON_KEYWORD) {
557 goto out;
560 if (token_is_keyword(token, "true")) {
561 ret = QOBJECT(qbool_from_int(true));
562 } else if (token_is_keyword(token, "false")) {
563 ret = QOBJECT(qbool_from_int(false));
564 } else if (token_is_keyword(token, "null")) {
565 ret = qnull();
566 } else {
567 parse_error(ctxt, token, "invalid keyword `%s'", token_get_value(token));
568 goto out;
571 return ret;
573 out:
574 parser_context_restore(ctxt, saved_ctxt);
576 return NULL;
579 static QObject *parse_escape(JSONParserContext *ctxt, va_list *ap)
581 QObject *token = NULL, *obj;
582 JSONParserContext saved_ctxt = parser_context_save(ctxt);
584 if (ap == NULL) {
585 goto out;
588 token = parser_context_pop_token(ctxt);
589 if (token == NULL) {
590 goto out;
593 if (token_is_escape(token, "%p")) {
594 obj = va_arg(*ap, QObject *);
595 } else if (token_is_escape(token, "%i")) {
596 obj = QOBJECT(qbool_from_int(va_arg(*ap, int)));
597 } else if (token_is_escape(token, "%d")) {
598 obj = QOBJECT(qint_from_int(va_arg(*ap, int)));
599 } else if (token_is_escape(token, "%ld")) {
600 obj = QOBJECT(qint_from_int(va_arg(*ap, long)));
601 } else if (token_is_escape(token, "%lld") ||
602 token_is_escape(token, "%I64d")) {
603 obj = QOBJECT(qint_from_int(va_arg(*ap, long long)));
604 } else if (token_is_escape(token, "%s")) {
605 obj = QOBJECT(qstring_from_str(va_arg(*ap, const char *)));
606 } else if (token_is_escape(token, "%f")) {
607 obj = QOBJECT(qfloat_from_double(va_arg(*ap, double)));
608 } else {
609 goto out;
612 return obj;
614 out:
615 parser_context_restore(ctxt, saved_ctxt);
617 return NULL;
620 static QObject *parse_literal(JSONParserContext *ctxt)
622 QObject *token, *obj;
623 JSONParserContext saved_ctxt = parser_context_save(ctxt);
625 token = parser_context_pop_token(ctxt);
626 if (token == NULL) {
627 goto out;
630 switch (token_get_type(token)) {
631 case JSON_STRING:
632 obj = QOBJECT(qstring_from_escaped_str(ctxt, token));
633 break;
634 case JSON_INTEGER: {
635 /* A possibility exists that this is a whole-valued float where the
636 * fractional part was left out due to being 0 (.0). It's not a big
637 * deal to treat these as ints in the parser, so long as users of the
638 * resulting QObject know to expect a QInt in place of a QFloat in
639 * cases like these.
641 * However, in some cases these values will overflow/underflow a
642 * QInt/int64 container, thus we should assume these are to be handled
643 * as QFloats/doubles rather than silently changing their values.
645 * strtoll() indicates these instances by setting errno to ERANGE
647 int64_t value;
649 errno = 0; /* strtoll doesn't set errno on success */
650 value = strtoll(token_get_value(token), NULL, 10);
651 if (errno != ERANGE) {
652 obj = QOBJECT(qint_from_int(value));
653 break;
655 /* fall through to JSON_FLOAT */
657 case JSON_FLOAT:
658 /* FIXME dependent on locale */
659 obj = QOBJECT(qfloat_from_double(strtod(token_get_value(token), NULL)));
660 break;
661 default:
662 goto out;
665 return obj;
667 out:
668 parser_context_restore(ctxt, saved_ctxt);
670 return NULL;
673 static QObject *parse_value(JSONParserContext *ctxt, va_list *ap)
675 QObject *obj;
677 obj = parse_object(ctxt, ap);
678 if (obj == NULL) {
679 obj = parse_array(ctxt, ap);
681 if (obj == NULL) {
682 obj = parse_escape(ctxt, ap);
684 if (obj == NULL) {
685 obj = parse_keyword(ctxt);
687 if (obj == NULL) {
688 obj = parse_literal(ctxt);
691 return obj;
694 QObject *json_parser_parse(QList *tokens, va_list *ap)
696 return json_parser_parse_err(tokens, ap, NULL);
699 QObject *json_parser_parse_err(QList *tokens, va_list *ap, Error **errp)
701 JSONParserContext *ctxt = parser_context_new(tokens);
702 QObject *result;
704 if (!ctxt) {
705 return NULL;
708 result = parse_value(ctxt, ap);
710 error_propagate(errp, ctxt->err);
712 parser_context_free(ctxt);
714 return result;