4 * Copyright IBM, Corp. 2009
7 * Anthony Liguori <aliguori@us.ibm.com>
9 * This work is licensed under the terms of the GNU LGPL, version 2.1 or later.
10 * See the COPYING.LIB file in the top-level directory.
14 #include "qemu/osdep.h"
15 #include "qemu/cutils.h"
16 #include "qapi/error.h"
17 #include "qemu-common.h"
18 #include "qapi/qmp/qbool.h"
19 #include "qapi/qmp/qdict.h"
20 #include "qapi/qmp/qlist.h"
21 #include "qapi/qmp/qnull.h"
22 #include "qapi/qmp/qnum.h"
23 #include "qapi/qmp/qstring.h"
24 #include "qapi/qmp/json-parser.h"
25 #include "qapi/qmp/json-lexer.h"
26 #include "qapi/qmp/json-streamer.h"
28 typedef struct JSONParserContext
35 #define BUG_ON(cond) assert(!(cond))
40 * 0) make errors meaningful again
41 * 1) add geometry information to tokens
42 * 3) should we return a parsed size?
43 * 4) deal with premature EOI
46 static QObject
*parse_value(JSONParserContext
*ctxt
, va_list *ap
);
51 static void GCC_FMT_ATTR(3, 4) parse_error(JSONParserContext
*ctxt
,
52 JSONToken
*token
, const char *msg
, ...)
57 vsnprintf(message
, sizeof(message
), msg
, ap
);
60 error_free(ctxt
->err
);
63 error_setg(&ctxt
->err
, "JSON parse error, %s", message
);
69 * These helpers are used to unescape strings.
71 static void wchar_to_utf8(uint16_t wchar
, char *buffer
, size_t buffer_length
)
73 if (wchar
<= 0x007F) {
74 BUG_ON(buffer_length
< 2);
76 buffer
[0] = wchar
& 0x7F;
78 } else if (wchar
<= 0x07FF) {
79 BUG_ON(buffer_length
< 3);
81 buffer
[0] = 0xC0 | ((wchar
>> 6) & 0x1F);
82 buffer
[1] = 0x80 | (wchar
& 0x3F);
85 BUG_ON(buffer_length
< 4);
87 buffer
[0] = 0xE0 | ((wchar
>> 12) & 0x0F);
88 buffer
[1] = 0x80 | ((wchar
>> 6) & 0x3F);
89 buffer
[2] = 0x80 | (wchar
& 0x3F);
94 static int hex2decimal(char ch
)
96 if (ch
>= '0' && ch
<= '9') {
98 } else if (ch
>= 'a' && ch
<= 'f') {
99 return 10 + (ch
- 'a');
100 } else if (ch
>= 'A' && ch
<= 'F') {
101 return 10 + (ch
- 'A');
108 * parse_string(): Parse a json string and return a QObject
117 * any-Unicode-character-
130 static QString
*qstring_from_escaped_str(JSONParserContext
*ctxt
,
133 const char *ptr
= token
->str
;
135 int double_quote
= 1;
146 ((double_quote
&& *ptr
!= '"') || (!double_quote
&& *ptr
!= '\''))) {
152 qstring_append(str
, "\"");
156 qstring_append(str
, "'");
160 qstring_append(str
, "\\");
164 qstring_append(str
, "/");
168 qstring_append(str
, "\b");
172 qstring_append(str
, "\f");
176 qstring_append(str
, "\n");
180 qstring_append(str
, "\r");
184 qstring_append(str
, "\t");
188 uint16_t unicode_char
= 0;
194 for (i
= 0; i
< 4; i
++) {
195 if (qemu_isxdigit(*ptr
)) {
196 unicode_char
|= hex2decimal(*ptr
) << ((3 - i
) * 4);
198 parse_error(ctxt
, token
,
199 "invalid hex escape sequence in string");
205 wchar_to_utf8(unicode_char
, utf8_char
, sizeof(utf8_char
));
206 qstring_append(str
, utf8_char
);
209 parse_error(ctxt
, token
, "invalid escape sequence in string");
218 qstring_append(str
, dummy
);
229 /* Note: the token object returned by parser_context_peek_token or
230 * parser_context_pop_token is deleted as soon as parser_context_pop_token
233 static JSONToken
*parser_context_pop_token(JSONParserContext
*ctxt
)
235 g_free(ctxt
->current
);
236 assert(!g_queue_is_empty(ctxt
->buf
));
237 ctxt
->current
= g_queue_pop_head(ctxt
->buf
);
238 return ctxt
->current
;
241 static JSONToken
*parser_context_peek_token(JSONParserContext
*ctxt
)
243 assert(!g_queue_is_empty(ctxt
->buf
));
244 return g_queue_peek_head(ctxt
->buf
);
247 static JSONParserContext
*parser_context_new(GQueue
*tokens
)
249 JSONParserContext
*ctxt
;
255 ctxt
= g_malloc0(sizeof(JSONParserContext
));
261 /* to support error propagation, ctxt->err must be freed separately */
262 static void parser_context_free(JSONParserContext
*ctxt
)
265 while (!g_queue_is_empty(ctxt
->buf
)) {
266 parser_context_pop_token(ctxt
);
268 g_free(ctxt
->current
);
269 g_queue_free(ctxt
->buf
);
277 static int parse_pair(JSONParserContext
*ctxt
, QDict
*dict
, va_list *ap
)
281 JSONToken
*peek
, *token
;
283 peek
= parser_context_peek_token(ctxt
);
285 parse_error(ctxt
, NULL
, "premature EOI");
289 key
= qobject_to(QString
, parse_value(ctxt
, ap
));
291 parse_error(ctxt
, peek
, "key is not a string in object");
295 token
= parser_context_pop_token(ctxt
);
297 parse_error(ctxt
, NULL
, "premature EOI");
301 if (token
->type
!= JSON_COLON
) {
302 parse_error(ctxt
, token
, "missing : in object pair");
306 value
= parse_value(ctxt
, ap
);
308 parse_error(ctxt
, token
, "Missing value in dict");
312 qdict_put_obj(dict
, qstring_get_str(key
), value
);
324 static QObject
*parse_object(JSONParserContext
*ctxt
, va_list *ap
)
327 JSONToken
*token
, *peek
;
329 token
= parser_context_pop_token(ctxt
);
330 assert(token
&& token
->type
== JSON_LCURLY
);
334 peek
= parser_context_peek_token(ctxt
);
336 parse_error(ctxt
, NULL
, "premature EOI");
340 if (peek
->type
!= JSON_RCURLY
) {
341 if (parse_pair(ctxt
, dict
, ap
) == -1) {
345 token
= parser_context_pop_token(ctxt
);
347 parse_error(ctxt
, NULL
, "premature EOI");
351 while (token
->type
!= JSON_RCURLY
) {
352 if (token
->type
!= JSON_COMMA
) {
353 parse_error(ctxt
, token
, "expected separator in dict");
357 if (parse_pair(ctxt
, dict
, ap
) == -1) {
361 token
= parser_context_pop_token(ctxt
);
363 parse_error(ctxt
, NULL
, "premature EOI");
368 (void)parser_context_pop_token(ctxt
);
371 return QOBJECT(dict
);
378 static QObject
*parse_array(JSONParserContext
*ctxt
, va_list *ap
)
381 JSONToken
*token
, *peek
;
383 token
= parser_context_pop_token(ctxt
);
384 assert(token
&& token
->type
== JSON_LSQUARE
);
388 peek
= parser_context_peek_token(ctxt
);
390 parse_error(ctxt
, NULL
, "premature EOI");
394 if (peek
->type
!= JSON_RSQUARE
) {
397 obj
= parse_value(ctxt
, ap
);
399 parse_error(ctxt
, token
, "expecting value");
403 qlist_append_obj(list
, obj
);
405 token
= parser_context_pop_token(ctxt
);
407 parse_error(ctxt
, NULL
, "premature EOI");
411 while (token
->type
!= JSON_RSQUARE
) {
412 if (token
->type
!= JSON_COMMA
) {
413 parse_error(ctxt
, token
, "expected separator in list");
417 obj
= parse_value(ctxt
, ap
);
419 parse_error(ctxt
, token
, "expecting value");
423 qlist_append_obj(list
, obj
);
425 token
= parser_context_pop_token(ctxt
);
427 parse_error(ctxt
, NULL
, "premature EOI");
432 (void)parser_context_pop_token(ctxt
);
435 return QOBJECT(list
);
442 static QObject
*parse_keyword(JSONParserContext
*ctxt
)
446 token
= parser_context_pop_token(ctxt
);
447 assert(token
&& token
->type
== JSON_KEYWORD
);
449 if (!strcmp(token
->str
, "true")) {
450 return QOBJECT(qbool_from_bool(true));
451 } else if (!strcmp(token
->str
, "false")) {
452 return QOBJECT(qbool_from_bool(false));
453 } else if (!strcmp(token
->str
, "null")) {
454 return QOBJECT(qnull());
456 parse_error(ctxt
, token
, "invalid keyword '%s'", token
->str
);
460 static QObject
*parse_escape(JSONParserContext
*ctxt
, va_list *ap
)
468 token
= parser_context_pop_token(ctxt
);
469 assert(token
&& token
->type
== JSON_ESCAPE
);
471 if (!strcmp(token
->str
, "%p")) {
472 return va_arg(*ap
, QObject
*);
473 } else if (!strcmp(token
->str
, "%i")) {
474 return QOBJECT(qbool_from_bool(va_arg(*ap
, int)));
475 } else if (!strcmp(token
->str
, "%d")) {
476 return QOBJECT(qnum_from_int(va_arg(*ap
, int)));
477 } else if (!strcmp(token
->str
, "%ld")) {
478 return QOBJECT(qnum_from_int(va_arg(*ap
, long)));
479 } else if (!strcmp(token
->str
, "%lld") ||
480 !strcmp(token
->str
, "%I64d")) {
481 return QOBJECT(qnum_from_int(va_arg(*ap
, long long)));
482 } else if (!strcmp(token
->str
, "%u")) {
483 return QOBJECT(qnum_from_uint(va_arg(*ap
, unsigned int)));
484 } else if (!strcmp(token
->str
, "%lu")) {
485 return QOBJECT(qnum_from_uint(va_arg(*ap
, unsigned long)));
486 } else if (!strcmp(token
->str
, "%llu") ||
487 !strcmp(token
->str
, "%I64u")) {
488 return QOBJECT(qnum_from_uint(va_arg(*ap
, unsigned long long)));
489 } else if (!strcmp(token
->str
, "%s")) {
490 return QOBJECT(qstring_from_str(va_arg(*ap
, const char *)));
491 } else if (!strcmp(token
->str
, "%f")) {
492 return QOBJECT(qnum_from_double(va_arg(*ap
, double)));
497 static QObject
*parse_literal(JSONParserContext
*ctxt
)
501 token
= parser_context_pop_token(ctxt
);
504 switch (token
->type
) {
506 return QOBJECT(qstring_from_escaped_str(ctxt
, token
));
509 * Represent JSON_INTEGER as QNUM_I64 if possible, else as
510 * QNUM_U64, else as QNUM_DOUBLE. Note that qemu_strtoi64()
511 * and qemu_strtou64() fail with ERANGE when it's not
514 * qnum_get_int() will then work for any signed 64-bit
515 * JSON_INTEGER, qnum_get_uint() for any unsigned 64-bit
516 * integer, and qnum_get_double() both for any JSON_INTEGER
517 * and any JSON_FLOAT (with precision loss for integers beyond
524 ret
= qemu_strtoi64(token
->str
, NULL
, 10, &value
);
526 return QOBJECT(qnum_from_int(value
));
528 assert(ret
== -ERANGE
);
530 if (token
->str
[0] != '-') {
531 ret
= qemu_strtou64(token
->str
, NULL
, 10, &uvalue
);
533 return QOBJECT(qnum_from_uint(uvalue
));
535 assert(ret
== -ERANGE
);
537 /* fall through to JSON_FLOAT */
540 /* FIXME dependent on locale; a pervasive issue in QEMU */
541 /* FIXME our lexer matches RFC 7159 in forbidding Inf or NaN,
542 * but those might be useful extensions beyond JSON */
543 return QOBJECT(qnum_from_double(strtod(token
->str
, NULL
)));
549 static QObject
*parse_value(JSONParserContext
*ctxt
, va_list *ap
)
553 token
= parser_context_peek_token(ctxt
);
555 parse_error(ctxt
, NULL
, "premature EOI");
559 switch (token
->type
) {
561 return parse_object(ctxt
, ap
);
563 return parse_array(ctxt
, ap
);
565 return parse_escape(ctxt
, ap
);
569 return parse_literal(ctxt
);
571 return parse_keyword(ctxt
);
573 parse_error(ctxt
, token
, "expecting value");
578 QObject
*json_parser_parse(GQueue
*tokens
, va_list *ap
)
580 return json_parser_parse_err(tokens
, ap
, NULL
);
583 QObject
*json_parser_parse_err(GQueue
*tokens
, va_list *ap
, Error
**errp
)
585 JSONParserContext
*ctxt
= parser_context_new(tokens
);
592 result
= parse_value(ctxt
, ap
);
594 error_propagate(errp
, ctxt
->err
);
596 parser_context_free(ctxt
);