4 * Copyright IBM, Corp. 2009
7 * Anthony Liguori <aliguori@us.ibm.com>
9 * This work is licensed under the terms of the GNU LGPL, version 2.1 or later.
10 * See the COPYING.LIB file in the top-level directory.
16 #include "qemu-common.h"
23 #include "json-parser.h"
24 #include "json-lexer.h"
26 typedef struct JSONParserContext
30 #define BUG_ON(cond) assert(!(cond))
35 * 0) make errors meaningful again
36 * 1) add geometry information to tokens
37 * 3) should we return a parsed size?
38 * 4) deal with premature EOI
41 static QObject
*parse_value(JSONParserContext
*ctxt
, QList
**tokens
, va_list *ap
);
46 * tokens are dictionaries that contain a type, a string value, and geometry information
47 * about a token identified by the lexer. These are routines that make working with
48 * these objects a bit easier.
50 static const char *token_get_value(QObject
*obj
)
52 return qdict_get_str(qobject_to_qdict(obj
), "token");
55 static JSONTokenType
token_get_type(QObject
*obj
)
57 return qdict_get_int(qobject_to_qdict(obj
), "type");
60 static int token_is_operator(QObject
*obj
, char op
)
64 if (token_get_type(obj
) != JSON_OPERATOR
) {
68 val
= token_get_value(obj
);
70 return (val
[0] == op
) && (val
[1] == 0);
73 static int token_is_keyword(QObject
*obj
, const char *value
)
75 if (token_get_type(obj
) != JSON_KEYWORD
) {
79 return strcmp(token_get_value(obj
), value
) == 0;
82 static int token_is_escape(QObject
*obj
, const char *value
)
84 if (token_get_type(obj
) != JSON_ESCAPE
) {
88 return (strcmp(token_get_value(obj
), value
) == 0);
94 static void parse_error(JSONParserContext
*ctxt
, QObject
*token
, const char *msg
, ...)
96 fprintf(stderr
, "parse error: %s\n", msg
);
102 * These helpers are used to unescape strings.
104 static void wchar_to_utf8(uint16_t wchar
, char *buffer
, size_t buffer_length
)
106 if (wchar
<= 0x007F) {
107 BUG_ON(buffer_length
< 2);
109 buffer
[0] = wchar
& 0x7F;
111 } else if (wchar
<= 0x07FF) {
112 BUG_ON(buffer_length
< 3);
114 buffer
[0] = 0xC0 | ((wchar
>> 6) & 0x1F);
115 buffer
[1] = 0x80 | (wchar
& 0x3F);
118 BUG_ON(buffer_length
< 4);
120 buffer
[0] = 0xE0 | ((wchar
>> 12) & 0x0F);
121 buffer
[1] = 0x80 | ((wchar
>> 6) & 0x3F);
122 buffer
[2] = 0x80 | (wchar
& 0x3F);
127 static int hex2decimal(char ch
)
129 if (ch
>= '0' && ch
<= '9') {
131 } else if (ch
>= 'a' && ch
<= 'f') {
132 return 10 + (ch
- 'a');
133 } else if (ch
>= 'A' && ch
<= 'F') {
134 return 10 + (ch
- 'A');
141 * parse_string(): Parse a json string and return a QObject
150 * any-Unicode-character-
163 static QString
*qstring_from_escaped_str(JSONParserContext
*ctxt
, QObject
*token
)
165 const char *ptr
= token_get_value(token
);
167 int double_quote
= 1;
178 ((double_quote
&& *ptr
!= '"') || (!double_quote
&& *ptr
!= '\''))) {
184 qstring_append(str
, "\"");
188 qstring_append(str
, "'");
192 qstring_append(str
, "\\");
196 qstring_append(str
, "/");
200 qstring_append(str
, "\b");
204 qstring_append(str
, "\n");
208 qstring_append(str
, "\r");
212 qstring_append(str
, "\t");
216 uint16_t unicode_char
= 0;
222 for (i
= 0; i
< 4; i
++) {
223 if (qemu_isxdigit(*ptr
)) {
224 unicode_char
|= hex2decimal(*ptr
) << ((3 - i
) * 4);
226 parse_error(ctxt
, token
,
227 "invalid hex escape sequence in string");
233 wchar_to_utf8(unicode_char
, utf8_char
, sizeof(utf8_char
));
234 qstring_append(str
, utf8_char
);
237 parse_error(ctxt
, token
, "invalid escape sequence in string");
246 qstring_append(str
, dummy
);
262 static int parse_pair(JSONParserContext
*ctxt
, QDict
*dict
, QList
**tokens
, va_list *ap
)
264 QObject
*key
, *token
= NULL
, *value
, *peek
;
265 QList
*working
= qlist_copy(*tokens
);
267 peek
= qlist_peek(working
);
268 key
= parse_value(ctxt
, &working
, ap
);
269 if (qobject_type(key
) != QTYPE_QSTRING
) {
270 parse_error(ctxt
, peek
, "key is not a string in object");
274 token
= qlist_pop(working
);
275 if (!token_is_operator(token
, ':')) {
276 parse_error(ctxt
, token
, "missing : in object pair");
280 value
= parse_value(ctxt
, &working
, ap
);
282 parse_error(ctxt
, token
, "Missing value in dict");
286 qdict_put_obj(dict
, qstring_get_str(qobject_to_qstring(key
)), value
);
288 qobject_decref(token
);
296 qobject_decref(token
);
303 static QObject
*parse_object(JSONParserContext
*ctxt
, QList
**tokens
, va_list *ap
)
306 QObject
*token
, *peek
;
307 QList
*working
= qlist_copy(*tokens
);
309 token
= qlist_pop(working
);
310 if (!token_is_operator(token
, '{')) {
313 qobject_decref(token
);
318 peek
= qlist_peek(working
);
319 if (!token_is_operator(peek
, '}')) {
320 if (parse_pair(ctxt
, dict
, &working
, ap
) == -1) {
324 token
= qlist_pop(working
);
325 while (!token_is_operator(token
, '}')) {
326 if (!token_is_operator(token
, ',')) {
327 parse_error(ctxt
, token
, "expected separator in dict");
330 qobject_decref(token
);
333 if (parse_pair(ctxt
, dict
, &working
, ap
) == -1) {
337 token
= qlist_pop(working
);
339 qobject_decref(token
);
342 token
= qlist_pop(working
);
343 qobject_decref(token
);
350 return QOBJECT(dict
);
353 qobject_decref(token
);
359 static QObject
*parse_array(JSONParserContext
*ctxt
, QList
**tokens
, va_list *ap
)
362 QObject
*token
, *peek
;
363 QList
*working
= qlist_copy(*tokens
);
365 token
= qlist_pop(working
);
366 if (!token_is_operator(token
, '[')) {
369 qobject_decref(token
);
374 peek
= qlist_peek(working
);
375 if (!token_is_operator(peek
, ']')) {
378 obj
= parse_value(ctxt
, &working
, ap
);
380 parse_error(ctxt
, token
, "expecting value");
384 qlist_append_obj(list
, obj
);
386 token
= qlist_pop(working
);
387 while (!token_is_operator(token
, ']')) {
388 if (!token_is_operator(token
, ',')) {
389 parse_error(ctxt
, token
, "expected separator in list");
393 qobject_decref(token
);
396 obj
= parse_value(ctxt
, &working
, ap
);
398 parse_error(ctxt
, token
, "expecting value");
402 qlist_append_obj(list
, obj
);
404 token
= qlist_pop(working
);
407 qobject_decref(token
);
410 token
= qlist_pop(working
);
411 qobject_decref(token
);
418 return QOBJECT(list
);
421 qobject_decref(token
);
427 static QObject
*parse_keyword(JSONParserContext
*ctxt
, QList
**tokens
)
429 QObject
*token
, *ret
;
430 QList
*working
= qlist_copy(*tokens
);
432 token
= qlist_pop(working
);
434 if (token_get_type(token
) != JSON_KEYWORD
) {
438 if (token_is_keyword(token
, "true")) {
439 ret
= QOBJECT(qbool_from_int(true));
440 } else if (token_is_keyword(token
, "false")) {
441 ret
= QOBJECT(qbool_from_int(false));
443 parse_error(ctxt
, token
, "invalid keyword `%s'", token_get_value(token
));
447 qobject_decref(token
);
454 qobject_decref(token
);
460 static QObject
*parse_escape(JSONParserContext
*ctxt
, QList
**tokens
, va_list *ap
)
462 QObject
*token
= NULL
, *obj
;
463 QList
*working
= qlist_copy(*tokens
);
469 token
= qlist_pop(working
);
471 if (token_is_escape(token
, "%p")) {
472 obj
= va_arg(*ap
, QObject
*);
473 } else if (token_is_escape(token
, "%i")) {
474 obj
= QOBJECT(qbool_from_int(va_arg(*ap
, int)));
475 } else if (token_is_escape(token
, "%d")) {
476 obj
= QOBJECT(qint_from_int(va_arg(*ap
, int)));
477 } else if (token_is_escape(token
, "%ld")) {
478 obj
= QOBJECT(qint_from_int(va_arg(*ap
, long)));
479 } else if (token_is_escape(token
, "%lld")) {
480 obj
= QOBJECT(qint_from_int(va_arg(*ap
, long long)));
481 } else if (token_is_escape(token
, "%s")) {
482 obj
= QOBJECT(qstring_from_str(va_arg(*ap
, const char *)));
483 } else if (token_is_escape(token
, "%f")) {
484 obj
= QOBJECT(qfloat_from_double(va_arg(*ap
, double)));
489 qobject_decref(token
);
496 qobject_decref(token
);
502 static QObject
*parse_literal(JSONParserContext
*ctxt
, QList
**tokens
)
504 QObject
*token
, *obj
;
505 QList
*working
= qlist_copy(*tokens
);
507 token
= qlist_pop(working
);
508 switch (token_get_type(token
)) {
510 obj
= QOBJECT(qstring_from_escaped_str(ctxt
, token
));
513 obj
= QOBJECT(qint_from_int(strtoll(token_get_value(token
), NULL
, 10)));
516 /* FIXME dependent on locale */
517 obj
= QOBJECT(qfloat_from_double(strtod(token_get_value(token
), NULL
)));
523 qobject_decref(token
);
530 qobject_decref(token
);
536 static QObject
*parse_value(JSONParserContext
*ctxt
, QList
**tokens
, va_list *ap
)
540 obj
= parse_object(ctxt
, tokens
, ap
);
542 obj
= parse_array(ctxt
, tokens
, ap
);
545 obj
= parse_escape(ctxt
, tokens
, ap
);
548 obj
= parse_keyword(ctxt
, tokens
);
551 obj
= parse_literal(ctxt
, tokens
);
557 QObject
*json_parser_parse(QList
*tokens
, va_list *ap
)
559 JSONParserContext ctxt
= {};
560 QList
*working
= qlist_copy(tokens
);
563 result
= parse_value(&ctxt
, &working
, ap
);