4 * Copyright IBM, Corp. 2009
7 * Anthony Liguori <aliguori@us.ibm.com>
9 * This work is licensed under the terms of the GNU LGPL, version 2.1 or later.
10 * See the COPYING.LIB file in the top-level directory.
17 #include "qemu-common.h"
24 #include "json-parser.h"
25 #include "json-lexer.h"
27 typedef struct JSONParserContext
31 #define BUG_ON(cond) assert(!(cond))
36 * 0) make errors meaningful again
37 * 1) add geometry information to tokens
38 * 3) should we return a parsed size?
39 * 4) deal with premature EOI
42 static QObject
*parse_value(JSONParserContext
*ctxt
, QList
**tokens
, va_list *ap
);
47 * tokens are dictionaries that contain a type, a string value, and geometry information
48 * about a token identified by the lexer. These are routines that make working with
49 * these objects a bit easier.
51 static const char *token_get_value(QObject
*obj
)
53 return qdict_get_str(qobject_to_qdict(obj
), "token");
56 static JSONTokenType
token_get_type(QObject
*obj
)
58 return qdict_get_int(qobject_to_qdict(obj
), "type");
61 static int token_is_operator(QObject
*obj
, char op
)
65 if (token_get_type(obj
) != JSON_OPERATOR
) {
69 val
= token_get_value(obj
);
71 return (val
[0] == op
) && (val
[1] == 0);
74 static int token_is_keyword(QObject
*obj
, const char *value
)
76 if (token_get_type(obj
) != JSON_KEYWORD
) {
80 return strcmp(token_get_value(obj
), value
) == 0;
83 static int token_is_escape(QObject
*obj
, const char *value
)
85 if (token_get_type(obj
) != JSON_ESCAPE
) {
89 return (strcmp(token_get_value(obj
), value
) == 0);
95 static void parse_error(JSONParserContext
*ctxt
, QObject
*token
, const char *msg
, ...)
99 fprintf(stderr
, "parse error: ");
100 vfprintf(stderr
, msg
, ap
);
101 fprintf(stderr
, "\n");
108 * These helpers are used to unescape strings.
110 static void wchar_to_utf8(uint16_t wchar
, char *buffer
, size_t buffer_length
)
112 if (wchar
<= 0x007F) {
113 BUG_ON(buffer_length
< 2);
115 buffer
[0] = wchar
& 0x7F;
117 } else if (wchar
<= 0x07FF) {
118 BUG_ON(buffer_length
< 3);
120 buffer
[0] = 0xC0 | ((wchar
>> 6) & 0x1F);
121 buffer
[1] = 0x80 | (wchar
& 0x3F);
124 BUG_ON(buffer_length
< 4);
126 buffer
[0] = 0xE0 | ((wchar
>> 12) & 0x0F);
127 buffer
[1] = 0x80 | ((wchar
>> 6) & 0x3F);
128 buffer
[2] = 0x80 | (wchar
& 0x3F);
133 static int hex2decimal(char ch
)
135 if (ch
>= '0' && ch
<= '9') {
137 } else if (ch
>= 'a' && ch
<= 'f') {
138 return 10 + (ch
- 'a');
139 } else if (ch
>= 'A' && ch
<= 'F') {
140 return 10 + (ch
- 'A');
147 * parse_string(): Parse a json string and return a QObject
156 * any-Unicode-character-
169 static QString
*qstring_from_escaped_str(JSONParserContext
*ctxt
, QObject
*token
)
171 const char *ptr
= token_get_value(token
);
173 int double_quote
= 1;
184 ((double_quote
&& *ptr
!= '"') || (!double_quote
&& *ptr
!= '\''))) {
190 qstring_append(str
, "\"");
194 qstring_append(str
, "'");
198 qstring_append(str
, "\\");
202 qstring_append(str
, "/");
206 qstring_append(str
, "\b");
210 qstring_append(str
, "\n");
214 qstring_append(str
, "\r");
218 qstring_append(str
, "\t");
222 uint16_t unicode_char
= 0;
228 for (i
= 0; i
< 4; i
++) {
229 if (qemu_isxdigit(*ptr
)) {
230 unicode_char
|= hex2decimal(*ptr
) << ((3 - i
) * 4);
232 parse_error(ctxt
, token
,
233 "invalid hex escape sequence in string");
239 wchar_to_utf8(unicode_char
, utf8_char
, sizeof(utf8_char
));
240 qstring_append(str
, utf8_char
);
243 parse_error(ctxt
, token
, "invalid escape sequence in string");
252 qstring_append(str
, dummy
);
266 static int parse_pair(JSONParserContext
*ctxt
, QDict
*dict
, QList
**tokens
, va_list *ap
)
268 QObject
*key
, *token
= NULL
, *value
, *peek
;
269 QList
*working
= qlist_copy(*tokens
);
271 peek
= qlist_peek(working
);
272 key
= parse_value(ctxt
, &working
, ap
);
273 if (!key
|| qobject_type(key
) != QTYPE_QSTRING
) {
274 parse_error(ctxt
, peek
, "key is not a string in object");
278 token
= qlist_pop(working
);
279 if (!token_is_operator(token
, ':')) {
280 parse_error(ctxt
, token
, "missing : in object pair");
284 value
= parse_value(ctxt
, &working
, ap
);
286 parse_error(ctxt
, token
, "Missing value in dict");
290 qdict_put_obj(dict
, qstring_get_str(qobject_to_qstring(key
)), value
);
292 qobject_decref(token
);
300 qobject_decref(token
);
307 static QObject
*parse_object(JSONParserContext
*ctxt
, QList
**tokens
, va_list *ap
)
310 QObject
*token
, *peek
;
311 QList
*working
= qlist_copy(*tokens
);
313 token
= qlist_pop(working
);
314 if (!token_is_operator(token
, '{')) {
317 qobject_decref(token
);
322 peek
= qlist_peek(working
);
323 if (!token_is_operator(peek
, '}')) {
324 if (parse_pair(ctxt
, dict
, &working
, ap
) == -1) {
328 token
= qlist_pop(working
);
329 while (!token_is_operator(token
, '}')) {
330 if (!token_is_operator(token
, ',')) {
331 parse_error(ctxt
, token
, "expected separator in dict");
334 qobject_decref(token
);
337 if (parse_pair(ctxt
, dict
, &working
, ap
) == -1) {
341 token
= qlist_pop(working
);
343 qobject_decref(token
);
346 token
= qlist_pop(working
);
347 qobject_decref(token
);
354 return QOBJECT(dict
);
357 qobject_decref(token
);
363 static QObject
*parse_array(JSONParserContext
*ctxt
, QList
**tokens
, va_list *ap
)
366 QObject
*token
, *peek
;
367 QList
*working
= qlist_copy(*tokens
);
369 token
= qlist_pop(working
);
370 if (!token_is_operator(token
, '[')) {
373 qobject_decref(token
);
378 peek
= qlist_peek(working
);
379 if (!token_is_operator(peek
, ']')) {
382 obj
= parse_value(ctxt
, &working
, ap
);
384 parse_error(ctxt
, token
, "expecting value");
388 qlist_append_obj(list
, obj
);
390 token
= qlist_pop(working
);
391 while (!token_is_operator(token
, ']')) {
392 if (!token_is_operator(token
, ',')) {
393 parse_error(ctxt
, token
, "expected separator in list");
397 qobject_decref(token
);
400 obj
= parse_value(ctxt
, &working
, ap
);
402 parse_error(ctxt
, token
, "expecting value");
406 qlist_append_obj(list
, obj
);
408 token
= qlist_pop(working
);
411 qobject_decref(token
);
414 token
= qlist_pop(working
);
415 qobject_decref(token
);
422 return QOBJECT(list
);
425 qobject_decref(token
);
431 static QObject
*parse_keyword(JSONParserContext
*ctxt
, QList
**tokens
)
433 QObject
*token
, *ret
;
434 QList
*working
= qlist_copy(*tokens
);
436 token
= qlist_pop(working
);
438 if (token_get_type(token
) != JSON_KEYWORD
) {
442 if (token_is_keyword(token
, "true")) {
443 ret
= QOBJECT(qbool_from_int(true));
444 } else if (token_is_keyword(token
, "false")) {
445 ret
= QOBJECT(qbool_from_int(false));
447 parse_error(ctxt
, token
, "invalid keyword `%s'", token_get_value(token
));
451 qobject_decref(token
);
458 qobject_decref(token
);
464 static QObject
*parse_escape(JSONParserContext
*ctxt
, QList
**tokens
, va_list *ap
)
466 QObject
*token
= NULL
, *obj
;
467 QList
*working
= qlist_copy(*tokens
);
473 token
= qlist_pop(working
);
475 if (token_is_escape(token
, "%p")) {
476 obj
= va_arg(*ap
, QObject
*);
477 } else if (token_is_escape(token
, "%i")) {
478 obj
= QOBJECT(qbool_from_int(va_arg(*ap
, int)));
479 } else if (token_is_escape(token
, "%d")) {
480 obj
= QOBJECT(qint_from_int(va_arg(*ap
, int)));
481 } else if (token_is_escape(token
, "%ld")) {
482 obj
= QOBJECT(qint_from_int(va_arg(*ap
, long)));
483 } else if (token_is_escape(token
, "%lld") ||
484 token_is_escape(token
, "%I64d")) {
485 obj
= QOBJECT(qint_from_int(va_arg(*ap
, long long)));
486 } else if (token_is_escape(token
, "%s")) {
487 obj
= QOBJECT(qstring_from_str(va_arg(*ap
, const char *)));
488 } else if (token_is_escape(token
, "%f")) {
489 obj
= QOBJECT(qfloat_from_double(va_arg(*ap
, double)));
494 qobject_decref(token
);
501 qobject_decref(token
);
507 static QObject
*parse_literal(JSONParserContext
*ctxt
, QList
**tokens
)
509 QObject
*token
, *obj
;
510 QList
*working
= qlist_copy(*tokens
);
512 token
= qlist_pop(working
);
513 switch (token_get_type(token
)) {
515 obj
= QOBJECT(qstring_from_escaped_str(ctxt
, token
));
518 obj
= QOBJECT(qint_from_int(strtoll(token_get_value(token
), NULL
, 10)));
521 /* FIXME dependent on locale */
522 obj
= QOBJECT(qfloat_from_double(strtod(token_get_value(token
), NULL
)));
528 qobject_decref(token
);
535 qobject_decref(token
);
541 static QObject
*parse_value(JSONParserContext
*ctxt
, QList
**tokens
, va_list *ap
)
545 obj
= parse_object(ctxt
, tokens
, ap
);
547 obj
= parse_array(ctxt
, tokens
, ap
);
550 obj
= parse_escape(ctxt
, tokens
, ap
);
553 obj
= parse_keyword(ctxt
, tokens
);
556 obj
= parse_literal(ctxt
, tokens
);
562 QObject
*json_parser_parse(QList
*tokens
, va_list *ap
)
564 JSONParserContext ctxt
= {};
565 QList
*working
= qlist_copy(tokens
);
568 result
= parse_value(&ctxt
, &working
, ap
);