4 * Copyright IBM, Corp. 2009
7 * Anthony Liguori <aliguori@us.ibm.com>
9 * This work is licensed under the terms of the GNU LGPL, version 2.1 or later.
10 * See the COPYING.LIB file in the top-level directory.
16 #include "qemu-common.h"
23 #include "json-parser.h"
24 #include "json-lexer.h"
26 typedef struct JSONParserContext
30 #define BUG_ON(cond) assert(!(cond))
35 * 0) make errors meaningful again
36 * 1) add geometry information to tokens
37 * 3) should we return a parsed size?
38 * 4) deal with premature EOI
41 static QObject
*parse_value(JSONParserContext
*ctxt
, QList
**tokens
, va_list *ap
);
46 * tokens are dictionaries that contain a type, a string value, and geometry information
47 * about a token identified by the lexer. These are routines that make working with
48 * these objects a bit easier.
50 static const char *token_get_value(QObject
*obj
)
52 return qdict_get_str(qobject_to_qdict(obj
), "token");
55 static JSONTokenType
token_get_type(QObject
*obj
)
57 return qdict_get_int(qobject_to_qdict(obj
), "type");
60 static int token_is_operator(QObject
*obj
, char op
)
64 if (token_get_type(obj
) != JSON_OPERATOR
) {
68 val
= token_get_value(obj
);
70 return (val
[0] == op
) && (val
[1] == 0);
73 static int token_is_keyword(QObject
*obj
, const char *value
)
75 if (token_get_type(obj
) != JSON_KEYWORD
) {
79 return strcmp(token_get_value(obj
), value
) == 0;
82 static int token_is_escape(QObject
*obj
, const char *value
)
84 if (token_get_type(obj
) != JSON_ESCAPE
) {
88 return (strcmp(token_get_value(obj
), value
) == 0);
94 static void parse_error(JSONParserContext
*ctxt
, QObject
*token
, const char *msg
, ...)
96 fprintf(stderr
, "parse error: %s\n", msg
);
102 * These helpers are used to unescape strings.
104 static void wchar_to_utf8(uint16_t wchar
, char *buffer
, size_t buffer_length
)
106 if (wchar
<= 0x007F) {
107 BUG_ON(buffer_length
< 2);
109 buffer
[0] = wchar
& 0x7F;
111 } else if (wchar
<= 0x07FF) {
112 BUG_ON(buffer_length
< 3);
114 buffer
[0] = 0xC0 | ((wchar
>> 6) & 0x1F);
115 buffer
[1] = 0x80 | (wchar
& 0x3F);
118 BUG_ON(buffer_length
< 4);
120 buffer
[0] = 0xE0 | ((wchar
>> 12) & 0x0F);
121 buffer
[1] = 0x80 | ((wchar
>> 6) & 0x3F);
122 buffer
[2] = 0x80 | (wchar
& 0x3F);
127 static int hex2decimal(char ch
)
129 if (ch
>= '0' && ch
<= '9') {
131 } else if (ch
>= 'a' && ch
<= 'f') {
132 return 10 + (ch
- 'a');
133 } else if (ch
>= 'A' && ch
<= 'F') {
134 return 10 + (ch
- 'A');
141 * parse_string(): Parse a json string and return a QObject
150 * any-Unicode-character-
163 static QString
*qstring_from_escaped_str(JSONParserContext
*ctxt
, QObject
*token
)
165 const char *ptr
= token_get_value(token
);
167 int double_quote
= 1;
178 ((double_quote
&& *ptr
!= '"') || (!double_quote
&& *ptr
!= '\''))) {
184 qstring_append(str
, "\"");
188 qstring_append(str
, "'");
192 qstring_append(str
, "\\");
196 qstring_append(str
, "/");
200 qstring_append(str
, "\b");
204 qstring_append(str
, "\n");
208 qstring_append(str
, "\r");
212 qstring_append(str
, "\t");
216 uint16_t unicode_char
= 0;
222 for (i
= 0; i
< 4; i
++) {
223 if (qemu_isxdigit(*ptr
)) {
224 unicode_char
|= hex2decimal(*ptr
) << ((3 - i
) * 4);
226 parse_error(ctxt
, token
,
227 "invalid hex escape sequence in string");
233 wchar_to_utf8(unicode_char
, utf8_char
, sizeof(utf8_char
));
234 qstring_append(str
, utf8_char
);
237 parse_error(ctxt
, token
, "invalid escape sequence in string");
246 qstring_append(str
, dummy
);
260 static int parse_pair(JSONParserContext
*ctxt
, QDict
*dict
, QList
**tokens
, va_list *ap
)
262 QObject
*key
, *token
= NULL
, *value
, *peek
;
263 QList
*working
= qlist_copy(*tokens
);
265 peek
= qlist_peek(working
);
266 key
= parse_value(ctxt
, &working
, ap
);
267 if (!key
|| qobject_type(key
) != QTYPE_QSTRING
) {
268 parse_error(ctxt
, peek
, "key is not a string in object");
272 token
= qlist_pop(working
);
273 if (!token_is_operator(token
, ':')) {
274 parse_error(ctxt
, token
, "missing : in object pair");
278 value
= parse_value(ctxt
, &working
, ap
);
280 parse_error(ctxt
, token
, "Missing value in dict");
284 qdict_put_obj(dict
, qstring_get_str(qobject_to_qstring(key
)), value
);
286 qobject_decref(token
);
294 qobject_decref(token
);
301 static QObject
*parse_object(JSONParserContext
*ctxt
, QList
**tokens
, va_list *ap
)
304 QObject
*token
, *peek
;
305 QList
*working
= qlist_copy(*tokens
);
307 token
= qlist_pop(working
);
308 if (!token_is_operator(token
, '{')) {
311 qobject_decref(token
);
316 peek
= qlist_peek(working
);
317 if (!token_is_operator(peek
, '}')) {
318 if (parse_pair(ctxt
, dict
, &working
, ap
) == -1) {
322 token
= qlist_pop(working
);
323 while (!token_is_operator(token
, '}')) {
324 if (!token_is_operator(token
, ',')) {
325 parse_error(ctxt
, token
, "expected separator in dict");
328 qobject_decref(token
);
331 if (parse_pair(ctxt
, dict
, &working
, ap
) == -1) {
335 token
= qlist_pop(working
);
337 qobject_decref(token
);
340 token
= qlist_pop(working
);
341 qobject_decref(token
);
348 return QOBJECT(dict
);
351 qobject_decref(token
);
357 static QObject
*parse_array(JSONParserContext
*ctxt
, QList
**tokens
, va_list *ap
)
360 QObject
*token
, *peek
;
361 QList
*working
= qlist_copy(*tokens
);
363 token
= qlist_pop(working
);
364 if (!token_is_operator(token
, '[')) {
367 qobject_decref(token
);
372 peek
= qlist_peek(working
);
373 if (!token_is_operator(peek
, ']')) {
376 obj
= parse_value(ctxt
, &working
, ap
);
378 parse_error(ctxt
, token
, "expecting value");
382 qlist_append_obj(list
, obj
);
384 token
= qlist_pop(working
);
385 while (!token_is_operator(token
, ']')) {
386 if (!token_is_operator(token
, ',')) {
387 parse_error(ctxt
, token
, "expected separator in list");
391 qobject_decref(token
);
394 obj
= parse_value(ctxt
, &working
, ap
);
396 parse_error(ctxt
, token
, "expecting value");
400 qlist_append_obj(list
, obj
);
402 token
= qlist_pop(working
);
405 qobject_decref(token
);
408 token
= qlist_pop(working
);
409 qobject_decref(token
);
416 return QOBJECT(list
);
419 qobject_decref(token
);
425 static QObject
*parse_keyword(JSONParserContext
*ctxt
, QList
**tokens
)
427 QObject
*token
, *ret
;
428 QList
*working
= qlist_copy(*tokens
);
430 token
= qlist_pop(working
);
432 if (token_get_type(token
) != JSON_KEYWORD
) {
436 if (token_is_keyword(token
, "true")) {
437 ret
= QOBJECT(qbool_from_int(true));
438 } else if (token_is_keyword(token
, "false")) {
439 ret
= QOBJECT(qbool_from_int(false));
441 parse_error(ctxt
, token
, "invalid keyword `%s'", token_get_value(token
));
445 qobject_decref(token
);
452 qobject_decref(token
);
458 static QObject
*parse_escape(JSONParserContext
*ctxt
, QList
**tokens
, va_list *ap
)
460 QObject
*token
= NULL
, *obj
;
461 QList
*working
= qlist_copy(*tokens
);
467 token
= qlist_pop(working
);
469 if (token_is_escape(token
, "%p")) {
470 obj
= va_arg(*ap
, QObject
*);
471 } else if (token_is_escape(token
, "%i")) {
472 obj
= QOBJECT(qbool_from_int(va_arg(*ap
, int)));
473 } else if (token_is_escape(token
, "%d")) {
474 obj
= QOBJECT(qint_from_int(va_arg(*ap
, int)));
475 } else if (token_is_escape(token
, "%ld")) {
476 obj
= QOBJECT(qint_from_int(va_arg(*ap
, long)));
477 } else if (token_is_escape(token
, "%lld") ||
478 token_is_escape(token
, "%I64d")) {
479 obj
= QOBJECT(qint_from_int(va_arg(*ap
, long long)));
480 } else if (token_is_escape(token
, "%s")) {
481 obj
= QOBJECT(qstring_from_str(va_arg(*ap
, const char *)));
482 } else if (token_is_escape(token
, "%f")) {
483 obj
= QOBJECT(qfloat_from_double(va_arg(*ap
, double)));
488 qobject_decref(token
);
495 qobject_decref(token
);
501 static QObject
*parse_literal(JSONParserContext
*ctxt
, QList
**tokens
)
503 QObject
*token
, *obj
;
504 QList
*working
= qlist_copy(*tokens
);
506 token
= qlist_pop(working
);
507 switch (token_get_type(token
)) {
509 obj
= QOBJECT(qstring_from_escaped_str(ctxt
, token
));
512 obj
= QOBJECT(qint_from_int(strtoll(token_get_value(token
), NULL
, 10)));
515 /* FIXME dependent on locale */
516 obj
= QOBJECT(qfloat_from_double(strtod(token_get_value(token
), NULL
)));
522 qobject_decref(token
);
529 qobject_decref(token
);
535 static QObject
*parse_value(JSONParserContext
*ctxt
, QList
**tokens
, va_list *ap
)
539 obj
= parse_object(ctxt
, tokens
, ap
);
541 obj
= parse_array(ctxt
, tokens
, ap
);
544 obj
= parse_escape(ctxt
, tokens
, ap
);
547 obj
= parse_keyword(ctxt
, tokens
);
550 obj
= parse_literal(ctxt
, tokens
);
556 QObject
*json_parser_parse(QList
*tokens
, va_list *ap
)
558 JSONParserContext ctxt
= {};
559 QList
*working
= qlist_copy(tokens
);
562 result
= parse_value(&ctxt
, &working
, ap
);