Merge remote-tracking branch 'remotes/kraxel/tags/pull-input-20160928-1' into staging
[qemu/kevin.git] / qobject / json-parser.c
blobc18e48ab945e9573b044f35181ae59465b262158
1 /*
2 * JSON Parser
4 * Copyright IBM, Corp. 2009
6 * Authors:
7 * Anthony Liguori <aliguori@us.ibm.com>
9 * This work is licensed under the terms of the GNU LGPL, version 2.1 or later.
10 * See the COPYING.LIB file in the top-level directory.
14 #include "qemu/osdep.h"
15 #include "qapi/error.h"
16 #include "qemu-common.h"
17 #include "qapi/qmp/types.h"
18 #include "qapi/qmp/json-parser.h"
19 #include "qapi/qmp/json-lexer.h"
20 #include "qapi/qmp/json-streamer.h"
22 typedef struct JSONParserContext
24 Error *err;
25 JSONToken *current;
26 GQueue *buf;
27 } JSONParserContext;
29 #define BUG_ON(cond) assert(!(cond))
31 /**
32 * TODO
34 * 0) make errors meaningful again
35 * 1) add geometry information to tokens
36 * 3) should we return a parsed size?
37 * 4) deal with premature EOI
40 static QObject *parse_value(JSONParserContext *ctxt, va_list *ap);
42 /**
43 * Error handler
45 static void GCC_FMT_ATTR(3, 4) parse_error(JSONParserContext *ctxt,
46 JSONToken *token, const char *msg, ...)
48 va_list ap;
49 char message[1024];
50 va_start(ap, msg);
51 vsnprintf(message, sizeof(message), msg, ap);
52 va_end(ap);
53 if (ctxt->err) {
54 error_free(ctxt->err);
55 ctxt->err = NULL;
57 error_setg(&ctxt->err, "JSON parse error, %s", message);
60 /**
61 * String helpers
63 * These helpers are used to unescape strings.
65 static void wchar_to_utf8(uint16_t wchar, char *buffer, size_t buffer_length)
67 if (wchar <= 0x007F) {
68 BUG_ON(buffer_length < 2);
70 buffer[0] = wchar & 0x7F;
71 buffer[1] = 0;
72 } else if (wchar <= 0x07FF) {
73 BUG_ON(buffer_length < 3);
75 buffer[0] = 0xC0 | ((wchar >> 6) & 0x1F);
76 buffer[1] = 0x80 | (wchar & 0x3F);
77 buffer[2] = 0;
78 } else {
79 BUG_ON(buffer_length < 4);
81 buffer[0] = 0xE0 | ((wchar >> 12) & 0x0F);
82 buffer[1] = 0x80 | ((wchar >> 6) & 0x3F);
83 buffer[2] = 0x80 | (wchar & 0x3F);
84 buffer[3] = 0;
88 static int hex2decimal(char ch)
90 if (ch >= '0' && ch <= '9') {
91 return (ch - '0');
92 } else if (ch >= 'a' && ch <= 'f') {
93 return 10 + (ch - 'a');
94 } else if (ch >= 'A' && ch <= 'F') {
95 return 10 + (ch - 'A');
98 return -1;
102 * parse_string(): Parse a json string and return a QObject
104 * string
105 * ""
106 * " chars "
107 * chars
108 * char
109 * char chars
110 * char
111 * any-Unicode-character-
112 * except-"-or-\-or-
113 * control-character
114 * \"
115 * \\
116 * \/
117 * \b
118 * \f
119 * \n
120 * \r
121 * \t
122 * \u four-hex-digits
124 static QString *qstring_from_escaped_str(JSONParserContext *ctxt,
125 JSONToken *token)
127 const char *ptr = token->str;
128 QString *str;
129 int double_quote = 1;
131 if (*ptr == '"') {
132 double_quote = 1;
133 } else {
134 double_quote = 0;
136 ptr++;
138 str = qstring_new();
139 while (*ptr &&
140 ((double_quote && *ptr != '"') || (!double_quote && *ptr != '\''))) {
141 if (*ptr == '\\') {
142 ptr++;
144 switch (*ptr) {
145 case '"':
146 qstring_append(str, "\"");
147 ptr++;
148 break;
149 case '\'':
150 qstring_append(str, "'");
151 ptr++;
152 break;
153 case '\\':
154 qstring_append(str, "\\");
155 ptr++;
156 break;
157 case '/':
158 qstring_append(str, "/");
159 ptr++;
160 break;
161 case 'b':
162 qstring_append(str, "\b");
163 ptr++;
164 break;
165 case 'f':
166 qstring_append(str, "\f");
167 ptr++;
168 break;
169 case 'n':
170 qstring_append(str, "\n");
171 ptr++;
172 break;
173 case 'r':
174 qstring_append(str, "\r");
175 ptr++;
176 break;
177 case 't':
178 qstring_append(str, "\t");
179 ptr++;
180 break;
181 case 'u': {
182 uint16_t unicode_char = 0;
183 char utf8_char[4];
184 int i = 0;
186 ptr++;
188 for (i = 0; i < 4; i++) {
189 if (qemu_isxdigit(*ptr)) {
190 unicode_char |= hex2decimal(*ptr) << ((3 - i) * 4);
191 } else {
192 parse_error(ctxt, token,
193 "invalid hex escape sequence in string");
194 goto out;
196 ptr++;
199 wchar_to_utf8(unicode_char, utf8_char, sizeof(utf8_char));
200 qstring_append(str, utf8_char);
201 } break;
202 default:
203 parse_error(ctxt, token, "invalid escape sequence in string");
204 goto out;
206 } else {
207 char dummy[2];
209 dummy[0] = *ptr++;
210 dummy[1] = 0;
212 qstring_append(str, dummy);
216 return str;
218 out:
219 QDECREF(str);
220 return NULL;
223 /* Note: the token object returned by parser_context_peek_token or
224 * parser_context_pop_token is deleted as soon as parser_context_pop_token
225 * is called again.
227 static JSONToken *parser_context_pop_token(JSONParserContext *ctxt)
229 g_free(ctxt->current);
230 assert(!g_queue_is_empty(ctxt->buf));
231 ctxt->current = g_queue_pop_head(ctxt->buf);
232 return ctxt->current;
235 static JSONToken *parser_context_peek_token(JSONParserContext *ctxt)
237 assert(!g_queue_is_empty(ctxt->buf));
238 return g_queue_peek_head(ctxt->buf);
241 static JSONParserContext *parser_context_new(GQueue *tokens)
243 JSONParserContext *ctxt;
245 if (!tokens) {
246 return NULL;
249 ctxt = g_malloc0(sizeof(JSONParserContext));
250 ctxt->buf = tokens;
252 return ctxt;
255 /* to support error propagation, ctxt->err must be freed separately */
256 static void parser_context_free(JSONParserContext *ctxt)
258 if (ctxt) {
259 while (!g_queue_is_empty(ctxt->buf)) {
260 parser_context_pop_token(ctxt);
262 g_free(ctxt->current);
263 g_queue_free(ctxt->buf);
264 g_free(ctxt);
269 * Parsing rules
271 static int parse_pair(JSONParserContext *ctxt, QDict *dict, va_list *ap)
273 QObject *key = NULL, *value;
274 JSONToken *peek, *token;
276 peek = parser_context_peek_token(ctxt);
277 if (peek == NULL) {
278 parse_error(ctxt, NULL, "premature EOI");
279 goto out;
282 key = parse_value(ctxt, ap);
283 if (!key || qobject_type(key) != QTYPE_QSTRING) {
284 parse_error(ctxt, peek, "key is not a string in object");
285 goto out;
288 token = parser_context_pop_token(ctxt);
289 if (token == NULL) {
290 parse_error(ctxt, NULL, "premature EOI");
291 goto out;
294 if (token->type != JSON_COLON) {
295 parse_error(ctxt, token, "missing : in object pair");
296 goto out;
299 value = parse_value(ctxt, ap);
300 if (value == NULL) {
301 parse_error(ctxt, token, "Missing value in dict");
302 goto out;
305 qdict_put_obj(dict, qstring_get_str(qobject_to_qstring(key)), value);
307 qobject_decref(key);
309 return 0;
311 out:
312 qobject_decref(key);
314 return -1;
317 static QObject *parse_object(JSONParserContext *ctxt, va_list *ap)
319 QDict *dict = NULL;
320 JSONToken *token, *peek;
322 token = parser_context_pop_token(ctxt);
323 assert(token && token->type == JSON_LCURLY);
325 dict = qdict_new();
327 peek = parser_context_peek_token(ctxt);
328 if (peek == NULL) {
329 parse_error(ctxt, NULL, "premature EOI");
330 goto out;
333 if (peek->type != JSON_RCURLY) {
334 if (parse_pair(ctxt, dict, ap) == -1) {
335 goto out;
338 token = parser_context_pop_token(ctxt);
339 if (token == NULL) {
340 parse_error(ctxt, NULL, "premature EOI");
341 goto out;
344 while (token->type != JSON_RCURLY) {
345 if (token->type != JSON_COMMA) {
346 parse_error(ctxt, token, "expected separator in dict");
347 goto out;
350 if (parse_pair(ctxt, dict, ap) == -1) {
351 goto out;
354 token = parser_context_pop_token(ctxt);
355 if (token == NULL) {
356 parse_error(ctxt, NULL, "premature EOI");
357 goto out;
360 } else {
361 (void)parser_context_pop_token(ctxt);
364 return QOBJECT(dict);
366 out:
367 QDECREF(dict);
368 return NULL;
371 static QObject *parse_array(JSONParserContext *ctxt, va_list *ap)
373 QList *list = NULL;
374 JSONToken *token, *peek;
376 token = parser_context_pop_token(ctxt);
377 assert(token && token->type == JSON_LSQUARE);
379 list = qlist_new();
381 peek = parser_context_peek_token(ctxt);
382 if (peek == NULL) {
383 parse_error(ctxt, NULL, "premature EOI");
384 goto out;
387 if (peek->type != JSON_RSQUARE) {
388 QObject *obj;
390 obj = parse_value(ctxt, ap);
391 if (obj == NULL) {
392 parse_error(ctxt, token, "expecting value");
393 goto out;
396 qlist_append_obj(list, obj);
398 token = parser_context_pop_token(ctxt);
399 if (token == NULL) {
400 parse_error(ctxt, NULL, "premature EOI");
401 goto out;
404 while (token->type != JSON_RSQUARE) {
405 if (token->type != JSON_COMMA) {
406 parse_error(ctxt, token, "expected separator in list");
407 goto out;
410 obj = parse_value(ctxt, ap);
411 if (obj == NULL) {
412 parse_error(ctxt, token, "expecting value");
413 goto out;
416 qlist_append_obj(list, obj);
418 token = parser_context_pop_token(ctxt);
419 if (token == NULL) {
420 parse_error(ctxt, NULL, "premature EOI");
421 goto out;
424 } else {
425 (void)parser_context_pop_token(ctxt);
428 return QOBJECT(list);
430 out:
431 QDECREF(list);
432 return NULL;
435 static QObject *parse_keyword(JSONParserContext *ctxt)
437 JSONToken *token;
439 token = parser_context_pop_token(ctxt);
440 assert(token && token->type == JSON_KEYWORD);
442 if (!strcmp(token->str, "true")) {
443 return QOBJECT(qbool_from_bool(true));
444 } else if (!strcmp(token->str, "false")) {
445 return QOBJECT(qbool_from_bool(false));
446 } else if (!strcmp(token->str, "null")) {
447 return qnull();
449 parse_error(ctxt, token, "invalid keyword '%s'", token->str);
450 return NULL;
453 static QObject *parse_escape(JSONParserContext *ctxt, va_list *ap)
455 JSONToken *token;
457 if (ap == NULL) {
458 return NULL;
461 token = parser_context_pop_token(ctxt);
462 assert(token && token->type == JSON_ESCAPE);
464 if (!strcmp(token->str, "%p")) {
465 return va_arg(*ap, QObject *);
466 } else if (!strcmp(token->str, "%i")) {
467 return QOBJECT(qbool_from_bool(va_arg(*ap, int)));
468 } else if (!strcmp(token->str, "%d")) {
469 return QOBJECT(qint_from_int(va_arg(*ap, int)));
470 } else if (!strcmp(token->str, "%ld")) {
471 return QOBJECT(qint_from_int(va_arg(*ap, long)));
472 } else if (!strcmp(token->str, "%lld") ||
473 !strcmp(token->str, "%I64d")) {
474 return QOBJECT(qint_from_int(va_arg(*ap, long long)));
475 } else if (!strcmp(token->str, "%s")) {
476 return QOBJECT(qstring_from_str(va_arg(*ap, const char *)));
477 } else if (!strcmp(token->str, "%f")) {
478 return QOBJECT(qfloat_from_double(va_arg(*ap, double)));
480 return NULL;
483 static QObject *parse_literal(JSONParserContext *ctxt)
485 JSONToken *token;
487 token = parser_context_pop_token(ctxt);
488 assert(token);
490 switch (token->type) {
491 case JSON_STRING:
492 return QOBJECT(qstring_from_escaped_str(ctxt, token));
493 case JSON_INTEGER: {
494 /* A possibility exists that this is a whole-valued float where the
495 * fractional part was left out due to being 0 (.0). It's not a big
496 * deal to treat these as ints in the parser, so long as users of the
497 * resulting QObject know to expect a QInt in place of a QFloat in
498 * cases like these.
500 * However, in some cases these values will overflow/underflow a
501 * QInt/int64 container, thus we should assume these are to be handled
502 * as QFloats/doubles rather than silently changing their values.
504 * strtoll() indicates these instances by setting errno to ERANGE
506 int64_t value;
508 errno = 0; /* strtoll doesn't set errno on success */
509 value = strtoll(token->str, NULL, 10);
510 if (errno != ERANGE) {
511 return QOBJECT(qint_from_int(value));
513 /* fall through to JSON_FLOAT */
515 case JSON_FLOAT:
516 /* FIXME dependent on locale; a pervasive issue in QEMU */
517 /* FIXME our lexer matches RFC 7159 in forbidding Inf or NaN,
518 * but those might be useful extensions beyond JSON */
519 return QOBJECT(qfloat_from_double(strtod(token->str, NULL)));
520 default:
521 abort();
525 static QObject *parse_value(JSONParserContext *ctxt, va_list *ap)
527 JSONToken *token;
529 token = parser_context_peek_token(ctxt);
530 if (token == NULL) {
531 parse_error(ctxt, NULL, "premature EOI");
532 return NULL;
535 switch (token->type) {
536 case JSON_LCURLY:
537 return parse_object(ctxt, ap);
538 case JSON_LSQUARE:
539 return parse_array(ctxt, ap);
540 case JSON_ESCAPE:
541 return parse_escape(ctxt, ap);
542 case JSON_INTEGER:
543 case JSON_FLOAT:
544 case JSON_STRING:
545 return parse_literal(ctxt);
546 case JSON_KEYWORD:
547 return parse_keyword(ctxt);
548 default:
549 parse_error(ctxt, token, "expecting value");
550 return NULL;
554 QObject *json_parser_parse(GQueue *tokens, va_list *ap)
556 return json_parser_parse_err(tokens, ap, NULL);
559 QObject *json_parser_parse_err(GQueue *tokens, va_list *ap, Error **errp)
561 JSONParserContext *ctxt = parser_context_new(tokens);
562 QObject *result;
564 if (!ctxt) {
565 return NULL;
568 result = parse_value(ctxt, ap);
570 error_propagate(errp, ctxt->err);
572 parser_context_free(ctxt);
574 return result;