]> Git Repo - qemu.git/blame - qobject/json-parser.c
Merge remote-tracking branch 'remotes/ericb/tags/pull-nbd-2017-07-10-v2' into staging
[qemu.git] / qobject / json-parser.c
CommitLineData
4a5fcab7 1/*
6e8e5cb9 2 * JSON Parser
4a5fcab7
AL
3 *
4 * Copyright IBM, Corp. 2009
5 *
6 * Authors:
7 * Anthony Liguori <[email protected]>
8 *
9 * This work is licensed under the terms of the GNU LGPL, version 2.1 or later.
10 * See the COPYING.LIB file in the top-level directory.
11 *
12 */
13
f2ad72b3 14#include "qemu/osdep.h"
2bc7cfea 15#include "qemu/cutils.h"
da34e65c 16#include "qapi/error.h"
4a5fcab7 17#include "qemu-common.h"
c7eb39cb 18#include "qapi/qmp/types.h"
7b1b5d19
PB
19#include "qapi/qmp/json-parser.h"
20#include "qapi/qmp/json-lexer.h"
9bada897 21#include "qapi/qmp/json-streamer.h"
4a5fcab7
AL
22
23typedef struct JSONParserContext
24{
ef749d07 25 Error *err;
9bada897 26 JSONToken *current;
95385fe9 27 GQueue *buf;
4a5fcab7
AL
28} JSONParserContext;
29
30#define BUG_ON(cond) assert(!(cond))
31
32/**
33 * TODO
34 *
35 * 0) make errors meaningful again
36 * 1) add geometry information to tokens
37 * 3) should we return a parsed size?
38 * 4) deal with premature EOI
39 */
40
65c0f1e9 41static QObject *parse_value(JSONParserContext *ctxt, va_list *ap);
4a5fcab7 42
4a5fcab7
AL
43/**
44 * Error handler
45 */
8b7968f7 46static void GCC_FMT_ATTR(3, 4) parse_error(JSONParserContext *ctxt,
9bada897 47 JSONToken *token, const char *msg, ...)
4a5fcab7 48{
c96c84a9 49 va_list ap;
ef749d07 50 char message[1024];
c96c84a9 51 va_start(ap, msg);
ef749d07 52 vsnprintf(message, sizeof(message), msg, ap);
c96c84a9 53 va_end(ap);
ef749d07
AL
54 if (ctxt->err) {
55 error_free(ctxt->err);
56 ctxt->err = NULL;
57 }
f231b88d 58 error_setg(&ctxt->err, "JSON parse error, %s", message);
4a5fcab7
AL
59}
60
61/**
62 * String helpers
63 *
64 * These helpers are used to unescape strings.
65 */
66static void wchar_to_utf8(uint16_t wchar, char *buffer, size_t buffer_length)
67{
68 if (wchar <= 0x007F) {
69 BUG_ON(buffer_length < 2);
70
71 buffer[0] = wchar & 0x7F;
72 buffer[1] = 0;
73 } else if (wchar <= 0x07FF) {
74 BUG_ON(buffer_length < 3);
75
76 buffer[0] = 0xC0 | ((wchar >> 6) & 0x1F);
77 buffer[1] = 0x80 | (wchar & 0x3F);
78 buffer[2] = 0;
79 } else {
80 BUG_ON(buffer_length < 4);
81
82 buffer[0] = 0xE0 | ((wchar >> 12) & 0x0F);
83 buffer[1] = 0x80 | ((wchar >> 6) & 0x3F);
84 buffer[2] = 0x80 | (wchar & 0x3F);
85 buffer[3] = 0;
86 }
87}
88
89static int hex2decimal(char ch)
90{
91 if (ch >= '0' && ch <= '9') {
92 return (ch - '0');
93 } else if (ch >= 'a' && ch <= 'f') {
94 return 10 + (ch - 'a');
95 } else if (ch >= 'A' && ch <= 'F') {
96 return 10 + (ch - 'A');
97 }
98
99 return -1;
100}
101
102/**
103 * parse_string(): Parse a json string and return a QObject
104 *
105 * string
106 * ""
107 * " chars "
108 * chars
109 * char
110 * char chars
111 * char
112 * any-Unicode-character-
113 * except-"-or-\-or-
114 * control-character
115 * \"
116 * \\
117 * \/
118 * \b
119 * \f
120 * \n
121 * \r
122 * \t
123 * \u four-hex-digits
124 */
9bada897
PB
125static QString *qstring_from_escaped_str(JSONParserContext *ctxt,
126 JSONToken *token)
4a5fcab7 127{
9bada897 128 const char *ptr = token->str;
4a5fcab7
AL
129 QString *str;
130 int double_quote = 1;
131
132 if (*ptr == '"') {
133 double_quote = 1;
134 } else {
135 double_quote = 0;
136 }
137 ptr++;
138
139 str = qstring_new();
140 while (*ptr &&
141 ((double_quote && *ptr != '"') || (!double_quote && *ptr != '\''))) {
142 if (*ptr == '\\') {
143 ptr++;
144
145 switch (*ptr) {
146 case '"':
147 qstring_append(str, "\"");
148 ptr++;
149 break;
150 case '\'':
151 qstring_append(str, "'");
152 ptr++;
153 break;
154 case '\\':
155 qstring_append(str, "\\");
156 ptr++;
157 break;
158 case '/':
159 qstring_append(str, "/");
160 ptr++;
161 break;
162 case 'b':
163 qstring_append(str, "\b");
164 ptr++;
165 break;
bd032695
LC
166 case 'f':
167 qstring_append(str, "\f");
168 ptr++;
169 break;
4a5fcab7
AL
170 case 'n':
171 qstring_append(str, "\n");
172 ptr++;
173 break;
174 case 'r':
175 qstring_append(str, "\r");
176 ptr++;
177 break;
178 case 't':
179 qstring_append(str, "\t");
180 ptr++;
181 break;
182 case 'u': {
183 uint16_t unicode_char = 0;
184 char utf8_char[4];
185 int i = 0;
186
187 ptr++;
188
189 for (i = 0; i < 4; i++) {
190 if (qemu_isxdigit(*ptr)) {
191 unicode_char |= hex2decimal(*ptr) << ((3 - i) * 4);
192 } else {
193 parse_error(ctxt, token,
194 "invalid hex escape sequence in string");
195 goto out;
196 }
197 ptr++;
198 }
199
200 wchar_to_utf8(unicode_char, utf8_char, sizeof(utf8_char));
201 qstring_append(str, utf8_char);
202 } break;
203 default:
204 parse_error(ctxt, token, "invalid escape sequence in string");
205 goto out;
206 }
207 } else {
208 char dummy[2];
209
210 dummy[0] = *ptr++;
211 dummy[1] = 0;
212
213 qstring_append(str, dummy);
214 }
215 }
216
4a5fcab7
AL
217 return str;
218
219out:
220 QDECREF(str);
221 return NULL;
222}
223
9bada897
PB
224/* Note: the token object returned by parser_context_peek_token or
225 * parser_context_pop_token is deleted as soon as parser_context_pop_token
226 * is called again.
95385fe9 227 */
9bada897 228static JSONToken *parser_context_pop_token(JSONParserContext *ctxt)
65c0f1e9 229{
9bada897 230 g_free(ctxt->current);
95385fe9
PB
231 assert(!g_queue_is_empty(ctxt->buf));
232 ctxt->current = g_queue_pop_head(ctxt->buf);
233 return ctxt->current;
65c0f1e9
MR
234}
235
9bada897 236static JSONToken *parser_context_peek_token(JSONParserContext *ctxt)
65c0f1e9 237{
95385fe9
PB
238 assert(!g_queue_is_empty(ctxt->buf));
239 return g_queue_peek_head(ctxt->buf);
65c0f1e9
MR
240}
241
95385fe9 242static JSONParserContext *parser_context_new(GQueue *tokens)
65c0f1e9
MR
243{
244 JSONParserContext *ctxt;
65c0f1e9
MR
245
246 if (!tokens) {
247 return NULL;
248 }
249
65c0f1e9 250 ctxt = g_malloc0(sizeof(JSONParserContext));
95385fe9 251 ctxt->buf = tokens;
65c0f1e9
MR
252
253 return ctxt;
254}
255
256/* to support error propagation, ctxt->err must be freed separately */
257static void parser_context_free(JSONParserContext *ctxt)
258{
65c0f1e9 259 if (ctxt) {
95385fe9
PB
260 while (!g_queue_is_empty(ctxt->buf)) {
261 parser_context_pop_token(ctxt);
65c0f1e9 262 }
9bada897 263 g_free(ctxt->current);
95385fe9 264 g_queue_free(ctxt->buf);
65c0f1e9
MR
265 g_free(ctxt);
266 }
267}
268
4a5fcab7
AL
269/**
270 * Parsing rules
271 */
65c0f1e9 272static int parse_pair(JSONParserContext *ctxt, QDict *dict, va_list *ap)
4a5fcab7 273{
9bada897
PB
274 QObject *key = NULL, *value;
275 JSONToken *peek, *token;
4a5fcab7 276
65c0f1e9 277 peek = parser_context_peek_token(ctxt);
11e8a46c
AL
278 if (peek == NULL) {
279 parse_error(ctxt, NULL, "premature EOI");
280 goto out;
281 }
282
65c0f1e9 283 key = parse_value(ctxt, ap);
d758d90f 284 if (!key || qobject_type(key) != QTYPE_QSTRING) {
4a5fcab7
AL
285 parse_error(ctxt, peek, "key is not a string in object");
286 goto out;
287 }
288
65c0f1e9 289 token = parser_context_pop_token(ctxt);
11e8a46c
AL
290 if (token == NULL) {
291 parse_error(ctxt, NULL, "premature EOI");
292 goto out;
293 }
294
9bada897 295 if (token->type != JSON_COLON) {
4a5fcab7
AL
296 parse_error(ctxt, token, "missing : in object pair");
297 goto out;
298 }
299
65c0f1e9 300 value = parse_value(ctxt, ap);
4a5fcab7
AL
301 if (value == NULL) {
302 parse_error(ctxt, token, "Missing value in dict");
303 goto out;
304 }
305
306 qdict_put_obj(dict, qstring_get_str(qobject_to_qstring(key)), value);
307
4a5fcab7 308 qobject_decref(key);
4a5fcab7
AL
309
310 return 0;
311
312out:
4a5fcab7 313 qobject_decref(key);
4a5fcab7
AL
314
315 return -1;
316}
317
65c0f1e9 318static QObject *parse_object(JSONParserContext *ctxt, va_list *ap)
4a5fcab7
AL
319{
320 QDict *dict = NULL;
9bada897 321 JSONToken *token, *peek;
4a5fcab7 322
65c0f1e9 323 token = parser_context_pop_token(ctxt);
9bada897 324 assert(token && token->type == JSON_LCURLY);
4a5fcab7
AL
325
326 dict = qdict_new();
327
65c0f1e9 328 peek = parser_context_peek_token(ctxt);
11e8a46c
AL
329 if (peek == NULL) {
330 parse_error(ctxt, NULL, "premature EOI");
331 goto out;
332 }
333
9bada897 334 if (peek->type != JSON_RCURLY) {
65c0f1e9 335 if (parse_pair(ctxt, dict, ap) == -1) {
4a5fcab7
AL
336 goto out;
337 }
338
65c0f1e9 339 token = parser_context_pop_token(ctxt);
11e8a46c
AL
340 if (token == NULL) {
341 parse_error(ctxt, NULL, "premature EOI");
342 goto out;
343 }
344
9bada897
PB
345 while (token->type != JSON_RCURLY) {
346 if (token->type != JSON_COMMA) {
4a5fcab7
AL
347 parse_error(ctxt, token, "expected separator in dict");
348 goto out;
349 }
4a5fcab7 350
65c0f1e9 351 if (parse_pair(ctxt, dict, ap) == -1) {
4a5fcab7
AL
352 goto out;
353 }
354
65c0f1e9 355 token = parser_context_pop_token(ctxt);
11e8a46c
AL
356 if (token == NULL) {
357 parse_error(ctxt, NULL, "premature EOI");
358 goto out;
359 }
4a5fcab7 360 }
4a5fcab7 361 } else {
a491af47 362 (void)parser_context_pop_token(ctxt);
4a5fcab7
AL
363 }
364
4a5fcab7
AL
365 return QOBJECT(dict);
366
367out:
4a5fcab7
AL
368 QDECREF(dict);
369 return NULL;
370}
371
65c0f1e9 372static QObject *parse_array(JSONParserContext *ctxt, va_list *ap)
4a5fcab7
AL
373{
374 QList *list = NULL;
9bada897 375 JSONToken *token, *peek;
4a5fcab7 376
65c0f1e9 377 token = parser_context_pop_token(ctxt);
9bada897 378 assert(token && token->type == JSON_LSQUARE);
4a5fcab7
AL
379
380 list = qlist_new();
381
65c0f1e9 382 peek = parser_context_peek_token(ctxt);
11e8a46c
AL
383 if (peek == NULL) {
384 parse_error(ctxt, NULL, "premature EOI");
385 goto out;
386 }
387
9bada897 388 if (peek->type != JSON_RSQUARE) {
4a5fcab7
AL
389 QObject *obj;
390
65c0f1e9 391 obj = parse_value(ctxt, ap);
4a5fcab7
AL
392 if (obj == NULL) {
393 parse_error(ctxt, token, "expecting value");
394 goto out;
395 }
396
397 qlist_append_obj(list, obj);
398
65c0f1e9 399 token = parser_context_pop_token(ctxt);
11e8a46c
AL
400 if (token == NULL) {
401 parse_error(ctxt, NULL, "premature EOI");
402 goto out;
403 }
404
9bada897
PB
405 while (token->type != JSON_RSQUARE) {
406 if (token->type != JSON_COMMA) {
4a5fcab7
AL
407 parse_error(ctxt, token, "expected separator in list");
408 goto out;
409 }
410
65c0f1e9 411 obj = parse_value(ctxt, ap);
4a5fcab7
AL
412 if (obj == NULL) {
413 parse_error(ctxt, token, "expecting value");
414 goto out;
415 }
416
417 qlist_append_obj(list, obj);
418
65c0f1e9 419 token = parser_context_pop_token(ctxt);
11e8a46c
AL
420 if (token == NULL) {
421 parse_error(ctxt, NULL, "premature EOI");
422 goto out;
423 }
4a5fcab7 424 }
4a5fcab7 425 } else {
a491af47 426 (void)parser_context_pop_token(ctxt);
4a5fcab7
AL
427 }
428
4a5fcab7
AL
429 return QOBJECT(list);
430
431out:
4a5fcab7
AL
432 QDECREF(list);
433 return NULL;
434}
435
65c0f1e9 436static QObject *parse_keyword(JSONParserContext *ctxt)
4a5fcab7 437{
9bada897 438 JSONToken *token;
4a5fcab7 439
65c0f1e9 440 token = parser_context_pop_token(ctxt);
9bada897 441 assert(token && token->type == JSON_KEYWORD);
50e2a467 442
9bada897 443 if (!strcmp(token->str, "true")) {
d538b255 444 return QOBJECT(qbool_from_bool(true));
9bada897 445 } else if (!strcmp(token->str, "false")) {
d538b255 446 return QOBJECT(qbool_from_bool(false));
9bada897 447 } else if (!strcmp(token->str, "null")) {
d538b255 448 return qnull();
4a5fcab7 449 }
9bada897 450 parse_error(ctxt, token, "invalid keyword '%s'", token->str);
4a5fcab7
AL
451 return NULL;
452}
453
65c0f1e9 454static QObject *parse_escape(JSONParserContext *ctxt, va_list *ap)
4a5fcab7 455{
9bada897 456 JSONToken *token;
4a5fcab7
AL
457
458 if (ap == NULL) {
d538b255 459 return NULL;
4a5fcab7
AL
460 }
461
65c0f1e9 462 token = parser_context_pop_token(ctxt);
9bada897 463 assert(token && token->type == JSON_ESCAPE);
6b9606f6 464
9bada897 465 if (!strcmp(token->str, "%p")) {
d538b255 466 return va_arg(*ap, QObject *);
9bada897 467 } else if (!strcmp(token->str, "%i")) {
d538b255 468 return QOBJECT(qbool_from_bool(va_arg(*ap, int)));
9bada897 469 } else if (!strcmp(token->str, "%d")) {
01b2ffce 470 return QOBJECT(qnum_from_int(va_arg(*ap, int)));
9bada897 471 } else if (!strcmp(token->str, "%ld")) {
01b2ffce 472 return QOBJECT(qnum_from_int(va_arg(*ap, long)));
9bada897
PB
473 } else if (!strcmp(token->str, "%lld") ||
474 !strcmp(token->str, "%I64d")) {
01b2ffce 475 return QOBJECT(qnum_from_int(va_arg(*ap, long long)));
2bc7cfea
MAL
476 } else if (!strcmp(token->str, "%u")) {
477 return QOBJECT(qnum_from_uint(va_arg(*ap, unsigned int)));
478 } else if (!strcmp(token->str, "%lu")) {
479 return QOBJECT(qnum_from_uint(va_arg(*ap, unsigned long)));
480 } else if (!strcmp(token->str, "%llu") ||
481 !strcmp(token->str, "%I64u")) {
482 return QOBJECT(qnum_from_uint(va_arg(*ap, unsigned long long)));
9bada897 483 } else if (!strcmp(token->str, "%s")) {
d538b255 484 return QOBJECT(qstring_from_str(va_arg(*ap, const char *)));
9bada897 485 } else if (!strcmp(token->str, "%f")) {
01b2ffce 486 return QOBJECT(qnum_from_double(va_arg(*ap, double)));
4a5fcab7 487 }
4a5fcab7
AL
488 return NULL;
489}
490
65c0f1e9 491static QObject *parse_literal(JSONParserContext *ctxt)
4a5fcab7 492{
9bada897 493 JSONToken *token;
4a5fcab7 494
65c0f1e9 495 token = parser_context_pop_token(ctxt);
d538b255 496 assert(token);
11e8a46c 497
9bada897 498 switch (token->type) {
4a5fcab7 499 case JSON_STRING:
d538b255 500 return QOBJECT(qstring_from_escaped_str(ctxt, token));
3d5b3ec6 501 case JSON_INTEGER: {
01b2ffce
MAL
502 /*
503 * Represent JSON_INTEGER as QNUM_I64 if possible, else as
2bc7cfea
MAL
504 * QNUM_U64, else as QNUM_DOUBLE. Note that qemu_strtoi64()
505 * and qemu_strtou64() fail with ERANGE when it's not
506 * possible.
3d5b3ec6 507 *
01b2ffce 508 * qnum_get_int() will then work for any signed 64-bit
2bc7cfea
MAL
509 * JSON_INTEGER, qnum_get_uint() for any unsigned 64-bit
510 * integer, and qnum_get_double() both for any JSON_INTEGER
511 * and any JSON_FLOAT (with precision loss for integers beyond
512 * 53 bits)
3d5b3ec6 513 */
2bc7cfea 514 int ret;
3d5b3ec6 515 int64_t value;
2bc7cfea 516 uint64_t uvalue;
3d5b3ec6 517
2bc7cfea
MAL
518 ret = qemu_strtoi64(token->str, NULL, 10, &value);
519 if (!ret) {
01b2ffce 520 return QOBJECT(qnum_from_int(value));
3d5b3ec6 521 }
2bc7cfea
MAL
522 assert(ret == -ERANGE);
523
524 if (token->str[0] != '-') {
525 ret = qemu_strtou64(token->str, NULL, 10, &uvalue);
526 if (!ret) {
527 return QOBJECT(qnum_from_uint(uvalue));
528 }
529 assert(ret == -ERANGE);
530 }
3d5b3ec6
MR
531 /* fall through to JSON_FLOAT */
532 }
4a5fcab7 533 case JSON_FLOAT:
6e8e5cb9
EB
534 /* FIXME dependent on locale; a pervasive issue in QEMU */
535 /* FIXME our lexer matches RFC 7159 in forbidding Inf or NaN,
536 * but those might be useful extensions beyond JSON */
01b2ffce 537 return QOBJECT(qnum_from_double(strtod(token->str, NULL)));
4a5fcab7 538 default:
d538b255 539 abort();
4a5fcab7 540 }
4a5fcab7
AL
541}
542
65c0f1e9 543static QObject *parse_value(JSONParserContext *ctxt, va_list *ap)
4a5fcab7 544{
9bada897 545 JSONToken *token;
4a5fcab7 546
d538b255
MA
547 token = parser_context_peek_token(ctxt);
548 if (token == NULL) {
549 parse_error(ctxt, NULL, "premature EOI");
550 return NULL;
4a5fcab7
AL
551 }
552
9bada897 553 switch (token->type) {
d538b255
MA
554 case JSON_LCURLY:
555 return parse_object(ctxt, ap);
556 case JSON_LSQUARE:
557 return parse_array(ctxt, ap);
558 case JSON_ESCAPE:
559 return parse_escape(ctxt, ap);
560 case JSON_INTEGER:
561 case JSON_FLOAT:
562 case JSON_STRING:
563 return parse_literal(ctxt);
564 case JSON_KEYWORD:
565 return parse_keyword(ctxt);
566 default:
567 parse_error(ctxt, token, "expecting value");
568 return NULL;
569 }
4a5fcab7
AL
570}
571
95385fe9 572QObject *json_parser_parse(GQueue *tokens, va_list *ap)
ef749d07
AL
573{
574 return json_parser_parse_err(tokens, ap, NULL);
575}
576
95385fe9 577QObject *json_parser_parse_err(GQueue *tokens, va_list *ap, Error **errp)
4a5fcab7 578{
65c0f1e9 579 JSONParserContext *ctxt = parser_context_new(tokens);
4a5fcab7
AL
580 QObject *result;
581
65c0f1e9 582 if (!ctxt) {
c1990ebf
MR
583 return NULL;
584 }
4a5fcab7 585
65c0f1e9
MR
586 result = parse_value(ctxt, ap);
587
588 error_propagate(errp, ctxt->err);
4a5fcab7 589
65c0f1e9 590 parser_context_free(ctxt);
ef749d07 591
4a5fcab7
AL
592 return result;
593}
This page took 0.566958 seconds and 4 git commands to generate.