linux-user: Merge pread/pwrite into pread64/pwrite64
[qemu/pbrook.git] / json-parser.c
blob457291b161ad464416833f25c6e2ce51b3252cec
1 /*
2 * JSON Parser
4 * Copyright IBM, Corp. 2009
6 * Authors:
7 * Anthony Liguori <aliguori@us.ibm.com>
9 * This work is licensed under the terms of the GNU LGPL, version 2.1 or later.
10 * See the COPYING.LIB file in the top-level directory.
14 #include <stdarg.h>
16 #include "qemu-common.h"
17 #include "qstring.h"
18 #include "qint.h"
19 #include "qdict.h"
20 #include "qlist.h"
21 #include "qfloat.h"
22 #include "qbool.h"
23 #include "json-parser.h"
24 #include "json-lexer.h"
25 #include "qerror.h"
27 typedef struct JSONParserContext
29 Error *err;
30 struct {
31 QObject **buf;
32 size_t pos;
33 size_t count;
34 } tokens;
35 } JSONParserContext;
37 #define BUG_ON(cond) assert(!(cond))
39 /**
40 * TODO
42 * 0) make errors meaningful again
43 * 1) add geometry information to tokens
44 * 3) should we return a parsed size?
45 * 4) deal with premature EOI
48 static QObject *parse_value(JSONParserContext *ctxt, va_list *ap);
50 /**
51 * Token manipulators
53 * tokens are dictionaries that contain a type, a string value, and geometry information
54 * about a token identified by the lexer. These are routines that make working with
55 * these objects a bit easier.
57 static const char *token_get_value(QObject *obj)
59 return qdict_get_str(qobject_to_qdict(obj), "token");
62 static JSONTokenType token_get_type(QObject *obj)
64 return qdict_get_int(qobject_to_qdict(obj), "type");
67 static int token_is_operator(QObject *obj, char op)
69 const char *val;
71 if (token_get_type(obj) != JSON_OPERATOR) {
72 return 0;
75 val = token_get_value(obj);
77 return (val[0] == op) && (val[1] == 0);
80 static int token_is_keyword(QObject *obj, const char *value)
82 if (token_get_type(obj) != JSON_KEYWORD) {
83 return 0;
86 return strcmp(token_get_value(obj), value) == 0;
89 static int token_is_escape(QObject *obj, const char *value)
91 if (token_get_type(obj) != JSON_ESCAPE) {
92 return 0;
95 return (strcmp(token_get_value(obj), value) == 0);
98 /**
99 * Error handler
101 static void GCC_FMT_ATTR(3, 4) parse_error(JSONParserContext *ctxt,
102 QObject *token, const char *msg, ...)
104 va_list ap;
105 char message[1024];
106 va_start(ap, msg);
107 vsnprintf(message, sizeof(message), msg, ap);
108 va_end(ap);
109 if (ctxt->err) {
110 error_free(ctxt->err);
111 ctxt->err = NULL;
113 error_set(&ctxt->err, QERR_JSON_PARSE_ERROR, message);
117 * String helpers
119 * These helpers are used to unescape strings.
121 static void wchar_to_utf8(uint16_t wchar, char *buffer, size_t buffer_length)
123 if (wchar <= 0x007F) {
124 BUG_ON(buffer_length < 2);
126 buffer[0] = wchar & 0x7F;
127 buffer[1] = 0;
128 } else if (wchar <= 0x07FF) {
129 BUG_ON(buffer_length < 3);
131 buffer[0] = 0xC0 | ((wchar >> 6) & 0x1F);
132 buffer[1] = 0x80 | (wchar & 0x3F);
133 buffer[2] = 0;
134 } else {
135 BUG_ON(buffer_length < 4);
137 buffer[0] = 0xE0 | ((wchar >> 12) & 0x0F);
138 buffer[1] = 0x80 | ((wchar >> 6) & 0x3F);
139 buffer[2] = 0x80 | (wchar & 0x3F);
140 buffer[3] = 0;
144 static int hex2decimal(char ch)
146 if (ch >= '0' && ch <= '9') {
147 return (ch - '0');
148 } else if (ch >= 'a' && ch <= 'f') {
149 return 10 + (ch - 'a');
150 } else if (ch >= 'A' && ch <= 'F') {
151 return 10 + (ch - 'A');
154 return -1;
158 * parse_string(): Parse a json string and return a QObject
160 * string
161 * ""
162 * " chars "
163 * chars
164 * char
165 * char chars
166 * char
167 * any-Unicode-character-
168 * except-"-or-\-or-
169 * control-character
170 * \"
171 * \\
172 * \/
173 * \b
174 * \f
175 * \n
176 * \r
177 * \t
178 * \u four-hex-digits
180 static QString *qstring_from_escaped_str(JSONParserContext *ctxt, QObject *token)
182 const char *ptr = token_get_value(token);
183 QString *str;
184 int double_quote = 1;
186 if (*ptr == '"') {
187 double_quote = 1;
188 } else {
189 double_quote = 0;
191 ptr++;
193 str = qstring_new();
194 while (*ptr &&
195 ((double_quote && *ptr != '"') || (!double_quote && *ptr != '\''))) {
196 if (*ptr == '\\') {
197 ptr++;
199 switch (*ptr) {
200 case '"':
201 qstring_append(str, "\"");
202 ptr++;
203 break;
204 case '\'':
205 qstring_append(str, "'");
206 ptr++;
207 break;
208 case '\\':
209 qstring_append(str, "\\");
210 ptr++;
211 break;
212 case '/':
213 qstring_append(str, "/");
214 ptr++;
215 break;
216 case 'b':
217 qstring_append(str, "\b");
218 ptr++;
219 break;
220 case 'f':
221 qstring_append(str, "\f");
222 ptr++;
223 break;
224 case 'n':
225 qstring_append(str, "\n");
226 ptr++;
227 break;
228 case 'r':
229 qstring_append(str, "\r");
230 ptr++;
231 break;
232 case 't':
233 qstring_append(str, "\t");
234 ptr++;
235 break;
236 case 'u': {
237 uint16_t unicode_char = 0;
238 char utf8_char[4];
239 int i = 0;
241 ptr++;
243 for (i = 0; i < 4; i++) {
244 if (qemu_isxdigit(*ptr)) {
245 unicode_char |= hex2decimal(*ptr) << ((3 - i) * 4);
246 } else {
247 parse_error(ctxt, token,
248 "invalid hex escape sequence in string");
249 goto out;
251 ptr++;
254 wchar_to_utf8(unicode_char, utf8_char, sizeof(utf8_char));
255 qstring_append(str, utf8_char);
256 } break;
257 default:
258 parse_error(ctxt, token, "invalid escape sequence in string");
259 goto out;
261 } else {
262 char dummy[2];
264 dummy[0] = *ptr++;
265 dummy[1] = 0;
267 qstring_append(str, dummy);
271 return str;
273 out:
274 QDECREF(str);
275 return NULL;
278 static QObject *parser_context_pop_token(JSONParserContext *ctxt)
280 QObject *token;
281 g_assert(ctxt->tokens.pos < ctxt->tokens.count);
282 token = ctxt->tokens.buf[ctxt->tokens.pos];
283 ctxt->tokens.pos++;
284 return token;
287 /* Note: parser_context_{peek|pop}_token do not increment the
288 * token object's refcount. In both cases the references will continue
289 * to be tracked and cleaned up in parser_context_free(), so do not
290 * attempt to free the token object.
292 static QObject *parser_context_peek_token(JSONParserContext *ctxt)
294 QObject *token;
295 g_assert(ctxt->tokens.pos < ctxt->tokens.count);
296 token = ctxt->tokens.buf[ctxt->tokens.pos];
297 return token;
300 static JSONParserContext parser_context_save(JSONParserContext *ctxt)
302 JSONParserContext saved_ctxt = {0};
303 saved_ctxt.tokens.pos = ctxt->tokens.pos;
304 saved_ctxt.tokens.count = ctxt->tokens.count;
305 saved_ctxt.tokens.buf = ctxt->tokens.buf;
306 return saved_ctxt;
309 static void parser_context_restore(JSONParserContext *ctxt,
310 JSONParserContext saved_ctxt)
312 ctxt->tokens.pos = saved_ctxt.tokens.pos;
313 ctxt->tokens.count = saved_ctxt.tokens.count;
314 ctxt->tokens.buf = saved_ctxt.tokens.buf;
317 static void tokens_append_from_iter(QObject *obj, void *opaque)
319 JSONParserContext *ctxt = opaque;
320 g_assert(ctxt->tokens.pos < ctxt->tokens.count);
321 ctxt->tokens.buf[ctxt->tokens.pos++] = obj;
322 qobject_incref(obj);
325 static JSONParserContext *parser_context_new(QList *tokens)
327 JSONParserContext *ctxt;
328 size_t count;
330 if (!tokens) {
331 return NULL;
334 count = qlist_size(tokens);
335 if (count == 0) {
336 return NULL;
339 ctxt = g_malloc0(sizeof(JSONParserContext));
340 ctxt->tokens.pos = 0;
341 ctxt->tokens.count = count;
342 ctxt->tokens.buf = g_malloc(count * sizeof(QObject *));
343 qlist_iter(tokens, tokens_append_from_iter, ctxt);
344 ctxt->tokens.pos = 0;
346 return ctxt;
349 /* to support error propagation, ctxt->err must be freed separately */
350 static void parser_context_free(JSONParserContext *ctxt)
352 int i;
353 if (ctxt) {
354 for (i = 0; i < ctxt->tokens.count; i++) {
355 qobject_decref(ctxt->tokens.buf[i]);
357 g_free(ctxt->tokens.buf);
358 g_free(ctxt);
363 * Parsing rules
365 static int parse_pair(JSONParserContext *ctxt, QDict *dict, va_list *ap)
367 QObject *key = NULL, *token = NULL, *value, *peek;
368 JSONParserContext saved_ctxt = parser_context_save(ctxt);
370 peek = parser_context_peek_token(ctxt);
371 if (peek == NULL) {
372 parse_error(ctxt, NULL, "premature EOI");
373 goto out;
376 key = parse_value(ctxt, ap);
377 if (!key || qobject_type(key) != QTYPE_QSTRING) {
378 parse_error(ctxt, peek, "key is not a string in object");
379 goto out;
382 token = parser_context_pop_token(ctxt);
383 if (token == NULL) {
384 parse_error(ctxt, NULL, "premature EOI");
385 goto out;
388 if (!token_is_operator(token, ':')) {
389 parse_error(ctxt, token, "missing : in object pair");
390 goto out;
393 value = parse_value(ctxt, ap);
394 if (value == NULL) {
395 parse_error(ctxt, token, "Missing value in dict");
396 goto out;
399 qdict_put_obj(dict, qstring_get_str(qobject_to_qstring(key)), value);
401 qobject_decref(key);
403 return 0;
405 out:
406 parser_context_restore(ctxt, saved_ctxt);
407 qobject_decref(key);
409 return -1;
412 static QObject *parse_object(JSONParserContext *ctxt, va_list *ap)
414 QDict *dict = NULL;
415 QObject *token, *peek;
416 JSONParserContext saved_ctxt = parser_context_save(ctxt);
418 token = parser_context_pop_token(ctxt);
419 if (token == NULL) {
420 goto out;
423 if (!token_is_operator(token, '{')) {
424 goto out;
426 token = NULL;
428 dict = qdict_new();
430 peek = parser_context_peek_token(ctxt);
431 if (peek == NULL) {
432 parse_error(ctxt, NULL, "premature EOI");
433 goto out;
436 if (!token_is_operator(peek, '}')) {
437 if (parse_pair(ctxt, dict, ap) == -1) {
438 goto out;
441 token = parser_context_pop_token(ctxt);
442 if (token == NULL) {
443 parse_error(ctxt, NULL, "premature EOI");
444 goto out;
447 while (!token_is_operator(token, '}')) {
448 if (!token_is_operator(token, ',')) {
449 parse_error(ctxt, token, "expected separator in dict");
450 goto out;
452 token = NULL;
454 if (parse_pair(ctxt, dict, ap) == -1) {
455 goto out;
458 token = parser_context_pop_token(ctxt);
459 if (token == NULL) {
460 parse_error(ctxt, NULL, "premature EOI");
461 goto out;
464 token = NULL;
465 } else {
466 token = parser_context_pop_token(ctxt);
467 token = NULL;
470 return QOBJECT(dict);
472 out:
473 parser_context_restore(ctxt, saved_ctxt);
474 QDECREF(dict);
475 return NULL;
478 static QObject *parse_array(JSONParserContext *ctxt, va_list *ap)
480 QList *list = NULL;
481 QObject *token, *peek;
482 JSONParserContext saved_ctxt = parser_context_save(ctxt);
484 token = parser_context_pop_token(ctxt);
485 if (token == NULL) {
486 goto out;
489 if (!token_is_operator(token, '[')) {
490 token = NULL;
491 goto out;
493 token = NULL;
495 list = qlist_new();
497 peek = parser_context_peek_token(ctxt);
498 if (peek == NULL) {
499 parse_error(ctxt, NULL, "premature EOI");
500 goto out;
503 if (!token_is_operator(peek, ']')) {
504 QObject *obj;
506 obj = parse_value(ctxt, ap);
507 if (obj == NULL) {
508 parse_error(ctxt, token, "expecting value");
509 goto out;
512 qlist_append_obj(list, obj);
514 token = parser_context_pop_token(ctxt);
515 if (token == NULL) {
516 parse_error(ctxt, NULL, "premature EOI");
517 goto out;
520 while (!token_is_operator(token, ']')) {
521 if (!token_is_operator(token, ',')) {
522 parse_error(ctxt, token, "expected separator in list");
523 goto out;
526 token = NULL;
528 obj = parse_value(ctxt, ap);
529 if (obj == NULL) {
530 parse_error(ctxt, token, "expecting value");
531 goto out;
534 qlist_append_obj(list, obj);
536 token = parser_context_pop_token(ctxt);
537 if (token == NULL) {
538 parse_error(ctxt, NULL, "premature EOI");
539 goto out;
543 token = NULL;
544 } else {
545 token = parser_context_pop_token(ctxt);
546 token = NULL;
549 return QOBJECT(list);
551 out:
552 parser_context_restore(ctxt, saved_ctxt);
553 QDECREF(list);
554 return NULL;
557 static QObject *parse_keyword(JSONParserContext *ctxt)
559 QObject *token, *ret;
560 JSONParserContext saved_ctxt = parser_context_save(ctxt);
562 token = parser_context_pop_token(ctxt);
563 if (token == NULL) {
564 goto out;
567 if (token_get_type(token) != JSON_KEYWORD) {
568 goto out;
571 if (token_is_keyword(token, "true")) {
572 ret = QOBJECT(qbool_from_int(true));
573 } else if (token_is_keyword(token, "false")) {
574 ret = QOBJECT(qbool_from_int(false));
575 } else {
576 parse_error(ctxt, token, "invalid keyword `%s'", token_get_value(token));
577 goto out;
580 return ret;
582 out:
583 parser_context_restore(ctxt, saved_ctxt);
585 return NULL;
588 static QObject *parse_escape(JSONParserContext *ctxt, va_list *ap)
590 QObject *token = NULL, *obj;
591 JSONParserContext saved_ctxt = parser_context_save(ctxt);
593 if (ap == NULL) {
594 goto out;
597 token = parser_context_pop_token(ctxt);
598 if (token == NULL) {
599 goto out;
602 if (token_is_escape(token, "%p")) {
603 obj = va_arg(*ap, QObject *);
604 } else if (token_is_escape(token, "%i")) {
605 obj = QOBJECT(qbool_from_int(va_arg(*ap, int)));
606 } else if (token_is_escape(token, "%d")) {
607 obj = QOBJECT(qint_from_int(va_arg(*ap, int)));
608 } else if (token_is_escape(token, "%ld")) {
609 obj = QOBJECT(qint_from_int(va_arg(*ap, long)));
610 } else if (token_is_escape(token, "%lld") ||
611 token_is_escape(token, "%I64d")) {
612 obj = QOBJECT(qint_from_int(va_arg(*ap, long long)));
613 } else if (token_is_escape(token, "%s")) {
614 obj = QOBJECT(qstring_from_str(va_arg(*ap, const char *)));
615 } else if (token_is_escape(token, "%f")) {
616 obj = QOBJECT(qfloat_from_double(va_arg(*ap, double)));
617 } else {
618 goto out;
621 return obj;
623 out:
624 parser_context_restore(ctxt, saved_ctxt);
626 return NULL;
629 static QObject *parse_literal(JSONParserContext *ctxt)
631 QObject *token, *obj;
632 JSONParserContext saved_ctxt = parser_context_save(ctxt);
634 token = parser_context_pop_token(ctxt);
635 if (token == NULL) {
636 goto out;
639 switch (token_get_type(token)) {
640 case JSON_STRING:
641 obj = QOBJECT(qstring_from_escaped_str(ctxt, token));
642 break;
643 case JSON_INTEGER:
644 obj = QOBJECT(qint_from_int(strtoll(token_get_value(token), NULL, 10)));
645 break;
646 case JSON_FLOAT:
647 /* FIXME dependent on locale */
648 obj = QOBJECT(qfloat_from_double(strtod(token_get_value(token), NULL)));
649 break;
650 default:
651 goto out;
654 return obj;
656 out:
657 parser_context_restore(ctxt, saved_ctxt);
659 return NULL;
662 static QObject *parse_value(JSONParserContext *ctxt, va_list *ap)
664 QObject *obj;
666 obj = parse_object(ctxt, ap);
667 if (obj == NULL) {
668 obj = parse_array(ctxt, ap);
670 if (obj == NULL) {
671 obj = parse_escape(ctxt, ap);
673 if (obj == NULL) {
674 obj = parse_keyword(ctxt);
676 if (obj == NULL) {
677 obj = parse_literal(ctxt);
680 return obj;
683 QObject *json_parser_parse(QList *tokens, va_list *ap)
685 return json_parser_parse_err(tokens, ap, NULL);
688 QObject *json_parser_parse_err(QList *tokens, va_list *ap, Error **errp)
690 JSONParserContext *ctxt = parser_context_new(tokens);
691 QObject *result;
693 if (!ctxt) {
694 return NULL;
697 result = parse_value(ctxt, ap);
699 error_propagate(errp, ctxt->err);
701 parser_context_free(ctxt);
703 return result;