2 * Copyright (c) 2009, 2010 Nicira Networks.
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at:
8 * http://www.apache.org/licenses/LICENSE-2.0
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
29 #include "dynamic-string.h"
35 /* The type of a JSON token. */
36 enum json_token_type
{
42 T_NAME_SEPARATOR
= ':',
43 T_VALUE_SEPARATOR
= ',',
44 T_FALSE
= UCHAR_MAX
+ 1,
54 * RFC 4627 doesn't define a lexical structure for JSON but I believe this to
55 * be compliant with the standard.
58 enum json_token_type type
;
61 long long int integer
;
67 JSON_LEX_START
, /* Not inside a token. */
68 JSON_LEX_NUMBER
, /* Reading a number. */
69 JSON_LEX_KEYWORD
, /* Reading a keyword. */
70 JSON_LEX_STRING
, /* Reading a quoted string. */
71 JSON_LEX_ESCAPE
/* In a quoted string just after a "\". */
74 enum json_parse_state
{
75 JSON_PARSE_START
, /* Beginning of input. */
76 JSON_PARSE_END
, /* End of input. */
79 JSON_PARSE_OBJECT_INIT
, /* Expecting '}' or an object name. */
80 JSON_PARSE_OBJECT_NAME
, /* Expecting an object name. */
81 JSON_PARSE_OBJECT_COLON
, /* Expecting ':'. */
82 JSON_PARSE_OBJECT_VALUE
, /* Expecting an object value. */
83 JSON_PARSE_OBJECT_NEXT
, /* Expecting ',' or '}'. */
86 JSON_PARSE_ARRAY_INIT
, /* Expecting ']' or a value. */
87 JSON_PARSE_ARRAY_VALUE
, /* Expecting a value. */
88 JSON_PARSE_ARRAY_NEXT
/* Expecting ',' or ']'. */
91 struct json_parser_node
{
99 /* Lexical analysis. */
100 enum json_lex_state lex_state
;
101 struct ds buffer
; /* Buffer for accumulating token text. */
107 enum json_parse_state parse_state
;
108 #define JSON_MAX_HEIGHT 1000
109 struct json_parser_node
*stack
;
110 size_t height
, allocated_height
;
115 char *error
; /* Error message, if any, null if none yet. */
118 static struct json
*json_create(enum json_type type
);
119 static void json_parser_input(struct json_parser
*, struct json_token
*);
121 static void json_error(struct json_parser
*p
, const char *format
, ...)
125 json_type_to_string(enum json_type type
)
156 /* Functions for manipulating struct json. */
159 json_null_create(void)
161 return json_create(JSON_NULL
);
165 json_boolean_create(bool b
)
167 return json_create(b
? JSON_TRUE
: JSON_FALSE
);
171 json_string_create_nocopy(char *s
)
173 struct json
*json
= json_create(JSON_STRING
);
179 json_string_create(const char *s
)
181 return json_string_create_nocopy(xstrdup(s
));
185 json_array_create_empty(void)
187 struct json
*json
= json_create(JSON_ARRAY
);
188 json
->u
.array
.elems
= NULL
;
190 json
->u
.array
.n_allocated
= 0;
195 json_array_add(struct json
*array_
, struct json
*element
)
197 struct json_array
*array
= json_array(array_
);
198 if (array
->n
>= array
->n_allocated
) {
199 array
->elems
= x2nrealloc(array
->elems
, &array
->n_allocated
,
200 sizeof *array
->elems
);
202 array
->elems
[array
->n
++] = element
;
206 json_array_trim(struct json
*array_
)
208 struct json_array
*array
= json_array(array_
);
209 if (array
->n
< array
->n_allocated
){
210 array
->n_allocated
= array
->n
;
211 array
->elems
= xrealloc(array
->elems
, array
->n
* sizeof *array
->elems
);
216 json_array_create(struct json
**elements
, size_t n
)
218 struct json
*json
= json_create(JSON_ARRAY
);
219 json
->u
.array
.elems
= elements
;
221 json
->u
.array
.n_allocated
= n
;
226 json_array_create_1(struct json
*elem0
)
228 struct json
**elems
= xmalloc(sizeof *elems
);
230 return json_array_create(elems
, 1);
234 json_array_create_2(struct json
*elem0
, struct json
*elem1
)
236 struct json
**elems
= xmalloc(2 * sizeof *elems
);
239 return json_array_create(elems
, 2);
243 json_array_create_3(struct json
*elem0
, struct json
*elem1
, struct json
*elem2
)
245 struct json
**elems
= xmalloc(3 * sizeof *elems
);
249 return json_array_create(elems
, 3);
253 json_object_create(void)
255 struct json
*json
= json_create(JSON_OBJECT
);
256 json
->u
.object
= xmalloc(sizeof *json
->u
.object
);
257 shash_init(json
->u
.object
);
262 json_integer_create(long long int integer
)
264 struct json
*json
= json_create(JSON_INTEGER
);
265 json
->u
.integer
= integer
;
270 json_real_create(double real
)
272 struct json
*json
= json_create(JSON_REAL
);
278 json_object_put(struct json
*json
, const char *name
, struct json
*value
)
280 json_destroy(shash_replace(json
->u
.object
, name
, value
));
284 json_object_put_string(struct json
*json
, const char *name
, const char *value
)
286 json_object_put(json
, name
, json_string_create(value
));
290 json_string(const struct json
*json
)
292 assert(json
->type
== JSON_STRING
);
293 return json
->u
.string
;
297 json_array(const struct json
*json
)
299 assert(json
->type
== JSON_ARRAY
);
300 return (struct json_array
*) &json
->u
.array
;
304 json_object(const struct json
*json
)
306 assert(json
->type
== JSON_OBJECT
);
307 return (struct shash
*) json
->u
.object
;
311 json_boolean(const struct json
*json
)
313 assert(json
->type
== JSON_TRUE
|| json
->type
== JSON_FALSE
);
314 return json
->type
== JSON_TRUE
;
318 json_real(const struct json
*json
)
320 assert(json
->type
== JSON_REAL
|| json
->type
== JSON_INTEGER
);
321 return json
->type
== JSON_REAL
? json
->u
.real
: json
->u
.integer
;
325 json_integer(const struct json
*json
)
327 assert(json
->type
== JSON_INTEGER
);
328 return json
->u
.integer
;
331 static void json_destroy_object(struct shash
*object
);
332 static void json_destroy_array(struct json_array
*array
);
334 /* Frees 'json' and everything it points to, recursively. */
336 json_destroy(struct json
*json
)
339 switch (json
->type
) {
341 json_destroy_object(json
->u
.object
);
345 json_destroy_array(&json
->u
.array
);
349 free(json
->u
.string
);
367 json_destroy_object(struct shash
*object
)
369 struct shash_node
*node
, *next
;
371 SHASH_FOR_EACH_SAFE (node
, next
, object
) {
372 struct json
*value
= node
->data
;
375 shash_delete(object
, node
);
377 shash_destroy(object
);
382 json_destroy_array(struct json_array
*array
)
386 for (i
= 0; i
< array
->n
; i
++) {
387 json_destroy(array
->elems
[i
]);
392 static struct json
*json_clone_object(const struct shash
*object
);
393 static struct json
*json_clone_array(const struct json_array
*array
);
395 /* Returns a deep copy of 'json'. */
397 json_clone(const struct json
*json
)
399 switch (json
->type
) {
401 return json_clone_object(json
->u
.object
);
404 return json_clone_array(&json
->u
.array
);
407 return json_string_create(json
->u
.string
);
412 return json_create(json
->type
);
415 return json_integer_create(json
->u
.integer
);
418 return json_real_create(json
->u
.real
);
427 json_clone_object(const struct shash
*object
)
429 struct shash_node
*node
;
432 json
= json_object_create();
433 SHASH_FOR_EACH (node
, object
) {
434 struct json
*value
= node
->data
;
435 json_object_put(json
, node
->name
, json_clone(value
));
441 json_clone_array(const struct json_array
*array
)
446 elems
= xmalloc(array
->n
* sizeof *elems
);
447 for (i
= 0; i
< array
->n
; i
++) {
448 elems
[i
] = json_clone(array
->elems
[i
]);
450 return json_array_create(elems
, array
->n
);
454 json_hash_object(const struct shash
*object
, size_t basis
)
456 const struct shash_node
**nodes
;
459 nodes
= shash_sort(object
);
460 n
= shash_count(object
);
461 for (i
= 0; i
< n
; i
++) {
462 const struct shash_node
*node
= nodes
[i
];
463 basis
= hash_string(node
->name
, basis
);
464 basis
= json_hash(node
->data
, basis
);
470 json_hash_array(const struct json_array
*array
, size_t basis
)
474 basis
= hash_int(array
->n
, basis
);
475 for (i
= 0; i
< array
->n
; i
++) {
476 basis
= json_hash(array
->elems
[i
], basis
);
482 json_hash(const struct json
*json
, size_t basis
)
484 switch (json
->type
) {
486 return json_hash_object(json
->u
.object
, basis
);
489 return json_hash_array(&json
->u
.array
, basis
);
492 return hash_string(json
->u
.string
, basis
);
497 return hash_int(json
->type
<< 8, basis
);
500 return hash_int(json
->u
.integer
, basis
);
503 return hash_double(json
->u
.real
, basis
);
512 json_equal_object(const struct shash
*a
, const struct shash
*b
)
514 struct shash_node
*a_node
;
516 if (shash_count(a
) != shash_count(b
)) {
520 SHASH_FOR_EACH (a_node
, a
) {
521 struct shash_node
*b_node
= shash_find(b
, a_node
->name
);
522 if (!b_node
|| !json_equal(a_node
->data
, b_node
->data
)) {
531 json_equal_array(const struct json_array
*a
, const struct json_array
*b
)
539 for (i
= 0; i
< a
->n
; i
++) {
540 if (!json_equal(a
->elems
[i
], b
->elems
[i
])) {
549 json_equal(const struct json
*a
, const struct json
*b
)
551 if (a
->type
!= b
->type
) {
557 return json_equal_object(a
->u
.object
, b
->u
.object
);
560 return json_equal_array(&a
->u
.array
, &b
->u
.array
);
563 return !strcmp(a
->u
.string
, b
->u
.string
);
571 return a
->u
.integer
== b
->u
.integer
;
574 return a
->u
.real
== b
->u
.real
;
582 /* Lexical analysis. */
585 json_lex_keyword(struct json_parser
*p
)
587 struct json_token token
;
590 s
= ds_cstr(&p
->buffer
);
591 if (!strcmp(s
, "false")) {
592 token
.type
= T_FALSE
;
593 } else if (!strcmp(s
, "true")) {
595 } else if (!strcmp(s
, "null")) {
598 json_error(p
, "invalid keyword '%s'", s
);
601 json_parser_input(p
, &token
);
605 json_lex_number(struct json_parser
*p
)
607 const char *cp
= ds_cstr(&p
->buffer
);
608 unsigned long long int significand
= 0;
609 struct json_token token
;
610 bool imprecise
= false;
611 bool negative
= false;
614 /* Leading minus sign. */
620 /* At least one integer digit, but 0 may not be used as a leading digit for
621 * a longer number. */
626 json_error(p
, "leading zeros not allowed");
629 } else if (isdigit(*cp
)) {
631 if (significand
<= ULLONG_MAX
/ 10) {
632 significand
= significand
* 10 + (*cp
- '0');
640 } while (isdigit(*cp
));
642 json_error(p
, "'-' must be followed by digit");
646 /* Optional fraction. */
650 json_error(p
, "decimal point must be followed by digit");
654 if (significand
<= ULLONG_MAX
/ 10) {
655 significand
= significand
* 10 + (*cp
- '0');
657 } else if (*cp
!= '0') {
661 } while (isdigit(*cp
));
664 /* Optional exponent. */
665 if (*cp
== 'e' || *cp
== 'E') {
666 bool negative_exponent
= false;
672 } else if (*cp
== '-') {
673 negative_exponent
= true;
678 json_error(p
, "exponent must contain at least one digit");
684 if (exponent
>= INT_MAX
/ 10) {
685 json_error(p
, "exponent outside valid range");
688 exponent
= exponent
* 10 + (*cp
- '0');
690 } while (isdigit(*cp
));
692 if (negative_exponent
) {
700 json_error(p
, "syntax error in number");
704 /* Figure out number.
706 * We suppress negative zeros as a matter of policy. */
708 struct json_token token
;
709 token
.type
= T_INTEGER
;
711 json_parser_input(p
, &token
);
716 while (pow10
> 0 && significand
< ULLONG_MAX
/ 10) {
720 while (pow10
< 0 && significand
% 10 == 0) {
725 && significand
<= (negative
726 ? (unsigned long long int) LLONG_MAX
+ 1
728 token
.type
= T_INTEGER
;
729 token
.u
.integer
= negative
? -significand
: significand
;
730 json_parser_input(p
, &token
);
736 if (!str_to_double(ds_cstr(&p
->buffer
), &token
.u
.real
)) {
737 json_error(p
, "number outside valid range");
740 /* Suppress negative zero. */
741 if (token
.u
.real
== 0) {
744 json_parser_input(p
, &token
);
748 json_lex_4hex(const char *cp
, const char *end
, int *valuep
)
753 return "quoted string ends within \\u escape";
757 for (i
= 0; i
< 4; i
++) {
758 unsigned char c
= *cp
++;
760 return "malformed \\u escape";
762 value
= (value
<< 4) | hexit_value(c
);
765 return "null bytes not supported in quoted strings";
772 json_lex_unicode(const char *cp
, const char *end
, struct ds
*out
)
777 error
= json_lex_4hex(cp
, end
, &c0
);
780 ds_put_cstr(out
, error
);
784 if (!uc_is_leading_surrogate(c0
)) {
785 ds_put_utf8(out
, c0
);
789 if (cp
+ 2 > end
|| *cp
++ != '\\' || *cp
++ != 'u') {
791 ds_put_cstr(out
, "malformed escaped surrogate pair");
795 error
= json_lex_4hex(cp
, end
, &c1
);
798 ds_put_cstr(out
, error
);
802 if (!uc_is_trailing_surrogate(c1
)) {
804 ds_put_cstr(out
, "second half of escaped surrogate pair is not "
805 "trailing surrogate");
809 ds_put_utf8(out
, utf16_decode_surrogate_pair(c0
, c1
));
814 json_string_unescape(const char *in
, size_t in_len
, char **outp
)
816 const char *end
= in
+ in_len
;
821 ds_reserve(&out
, in_len
);
822 if (in_len
> 0 && in
[in_len
- 1] == '\\') {
823 ds_put_cstr(&out
, "quoted string may not end with backslash");
829 ds_put_cstr(&out
, "quoted string may not include unescaped \"");
833 ds_put_char(&out
, *in
++);
839 case '"': case '\\': case '/':
840 ds_put_char(&out
, in
[-1]);
844 ds_put_char(&out
, '\b');
848 ds_put_char(&out
, '\f');
852 ds_put_char(&out
, '\n');
856 ds_put_char(&out
, '\r');
860 ds_put_char(&out
, '\t');
864 in
= json_lex_unicode(in
, end
, &out
);
872 ds_put_format(&out
, "bad escape \\%c", in
[-1]);
879 *outp
= ds_cstr(&out
);
884 json_parser_input_string(struct json_parser
*p
, const char *s
)
886 struct json_token token
;
888 token
.type
= T_STRING
;
890 json_parser_input(p
, &token
);
894 json_lex_string(struct json_parser
*p
)
896 const char *raw
= ds_cstr(&p
->buffer
);
897 if (!strchr(raw
, '\\')) {
898 json_parser_input_string(p
, raw
);
902 if (json_string_unescape(raw
, strlen(raw
), &cooked
)) {
903 json_parser_input_string(p
, cooked
);
905 json_error(p
, "%s", cooked
);
913 json_lex_input(struct json_parser
*p
, unsigned char c
)
915 struct json_token token
;
919 p
->column_number
= 0;
925 switch (p
->lex_state
) {
928 case ' ': case '\t': case '\n': case '\r':
932 case 'a': case 'b': case 'c': case 'd': case 'e':
933 case 'f': case 'g': case 'h': case 'i': case 'j':
934 case 'k': case 'l': case 'm': case 'n': case 'o':
935 case 'p': case 'q': case 'r': case 's': case 't':
936 case 'u': case 'v': case 'w': case 'x': case 'y':
938 p
->lex_state
= JSON_LEX_KEYWORD
;
941 case '[': case '{': case ']': case '}': case ':': case ',':
943 json_parser_input(p
, &token
);
947 case '0': case '1': case '2': case '3': case '4':
948 case '5': case '6': case '7': case '8': case '9':
949 p
->lex_state
= JSON_LEX_NUMBER
;
953 p
->lex_state
= JSON_LEX_STRING
;
958 json_error(p
, "invalid character '%c'", c
);
960 json_error(p
, "invalid character U+%04x", c
);
966 case JSON_LEX_KEYWORD
:
967 if (!isalpha((unsigned char) c
)) {
973 case JSON_LEX_NUMBER
:
974 if (!strchr(".0123456789eE-+", c
)) {
980 case JSON_LEX_STRING
:
982 p
->lex_state
= JSON_LEX_ESCAPE
;
983 } else if (c
== '"') {
986 } else if (c
< 0x20) {
987 json_error(p
, "U+%04X must be escaped in quoted string", c
);
992 case JSON_LEX_ESCAPE
:
993 p
->lex_state
= JSON_LEX_STRING
;
999 ds_put_char(&p
->buffer
, c
);
1005 /* Parses 'string' as a JSON object or array and returns a newly allocated
1006 * 'struct json'. The caller must free the returned structure with
1007 * json_destroy() when it is no longer needed.
1009 * 'string' must be encoded in UTF-8.
1011 * If 'string' is valid JSON, then the returned 'struct json' will be either an
1012 * object (JSON_OBJECT) or an array (JSON_ARRAY).
1014 * If 'string' is not valid JSON, then the returned 'struct json' will be a
1015 * string (JSON_STRING) that describes the particular error encountered during
1016 * parsing. (This is an acceptable means of error reporting because at its top
1017 * level JSON must be either an object or an array; a bare string is not
1020 json_from_string(const char *string
)
1022 struct json_parser
*p
= json_parser_create(JSPF_TRAILER
);
1023 json_parser_feed(p
, string
, strlen(string
));
1024 return json_parser_finish(p
);
1027 /* Reads the file named 'file_name', parses its contents as a JSON object or
1028 * array, and returns a newly allocated 'struct json'. The caller must free
1029 * the returned structure with json_destroy() when it is no longer needed.
1031 * The file must be encoded in UTF-8.
1033 * See json_from_string() for return value semantics.
1036 json_from_file(const char *file_name
)
1041 stream
= fopen(file_name
, "r");
1043 return json_string_create_nocopy(
1044 xasprintf("error opening \"%s\": %s", file_name
, strerror(errno
)));
1046 json
= json_from_stream(stream
);
1052 /* Parses the contents of 'stream' as a JSON object or array, and returns a
1053 * newly allocated 'struct json'. The caller must free the returned structure
1054 * with json_destroy() when it is no longer needed.
1056 * The file must be encoded in UTF-8.
1058 * See json_from_string() for return value semantics.
1061 json_from_stream(FILE *stream
)
1063 struct json_parser
*p
;
1066 p
= json_parser_create(JSPF_TRAILER
);
1068 char buffer
[BUFSIZ
];
1071 n
= fread(buffer
, 1, sizeof buffer
, stream
);
1072 if (!n
|| json_parser_feed(p
, buffer
, n
) != n
) {
1076 json
= json_parser_finish(p
);
1078 if (ferror(stream
)) {
1080 json
= json_string_create_nocopy(
1081 xasprintf("error reading JSON stream: %s", strerror(errno
)));
1087 struct json_parser
*
1088 json_parser_create(int flags
)
1090 struct json_parser
*p
= xzalloc(sizeof *p
);
1096 json_parser_feed(struct json_parser
*p
, const char *input
, size_t n
)
1099 for (i
= 0; !p
->done
&& i
< n
; ) {
1100 if (json_lex_input(p
, input
[i
])) {
1108 json_parser_is_done(const struct json_parser
*p
)
1114 json_parser_finish(struct json_parser
*p
)
1118 switch (p
->lex_state
) {
1119 case JSON_LEX_START
:
1122 case JSON_LEX_STRING
:
1123 case JSON_LEX_ESCAPE
:
1124 json_error(p
, "unexpected end of input in quoted string");
1127 case JSON_LEX_NUMBER
:
1128 case JSON_LEX_KEYWORD
:
1129 json_lex_input(p
, ' ');
1133 if (p
->parse_state
== JSON_PARSE_START
) {
1134 json_error(p
, "empty input stream");
1135 } else if (p
->parse_state
!= JSON_PARSE_END
) {
1136 json_error(p
, "unexpected end of input");
1140 assert(p
->height
== 1);
1141 assert(p
->stack
[0].json
!= NULL
);
1142 json
= p
->stack
[--p
->height
].json
;
1144 json
= json_string_create_nocopy(p
->error
);
1148 json_parser_abort(p
);
1154 json_parser_abort(struct json_parser
*p
)
1157 ds_destroy(&p
->buffer
);
1159 json_destroy(p
->stack
[0].json
);
1162 free(p
->member_name
);
1168 static struct json_parser_node
*
1169 json_parser_top(struct json_parser
*p
)
1171 return &p
->stack
[p
->height
- 1];
1175 json_parser_put_value(struct json_parser
*p
, struct json
*value
)
1177 struct json_parser_node
*node
= json_parser_top(p
);
1178 if (node
->json
->type
== JSON_OBJECT
) {
1179 json_object_put(node
->json
, p
->member_name
, value
);
1180 free(p
->member_name
);
1181 p
->member_name
= NULL
;
1182 } else if (node
->json
->type
== JSON_ARRAY
) {
1183 json_array_add(node
->json
, value
);
1189 static struct json_parser_node
*
1190 json_parser_push(struct json_parser
*p
,
1191 struct json
*new_json
, enum json_parse_state new_state
)
1193 if (p
->height
< JSON_MAX_HEIGHT
) {
1194 struct json_parser_node
*node
;
1196 if (p
->height
>= p
->allocated_height
) {
1197 p
->stack
= x2nrealloc(p
->stack
, &p
->allocated_height
,
1201 if (p
->height
> 0) {
1202 json_parser_put_value(p
, new_json
);
1205 node
= &p
->stack
[p
->height
++];
1206 node
->json
= new_json
;
1207 p
->parse_state
= new_state
;
1210 json_destroy(new_json
);
1211 json_error(p
, "input exceeds maximum nesting depth %d",
1218 json_parser_push_object(struct json_parser
*p
)
1220 json_parser_push(p
, json_object_create(), JSON_PARSE_OBJECT_INIT
);
1224 json_parser_push_array(struct json_parser
*p
)
1226 json_parser_push(p
, json_array_create_empty(), JSON_PARSE_ARRAY_INIT
);
1230 json_parse_value(struct json_parser
*p
, struct json_token
*token
,
1231 enum json_parse_state next_state
)
1235 switch (token
->type
) {
1237 value
= json_boolean_create(false);
1241 value
= json_null_create();
1245 value
= json_boolean_create(true);
1249 json_parser_push_object(p
);
1253 json_parser_push_array(p
);
1257 value
= json_integer_create(token
->u
.integer
);
1261 value
= json_real_create(token
->u
.real
);
1265 value
= json_string_create(token
->u
.string
);
1274 json_error(p
, "syntax error expecting value");
1278 json_parser_put_value(p
, value
);
1279 p
->parse_state
= next_state
;
1283 json_parser_pop(struct json_parser
*p
)
1285 struct json_parser_node
*node
;
1287 /* Conserve memory. */
1288 node
= json_parser_top(p
);
1289 if (node
->json
->type
== JSON_ARRAY
) {
1290 json_array_trim(node
->json
);
1293 /* Pop off the top-of-stack. */
1294 if (p
->height
== 1) {
1295 p
->parse_state
= JSON_PARSE_END
;
1296 if (!(p
->flags
& JSPF_TRAILER
)) {
1301 node
= json_parser_top(p
);
1302 if (node
->json
->type
== JSON_ARRAY
) {
1303 p
->parse_state
= JSON_PARSE_ARRAY_NEXT
;
1304 } else if (node
->json
->type
== JSON_OBJECT
) {
1305 p
->parse_state
= JSON_PARSE_OBJECT_NEXT
;
1313 json_parser_input(struct json_parser
*p
, struct json_token
*token
)
1315 switch (p
->parse_state
) {
1316 case JSON_PARSE_START
:
1317 if (token
->type
== '{') {
1318 json_parser_push_object(p
);
1319 } else if (token
->type
== '[') {
1320 json_parser_push_array(p
);
1322 json_error(p
, "syntax error at beginning of input");
1326 case JSON_PARSE_END
:
1327 json_error(p
, "trailing garbage at end of input");
1330 case JSON_PARSE_OBJECT_INIT
:
1331 if (token
->type
== '}') {
1336 case JSON_PARSE_OBJECT_NAME
:
1337 if (token
->type
== T_STRING
) {
1338 p
->member_name
= xstrdup(token
->u
.string
);
1339 p
->parse_state
= JSON_PARSE_OBJECT_COLON
;
1341 json_error(p
, "syntax error parsing object expecting string");
1345 case JSON_PARSE_OBJECT_COLON
:
1346 if (token
->type
== ':') {
1347 p
->parse_state
= JSON_PARSE_OBJECT_VALUE
;
1349 json_error(p
, "syntax error parsing object expecting ':'");
1353 case JSON_PARSE_OBJECT_VALUE
:
1354 json_parse_value(p
, token
, JSON_PARSE_OBJECT_NEXT
);
1357 case JSON_PARSE_OBJECT_NEXT
:
1358 if (token
->type
== ',') {
1359 p
->parse_state
= JSON_PARSE_OBJECT_NAME
;
1360 } else if (token
->type
== '}') {
1363 json_error(p
, "syntax error expecting '}' or ','");
1367 case JSON_PARSE_ARRAY_INIT
:
1368 if (token
->type
== ']') {
1373 case JSON_PARSE_ARRAY_VALUE
:
1374 json_parse_value(p
, token
, JSON_PARSE_ARRAY_NEXT
);
1377 case JSON_PARSE_ARRAY_NEXT
:
1378 if (token
->type
== ',') {
1379 p
->parse_state
= JSON_PARSE_ARRAY_VALUE
;
1380 } else if (token
->type
== ']') {
1383 json_error(p
, "syntax error expecting ']' or ','");
1391 p
->lex_state
= JSON_LEX_START
;
1392 ds_clear(&p
->buffer
);
1395 static struct json
*
1396 json_create(enum json_type type
)
1398 struct json
*json
= xmalloc(sizeof *json
);
1404 json_error(struct json_parser
*p
, const char *format
, ...)
1411 ds_put_format(&msg
, "line %d, column %d, byte %d: ",
1412 p
->line_number
, p
->column_number
, p
->byte_number
);
1413 va_start(args
, format
);
1414 ds_put_format_valist(&msg
, format
, args
);
1417 p
->error
= ds_steal_cstr(&msg
);
1423 #define SPACES_PER_LEVEL 2
1425 struct json_serializer
{
1431 static void json_serialize(const struct json
*, struct json_serializer
*);
1432 static void json_serialize_object(const struct shash
*object
,
1433 struct json_serializer
*);
1434 static void json_serialize_array(const struct json_array
*,
1435 struct json_serializer
*);
1436 static void json_serialize_string(const char *, struct ds
*);
1438 /* Converts 'json' to a string in JSON format, encoded in UTF-8, and returns
1439 * that string. The caller is responsible for freeing the returned string,
1440 * with free(), when it is no longer needed.
1442 * If 'flags' contains JSSF_PRETTY, the output is pretty-printed with each
1443 * nesting level introducing an additional indentation. Otherwise, the
1444 * returned string does not contain any new-line characters.
1446 * If 'flags' contains JSSF_SORT, members of objects in the output are sorted
1447 * in bytewise lexicographic order for reproducibility. Otherwise, members of
1448 * objects are output in an indeterminate order.
1450 * The returned string is valid JSON only if 'json' represents an array or an
1451 * object, since a bare literal does not satisfy the JSON grammar. */
1453 json_to_string(const struct json
*json
, int flags
)
1458 json_to_ds(json
, flags
, &ds
);
1459 return ds_steal_cstr(&ds
);
1462 /* Same as json_to_string(), but the output is appended to 'ds'. */
1464 json_to_ds(const struct json
*json
, int flags
, struct ds
*ds
)
1466 struct json_serializer s
;
1471 json_serialize(json
, &s
);
1475 json_serialize(const struct json
*json
, struct json_serializer
*s
)
1477 struct ds
*ds
= s
->ds
;
1479 switch (json
->type
) {
1481 ds_put_cstr(ds
, "null");
1485 ds_put_cstr(ds
, "false");
1489 ds_put_cstr(ds
, "true");
1493 json_serialize_object(json
->u
.object
, s
);
1497 json_serialize_array(&json
->u
.array
, s
);
1501 ds_put_format(ds
, "%lld", json
->u
.integer
);
1505 ds_put_format(ds
, "%.*g", DBL_DIG
, json
->u
.real
);
1509 json_serialize_string(json
->u
.string
, ds
);
1519 indent_line(struct json_serializer
*s
)
1521 if (s
->flags
& JSSF_PRETTY
) {
1522 ds_put_char(s
->ds
, '\n');
1523 ds_put_char_multiple(s
->ds
, ' ', SPACES_PER_LEVEL
* s
->depth
);
1528 json_serialize_object_member(size_t i
, const struct shash_node
*node
,
1529 struct json_serializer
*s
)
1531 struct ds
*ds
= s
->ds
;
1534 ds_put_char(ds
, ',');
1538 json_serialize_string(node
->name
, ds
);
1539 ds_put_char(ds
, ':');
1540 if (s
->flags
& JSSF_PRETTY
) {
1541 ds_put_char(ds
, ' ');
1543 json_serialize(node
->data
, s
);
1547 json_serialize_object(const struct shash
*object
, struct json_serializer
*s
)
1549 struct ds
*ds
= s
->ds
;
1551 ds_put_char(ds
, '{');
1556 if (s
->flags
& JSSF_SORT
) {
1557 const struct shash_node
**nodes
;
1560 nodes
= shash_sort(object
);
1561 n
= shash_count(object
);
1562 for (i
= 0; i
< n
; i
++) {
1563 json_serialize_object_member(i
, nodes
[i
], s
);
1567 struct shash_node
*node
;
1571 SHASH_FOR_EACH (node
, object
) {
1572 json_serialize_object_member(i
++, node
, s
);
1576 ds_put_char(ds
, '}');
1581 json_serialize_array(const struct json_array
*array
, struct json_serializer
*s
)
1583 struct ds
*ds
= s
->ds
;
1586 ds_put_char(ds
, '[');
1592 for (i
= 0; i
< array
->n
; i
++) {
1594 ds_put_char(ds
, ',');
1597 json_serialize(array
->elems
[i
], s
);
1602 ds_put_char(ds
, ']');
1606 json_serialize_string(const char *string
, struct ds
*ds
)
1610 ds_put_char(ds
, '"');
1611 while ((c
= *string
++) != '\0') {
1614 ds_put_cstr(ds
, "\\\"");
1618 ds_put_cstr(ds
, "\\\\");
1622 ds_put_cstr(ds
, "\\b");
1626 ds_put_cstr(ds
, "\\f");
1630 ds_put_cstr(ds
, "\\n");
1634 ds_put_cstr(ds
, "\\r");
1638 ds_put_cstr(ds
, "\\t");
1645 ds_put_format(ds
, "\\u%04x", c
);
1650 ds_put_char(ds
, '"');