load.c 24 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054
  1. /*
  2. * Copyright (c) 2009-2012 Petri Lehtinen <petri@digip.org>
  3. *
  4. * Jansson is free software; you can redistribute it and/or modify
  5. * it under the terms of the MIT license. See LICENSE for details.
  6. */
  7. #define _GNU_SOURCE
  8. #include <errno.h>
  9. #include <limits.h>
  10. #include <stdio.h>
  11. #include <stdlib.h>
  12. #include <string.h>
  13. #include <assert.h>
  14. #include "jansson.h"
  15. #include "jansson_private.h"
  16. #include "strbuffer.h"
  17. #include "utf.h"
  18. #define STREAM_STATE_OK 0
  19. #define STREAM_STATE_EOF -1
  20. #define STREAM_STATE_ERROR -2
  21. #define TOKEN_INVALID -1
  22. #define TOKEN_EOF 0
  23. #define TOKEN_STRING 256
  24. #define TOKEN_INTEGER 257
  25. #define TOKEN_REAL 258
  26. #define TOKEN_TRUE 259
  27. #define TOKEN_FALSE 260
  28. #define TOKEN_NULL 261
  29. /* Locale independent versions of isxxx() functions */
  30. #define l_isupper(c) ('A' <= (c) && (c) <= 'Z')
  31. #define l_islower(c) ('a' <= (c) && (c) <= 'z')
  32. #define l_isalpha(c) (l_isupper(c) || l_islower(c))
  33. #define l_isdigit(c) ('0' <= (c) && (c) <= '9')
  34. #define l_isxdigit(c) \
  35. (l_isdigit(c) || 'A' <= (c) || (c) <= 'F' || 'a' <= (c) || (c) <= 'f')
  36. /* Read one byte from stream, convert to unsigned char, then int, and
  37. return. return EOF on end of file. This corresponds to the
  38. behaviour of fgetc(). */
  39. typedef int (*get_func)(void *data);
  40. typedef struct {
  41. get_func get;
  42. void *data;
  43. char buffer[5];
  44. size_t buffer_pos;
  45. int state;
  46. int line;
  47. int column, last_column;
  48. size_t position;
  49. } stream_t;
  50. typedef struct {
  51. stream_t stream;
  52. strbuffer_t saved_text;
  53. int token;
  54. union {
  55. char *string;
  56. json_int_t integer;
  57. double real;
  58. } value;
  59. } lex_t;
  60. #define stream_to_lex(stream) container_of(stream, lex_t, stream)
  61. /*** error reporting ***/
  62. static void error_set(json_error_t *error, const lex_t *lex,
  63. const char *msg, ...)
  64. {
  65. va_list ap;
  66. char msg_text[JSON_ERROR_TEXT_LENGTH];
  67. char msg_with_context[JSON_ERROR_TEXT_LENGTH];
  68. int line = -1, col = -1;
  69. size_t pos = 0;
  70. const char *result = msg_text;
  71. if(!error)
  72. return;
  73. va_start(ap, msg);
  74. vsnprintf(msg_text, JSON_ERROR_TEXT_LENGTH, msg, ap);
  75. msg_text[JSON_ERROR_TEXT_LENGTH - 1] = '\0';
  76. va_end(ap);
  77. if(lex)
  78. {
  79. const char *saved_text = strbuffer_value(&lex->saved_text);
  80. line = lex->stream.line;
  81. col = lex->stream.column;
  82. pos = lex->stream.position;
  83. if(saved_text && saved_text[0])
  84. {
  85. if(lex->saved_text.length <= 20) {
  86. snprintf(msg_with_context, JSON_ERROR_TEXT_LENGTH,
  87. "%s near '%s'", msg_text, saved_text);
  88. msg_with_context[JSON_ERROR_TEXT_LENGTH - 1] = '\0';
  89. result = msg_with_context;
  90. }
  91. }
  92. else
  93. {
  94. if(lex->stream.state == STREAM_STATE_ERROR) {
  95. /* No context for UTF-8 decoding errors */
  96. result = msg_text;
  97. }
  98. else {
  99. snprintf(msg_with_context, JSON_ERROR_TEXT_LENGTH,
  100. "%s near end of file", msg_text);
  101. msg_with_context[JSON_ERROR_TEXT_LENGTH - 1] = '\0';
  102. result = msg_with_context;
  103. }
  104. }
  105. }
  106. jsonp_error_set(error, line, col, pos, "%s", result);
  107. }
  108. /*** lexical analyzer ***/
  109. static void
  110. stream_init(stream_t *stream, get_func get, void *data)
  111. {
  112. stream->get = get;
  113. stream->data = data;
  114. stream->buffer[0] = '\0';
  115. stream->buffer_pos = 0;
  116. stream->state = STREAM_STATE_OK;
  117. stream->line = 1;
  118. stream->column = 0;
  119. stream->position = 0;
  120. }
  121. static int stream_get(stream_t *stream, json_error_t *error)
  122. {
  123. int c;
  124. if(stream->state != STREAM_STATE_OK)
  125. return stream->state;
  126. if(!stream->buffer[stream->buffer_pos])
  127. {
  128. c = stream->get(stream->data);
  129. if(c == EOF) {
  130. stream->state = STREAM_STATE_EOF;
  131. return STREAM_STATE_EOF;
  132. }
  133. stream->buffer[0] = c;
  134. stream->buffer_pos = 0;
  135. if(0x80 <= c && c <= 0xFF)
  136. {
  137. /* multi-byte UTF-8 sequence */
  138. int i, count;
  139. count = utf8_check_first(c);
  140. if(!count)
  141. goto out;
  142. assert(count >= 2);
  143. for(i = 1; i < count; i++)
  144. stream->buffer[i] = stream->get(stream->data);
  145. if(!utf8_check_full(stream->buffer, count, NULL))
  146. goto out;
  147. stream->buffer[count] = '\0';
  148. }
  149. else
  150. stream->buffer[1] = '\0';
  151. }
  152. c = stream->buffer[stream->buffer_pos++];
  153. stream->position++;
  154. if(c == '\n') {
  155. stream->line++;
  156. stream->last_column = stream->column;
  157. stream->column = 0;
  158. }
  159. else if(utf8_check_first(c)) {
  160. /* track the Unicode character column, so increment only if
  161. this is the first character of a UTF-8 sequence */
  162. stream->column++;
  163. }
  164. return c;
  165. out:
  166. stream->state = STREAM_STATE_ERROR;
  167. error_set(error, stream_to_lex(stream), "unable to decode byte 0x%x", c);
  168. return STREAM_STATE_ERROR;
  169. }
  170. static void stream_unget(stream_t *stream, int c)
  171. {
  172. if(c == STREAM_STATE_EOF || c == STREAM_STATE_ERROR)
  173. return;
  174. stream->position--;
  175. if(c == '\n') {
  176. stream->line--;
  177. stream->column = stream->last_column;
  178. }
  179. else if(utf8_check_first(c))
  180. stream->column--;
  181. assert(stream->buffer_pos > 0);
  182. stream->buffer_pos--;
  183. assert(stream->buffer[stream->buffer_pos] == c);
  184. }
  185. static int lex_get(lex_t *lex, json_error_t *error)
  186. {
  187. return stream_get(&lex->stream, error);
  188. }
  189. static void lex_save(lex_t *lex, int c)
  190. {
  191. strbuffer_append_byte(&lex->saved_text, c);
  192. }
  193. static int lex_get_save(lex_t *lex, json_error_t *error)
  194. {
  195. int c = stream_get(&lex->stream, error);
  196. if(c != STREAM_STATE_EOF && c != STREAM_STATE_ERROR)
  197. lex_save(lex, c);
  198. return c;
  199. }
  200. static void lex_unget(lex_t *lex, int c)
  201. {
  202. stream_unget(&lex->stream, c);
  203. }
  204. static void lex_unget_unsave(lex_t *lex, int c)
  205. {
  206. if(c != STREAM_STATE_EOF && c != STREAM_STATE_ERROR) {
  207. char d;
  208. stream_unget(&lex->stream, c);
  209. d = strbuffer_pop(&lex->saved_text);
  210. assert(c == d);
  211. }
  212. }
  213. static void lex_save_cached(lex_t *lex)
  214. {
  215. while(lex->stream.buffer[lex->stream.buffer_pos] != '\0')
  216. {
  217. lex_save(lex, lex->stream.buffer[lex->stream.buffer_pos]);
  218. lex->stream.buffer_pos++;
  219. lex->stream.position++;
  220. }
  221. }
  222. /* assumes that str points to 'u' plus at least 4 valid hex digits */
  223. static int32_t decode_unicode_escape(const char *str)
  224. {
  225. int i;
  226. int32_t value = 0;
  227. assert(str[0] == 'u');
  228. for(i = 1; i <= 4; i++) {
  229. char c = str[i];
  230. value <<= 4;
  231. if(l_isdigit(c))
  232. value += c - '0';
  233. else if(l_islower(c))
  234. value += c - 'a' + 10;
  235. else if(l_isupper(c))
  236. value += c - 'A' + 10;
  237. else
  238. assert(0);
  239. }
  240. return value;
  241. }
  242. static void lex_scan_string(lex_t *lex, json_error_t *error)
  243. {
  244. int c;
  245. const char *p;
  246. char *t;
  247. int i;
  248. lex->value.string = NULL;
  249. lex->token = TOKEN_INVALID;
  250. c = lex_get_save(lex, error);
  251. while(c != '"') {
  252. if(c == STREAM_STATE_ERROR)
  253. goto out;
  254. else if(c == STREAM_STATE_EOF) {
  255. error_set(error, lex, "premature end of input");
  256. goto out;
  257. }
  258. else if(0 <= c && c <= 0x1F) {
  259. /* control character */
  260. lex_unget_unsave(lex, c);
  261. if(c == '\n')
  262. error_set(error, lex, "unexpected newline", c);
  263. else
  264. error_set(error, lex, "control character 0x%x", c);
  265. goto out;
  266. }
  267. else if(c == '\\') {
  268. c = lex_get_save(lex, error);
  269. if(c == 'u') {
  270. c = lex_get_save(lex, error);
  271. for(i = 0; i < 4; i++) {
  272. if(!l_isxdigit(c)) {
  273. error_set(error, lex, "invalid escape");
  274. goto out;
  275. }
  276. c = lex_get_save(lex, error);
  277. }
  278. }
  279. else if(c == '"' || c == '\\' || c == '/' || c == 'b' ||
  280. c == 'f' || c == 'n' || c == 'r' || c == 't')
  281. c = lex_get_save(lex, error);
  282. else {
  283. error_set(error, lex, "invalid escape");
  284. goto out;
  285. }
  286. }
  287. else
  288. c = lex_get_save(lex, error);
  289. }
  290. /* the actual value is at most of the same length as the source
  291. string, because:
  292. - shortcut escapes (e.g. "\t") (length 2) are converted to 1 byte
  293. - a single \uXXXX escape (length 6) is converted to at most 3 bytes
  294. - two \uXXXX escapes (length 12) forming an UTF-16 surrogate pair
  295. are converted to 4 bytes
  296. */
  297. lex->value.string = jsonp_malloc(lex->saved_text.length + 1);
  298. if(!lex->value.string) {
  299. /* this is not very nice, since TOKEN_INVALID is returned */
  300. goto out;
  301. }
  302. /* the target */
  303. t = lex->value.string;
  304. /* + 1 to skip the " */
  305. p = strbuffer_value(&lex->saved_text) + 1;
  306. while(*p != '"') {
  307. if(*p == '\\') {
  308. p++;
  309. if(*p == 'u') {
  310. char buffer[4];
  311. int length;
  312. int32_t value;
  313. value = decode_unicode_escape(p);
  314. p += 5;
  315. if(0xD800 <= value && value <= 0xDBFF) {
  316. /* surrogate pair */
  317. if(*p == '\\' && *(p + 1) == 'u') {
  318. int32_t value2 = decode_unicode_escape(++p);
  319. p += 5;
  320. if(0xDC00 <= value2 && value2 <= 0xDFFF) {
  321. /* valid second surrogate */
  322. value =
  323. ((value - 0xD800) << 10) +
  324. (value2 - 0xDC00) +
  325. 0x10000;
  326. }
  327. else {
  328. /* invalid second surrogate */
  329. error_set(error, lex,
  330. "invalid Unicode '\\u%04X\\u%04X'",
  331. value, value2);
  332. goto out;
  333. }
  334. }
  335. else {
  336. /* no second surrogate */
  337. error_set(error, lex, "invalid Unicode '\\u%04X'",
  338. value);
  339. goto out;
  340. }
  341. }
  342. else if(0xDC00 <= value && value <= 0xDFFF) {
  343. error_set(error, lex, "invalid Unicode '\\u%04X'", value);
  344. goto out;
  345. }
  346. else if(value == 0)
  347. {
  348. error_set(error, lex, "\\u0000 is not allowed");
  349. goto out;
  350. }
  351. if(utf8_encode(value, buffer, &length))
  352. assert(0);
  353. memcpy(t, buffer, length);
  354. t += length;
  355. }
  356. else {
  357. switch(*p) {
  358. case '"': case '\\': case '/':
  359. *t = *p; break;
  360. case 'b': *t = '\b'; break;
  361. case 'f': *t = '\f'; break;
  362. case 'n': *t = '\n'; break;
  363. case 'r': *t = '\r'; break;
  364. case 't': *t = '\t'; break;
  365. default: assert(0);
  366. }
  367. t++;
  368. p++;
  369. }
  370. }
  371. else
  372. *(t++) = *(p++);
  373. }
  374. *t = '\0';
  375. lex->token = TOKEN_STRING;
  376. return;
  377. out:
  378. jsonp_free(lex->value.string);
  379. }
  380. #if JSON_INTEGER_IS_LONG_LONG
  381. #ifdef _MSC_VER // Microsoft Visual Studio
  382. #define json_strtoint _strtoi64
  383. #else
  384. #define json_strtoint strtoll
  385. #endif
  386. #else
  387. #define json_strtoint strtol
  388. #endif
  389. static int lex_scan_number(lex_t *lex, int c, json_error_t *error)
  390. {
  391. const char *saved_text;
  392. char *end;
  393. double value;
  394. lex->token = TOKEN_INVALID;
  395. if(c == '-')
  396. c = lex_get_save(lex, error);
  397. if(c == '0') {
  398. c = lex_get_save(lex, error);
  399. if(l_isdigit(c)) {
  400. lex_unget_unsave(lex, c);
  401. goto out;
  402. }
  403. }
  404. else if(l_isdigit(c)) {
  405. c = lex_get_save(lex, error);
  406. while(l_isdigit(c))
  407. c = lex_get_save(lex, error);
  408. }
  409. else {
  410. lex_unget_unsave(lex, c);
  411. goto out;
  412. }
  413. if(c != '.' && c != 'E' && c != 'e') {
  414. json_int_t value;
  415. lex_unget_unsave(lex, c);
  416. saved_text = strbuffer_value(&lex->saved_text);
  417. errno = 0;
  418. value = json_strtoint(saved_text, &end, 10);
  419. if(errno == ERANGE) {
  420. if(value < 0)
  421. error_set(error, lex, "too big negative integer");
  422. else
  423. error_set(error, lex, "too big integer");
  424. goto out;
  425. }
  426. assert(end == saved_text + lex->saved_text.length);
  427. lex->token = TOKEN_INTEGER;
  428. lex->value.integer = value;
  429. return 0;
  430. }
  431. if(c == '.') {
  432. c = lex_get(lex, error);
  433. if(!l_isdigit(c)) {
  434. lex_unget(lex, c);
  435. goto out;
  436. }
  437. lex_save(lex, c);
  438. c = lex_get_save(lex, error);
  439. while(l_isdigit(c))
  440. c = lex_get_save(lex, error);
  441. }
  442. if(c == 'E' || c == 'e') {
  443. c = lex_get_save(lex, error);
  444. if(c == '+' || c == '-')
  445. c = lex_get_save(lex, error);
  446. if(!l_isdigit(c)) {
  447. lex_unget_unsave(lex, c);
  448. goto out;
  449. }
  450. c = lex_get_save(lex, error);
  451. while(l_isdigit(c))
  452. c = lex_get_save(lex, error);
  453. }
  454. lex_unget_unsave(lex, c);
  455. if(jsonp_strtod(&lex->saved_text, &value)) {
  456. error_set(error, lex, "real number overflow");
  457. goto out;
  458. }
  459. lex->token = TOKEN_REAL;
  460. lex->value.real = value;
  461. return 0;
  462. out:
  463. return -1;
  464. }
  465. static int lex_scan(lex_t *lex, json_error_t *error)
  466. {
  467. int c;
  468. strbuffer_clear(&lex->saved_text);
  469. if(lex->token == TOKEN_STRING) {
  470. jsonp_free(lex->value.string);
  471. lex->value.string = NULL;
  472. }
  473. c = lex_get(lex, error);
  474. while(c == ' ' || c == '\t' || c == '\n' || c == '\r')
  475. c = lex_get(lex, error);
  476. if(c == STREAM_STATE_EOF) {
  477. lex->token = TOKEN_EOF;
  478. goto out;
  479. }
  480. if(c == STREAM_STATE_ERROR) {
  481. lex->token = TOKEN_INVALID;
  482. goto out;
  483. }
  484. lex_save(lex, c);
  485. if(c == '{' || c == '}' || c == '[' || c == ']' || c == ':' || c == ',')
  486. lex->token = c;
  487. else if(c == '"')
  488. lex_scan_string(lex, error);
  489. else if(l_isdigit(c) || c == '-') {
  490. if(lex_scan_number(lex, c, error))
  491. goto out;
  492. }
  493. else if(l_isalpha(c)) {
  494. /* eat up the whole identifier for clearer error messages */
  495. const char *saved_text;
  496. c = lex_get_save(lex, error);
  497. while(l_isalpha(c))
  498. c = lex_get_save(lex, error);
  499. lex_unget_unsave(lex, c);
  500. saved_text = strbuffer_value(&lex->saved_text);
  501. if(strcmp(saved_text, "true") == 0)
  502. lex->token = TOKEN_TRUE;
  503. else if(strcmp(saved_text, "false") == 0)
  504. lex->token = TOKEN_FALSE;
  505. else if(strcmp(saved_text, "null") == 0)
  506. lex->token = TOKEN_NULL;
  507. else
  508. lex->token = TOKEN_INVALID;
  509. }
  510. else {
  511. /* save the rest of the input UTF-8 sequence to get an error
  512. message of valid UTF-8 */
  513. lex_save_cached(lex);
  514. lex->token = TOKEN_INVALID;
  515. }
  516. out:
  517. return lex->token;
  518. }
  519. static char *lex_steal_string(lex_t *lex)
  520. {
  521. char *result = NULL;
  522. if(lex->token == TOKEN_STRING)
  523. {
  524. result = lex->value.string;
  525. lex->value.string = NULL;
  526. }
  527. return result;
  528. }
  529. static int lex_init(lex_t *lex, get_func get, void *data)
  530. {
  531. stream_init(&lex->stream, get, data);
  532. if(strbuffer_init(&lex->saved_text))
  533. return -1;
  534. lex->token = TOKEN_INVALID;
  535. return 0;
  536. }
  537. static void lex_close(lex_t *lex)
  538. {
  539. if(lex->token == TOKEN_STRING)
  540. jsonp_free(lex->value.string);
  541. strbuffer_close(&lex->saved_text);
  542. }
  543. /*** parser ***/
  544. static json_t *parse_value(lex_t *lex, size_t flags, json_error_t *error);
  545. static json_t *parse_object(lex_t *lex, size_t flags, json_error_t *error)
  546. {
  547. json_t *object = json_object();
  548. if(!object)
  549. return NULL;
  550. lex_scan(lex, error);
  551. if(lex->token == '}')
  552. return object;
  553. while(1) {
  554. char *key;
  555. json_t *value;
  556. if(lex->token != TOKEN_STRING) {
  557. error_set(error, lex, "string or '}' expected");
  558. goto error;
  559. }
  560. key = lex_steal_string(lex);
  561. if(!key)
  562. return NULL;
  563. if(flags & JSON_REJECT_DUPLICATES) {
  564. if(json_object_get(object, key)) {
  565. jsonp_free(key);
  566. error_set(error, lex, "duplicate object key");
  567. goto error;
  568. }
  569. }
  570. lex_scan(lex, error);
  571. if(lex->token != ':') {
  572. jsonp_free(key);
  573. error_set(error, lex, "':' expected");
  574. goto error;
  575. }
  576. lex_scan(lex, error);
  577. value = parse_value(lex, flags, error);
  578. if(!value) {
  579. jsonp_free(key);
  580. goto error;
  581. }
  582. if(json_object_set_nocheck(object, key, value)) {
  583. jsonp_free(key);
  584. json_decref(value);
  585. goto error;
  586. }
  587. json_decref(value);
  588. jsonp_free(key);
  589. lex_scan(lex, error);
  590. if(lex->token != ',')
  591. break;
  592. lex_scan(lex, error);
  593. }
  594. if(lex->token != '}') {
  595. error_set(error, lex, "'}' expected");
  596. goto error;
  597. }
  598. return object;
  599. error:
  600. json_decref(object);
  601. return NULL;
  602. }
  603. static json_t *parse_array(lex_t *lex, size_t flags, json_error_t *error)
  604. {
  605. json_t *array = json_array();
  606. if(!array)
  607. return NULL;
  608. lex_scan(lex, error);
  609. if(lex->token == ']')
  610. return array;
  611. while(lex->token) {
  612. json_t *elem = parse_value(lex, flags, error);
  613. if(!elem)
  614. goto error;
  615. if(json_array_append(array, elem)) {
  616. json_decref(elem);
  617. goto error;
  618. }
  619. json_decref(elem);
  620. lex_scan(lex, error);
  621. if(lex->token != ',')
  622. break;
  623. lex_scan(lex, error);
  624. }
  625. if(lex->token != ']') {
  626. error_set(error, lex, "']' expected");
  627. goto error;
  628. }
  629. return array;
  630. error:
  631. json_decref(array);
  632. return NULL;
  633. }
  634. static json_t *parse_value(lex_t *lex, size_t flags, json_error_t *error)
  635. {
  636. json_t *json;
  637. switch(lex->token) {
  638. case TOKEN_STRING: {
  639. json = json_string_nocheck(lex->value.string);
  640. break;
  641. }
  642. case TOKEN_INTEGER: {
  643. json = json_integer(lex->value.integer);
  644. break;
  645. }
  646. case TOKEN_REAL: {
  647. json = json_real(lex->value.real);
  648. break;
  649. }
  650. case TOKEN_TRUE:
  651. json = json_true();
  652. break;
  653. case TOKEN_FALSE:
  654. json = json_false();
  655. break;
  656. case TOKEN_NULL:
  657. json = json_null();
  658. break;
  659. case '{':
  660. json = parse_object(lex, flags, error);
  661. break;
  662. case '[':
  663. json = parse_array(lex, flags, error);
  664. break;
  665. case TOKEN_INVALID:
  666. error_set(error, lex, "invalid token");
  667. return NULL;
  668. default:
  669. error_set(error, lex, "unexpected token");
  670. return NULL;
  671. }
  672. if(!json)
  673. return NULL;
  674. return json;
  675. }
  676. static json_t *parse_json(lex_t *lex, size_t flags, json_error_t *error)
  677. {
  678. json_t *result;
  679. lex_scan(lex, error);
  680. if(!(flags & JSON_DECODE_ANY)) {
  681. if(lex->token != '[' && lex->token != '{') {
  682. error_set(error, lex, "'[' or '{' expected");
  683. return NULL;
  684. }
  685. }
  686. result = parse_value(lex, flags, error);
  687. if(!result)
  688. return NULL;
  689. if(!(flags & JSON_DISABLE_EOF_CHECK)) {
  690. lex_scan(lex, error);
  691. if(lex->token != TOKEN_EOF) {
  692. error_set(error, lex, "end of file expected");
  693. json_decref(result);
  694. return NULL;
  695. }
  696. }
  697. if(error) {
  698. /* Save the position even though there was no error */
  699. error->position = lex->stream.position;
  700. }
  701. return result;
  702. }
  703. typedef struct
  704. {
  705. const char *data;
  706. int pos;
  707. } string_data_t;
  708. static int string_get(void *data)
  709. {
  710. char c;
  711. string_data_t *stream = (string_data_t *)data;
  712. c = stream->data[stream->pos];
  713. if(c == '\0')
  714. return EOF;
  715. else
  716. {
  717. stream->pos++;
  718. return (unsigned char)c;
  719. }
  720. }
  721. json_t *json_loads(const char *string, size_t flags, json_error_t *error)
  722. {
  723. lex_t lex;
  724. json_t *result;
  725. string_data_t stream_data;
  726. jsonp_error_init(error, "<string>");
  727. if (string == NULL) {
  728. error_set(error, NULL, "wrong arguments");
  729. return NULL;
  730. }
  731. stream_data.data = string;
  732. stream_data.pos = 0;
  733. if(lex_init(&lex, string_get, (void *)&stream_data))
  734. return NULL;
  735. result = parse_json(&lex, flags, error);
  736. lex_close(&lex);
  737. return result;
  738. }
  739. typedef struct
  740. {
  741. const char *data;
  742. size_t len;
  743. size_t pos;
  744. } buffer_data_t;
  745. static int buffer_get(void *data)
  746. {
  747. char c;
  748. buffer_data_t *stream = data;
  749. if(stream->pos >= stream->len)
  750. return EOF;
  751. c = stream->data[stream->pos];
  752. stream->pos++;
  753. return (unsigned char)c;
  754. }
  755. json_t *json_loadb(const char *buffer, size_t buflen, size_t flags, json_error_t *error)
  756. {
  757. lex_t lex;
  758. json_t *result;
  759. buffer_data_t stream_data;
  760. jsonp_error_init(error, "<buffer>");
  761. if (buffer == NULL) {
  762. error_set(error, NULL, "wrong arguments");
  763. return NULL;
  764. }
  765. stream_data.data = buffer;
  766. stream_data.pos = 0;
  767. stream_data.len = buflen;
  768. if(lex_init(&lex, buffer_get, (void *)&stream_data))
  769. return NULL;
  770. result = parse_json(&lex, flags, error);
  771. lex_close(&lex);
  772. return result;
  773. }
  774. json_t *json_loadf(FILE *input, size_t flags, json_error_t *error)
  775. {
  776. lex_t lex;
  777. const char *source;
  778. json_t *result;
  779. if(input == stdin)
  780. source = "<stdin>";
  781. else
  782. source = "<stream>";
  783. jsonp_error_init(error, source);
  784. if (input == NULL) {
  785. error_set(error, NULL, "wrong arguments");
  786. return NULL;
  787. }
  788. if(lex_init(&lex, (get_func)fgetc, input))
  789. return NULL;
  790. result = parse_json(&lex, flags, error);
  791. lex_close(&lex);
  792. return result;
  793. }
  794. json_t *json_load_file(const char *path, size_t flags, json_error_t *error)
  795. {
  796. json_t *result;
  797. FILE *fp;
  798. jsonp_error_init(error, path);
  799. if (path == NULL) {
  800. error_set(error, NULL, "wrong arguments");
  801. return NULL;
  802. }
  803. fp = fopen(path, "rb");
  804. if(!fp)
  805. {
  806. error_set(error, NULL, "unable to open %s: %s",
  807. path, strerror(errno));
  808. return NULL;
  809. }
  810. result = json_loadf(fp, flags, error);
  811. fclose(fp);
  812. return result;
  813. }
  814. #define MAX_BUF_LEN 1024
  815. typedef struct
  816. {
  817. char data[MAX_BUF_LEN];
  818. size_t len;
  819. size_t pos;
  820. json_load_callback_t callback;
  821. void *arg;
  822. } callback_data_t;
  823. static int callback_get(void *data)
  824. {
  825. char c;
  826. callback_data_t *stream = data;
  827. if(stream->pos >= stream->len) {
  828. stream->pos = 0;
  829. stream->len = stream->callback(stream->data, MAX_BUF_LEN, stream->arg);
  830. if(stream->len == 0 || stream->len == (size_t)-1)
  831. return EOF;
  832. }
  833. c = stream->data[stream->pos];
  834. stream->pos++;
  835. return (unsigned char)c;
  836. }
  837. json_t *json_load_callback(json_load_callback_t callback, void *arg, size_t flags, json_error_t *error)
  838. {
  839. lex_t lex;
  840. json_t *result;
  841. callback_data_t stream_data;
  842. memset(&stream_data, 0, sizeof(stream_data));
  843. stream_data.callback = callback;
  844. stream_data.arg = arg;
  845. jsonp_error_init(error, "<callback>");
  846. if (callback == NULL) {
  847. error_set(error, NULL, "wrong arguments");
  848. return NULL;
  849. }
  850. if(lex_init(&lex, (get_func)callback_get, &stream_data))
  851. return NULL;
  852. result = parse_json(&lex, flags, error);
  853. lex_close(&lex);
  854. return result;
  855. }