xs_json.h 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513
  1. /* copyright (c) 2022 grunfink - MIT license */
  2. #ifndef _XS_JSON_H
  3. #define _XS_JSON_H
  4. d_char *xs_json_dumps_pp(char *data, int indent);
  5. #define xs_json_dumps(data) xs_json_dumps_pp(data, 0)
  6. d_char *xs_json_loads(const char *json);
  7. #ifdef XS_IMPLEMENTATION
  8. /** IMPLEMENTATION **/
  9. /** JSON dumps **/
  10. d_char *_xs_json_dumps_str(d_char *s, char *data)
  11. /* dumps a string in JSON format */
  12. {
  13. unsigned char c;
  14. s = xs_str_cat(s, "\"");
  15. while ((c = *data)) {
  16. if (c == '\n')
  17. s = xs_str_cat(s, "\\n");
  18. else
  19. if (c == '\r')
  20. s = xs_str_cat(s, "\\r");
  21. else
  22. if (c == '\t')
  23. s = xs_str_cat(s, "\\t");
  24. else
  25. if (c == '\\')
  26. s = xs_str_cat(s, "\\\\");
  27. else
  28. if (c == '"')
  29. s = xs_str_cat(s, "\\\"");
  30. else
  31. if (c < 32) {
  32. char tmp[10];
  33. sprintf(tmp, "\\u%04x", (unsigned int) c);
  34. s = xs_str_cat(s, tmp);
  35. }
  36. else
  37. s = xs_append_m(s, data, 1);
  38. data++;
  39. }
  40. s = xs_str_cat(s, "\"");
  41. return s;
  42. }
  43. d_char *_xs_json_indent(d_char *s, int level, int indent)
  44. /* adds indentation */
  45. {
  46. if (indent) {
  47. int n;
  48. s = xs_str_cat(s, "\n");
  49. for (n = 0; n < level * indent; n++)
  50. s = xs_str_cat(s, " ");
  51. }
  52. return s;
  53. }
  54. d_char *_xs_json_dumps(d_char *s, char *data, int level, int indent)
  55. /* dumps partial data as JSON */
  56. {
  57. char *k, *v;
  58. int c = 0;
  59. switch (xs_type(data)) {
  60. case XSTYPE_NULL:
  61. s = xs_str_cat(s, "null");
  62. break;
  63. case XSTYPE_TRUE:
  64. s = xs_str_cat(s, "true");
  65. break;
  66. case XSTYPE_FALSE:
  67. s = xs_str_cat(s, "false");
  68. break;
  69. case XSTYPE_NUMBER:
  70. {
  71. char tmp[32];
  72. snprintf(tmp, sizeof(tmp), "%g", xs_number_get(data));
  73. s = xs_str_cat(s, tmp);
  74. }
  75. break;
  76. case XSTYPE_SOL:
  77. s = xs_str_cat(s, "[");
  78. while (xs_list_iter(&data, &v)) {
  79. if (c != 0)
  80. s = xs_str_cat(s, ",");
  81. s = _xs_json_indent(s, level + 1, indent);
  82. s = _xs_json_dumps(s, v, level + 1, indent);
  83. c++;
  84. }
  85. s = _xs_json_indent(s, level, indent);
  86. s = xs_str_cat(s, "]");
  87. break;
  88. case XSTYPE_SOD:
  89. s = xs_str_cat(s, "{");
  90. while (xs_dict_iter(&data, &k, &v)) {
  91. if (c != 0)
  92. s = xs_str_cat(s, ",");
  93. s = _xs_json_indent(s, level + 1, indent);
  94. s = _xs_json_dumps_str(s, k);
  95. s = xs_str_cat(s, ":");
  96. if (indent)
  97. s = xs_str_cat(s, " ");
  98. s = _xs_json_dumps(s, v, level + 1, indent);
  99. c++;
  100. }
  101. s = _xs_json_indent(s, level, indent);
  102. s = xs_str_cat(s, "}");
  103. break;
  104. case XSTYPE_STRING:
  105. s = _xs_json_dumps_str(s, data);
  106. break;
  107. default:
  108. break;
  109. }
  110. return s;
  111. }
  112. d_char *xs_json_dumps_pp(char *data, int indent)
  113. /* dumps a piece of data as JSON */
  114. {
  115. xstype t = xs_type(data);
  116. d_char *s = NULL;
  117. if (t == XSTYPE_SOL || t == XSTYPE_SOD) {
  118. s = xs_str_new(NULL);
  119. s = _xs_json_dumps(s, data, 0, indent);
  120. }
  121. return s;
  122. }
  123. /** JSON loads **/
  124. /* this code comes mostly from the Minimum Profit Text Editor (MPDM) */
  125. typedef enum {
  126. JS_ERROR = -1,
  127. JS_INCOMPLETE,
  128. JS_OCURLY,
  129. JS_OBRACK,
  130. JS_CCURLY,
  131. JS_CBRACK,
  132. JS_COMMA,
  133. JS_COLON,
  134. JS_VALUE,
  135. JS_STRING,
  136. JS_INTEGER,
  137. JS_REAL,
  138. JS_TRUE,
  139. JS_FALSE,
  140. JS_NULL,
  141. JS_ARRAY,
  142. JS_OBJECT
  143. } js_type;
  144. d_char *_xs_json_loads_lexer(const char **json, js_type *t)
  145. {
  146. char c;
  147. const char *s = *json;
  148. d_char *v = NULL;
  149. /* skip blanks */
  150. while (*s == L' ' || *s == L'\t' || *s == L'\n' || *s == L'\r')
  151. s++;
  152. c = *s++;
  153. if (c == '{')
  154. *t = JS_OCURLY;
  155. else
  156. if (c == '}')
  157. *t = JS_CCURLY;
  158. else
  159. if (c == '[')
  160. *t = JS_OBRACK;
  161. else
  162. if (c == ']')
  163. *t = JS_CBRACK;
  164. else
  165. if (c == ',')
  166. *t = JS_COMMA;
  167. else
  168. if (c == ':')
  169. *t = JS_COLON;
  170. else
  171. if (c == '"') {
  172. *t = JS_STRING;
  173. v = xs_str_new(NULL);
  174. while ((c = *s) != '"' && c != '\0') {
  175. char tmp[5];
  176. int cp, i;
  177. if (c == '\\') {
  178. s++;
  179. c = *s;
  180. switch (c) {
  181. case 'n': c = '\n'; break;
  182. case 'r': c = '\r'; break;
  183. case 't': c = '\t'; break;
  184. case 'u': /* Unicode codepoint as an hex char */
  185. s++;
  186. memcpy(tmp, s, 4);
  187. s += 3;
  188. tmp[4] = '\0';
  189. sscanf(tmp, "%04x", &i);
  190. if (i >= 0xd800 && i <= 0xdfff) {
  191. /* it's a surrogate pair */
  192. cp = (i & 0x3ff) << 10;
  193. /* skip to the next value */
  194. s += 3;
  195. memcpy(tmp, s, 4);
  196. s += 3;
  197. sscanf(tmp, "%04x", &i);
  198. cp |= (i & 0x3ff);
  199. cp += 0x10000;
  200. }
  201. else
  202. cp = i;
  203. v = xs_utf8_enc(v, cp);
  204. c = '\0';
  205. break;
  206. }
  207. }
  208. if (c)
  209. v = xs_append_m(v, &c, 1);
  210. s++;
  211. }
  212. if (c != '\0')
  213. s++;
  214. }
  215. else
  216. if (c == '-' || (c >= '0' && c <= '9') || c == '.') {
  217. xs *vn = NULL;
  218. *t = JS_INTEGER;
  219. vn = xs_str_new(NULL);
  220. vn = xs_append_m(vn, &c, 1);
  221. while (((c = *s) >= '0' && c <= '9') || c == '.') {
  222. if (c == '.')
  223. *t = JS_REAL;
  224. vn = xs_append_m(vn, &c, 1);
  225. s++;
  226. }
  227. /* convert to XSTYPE_NUMBER */
  228. v = xs_number_new(atof(vn));
  229. }
  230. else
  231. if (c == 't' && strncmp(s, "rue", 3) == 0) {
  232. s += 3;
  233. *t = JS_TRUE;
  234. v = xs_val_new(XSTYPE_TRUE);
  235. }
  236. else
  237. if (c == 'f' && strncmp(s, "alse", 4) == 0) {
  238. s += 4;
  239. *t = JS_FALSE;
  240. v = xs_val_new(XSTYPE_FALSE);
  241. }
  242. else
  243. if (c == 'n' && strncmp(s, "ull", 3) == 0) {
  244. s += 3;
  245. *t = JS_NULL;
  246. v = xs_val_new(XSTYPE_NULL);
  247. }
  248. else
  249. *t = JS_ERROR;
  250. *json = s;
  251. return v;
  252. }
  253. d_char *_xs_json_loads_array(const char **json, js_type *t);
  254. d_char *_xs_json_loads_object(const char **json, js_type *t);
  255. d_char *_xs_json_loads_value(const char **json, js_type *t, d_char *v)
  256. /* parses a JSON value */
  257. {
  258. if (*t == JS_OBRACK)
  259. v = _xs_json_loads_array(json, t);
  260. else
  261. if (*t == JS_OCURLY)
  262. v = _xs_json_loads_object(json, t);
  263. if (*t >= JS_VALUE)
  264. *t = JS_VALUE;
  265. else
  266. *t = JS_ERROR;
  267. return v;
  268. }
  269. d_char *_xs_json_loads_array(const char **json, js_type *t)
  270. /* parses a JSON array */
  271. {
  272. const char *s = *json;
  273. xs *v;
  274. d_char *l;
  275. js_type tt;
  276. l = xs_list_new();
  277. *t = JS_INCOMPLETE;
  278. v = _xs_json_loads_lexer(&s, &tt);
  279. if (tt == JS_CBRACK)
  280. *t = JS_ARRAY;
  281. else {
  282. v = _xs_json_loads_value(&s, &tt, v);
  283. if (tt == JS_VALUE) {
  284. l = xs_list_append(l, v);
  285. while (*t == JS_INCOMPLETE) {
  286. free(_xs_json_loads_lexer(&s, &tt));
  287. if (tt == JS_CBRACK)
  288. *t = JS_ARRAY;
  289. else
  290. if (tt == JS_COMMA) {
  291. xs *v2;
  292. v2 = _xs_json_loads_lexer(&s, &tt);
  293. v2 = _xs_json_loads_value(&s, &tt, v2);
  294. if (tt == JS_VALUE)
  295. l = xs_list_append(l, v2);
  296. else
  297. *t = JS_ERROR;
  298. }
  299. else
  300. *t = JS_ERROR;
  301. }
  302. }
  303. else
  304. *t = JS_ERROR;
  305. }
  306. if (*t == JS_ERROR) {
  307. free(l);
  308. l = NULL;
  309. }
  310. *json = s;
  311. return l;
  312. }
  313. d_char *_xs_json_loads_object(const char **json, js_type *t)
  314. /* parses a JSON object */
  315. {
  316. const char *s = *json;
  317. xs *k1;
  318. d_char *d;
  319. js_type tt;
  320. d = xs_dict_new();
  321. *t = JS_INCOMPLETE;
  322. k1 = _xs_json_loads_lexer(&s, &tt);
  323. if (tt == JS_CCURLY)
  324. *t = JS_OBJECT;
  325. else
  326. if (tt == JS_STRING) {
  327. free(_xs_json_loads_lexer(&s, &tt));
  328. if (tt == JS_COLON) {
  329. xs *v1;
  330. v1 = _xs_json_loads_lexer(&s, &tt);
  331. v1 = _xs_json_loads_value(&s, &tt, v1);
  332. if (tt == JS_VALUE) {
  333. d = xs_dict_append(d, k1, v1);
  334. while (*t == JS_INCOMPLETE) {
  335. free(_xs_json_loads_lexer(&s, &tt));
  336. if (tt == JS_CCURLY)
  337. *t = JS_OBJECT;
  338. else
  339. if (tt == JS_COMMA) {
  340. xs *k = _xs_json_loads_lexer(&s, &tt);
  341. if (tt == JS_STRING) {
  342. free(_xs_json_loads_lexer(&s, &tt));
  343. if (tt == JS_COLON) {
  344. xs *v;
  345. v = _xs_json_loads_lexer(&s, &tt);
  346. v = _xs_json_loads_value(&s, &tt, v);
  347. if (tt == JS_VALUE)
  348. d = xs_dict_append(d, k, v);
  349. else
  350. *t = JS_ERROR;
  351. }
  352. else
  353. *t = JS_ERROR;
  354. }
  355. else
  356. *t = JS_ERROR;
  357. }
  358. else
  359. *t = JS_ERROR;
  360. }
  361. }
  362. else
  363. *t = JS_ERROR;
  364. }
  365. else
  366. *t = JS_ERROR;
  367. }
  368. else
  369. *t = JS_ERROR;
  370. if (*t == JS_ERROR) {
  371. free(d);
  372. d = NULL;
  373. }
  374. *json = s;
  375. return d;
  376. }
  377. d_char *xs_json_loads(const char *json)
  378. /* loads a string in JSON format and converts to a multiple data */
  379. {
  380. d_char *v = NULL;
  381. js_type t;
  382. _xs_json_loads_lexer(&json, &t);
  383. if (t == JS_OBRACK)
  384. v = _xs_json_loads_array(&json, &t);
  385. else
  386. if (t == JS_OCURLY)
  387. v = _xs_json_loads_object(&json, &t);
  388. else
  389. t = JS_ERROR;
  390. return v;
  391. }
  392. #endif /* XS_IMPLEMENTATION */
  393. #endif /* _XS_JSON_H */