xs_json.h 10 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505
  1. /* copyright (c) 2022 grunfink - MIT license */
  2. #ifndef _XS_JSON_H
  3. #define _XS_JSON_H
  4. d_char *xs_json_dumps_pp(char *data, int indent);
  5. #define xs_json_dumps(data) xs_json_dumps_pp(data, 0)
  6. d_char *xs_json_loads(const char *json);
  7. #ifdef XS_IMPLEMENTATION
  8. /** IMPLEMENTATION **/
  9. /** JSON dumps **/
  10. d_char *_xs_json_dumps_str(d_char *s, char *data)
  11. /* dumps a string in JSON format */
  12. {
  13. unsigned char c;
  14. s = xs_str_cat(s, "\"");
  15. while ((c = *data)) {
  16. if (c == '\n')
  17. s = xs_str_cat(s, "\\n");
  18. else
  19. if (c == '\r')
  20. s = xs_str_cat(s, "\\r");
  21. else
  22. if (c == '\t')
  23. s = xs_str_cat(s, "\\t");
  24. else
  25. if (c == '\\')
  26. s = xs_str_cat(s, "\\\\");
  27. else
  28. if (c == '"')
  29. s = xs_str_cat(s, "\\\"");
  30. else
  31. if (c < 32) {
  32. char tmp[10];
  33. sprintf(tmp, "\\u%04x", (unsigned int) c);
  34. s = xs_str_cat(s, tmp);
  35. }
  36. else
  37. s = xs_append_m(s, data, 1);
  38. data++;
  39. }
  40. s = xs_str_cat(s, "\"");
  41. return s;
  42. }
  43. d_char *_xs_json_indent(d_char *s, int level, int indent)
  44. /* adds indentation */
  45. {
  46. if (indent) {
  47. int n;
  48. s = xs_str_cat(s, "\n");
  49. for (n = 0; n < level * indent; n++)
  50. s = xs_str_cat(s, " ");
  51. }
  52. return s;
  53. }
  54. d_char *_xs_json_dumps(d_char *s, char *data, int level, int indent)
  55. /* dumps partial data as JSON */
  56. {
  57. char *k, *v;
  58. int c = 0;
  59. switch (xs_type(data)) {
  60. case XSTYPE_NULL:
  61. s = xs_str_cat(s, "null");
  62. break;
  63. case XSTYPE_TRUE:
  64. s = xs_str_cat(s, "true");
  65. break;
  66. case XSTYPE_FALSE:
  67. s = xs_str_cat(s, "false");
  68. break;
  69. case XSTYPE_NUMBER:
  70. s = xs_str_cat(s, xs_number_str(data));
  71. break;
  72. case XSTYPE_LIST:
  73. s = xs_str_cat(s, "[");
  74. while (xs_list_iter(&data, &v)) {
  75. if (c != 0)
  76. s = xs_str_cat(s, ",");
  77. s = _xs_json_indent(s, level + 1, indent);
  78. s = _xs_json_dumps(s, v, level + 1, indent);
  79. c++;
  80. }
  81. s = _xs_json_indent(s, level, indent);
  82. s = xs_str_cat(s, "]");
  83. break;
  84. case XSTYPE_DICT:
  85. s = xs_str_cat(s, "{");
  86. while (xs_dict_iter(&data, &k, &v)) {
  87. if (c != 0)
  88. s = xs_str_cat(s, ",");
  89. s = _xs_json_indent(s, level + 1, indent);
  90. s = _xs_json_dumps_str(s, k);
  91. s = xs_str_cat(s, ":");
  92. if (indent)
  93. s = xs_str_cat(s, " ");
  94. s = _xs_json_dumps(s, v, level + 1, indent);
  95. c++;
  96. }
  97. s = _xs_json_indent(s, level, indent);
  98. s = xs_str_cat(s, "}");
  99. break;
  100. case XSTYPE_STRING:
  101. s = _xs_json_dumps_str(s, data);
  102. break;
  103. default:
  104. break;
  105. }
  106. return s;
  107. }
  108. d_char *xs_json_dumps_pp(char *data, int indent)
  109. /* dumps a piece of data as JSON */
  110. {
  111. xstype t = xs_type(data);
  112. d_char *s = NULL;
  113. if (t == XSTYPE_LIST || t == XSTYPE_DICT) {
  114. s = xs_str_new(NULL);
  115. s = _xs_json_dumps(s, data, 0, indent);
  116. }
  117. return s;
  118. }
  119. /** JSON loads **/
  120. /* this code comes mostly from the Minimum Profit Text Editor (MPDM) */
  121. typedef enum {
  122. JS_ERROR = -1,
  123. JS_INCOMPLETE,
  124. JS_OCURLY,
  125. JS_OBRACK,
  126. JS_CCURLY,
  127. JS_CBRACK,
  128. JS_COMMA,
  129. JS_COLON,
  130. JS_VALUE,
  131. JS_STRING,
  132. JS_INTEGER,
  133. JS_REAL,
  134. JS_TRUE,
  135. JS_FALSE,
  136. JS_NULL,
  137. JS_ARRAY,
  138. JS_OBJECT
  139. } js_type;
  140. d_char *_xs_json_loads_lexer(const char **json, js_type *t)
  141. {
  142. char c;
  143. const char *s = *json;
  144. d_char *v = NULL;
  145. /* skip blanks */
  146. while (*s == L' ' || *s == L'\t' || *s == L'\n' || *s == L'\r')
  147. s++;
  148. c = *s++;
  149. if (c == '{')
  150. *t = JS_OCURLY;
  151. else
  152. if (c == '}')
  153. *t = JS_CCURLY;
  154. else
  155. if (c == '[')
  156. *t = JS_OBRACK;
  157. else
  158. if (c == ']')
  159. *t = JS_CBRACK;
  160. else
  161. if (c == ',')
  162. *t = JS_COMMA;
  163. else
  164. if (c == ':')
  165. *t = JS_COLON;
  166. else
  167. if (c == '"') {
  168. *t = JS_STRING;
  169. v = xs_str_new(NULL);
  170. while ((c = *s) != '"' && c != '\0') {
  171. char tmp[5];
  172. int cp, i;
  173. if (c == '\\') {
  174. s++;
  175. c = *s;
  176. switch (c) {
  177. case 'n': c = '\n'; break;
  178. case 'r': c = '\r'; break;
  179. case 't': c = '\t'; break;
  180. case 'u': /* Unicode codepoint as an hex char */
  181. s++;
  182. memcpy(tmp, s, 4);
  183. s += 3;
  184. tmp[4] = '\0';
  185. sscanf(tmp, "%04x", &i);
  186. if (i >= 0xd800 && i <= 0xdfff) {
  187. /* it's a surrogate pair */
  188. cp = (i & 0x3ff) << 10;
  189. /* skip to the next value */
  190. s += 3;
  191. memcpy(tmp, s, 4);
  192. s += 3;
  193. sscanf(tmp, "%04x", &i);
  194. cp |= (i & 0x3ff);
  195. cp += 0x10000;
  196. }
  197. else
  198. cp = i;
  199. v = xs_utf8_enc(v, cp);
  200. c = '\0';
  201. break;
  202. }
  203. }
  204. if (c)
  205. v = xs_append_m(v, &c, 1);
  206. s++;
  207. }
  208. if (c != '\0')
  209. s++;
  210. }
  211. else
  212. if (c == '-' || (c >= '0' && c <= '9') || c == '.') {
  213. xs *vn = NULL;
  214. *t = JS_INTEGER;
  215. vn = xs_str_new(NULL);
  216. vn = xs_append_m(vn, &c, 1);
  217. while (((c = *s) >= '0' && c <= '9') || c == '.') {
  218. if (c == '.')
  219. *t = JS_REAL;
  220. vn = xs_append_m(vn, &c, 1);
  221. s++;
  222. }
  223. /* convert to XSTYPE_NUMBER */
  224. v = xs_number_new(atof(vn));
  225. }
  226. else
  227. if (c == 't' && strncmp(s, "rue", 3) == 0) {
  228. s += 3;
  229. *t = JS_TRUE;
  230. v = xs_val_new(XSTYPE_TRUE);
  231. }
  232. else
  233. if (c == 'f' && strncmp(s, "alse", 4) == 0) {
  234. s += 4;
  235. *t = JS_FALSE;
  236. v = xs_val_new(XSTYPE_FALSE);
  237. }
  238. else
  239. if (c == 'n' && strncmp(s, "ull", 3) == 0) {
  240. s += 3;
  241. *t = JS_NULL;
  242. v = xs_val_new(XSTYPE_NULL);
  243. }
  244. else
  245. *t = JS_ERROR;
  246. *json = s;
  247. return v;
  248. }
  249. d_char *_xs_json_loads_array(const char **json, js_type *t);
  250. d_char *_xs_json_loads_object(const char **json, js_type *t);
  251. d_char *_xs_json_loads_value(const char **json, js_type *t, d_char *v)
  252. /* parses a JSON value */
  253. {
  254. if (*t == JS_OBRACK)
  255. v = _xs_json_loads_array(json, t);
  256. else
  257. if (*t == JS_OCURLY)
  258. v = _xs_json_loads_object(json, t);
  259. if (*t >= JS_VALUE)
  260. *t = JS_VALUE;
  261. else
  262. *t = JS_ERROR;
  263. return v;
  264. }
  265. d_char *_xs_json_loads_array(const char **json, js_type *t)
  266. /* parses a JSON array */
  267. {
  268. const char *s = *json;
  269. xs *v;
  270. d_char *l;
  271. js_type tt;
  272. l = xs_list_new();
  273. *t = JS_INCOMPLETE;
  274. v = _xs_json_loads_lexer(&s, &tt);
  275. if (tt == JS_CBRACK)
  276. *t = JS_ARRAY;
  277. else {
  278. v = _xs_json_loads_value(&s, &tt, v);
  279. if (tt == JS_VALUE) {
  280. l = xs_list_append(l, v);
  281. while (*t == JS_INCOMPLETE) {
  282. xs_free(_xs_json_loads_lexer(&s, &tt));
  283. if (tt == JS_CBRACK)
  284. *t = JS_ARRAY;
  285. else
  286. if (tt == JS_COMMA) {
  287. xs *v2;
  288. v2 = _xs_json_loads_lexer(&s, &tt);
  289. v2 = _xs_json_loads_value(&s, &tt, v2);
  290. if (tt == JS_VALUE)
  291. l = xs_list_append(l, v2);
  292. else
  293. *t = JS_ERROR;
  294. }
  295. else
  296. *t = JS_ERROR;
  297. }
  298. }
  299. else
  300. *t = JS_ERROR;
  301. }
  302. if (*t == JS_ERROR)
  303. l = xs_free(l);
  304. *json = s;
  305. return l;
  306. }
  307. d_char *_xs_json_loads_object(const char **json, js_type *t)
  308. /* parses a JSON object */
  309. {
  310. const char *s = *json;
  311. xs *k1;
  312. d_char *d;
  313. js_type tt;
  314. d = xs_dict_new();
  315. *t = JS_INCOMPLETE;
  316. k1 = _xs_json_loads_lexer(&s, &tt);
  317. if (tt == JS_CCURLY)
  318. *t = JS_OBJECT;
  319. else
  320. if (tt == JS_STRING) {
  321. xs_free(_xs_json_loads_lexer(&s, &tt));
  322. if (tt == JS_COLON) {
  323. xs *v1;
  324. v1 = _xs_json_loads_lexer(&s, &tt);
  325. v1 = _xs_json_loads_value(&s, &tt, v1);
  326. if (tt == JS_VALUE) {
  327. d = xs_dict_append(d, k1, v1);
  328. while (*t == JS_INCOMPLETE) {
  329. xs_free(_xs_json_loads_lexer(&s, &tt));
  330. if (tt == JS_CCURLY)
  331. *t = JS_OBJECT;
  332. else
  333. if (tt == JS_COMMA) {
  334. xs *k = _xs_json_loads_lexer(&s, &tt);
  335. if (tt == JS_STRING) {
  336. xs_free(_xs_json_loads_lexer(&s, &tt));
  337. if (tt == JS_COLON) {
  338. xs *v;
  339. v = _xs_json_loads_lexer(&s, &tt);
  340. v = _xs_json_loads_value(&s, &tt, v);
  341. if (tt == JS_VALUE)
  342. d = xs_dict_append(d, k, v);
  343. else
  344. *t = JS_ERROR;
  345. }
  346. else
  347. *t = JS_ERROR;
  348. }
  349. else
  350. *t = JS_ERROR;
  351. }
  352. else
  353. *t = JS_ERROR;
  354. }
  355. }
  356. else
  357. *t = JS_ERROR;
  358. }
  359. else
  360. *t = JS_ERROR;
  361. }
  362. else
  363. *t = JS_ERROR;
  364. if (*t == JS_ERROR)
  365. d = xs_free(d);
  366. *json = s;
  367. return d;
  368. }
  369. d_char *xs_json_loads(const char *json)
  370. /* loads a string in JSON format and converts to a multiple data */
  371. {
  372. d_char *v = NULL;
  373. js_type t;
  374. xs_free(_xs_json_loads_lexer(&json, &t));
  375. if (t == JS_OBRACK)
  376. v = _xs_json_loads_array(&json, &t);
  377. else
  378. if (t == JS_OCURLY)
  379. v = _xs_json_loads_object(&json, &t);
  380. else
  381. t = JS_ERROR;
  382. return v;
  383. }
  384. #endif /* XS_IMPLEMENTATION */
  385. #endif /* _XS_JSON_H */