xs_url.h 6.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228
  1. /* copyright (c) 2022 - 2024 grunfink et al. / MIT license */
  2. #ifndef _XS_URL_H
  3. #define _XS_URL_H
  4. xs_str *xs_url_dec(const char *str);
  5. xs_dict *xs_url_vars(const char *str);
  6. xs_dict *xs_multipart_form_data(const char *payload, int p_size, const char *header);
  7. #ifdef XS_IMPLEMENTATION
  8. xs_str *xs_url_dec(const char *str)
  9. /* decodes an URL */
  10. {
  11. xs_str *s = xs_str_new(NULL);
  12. while (*str) {
  13. if (*str == '%') {
  14. int i;
  15. if (sscanf(str + 1, "%02x", &i) == 1) {
  16. unsigned char uc = i;
  17. s = xs_append_m(s, (char *)&uc, 1);
  18. str += 2;
  19. }
  20. }
  21. else
  22. if (*str == '+')
  23. s = xs_append_m(s, " ", 1);
  24. else
  25. s = xs_append_m(s, str, 1);
  26. str++;
  27. }
  28. return s;
  29. }
  30. xs_dict *xs_url_vars(const char *str)
  31. /* parse url variables */
  32. {
  33. xs_dict *vars;
  34. vars = xs_dict_new();
  35. if (str != NULL) {
  36. /* split by arguments */
  37. xs *args = xs_split(str, "&");
  38. const xs_val *v;
  39. xs_list_foreach(args, v) {
  40. xs *kv = xs_split_n(v, "=", 1);
  41. if (xs_list_len(kv) == 2) {
  42. const char *key = xs_list_get(kv, 0);
  43. const char *pv = xs_dict_get(vars, key);
  44. if (!xs_is_null(pv)) {
  45. /* there is a previous value: convert to a list and append */
  46. xs *vlist = NULL;
  47. if (xs_type(pv) == XSTYPE_LIST)
  48. vlist = xs_dup(pv);
  49. else {
  50. vlist = xs_list_new();
  51. vlist = xs_list_append(vlist, pv);
  52. }
  53. vlist = xs_list_append(vlist, xs_list_get(kv, 1));
  54. vars = xs_dict_set(vars, key, vlist);
  55. }
  56. else {
  57. /* ends with []? force to always be a list */
  58. if (xs_endswith(key, "[]")) {
  59. xs *vlist = xs_list_new();
  60. vlist = xs_list_append(vlist, xs_list_get(kv, 1));
  61. vars = xs_dict_append(vars, key, vlist);
  62. }
  63. else
  64. vars = xs_dict_append(vars, key, xs_list_get(kv, 1));
  65. }
  66. }
  67. }
  68. }
  69. return vars;
  70. }
  71. xs_dict *xs_multipart_form_data(const char *payload, int p_size, const char *header)
  72. /* parses a multipart/form-data payload */
  73. {
  74. xs *boundary = NULL;
  75. int offset = 0;
  76. int bsz;
  77. char *p;
  78. /* build the boundary string */
  79. {
  80. xs *l1 = xs_split(header, "=");
  81. if (xs_list_len(l1) != 2)
  82. return NULL;
  83. boundary = xs_dup(xs_list_get(l1, 1));
  84. /* Tokodon sends the boundary header with double quotes surrounded */
  85. if (xs_between("\"", boundary, "\"") != 0)
  86. boundary = xs_strip_chars_i(boundary, "\"");
  87. boundary = xs_fmt("--%s", boundary);
  88. }
  89. bsz = strlen(boundary);
  90. xs_dict *p_vars = xs_dict_new();
  91. /* iterate searching the boundaries */
  92. while ((p = xs_memmem(payload + offset, p_size - offset, boundary, bsz)) != NULL) {
  93. xs *s1 = NULL;
  94. xs *l1 = NULL;
  95. const char *vn = NULL;
  96. const char *fn = NULL;
  97. const char *ct = NULL;
  98. char *q;
  99. int po, ps;
  100. /* final boundary? */
  101. p += bsz;
  102. if (p[0] == '-' && p[1] == '-')
  103. break;
  104. /* skip the \r\n */
  105. p += 2;
  106. /* Tokodon sends also a Content-Type headers,
  107. let's use it to determine the file type */
  108. do {
  109. if (p[0] == 13 && p[1] == 10)
  110. break;
  111. q = strchr(p, '\r');
  112. s1 = xs_realloc(NULL, q - p + 1);
  113. memcpy(s1, p, q - p);
  114. s1[q - p] = '\0';
  115. if (xs_startswith(s1, "Content-Disposition")) {
  116. /* split by " like a primitive man */
  117. l1 = xs_split(s1, "\"");
  118. /* get the variable name */
  119. vn = xs_list_get(l1, 1);
  120. /* is it an attached file? */
  121. if (xs_list_len(l1) >= 4 && strcmp(xs_list_get(l1, 2), "; filename=") == 0) {
  122. /* get the file name */
  123. fn = xs_list_get(l1, 3);
  124. }
  125. }
  126. else
  127. if (xs_startswith(s1, "Content-Type")) {
  128. l1 = xs_split(s1, ":");
  129. if (xs_list_len(l1) >= 2) {
  130. ct = xs_lstrip_chars_i(xs_dup(xs_list_get(l1, 1)), " ");
  131. }
  132. }
  133. p += (q - p);
  134. p += 2; // Skip /r/n
  135. } while (1);
  136. /* find the start of the part content */
  137. if ((p = xs_memmem(p, p_size - (p - payload), "\r\n", 2)) == NULL)
  138. break;
  139. p += 2; // Skip empty line
  140. /* find the next boundary */
  141. if ((q = xs_memmem(p, p_size - (p - payload), boundary, bsz)) == NULL)
  142. break;
  143. po = p - payload;
  144. ps = q - p - 2; /* - 2 because the final \r\n */
  145. /* is it a filename? */
  146. if (fn != NULL) {
  147. /* p_var value is a list */
  148. /* if filename has no extension and content-type is image, attach extension to the filename */
  149. if (strchr(fn, '.') == NULL && xs_startswith(ct, "image/")) {
  150. char *ext = strchr(ct, '/');
  151. ext++;
  152. fn = xs_str_cat(xs_str_new(""), fn, ".", ext);
  153. }
  154. xs *l1 = xs_list_new();
  155. xs *vpo = xs_number_new(po);
  156. xs *vps = xs_number_new(ps);
  157. l1 = xs_list_append(l1, fn);
  158. l1 = xs_list_append(l1, vpo);
  159. l1 = xs_list_append(l1, vps);
  160. p_vars = xs_dict_append(p_vars, vn, l1);
  161. }
  162. else {
  163. /* regular variable; just copy */
  164. xs *vc = xs_realloc(NULL, ps + 1);
  165. memcpy(vc, payload + po, ps);
  166. vc[ps] = '\0';
  167. p_vars = xs_dict_append(p_vars, vn, vc);
  168. }
  169. /* move on */
  170. offset = q - payload;
  171. }
  172. return p_vars;
  173. }
  174. #endif /* XS_IMPLEMENTATION */
  175. #endif /* XS_URL_H */