/* snac - A simple, minimalistic ActivityPub instance */
/* copyright (c) 2022 - 2024 grunfink et al. / MIT license */
#include "xs.h"
#include "xs_regex.h"
#include "xs_mime.h"
#include "xs_html.h"
#include "xs_json.h"
#include "xs_time.h"
#include "snac.h"
/* emoticons, people laughing and such */
const char *smileys[] = {
":-)", "🙂",
":-D", "😀",
"X-D", "😆",
";-)", "😉",
"B-)", "😎",
">:-(", "😡",
":-(", "😞",
":-*", "😘",
":-/", "😕",
"8-o", "😲",
"%-)", "🤪",
":_(", "😢",
":-|", "😐",
"<3", "❤️",
":facepalm:", "🤦",
":shrug:", "🤷",
":shrug2:", "¯\\_(ツ)_/¯",
":eyeroll:", "🙄",
":beer:", "🍺",
":beers:", "🍻",
":munch:", "😱",
":thumb:", "👍",
NULL, NULL
};
xs_dict *emojis(void)
/* returns a dict with the emojis */
{
xs *fn = xs_fmt("%s/emojis.json", srv_basedir);
FILE *f;
if (mtime(fn) == 0) {
/* file does not exist; create it with the defaults */
xs *d = xs_dict_new();
const char **emo = smileys;
while (*emo) {
d = xs_dict_append(d, emo[0], emo[1]);
emo += 2;
}
if ((f = fopen(fn, "w")) != NULL) {
xs_json_dump(d, 4, f);
fclose(f);
}
else
srv_log(xs_fmt("Error creating '%s'", fn));
}
xs_dict *d = NULL;
if ((f = fopen(fn, "r")) != NULL) {
d = xs_json_load(f);
fclose(f);
if (d == NULL)
srv_log(xs_fmt("JSON parse error in '%s'", fn));
}
else
srv_log(xs_fmt("Error opening '%s'", fn));
return d;
}
static xs_str *format_line(const char *line, xs_list **attach)
/* formats a line */
{
xs_str *s = xs_str_new(NULL);
char *p;
const char *v;
/* split by markup */
xs *sm = xs_regex_split(line,
"("
"`[^`]+`" "|"
"~~[^~]+~~" "|"
"\\*\\*?\\*?[^\\*]+\\*?\\*?\\*" "|"
"!\\[[^]]+\\]\\([^\\)]+\\)" "|"
"\\[[^]]+\\]\\([^\\)]+\\)" "|"
"[a-z]+:/" "/[^[:space:]]+"
")");
int n = 0;
p = sm;
while (xs_list_iter(&p, &v)) {
if ((n & 0x1)) {
/* markup */
if (xs_startswith(v, "`")) {
xs *s1 = xs_strip_chars_i(xs_dup(v), "`");
xs *e1 = encode_html(s1);
xs *s2 = xs_fmt("%s
", e1);
s = xs_str_cat(s, s2);
}
else
if (xs_startswith(v, "***")) {
xs *s1 = xs_strip_chars_i(xs_dup(v), "*");
xs *s2 = xs_fmt("%s", s1);
s = xs_str_cat(s, s2);
}
else
if (xs_startswith(v, "**")) {
xs *s1 = xs_strip_chars_i(xs_dup(v), "*");
xs *s2 = xs_fmt("%s", s1);
s = xs_str_cat(s, s2);
}
else
if (xs_startswith(v, "*")) {
xs *s1 = xs_strip_chars_i(xs_dup(v), "*");
xs *s2 = xs_fmt("%s", s1);
s = xs_str_cat(s, s2);
}
else
if (xs_startswith(v, "~~")) {
xs *s1 = xs_strip_chars_i(xs_dup(v), "~");
xs *e1 = encode_html(s1);
xs *s2 = xs_fmt("%s", e1);
s = xs_str_cat(s, s2);
}
else
if (*v == '[') {
/* markdown-like links [label](url) */
xs *w = xs_strip_chars_i(
xs_replace_i(xs_replace(v, "#", "#"), "@", "@"),
"![)");
xs *l = xs_split_n(w, "](", 1);
if (xs_list_len(l) == 2) {
xs *link = xs_fmt("%s",
xs_list_get(l, 1), xs_list_get(l, 0));
s = xs_str_cat(s, link);
}
else
s = xs_str_cat(s, v);
}
else
if (*v == '!') {
/* markdown-like images ![alt text](url to image) */
xs *w = xs_strip_chars_i(
xs_replace_i(xs_replace(v, "#", "#"), "@", "@"),
"![)");
xs *l = xs_split_n(w, "](", 1);
if (xs_list_len(l) == 2) {
const char *alt_text = xs_list_get(l, 0);
const char *img_url = xs_list_get(l, 1);
const char *mime = xs_mime_by_ext(img_url);
if (attach != NULL && xs_startswith(mime, "image/")) {
const xs_dict *ad;
int add = 1;
xs_list_foreach(*attach, ad) {
if (strcmp(xs_dict_get_def(ad, "url", ""), img_url) == 0) {
add = 0;
break;
}
}
if (add) {
xs *d = xs_dict_new();
d = xs_dict_append(d, "mediaType", mime);
d = xs_dict_append(d, "url", img_url);
d = xs_dict_append(d, "name", alt_text);
d = xs_dict_append(d, "type", "Image");
*attach = xs_list_append(*attach, d);
}
}
else {
xs *link = xs_fmt("%s", img_url, alt_text);
s = xs_str_cat(s, link);
}
}
else
s = xs_str_cat(s, v);
}
else
if (xs_str_in(v, ":/" "/") != -1) {
xs *u = xs_replace_i(xs_replace(v, "#", "#"), "@", "@");
xs *v2 = xs_strip_chars_i(xs_dup(u), ".,)");
const char *mime = xs_mime_by_ext(v2);
if (attach != NULL && xs_startswith(mime, "image/")) {
/* if it's a link to an image, insert it as an attachment */
const xs_dict *ad;
int add = 1;
xs_list_foreach(*attach, ad) {
if (strcmp(xs_dict_get_def(ad, "url", ""), v2) == 0) {
add = 0;
break;
}
}
if (add) {
xs *d = xs_dict_new();
d = xs_dict_append(d, "mediaType", mime);
d = xs_dict_append(d, "url", v2);
d = xs_dict_append(d, "name", "");
d = xs_dict_append(d, "type", "Image");
*attach = xs_list_append(*attach, d);
}
}
else {
xs *s1 = xs_fmt("%s", v2, u);
s = xs_str_cat(s, s1);
}
}
else
s = xs_str_cat(s, v);
}
else
/* surrounded text, copy directly */
s = xs_str_cat(s, v);
n++;
}
return s;
}
xs_str *not_really_markdown(const char *content, xs_list **attach, xs_list **tag)
/* formats a content using some Markdown rules */
{
xs_str *s = xs_str_new(NULL);
int in_pre = 0;
int in_blq = 0;
xs *list;
char *p;
const char *v;
/* work by lines */
list = xs_split(content, "\n");
p = list;
while (xs_list_iter(&p, &v)) {
xs *ss = NULL;
if (strcmp(v, "```") == 0) {
if (!in_pre)
s = xs_str_cat(s, "
"); else s = xs_str_cat(s, ""); in_pre = !in_pre; continue; } if (in_pre) { // Encode all HTML characters when we're in pre element until we are out. ss = encode_html(v); s = xs_str_cat(s, ss); s = xs_str_cat(s, "
"); in_blq = 1; } s = xs_str_cat(s, ss); s = xs_str_cat(s, ""); in_blq = 0; } s = xs_str_cat(s, ss); s = xs_str_cat(s, "
"); continue; } if (in_blq) { s = xs_str_cat(s, "
", ""); s = xs_replace_i(s, ""); s = xs_replace_i(s, "
", "
");
}
}
else {
/* non-tag */
s = xs_str_cat(s, v);
}
n++;
}
return s;
}
xs_str *encode_html(const char *str)
/* escapes html characters */
{
xs_str *encoded = xs_html_encode((char *)str);
/* Restore only
. Probably safe. Let's hope nothing goes wrong with this. */
encoded = xs_replace_i(encoded, "<br>", "
");
return encoded;
}