Convert 'Link' attachments that have a media extension to something more useful.

This commit is contained in:
default 2023-08-17 17:38:39 +02:00
parent b3b4a4ef61
commit 6ede6497ad
5 changed files with 112 additions and 51 deletions

10
html.c
View file

@ -1313,6 +1313,16 @@ xs_str *html_entry(snac *user, xs_str *os, const xs_dict *msg, int local,
if (xs_is_null(url)) if (xs_is_null(url))
continue; continue;
/* if it's a plain Link, check if it can be "rewritten" */
if (strcmp(t, "Link") == 0) {
const char *mt = xs_mime_by_ext(url);
if (xs_startswith(mt, "image/") ||
xs_startswith(mt, "audio/") ||
xs_startswith(mt, "video/"))
t = mt;
}
const char *name = xs_dict_get(v, "name"); const char *name = xs_dict_get(v, "name");
if (xs_is_null(name)) if (xs_is_null(name))
name = xs_dict_get(msg, "name"); name = xs_dict_get(msg, "name");

View file

@ -6,57 +6,67 @@
const char *xs_mime_by_ext(const char *file); const char *xs_mime_by_ext(const char *file);
extern const char *xs_mime_types[];
#ifdef XS_IMPLEMENTATION #ifdef XS_IMPLEMENTATION
/* intentionally brain-dead simple */ /* intentionally brain-dead simple */
struct _mime_info { /* CAUTION: sorted */
const char *type;
const char *ext; const char *xs_mime_types[] = {
} mime_info[] = { "3gp", "video/3gpp",
{ "application/json", ".json" }, "aac", "audio/aac",
{ "image/gif", ".gif" }, "css", "text/css",
{ "image/jpeg", ".jpeg" }, "flac", "audio/flac",
{ "image/jpeg", ".jpg" }, "flv", "video/flv",
{ "image/png", ".png" }, "gif", "image/gif",
{ "image/webp", ".webp" }, "gmi", "text/gemini",
{ "video/mp4", ".mp4" }, "html", "text/html",
{ "video/mp4", ".mpg4" }, "jpeg", "image/jpeg",
{ "video/mp4", ".m4v" }, "jpg", "image/jpeg",
{ "video/webm", ".webm" }, "json", "application/json",
{ "video/quicktime", ".mov" }, "m4a", "audio/aac",
{ "video/3gpp", ".3gp" }, "m4v", "video/mp4",
{ "video/ogg", ".ogv" }, "md", "text/markdown",
{ "video/flv", ".flv" }, "mov", "video/quicktime",
{ "audio/mp3", ".mp3" }, "mp3", "audio/mp3",
{ "audio/ogg", ".ogg" }, "mp4", "video/mp4",
{ "audio/ogg", ".oga" }, "mpg4", "video/mp4",
{ "audio/ogg", ".opus" }, "oga", "audio/ogg",
{ "audio/flac", ".flac" }, "ogg", "audio/ogg",
{ "audio/wav", ".wav" }, "ogv", "video/ogg",
{ "audio/wma", ".wma" }, "opus", "audio/ogg",
{ "audio/aac", ".aac" }, "png", "image/png",
{ "audio/aac", ".m4a" }, "txt", "text/plain",
{ "text/css", ".css" }, "wav", "audio/wav",
{ "text/html", ".html" }, "webm", "video/webm",
{ "text/plain", ".txt" }, "webp", "image/webp",
{ "text/xml", ".xml" }, "wma", "audio/wma",
{ "text/markdown", ".md" }, "xml", "text/xml",
{ "text/gemini", ".gmi" }, NULL, NULL,
{ NULL, NULL }
}; };
const char *xs_mime_by_ext(const char *file) const char *xs_mime_by_ext(const char *file)
/* returns the MIME type by file extension */ /* returns the MIME type by file extension */
{ {
struct _mime_info *mi = mime_info; const char *ext = strrchr(file, '.');
xs *lfile = xs_tolower_i(xs_dup(file));
while (mi->type != NULL) { if (ext) {
if (xs_endswith(lfile, mi->ext)) const char **p = xs_mime_types;
return mi->type; xs *uext = xs_tolower_i(xs_dup(ext + 1));
mi++; while (**p) {
int c;
if ((c = strcmp(*p, uext)) == 0)
return p[1];
else
if (c > 0)
break;
p += 2;
}
} }
return "application/octet-stream"; return "application/octet-stream";

View file

@ -8,8 +8,10 @@ xs_list *xs_regex_split_n(const char *str, const char *rx, int count);
#define xs_regex_split(str, rx) xs_regex_split_n(str, rx, XS_ALL) #define xs_regex_split(str, rx) xs_regex_split_n(str, rx, XS_ALL)
xs_list *xs_regex_match_n(const char *str, const char *rx, int count); xs_list *xs_regex_match_n(const char *str, const char *rx, int count);
#define xs_regex_match(str, rx) xs_regex_match_n(str, rx, XS_ALL) #define xs_regex_match(str, rx) xs_regex_match_n(str, rx, XS_ALL)
xs_list *xs_regex_replace_n(const char *str, const char *rx, const char *rep, int count); xs_list *xs_regex_replace_in(xs_str *str, const char *rx, const char *rep, int count);
#define xs_regex_replace(str, rx, rep) xs_regex_replace_n(str, rx, rep, XS_ALL) #define xs_regex_replace_i(str, rx, rep) xs_regex_replace_in(str, rx, rep, XS_ALL)
#define xs_regex_replace_n(str, rx, rep, count) xs_regex_replace_in(xs_dup(str), rx, rep, count)
#define xs_regex_replace(str, rx, rep) xs_regex_replace_in(xs_dup(str), rx, rep, XS_ALL)
#ifdef XS_IMPLEMENTATION #ifdef XS_IMPLEMENTATION
@ -78,7 +80,7 @@ xs_list *xs_regex_match_n(const char *str, const char *rx, int count)
} }
xs_list *xs_regex_replace_n(const char *str, const char *rx, const char *rep, int count) xs_list *xs_regex_replace_in(xs_str *str, const char *rx, const char *rep, int count)
/* replaces all matches with the rep string. If it contains unescaped &, /* replaces all matches with the rep string. If it contains unescaped &,
they are replaced with the match */ they are replaced with the match */
{ {
@ -121,6 +123,8 @@ xs_list *xs_regex_replace_n(const char *str, const char *rx, const char *rep, in
n++; n++;
} }
xs_free(str);
return s; return s;
} }

View file

@ -4,8 +4,10 @@
#define _XS_UNICODE_H #define _XS_UNICODE_H
int _xs_utf8_enc(char buf[4], unsigned int cpoint);
xs_str *xs_utf8_enc(xs_str *str, unsigned int cpoint); xs_str *xs_utf8_enc(xs_str *str, unsigned int cpoint);
unsigned int xs_utf8_dec(char **str); unsigned int xs_utf8_dec(char **str);
int xs_unicode_width(unsigned int cpoint);
unsigned int *_xs_unicode_upper_search(unsigned int cpoint); unsigned int *_xs_unicode_upper_search(unsigned int cpoint);
unsigned int *_xs_unicode_lower_search(unsigned int cpoint); unsigned int *_xs_unicode_lower_search(unsigned int cpoint);
#define xs_unicode_is_upper(cpoint) (!!_xs_unicode_upper_search(cpoint)) #define xs_unicode_is_upper(cpoint) (!!_xs_unicode_upper_search(cpoint))
@ -18,8 +20,8 @@
#ifdef XS_IMPLEMENTATION #ifdef XS_IMPLEMENTATION
char *_xs_utf8_enc(char buf[4], unsigned int cpoint) int _xs_utf8_enc(char buf[4], unsigned int cpoint)
/* encodes an Unicode codepoint to utf-8 into buf and returns the new position */ /* encodes an Unicode codepoint to utf-8 into buf and returns the size in bytes */
{ {
unsigned char *p = (unsigned char *)buf; unsigned char *p = (unsigned char *)buf;
@ -42,18 +44,18 @@ char *_xs_utf8_enc(char buf[4], unsigned int cpoint)
*p++ = 0x80 | (cpoint & 0x3f); *p++ = 0x80 | (cpoint & 0x3f);
} }
return (char *)p; return p - (unsigned char *)buf;
} }
xs_str *xs_utf8_enc(xs_str *str, unsigned int cpoint) xs_str *xs_utf8_enc(xs_str *str, unsigned int cpoint)
/* encodes an Unicode codepoint to utf-8 into str */ /* encodes an Unicode codepoint to utf-8 into str */
{ {
char tmp[4], *p; char tmp[4];
p = _xs_utf8_enc(tmp, cpoint); int c = _xs_utf8_enc(tmp, cpoint);
return xs_append_m(str, tmp, p - tmp); return xs_append_m(str, tmp, c);
} }
@ -99,9 +101,44 @@ unsigned int xs_utf8_dec(char **str)
} }
/* intentionally dead simple */
static unsigned int xs_unicode_width_table[] = {
0x300, 0x36f, 0, /* diacritics */
0x1100, 0x11ff, 2, /* Hangul */
0x2e80, 0xa4cf, 2, /* CJK */
0xac00, 0xd7a3, 2, /* more Hangul */
0xe000, 0xf8ff, 0, /* private use */
0xf900, 0xfaff, 2, /* CJK compatibility */
0xff00, 0xff60, 2, /* full width things */
0xffdf, 0xffe6, 2, /* full width things */
0x1f200, 0x1ffff, 2, /* emojis */
0x20000, 0x2fffd, 2 /* more CJK */
};
int xs_unicode_width(unsigned int cpoint)
/* returns the width in columns of a Unicode codepoint (somewhat simplified) */
{
unsigned int *p = xs_unicode_width_table;
unsigned int *e = p + sizeof(xs_unicode_width_table) / sizeof(unsigned int);
while (p < e) {
if (cpoint < p[0])
return 1;
if (cpoint >= p[0] && cpoint <= p[1])
return p[2];
p += 3;
}
return 0;
}
#ifdef _XS_UNICODE_TBL_H #ifdef _XS_UNICODE_TBL_H
/* include xs_unicode_tbl.h before to use these functions */ /* include xs_unicode_tbl.h before this one to use these functions */
static int int_cmp(const void *p1, const void *p2) static int int_cmp(const void *p1, const void *p2)
{ {

View file

@ -1 +1 @@
/* b7e9713d90382d8da0b58023f4c78416e6ca1bc5 */ /* e85f257dd8fcb2980fd21aa37c1594c1461ddf48 */