2022-09-27 08:03:41 +00:00
|
|
|
/* copyright (c) 2022 grunfink - MIT license */
|
|
|
|
|
|
|
|
#ifndef _XS_REGEX_H
|
|
|
|
|
|
|
|
#define _XS_REGEX_H
|
|
|
|
|
2022-09-27 15:19:59 +00:00
|
|
|
d_char *xs_regex_split_n(const char *str, const char *rx, int count);
|
2022-11-24 07:47:02 +00:00
|
|
|
#define xs_regex_split(str, rx) xs_regex_split_n(str, rx, XS_ALL)
|
2022-09-27 15:19:59 +00:00
|
|
|
d_char *xs_regex_match_n(const char *str, const char *rx, int count);
|
2022-11-24 07:47:02 +00:00
|
|
|
#define xs_regex_match(str, rx) xs_regex_match_n(str, rx, XS_ALL)
|
2022-09-27 08:03:41 +00:00
|
|
|
|
|
|
|
#ifdef XS_IMPLEMENTATION
|
|
|
|
|
|
|
|
#include <regex.h>
|
|
|
|
|
2022-09-27 15:19:59 +00:00
|
|
|
d_char *xs_regex_split_n(const char *str, const char *rx, int count)
|
|
|
|
/* splits str by regex */
|
2022-09-27 08:03:41 +00:00
|
|
|
{
|
|
|
|
regex_t re;
|
|
|
|
regmatch_t rm;
|
|
|
|
int offset = 0;
|
2022-09-27 15:19:59 +00:00
|
|
|
d_char *list = NULL;
|
|
|
|
const char *p;
|
2022-09-27 08:03:41 +00:00
|
|
|
|
|
|
|
if (regcomp(&re, rx, REG_EXTENDED))
|
|
|
|
return NULL;
|
|
|
|
|
|
|
|
list = xs_list_new();
|
|
|
|
|
|
|
|
while (count > 0 && !regexec(&re, (p = str + offset), 1, &rm, offset > 0 ? REG_NOTBOL : 0)) {
|
2022-09-27 15:19:59 +00:00
|
|
|
/* add first the leading part of the string */
|
|
|
|
list = xs_list_append_m(list, p, rm.rm_so);
|
|
|
|
list = xs_str_cat(list, "");
|
2022-09-27 08:03:41 +00:00
|
|
|
|
2022-09-27 15:19:59 +00:00
|
|
|
/* add now the matched text as the separator */
|
|
|
|
list = xs_list_append_m(list, p + rm.rm_so, rm.rm_eo - rm.rm_so);
|
2022-09-27 08:03:41 +00:00
|
|
|
list = xs_str_cat(list, "");
|
|
|
|
|
2022-09-27 15:19:59 +00:00
|
|
|
/* move forward */
|
2022-09-27 08:03:41 +00:00
|
|
|
offset += rm.rm_eo;
|
|
|
|
|
|
|
|
count--;
|
|
|
|
}
|
|
|
|
|
2022-09-27 15:19:59 +00:00
|
|
|
/* add the rest of the string */
|
|
|
|
list = xs_list_append(list, p);
|
|
|
|
|
2022-09-27 08:03:41 +00:00
|
|
|
regfree(&re);
|
|
|
|
|
|
|
|
return list;
|
|
|
|
}
|
|
|
|
|
2022-09-27 15:19:59 +00:00
|
|
|
|
|
|
|
d_char *xs_regex_match_n(const char *str, const char *rx, int count)
|
|
|
|
/* returns a list with upto count matches */
|
|
|
|
{
|
|
|
|
d_char *list = xs_list_new();
|
|
|
|
xs *split = NULL;
|
|
|
|
char *p, *v;
|
|
|
|
int n = 0;
|
|
|
|
|
|
|
|
/* split */
|
2022-10-07 11:48:53 +00:00
|
|
|
split = xs_regex_split_n(str, rx, count);
|
2022-09-27 15:19:59 +00:00
|
|
|
|
|
|
|
/* now iterate to get only the 'separators' (odd ones) */
|
2022-10-07 11:48:53 +00:00
|
|
|
p = split;
|
2022-09-27 15:19:59 +00:00
|
|
|
while (xs_list_iter(&p, &v)) {
|
|
|
|
if (n & 0x1)
|
|
|
|
list = xs_list_append(list, v);
|
|
|
|
|
|
|
|
n++;
|
|
|
|
}
|
|
|
|
|
|
|
|
return list;
|
|
|
|
}
|
|
|
|
|
2022-09-27 08:03:41 +00:00
|
|
|
#endif /* XS_IMPLEMENTATION */
|
|
|
|
|
|
|
|
#endif /* XS_REGEX_H */
|