2020-12-05 19:26:32 +08:00
|
|
|
#include "str.h"
|
|
|
|
#include <stdlib.h>
|
|
|
|
|
2021-07-15 09:18:32 +08:00
|
|
|
struct mg_str mg_str_s(const char *s) {
|
2020-12-05 19:26:32 +08:00
|
|
|
struct mg_str str = {s, s == NULL ? 0 : strlen(s)};
|
|
|
|
return str;
|
|
|
|
}
|
|
|
|
|
2020-12-07 11:47:37 +08:00
|
|
|
struct mg_str mg_str_n(const char *s, size_t n) {
|
2020-12-05 19:26:32 +08:00
|
|
|
struct mg_str str = {s, n};
|
|
|
|
return str;
|
|
|
|
}
|
|
|
|
|
|
|
|
int mg_lower(const char *s) {
|
2022-02-23 04:20:56 +08:00
|
|
|
int c = *s;
|
|
|
|
if (c >= 'A' && c <= 'Z') c += 'a' - 'A';
|
|
|
|
return c;
|
2020-12-05 19:26:32 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
int mg_ncasecmp(const char *s1, const char *s2, size_t len) {
|
|
|
|
int diff = 0;
|
|
|
|
if (len > 0) do {
|
|
|
|
diff = mg_lower(s1++) - mg_lower(s2++);
|
|
|
|
} while (diff == 0 && s1[-1] != '\0' && --len > 0);
|
|
|
|
return diff;
|
|
|
|
}
|
|
|
|
|
|
|
|
int mg_casecmp(const char *s1, const char *s2) {
|
|
|
|
return mg_ncasecmp(s1, s2, (size_t) ~0);
|
|
|
|
}
|
|
|
|
|
|
|
|
int mg_vcmp(const struct mg_str *s1, const char *s2) {
|
|
|
|
size_t n2 = strlen(s2), n1 = s1->len;
|
|
|
|
int r = strncmp(s1->ptr, s2, (n1 < n2) ? n1 : n2);
|
|
|
|
if (r == 0) return (int) (n1 - n2);
|
|
|
|
return r;
|
|
|
|
}
|
|
|
|
|
|
|
|
int mg_vcasecmp(const struct mg_str *str1, const char *str2) {
|
|
|
|
size_t n2 = strlen(str2), n1 = str1->len;
|
|
|
|
int r = mg_ncasecmp(str1->ptr, str2, (n1 < n2) ? n1 : n2);
|
|
|
|
if (r == 0) return (int) (n1 - n2);
|
|
|
|
return r;
|
|
|
|
}
|
|
|
|
|
|
|
|
struct mg_str mg_strdup(const struct mg_str s) {
|
|
|
|
struct mg_str r = {NULL, 0};
|
|
|
|
if (s.len > 0 && s.ptr != NULL) {
|
2021-05-18 00:36:57 +08:00
|
|
|
char *sc = (char *) calloc(1, s.len + 1);
|
2020-12-05 19:26:32 +08:00
|
|
|
if (sc != NULL) {
|
|
|
|
memcpy(sc, s.ptr, s.len);
|
|
|
|
sc[s.len] = '\0';
|
|
|
|
r.ptr = sc;
|
|
|
|
r.len = s.len;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return r;
|
|
|
|
}
|
|
|
|
|
|
|
|
int mg_strcmp(const struct mg_str str1, const struct mg_str str2) {
|
|
|
|
size_t i = 0;
|
|
|
|
while (i < str1.len && i < str2.len) {
|
|
|
|
int c1 = str1.ptr[i];
|
|
|
|
int c2 = str2.ptr[i];
|
|
|
|
if (c1 < c2) return -1;
|
|
|
|
if (c1 > c2) return 1;
|
|
|
|
i++;
|
|
|
|
}
|
|
|
|
if (i < str1.len) return 1;
|
|
|
|
if (i < str2.len) return -1;
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
const char *mg_strstr(const struct mg_str haystack,
|
|
|
|
const struct mg_str needle) {
|
|
|
|
size_t i;
|
|
|
|
if (needle.len > haystack.len) return NULL;
|
|
|
|
for (i = 0; i <= haystack.len - needle.len; i++) {
|
|
|
|
if (memcmp(haystack.ptr + i, needle.ptr, needle.len) == 0) {
|
|
|
|
return haystack.ptr + i;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
2022-02-14 19:19:24 +08:00
|
|
|
static bool is_space(int c) {
|
|
|
|
return c == ' ' || c == '\r' || c == '\n' || c == '\t';
|
|
|
|
}
|
|
|
|
|
2020-12-05 19:26:32 +08:00
|
|
|
struct mg_str mg_strstrip(struct mg_str s) {
|
2022-02-14 19:19:24 +08:00
|
|
|
while (s.len > 0 && is_space((int) *s.ptr)) s.ptr++, s.len--;
|
|
|
|
while (s.len > 0 && is_space((int) *(s.ptr + s.len - 1))) s.len--;
|
2020-12-05 19:26:32 +08:00
|
|
|
return s;
|
|
|
|
}
|
2022-01-29 19:03:54 +08:00
|
|
|
|
|
|
|
bool mg_match(struct mg_str s, struct mg_str p, struct mg_str *caps) {
|
|
|
|
size_t i = 0, j = 0, ni = 0, nj = 0;
|
|
|
|
if (caps) caps->ptr = NULL, caps->len = 0;
|
|
|
|
while (i < p.len || j < s.len) {
|
|
|
|
if (i < p.len && j < s.len && (p.ptr[i] == '?' || s.ptr[j] == p.ptr[i])) {
|
|
|
|
if (caps == NULL) {
|
|
|
|
} else if (p.ptr[i] == '?') {
|
|
|
|
caps->ptr = &s.ptr[j], caps->len = 1; // Finalize `?` cap
|
|
|
|
caps++, caps->ptr = NULL, caps->len = 0; // Init next cap
|
|
|
|
} else if (caps->ptr != NULL && caps->len == 0) {
|
|
|
|
caps->len = (size_t) (&s.ptr[j] - caps->ptr); // Finalize current cap
|
|
|
|
caps++, caps->len = 0, caps->ptr = NULL; // Init next cap
|
|
|
|
}
|
|
|
|
i++, j++;
|
|
|
|
} else if (i < p.len && (p.ptr[i] == '*' || p.ptr[i] == '#')) {
|
|
|
|
if (caps && !caps->ptr) caps->len = 0, caps->ptr = &s.ptr[j]; // Init cap
|
|
|
|
ni = i++, nj = j + 1;
|
|
|
|
} else if (nj > 0 && nj <= s.len && (p.ptr[ni] == '#' || s.ptr[j] != '/')) {
|
|
|
|
i = ni, j = nj;
|
|
|
|
if (caps && caps->ptr == NULL && caps->len == 0) {
|
|
|
|
caps--, caps->len = 0; // Restart previous cap
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if (caps && caps->ptr && caps->len == 0) {
|
|
|
|
caps->len = (size_t) (&s.ptr[j] - caps->ptr);
|
|
|
|
}
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
bool mg_globmatch(const char *s1, size_t n1, const char *s2, size_t n2) {
|
|
|
|
return mg_match(mg_str_n(s2, n2), mg_str_n(s1, n1), NULL);
|
|
|
|
}
|
|
|
|
|
|
|
|
static size_t mg_nce(const char *s, size_t n, size_t ofs, size_t *koff,
|
2022-05-31 17:41:14 +08:00
|
|
|
size_t *klen, size_t *voff, size_t *vlen, char delim) {
|
2022-01-29 19:03:54 +08:00
|
|
|
size_t kvlen, kl;
|
2022-05-31 17:41:14 +08:00
|
|
|
for (kvlen = 0; ofs + kvlen < n && s[ofs + kvlen] != delim;) kvlen++;
|
2022-01-29 19:03:54 +08:00
|
|
|
for (kl = 0; kl < kvlen && s[ofs + kl] != '=';) kl++;
|
|
|
|
if (koff != NULL) *koff = ofs;
|
|
|
|
if (klen != NULL) *klen = kl;
|
|
|
|
if (voff != NULL) *voff = kl < kvlen ? ofs + kl + 1 : 0;
|
|
|
|
if (vlen != NULL) *vlen = kl < kvlen ? kvlen - kl - 1 : 0;
|
|
|
|
ofs += kvlen + 1;
|
|
|
|
return ofs > n ? n : ofs;
|
|
|
|
}
|
|
|
|
|
2022-06-09 04:44:01 +08:00
|
|
|
bool mg_split(struct mg_str *s, struct mg_str *k, struct mg_str *v, char sep) {
|
2022-01-29 19:03:54 +08:00
|
|
|
size_t koff = 0, klen = 0, voff = 0, vlen = 0, off = 0;
|
|
|
|
if (s->ptr == NULL || s->len == 0) return 0;
|
2022-06-09 04:44:01 +08:00
|
|
|
off = mg_nce(s->ptr, s->len, 0, &koff, &klen, &voff, &vlen, sep);
|
2022-01-29 19:03:54 +08:00
|
|
|
if (k != NULL) *k = mg_str_n(s->ptr + koff, klen);
|
|
|
|
if (v != NULL) *v = mg_str_n(s->ptr + voff, vlen);
|
|
|
|
*s = mg_str_n(s->ptr + off, s->len - off);
|
|
|
|
return off > 0;
|
|
|
|
}
|
2022-02-10 19:56:55 +08:00
|
|
|
|
2022-05-31 17:41:14 +08:00
|
|
|
bool mg_commalist(struct mg_str *s, struct mg_str *k, struct mg_str *v) {
|
|
|
|
return mg_split(s, k, v, ',');
|
|
|
|
}
|
|
|
|
|
2022-02-10 19:56:55 +08:00
|
|
|
size_t mg_snprintf(char *buf, size_t len, const char *fmt, ...) {
|
|
|
|
va_list ap;
|
|
|
|
size_t n;
|
|
|
|
va_start(ap, fmt);
|
2022-06-10 16:38:36 +08:00
|
|
|
n = mg_vsnprintf(buf, len, fmt, &ap);
|
2022-02-10 19:56:55 +08:00
|
|
|
va_end(ap);
|
|
|
|
return n;
|
|
|
|
}
|
|
|
|
|
|
|
|
char *mg_hex(const void *buf, size_t len, char *to) {
|
|
|
|
const unsigned char *p = (const unsigned char *) buf;
|
2022-04-12 21:14:55 +08:00
|
|
|
const char *hex = "0123456789abcdef";
|
2022-02-10 19:56:55 +08:00
|
|
|
size_t i = 0;
|
|
|
|
for (; len--; p++) {
|
|
|
|
to[i++] = hex[p[0] >> 4];
|
|
|
|
to[i++] = hex[p[0] & 0x0f];
|
|
|
|
}
|
|
|
|
to[i] = '\0';
|
|
|
|
return to;
|
|
|
|
}
|
|
|
|
|
|
|
|
static unsigned char mg_unhex_nimble(unsigned char c) {
|
|
|
|
return (c >= '0' && c <= '9') ? (unsigned char) (c - '0')
|
|
|
|
: (c >= 'A' && c <= 'F') ? (unsigned char) (c - '7')
|
|
|
|
: (unsigned char) (c - 'W');
|
|
|
|
}
|
|
|
|
|
|
|
|
unsigned long mg_unhexn(const char *s, size_t len) {
|
|
|
|
unsigned long i = 0, v = 0;
|
|
|
|
for (i = 0; i < len; i++) v <<= 4, v |= mg_unhex_nimble(((uint8_t *) s)[i]);
|
|
|
|
return v;
|
|
|
|
}
|
|
|
|
|
|
|
|
void mg_unhex(const char *buf, size_t len, unsigned char *to) {
|
|
|
|
size_t i;
|
|
|
|
for (i = 0; i < len; i += 2) {
|
|
|
|
to[i >> 1] = (unsigned char) mg_unhexn(&buf[i], 2);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2022-04-12 17:20:43 +08:00
|
|
|
uint64_t mg_tou64(struct mg_str str) {
|
|
|
|
uint64_t result = 0;
|
|
|
|
size_t i = 0;
|
|
|
|
while (i < str.len && (str.ptr[i] == ' ' || str.ptr[i] == '\t')) i++;
|
|
|
|
while (i < str.len && str.ptr[i] >= '0' && str.ptr[i] <= '9') {
|
|
|
|
result *= 10;
|
|
|
|
result += (unsigned) (str.ptr[i] - '0');
|
|
|
|
i++;
|
|
|
|
}
|
|
|
|
return result;
|
|
|
|
}
|
|
|
|
|
2022-02-10 19:56:55 +08:00
|
|
|
int64_t mg_to64(struct mg_str str) {
|
|
|
|
int64_t result = 0, neg = 1, max = 922337203685477570 /* INT64_MAX/10-10 */;
|
|
|
|
size_t i = 0;
|
|
|
|
while (i < str.len && (str.ptr[i] == ' ' || str.ptr[i] == '\t')) i++;
|
|
|
|
if (i < str.len && str.ptr[i] == '-') neg = -1, i++;
|
|
|
|
while (i < str.len && str.ptr[i] >= '0' && str.ptr[i] <= '9') {
|
|
|
|
if (result > max) return 0;
|
|
|
|
result *= 10;
|
|
|
|
result += (str.ptr[i] - '0');
|
|
|
|
i++;
|
|
|
|
}
|
|
|
|
return result * neg;
|
|
|
|
}
|
2022-07-01 03:27:43 +08:00
|
|
|
|
|
|
|
char *mg_remove_double_dots(char *s) {
|
|
|
|
char *p = s;
|
|
|
|
while (*s != '\0') {
|
|
|
|
*p++ = *s++;
|
|
|
|
if (s[-1] == '/' || s[-1] == '\\') {
|
|
|
|
while (s[0] != '\0') {
|
|
|
|
if (s[0] == '/' || s[0] == '\\') {
|
|
|
|
s++;
|
|
|
|
} else if (s[0] == '.' && s[1] == '.' &&
|
|
|
|
(s[2] == '/' || s[2] == '\\')) {
|
|
|
|
s += 2;
|
|
|
|
} else {
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
*p = '\0';
|
|
|
|
return s;
|
|
|
|
}
|