mirror of
https://github.com/rkd77/elinks.git
synced 2025-01-03 14:57:44 -05:00
657 lines
14 KiB
C
657 lines
14 KiB
C
/** String handling functions
|
|
* @file */
|
|
|
|
#ifdef HAVE_CONFIG_H
|
|
#include "config.h"
|
|
#endif
|
|
|
|
#ifndef _GNU_SOURCE
|
|
#define _GNU_SOURCE /* XXX: fseeko, ftello */
|
|
#endif
|
|
|
|
#include <ctype.h>
|
|
#include <stdarg.h>
|
|
#include <stdio.h>
|
|
#include <stdlib.h>
|
|
#include <string.h>
|
|
#include <limits.h>
|
|
|
|
#include "elinks.h"
|
|
|
|
#include "util/conv.h"
|
|
#include "util/error.h"
|
|
#include "util/memdebug.h"
|
|
#include "util/memory.h"
|
|
#include "util/string.h"
|
|
#include "util/snprintf.h"
|
|
|
|
|
|
/* This file looks to be slowly being overloaded by a lot of various stuff,
|
|
* like memory managment, stubs, tools, granular and non-granular strings,
|
|
* struct string object... Perhaps util/memory.* and util/stubs.* (stubs.h
|
|
* probably included in elinks.h, it's important enough) would be nice to
|
|
* have. --pasky */
|
|
|
|
|
|
#define string_assert(f, l, x, o) \
|
|
if ((assert_failed = !(x))) { \
|
|
errfile = f, errline = l, \
|
|
elinks_internal("[%s] assertion %s failed!", o, #x); \
|
|
}
|
|
|
|
#ifdef DEBUG_MEMLEAK
|
|
|
|
char *
|
|
debug_memacpy(const char *f, int l, const char *src, int len)
|
|
{
|
|
char *m;
|
|
|
|
string_assert(f, l, len >= 0, "memacpy");
|
|
if_assert_failed len = 0;
|
|
|
|
m = (char *)debug_mem_alloc(f, l, len + 1);
|
|
if (!m) return NULL;
|
|
|
|
if (src && len) memcpy(m, src, len);
|
|
m[len] = '\0';
|
|
|
|
return m;
|
|
}
|
|
|
|
char *
|
|
debug_stracpy(const char *f, int l, const char *src)
|
|
{
|
|
string_assert(f, l, src, "stracpy");
|
|
if_assert_failed return NULL;
|
|
|
|
return debug_memacpy(f, l, src, strlen(src));
|
|
}
|
|
|
|
#else /* DEBUG_MEMLEAK */
|
|
|
|
char *
|
|
memacpy(const char *src, int len)
|
|
{
|
|
char *m;
|
|
|
|
assertm(len >= 0, "[memacpy]");
|
|
if_assert_failed { len = 0; }
|
|
|
|
m = (char *)mem_alloc(len + 1);
|
|
if (!m) return NULL;
|
|
|
|
if (src && len) memcpy(m, src, len);
|
|
m[len] = 0;
|
|
|
|
return m;
|
|
}
|
|
|
|
char *
|
|
stracpy(const char *src)
|
|
{
|
|
assertm(src, "[stracpy]");
|
|
if_assert_failed return NULL;
|
|
|
|
return memacpy(src, strlen(src));
|
|
}
|
|
|
|
#endif /* DEBUG_MEMLEAK */
|
|
|
|
|
|
void
|
|
add_to_strn(char **dst, const char *src)
|
|
{
|
|
char *newdst;
|
|
int dstlen;
|
|
int srclen;
|
|
|
|
assertm(*dst && src, "[add_to_strn]");
|
|
if_assert_failed return;
|
|
|
|
dstlen = strlen(*dst);
|
|
srclen = strlen(src) + 1; /* Include the NUL char! */
|
|
newdst = (char *)mem_realloc(*dst, dstlen + srclen);
|
|
if (!newdst) return;
|
|
|
|
memcpy(newdst + dstlen, src, srclen);
|
|
*dst = newdst;
|
|
}
|
|
|
|
char *
|
|
insert_in_string(char **dst, int pos,
|
|
const char *seq, int seqlen)
|
|
{
|
|
int dstlen = strlen(*dst);
|
|
char *string = (char *)mem_realloc(*dst, dstlen + seqlen + 1);
|
|
|
|
if (!string) return NULL;
|
|
|
|
memmove(string + pos + seqlen, string + pos, dstlen - pos + 1);
|
|
memcpy(string + pos, seq, seqlen);
|
|
*dst = string;
|
|
|
|
return string;
|
|
}
|
|
|
|
char *
|
|
straconcat(const char *str, ...)
|
|
{
|
|
va_list ap;
|
|
const char *a;
|
|
char *s;
|
|
unsigned int len;
|
|
|
|
assertm(str != NULL, "[straconcat]");
|
|
if_assert_failed { return NULL; }
|
|
|
|
len = strlen(str);
|
|
s = (char *)mem_alloc(len + 1);
|
|
if (!s) return NULL;
|
|
|
|
if (len) memcpy(s, str, len);
|
|
|
|
va_start(ap, str);
|
|
while ((a = va_arg(ap, const char *))) {
|
|
unsigned int l = strlen(a);
|
|
char *ns;
|
|
|
|
if (!l) continue;
|
|
|
|
ns = (char *)mem_realloc(s, len + 1 + l);
|
|
if (!ns) {
|
|
mem_free(s);
|
|
va_end(ap);
|
|
return NULL;
|
|
}
|
|
|
|
s = ns;
|
|
memcpy(s + len, a, l);
|
|
len += l;
|
|
}
|
|
va_end(ap);
|
|
|
|
s[len] = '\0';
|
|
return s;
|
|
}
|
|
|
|
int
|
|
xstrcmp(const char *s1, const char *s2)
|
|
{
|
|
if (!s1) return -!!s2;
|
|
if (!s2) return 1;
|
|
return strcmp(s1, s2);
|
|
}
|
|
|
|
char *
|
|
safe_strncpy(char *dst, const char *src, size_t dst_size)
|
|
{
|
|
assertm(dst && src && dst_size > 0, "[safe_strncpy]");
|
|
if_assert_failed return NULL;
|
|
|
|
strncpy(dst, src, dst_size);
|
|
dst[dst_size - 1] = '\0';
|
|
|
|
return dst;
|
|
}
|
|
|
|
#define strlcmp_device(c,s1,n1,s2,n2,t1,t2) { \
|
|
size_t p; \
|
|
int d; \
|
|
\
|
|
/* XXX: The return value is inconsistent. Hrmpf. Making it consistent
|
|
* would make the @n1 != @n2 case significantly more expensive, though.
|
|
* So noone should better rely on the return value actually meaning
|
|
* anything quantitatively. --pasky */ \
|
|
\
|
|
if (!s1 || !s2) \
|
|
return 1; \
|
|
\
|
|
/* n1,n2 is unsigned, so don't assume -1 < 0 ! >:) */ \
|
|
\
|
|
/* TODO: Don't precompute strlen()s but rather make the loop smarter.
|
|
* --pasky */ \
|
|
if (n1 == -1) n1 = strlen(s1); \
|
|
if (n2 == -1) n2 = strlen(s2); \
|
|
\
|
|
string_assert(errfile, errline, n1 >= 0 && n2 >= 0, c); \
|
|
\
|
|
d = n1 - n2; \
|
|
if (d) return d; \
|
|
\
|
|
for (p = 0; p < n1 && s1[p] && s2[p]; p++) { \
|
|
d = t1 - t2; \
|
|
if (d) return d; \
|
|
} \
|
|
return 0; \
|
|
}
|
|
|
|
int
|
|
elinks_strlcmp(const char *s1, size_t n1,
|
|
const char *s2, size_t n2)
|
|
{
|
|
strlcmp_device("strlcmp", s1, n1, s2, n2, s1[p], s2[p]);
|
|
}
|
|
|
|
int
|
|
elinks_strlcasecmp(const char *s1, size_t n1,
|
|
const char *s2, size_t n2,
|
|
const int locale_indep)
|
|
{
|
|
if (locale_indep) {
|
|
strlcmp_device("strlcasecmp", s1, n1, s2, n2, c_toupper(s1[p]), c_toupper(s2[p]));
|
|
}
|
|
else {
|
|
strlcmp_device("strlcasecmp", s1, n1, s2, n2, toupper(s1[p]), toupper(s2[p]));
|
|
}
|
|
}
|
|
|
|
/* strlcasestr - adapted from c_strcasestr */
|
|
char *
|
|
elinks_strlcasestr(const char *haystack, const int haystackl,
|
|
const char *needle, const int needlel)
|
|
{
|
|
size_t haystack_length = haystackl == -1 ? strlen(haystack) : haystackl;
|
|
size_t needle_length = needlel == -1 ? strlen(needle) : needlel;
|
|
int i;
|
|
|
|
if (haystack_length < needle_length)
|
|
return NULL;
|
|
|
|
for (i = haystack_length - needle_length + 1; i; i--) {
|
|
if (!c_strncasecmp(haystack, needle, needle_length))
|
|
return (char *) haystack;
|
|
haystack++;
|
|
}
|
|
|
|
return NULL;
|
|
}
|
|
|
|
int
|
|
c_strcasecmp(const char *s1, const char *s2)
|
|
{
|
|
for (;; s1++, s2++) {
|
|
unsigned char c1 = c_tolower(*(const char *) s1);
|
|
unsigned char c2 = c_tolower(*(const char *) s2);
|
|
|
|
if (c1 != c2)
|
|
return (c1 < c2) ? -1: +1;
|
|
if (c1 == '\0')
|
|
return 0;
|
|
}
|
|
}
|
|
|
|
int c_strncasecmp(const char *s1, const char *s2, size_t n)
|
|
{
|
|
for (; n > 0; n--, s1++, s2++) {
|
|
unsigned char c1 = c_tolower(*(const char *) s1);
|
|
unsigned char c2 = c_tolower(*(const char *) s2);
|
|
|
|
if (c1 != c2)
|
|
return (c1 < c2) ? -1: +1;
|
|
if (c1 == '\0')
|
|
return 0;
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
/* c_strcasestr - adapted from src/osdep/stub.c */
|
|
char * c_strcasestr(const char *haystack, const char *needle)
|
|
{
|
|
size_t haystack_length = strlen(haystack);
|
|
size_t needle_length = strlen(needle);
|
|
int i;
|
|
|
|
if (haystack_length < needle_length)
|
|
return NULL;
|
|
|
|
for (i = haystack_length - needle_length + 1; i; i--) {
|
|
if (!c_strncasecmp(haystack, needle, needle_length))
|
|
return (char *) haystack;
|
|
haystack++;
|
|
}
|
|
|
|
return NULL;
|
|
}
|
|
|
|
/* The new string utilities: */
|
|
|
|
/* TODO Currently most of the functions use add_bytes_to_string() as a backend
|
|
* instead we should optimize each function. */
|
|
|
|
NONSTATIC_INLINE struct string *
|
|
#ifdef DEBUG_MEMLEAK
|
|
init_string__(const char *file, int line, struct string *string)
|
|
#else
|
|
init_string(struct string *string)
|
|
#endif
|
|
{
|
|
assertm(string != NULL, "[init_string]");
|
|
if_assert_failed { return NULL; }
|
|
|
|
string->length = 0;
|
|
#ifdef DEBUG_MEMLEAK
|
|
string->source = (char *)debug_mem_alloc(file, line, STRING_GRANULARITY + 1);
|
|
#else
|
|
string->source = (char *)mem_alloc(STRING_GRANULARITY + 1);
|
|
#endif
|
|
if (!string->source) return NULL;
|
|
|
|
*string->source = '\0';
|
|
|
|
set_string_magic(string);
|
|
|
|
return string;
|
|
}
|
|
|
|
NONSTATIC_INLINE void
|
|
done_string(struct string *string)
|
|
{
|
|
assertm(string != NULL, "[done_string]");
|
|
if_assert_failed { return; }
|
|
|
|
if (string->source) {
|
|
/* We only check the magic if we have to free anything so
|
|
* that done_string() can be called multiple times without
|
|
* blowing up something */
|
|
check_string_magic(string);
|
|
mem_free(string->source);
|
|
}
|
|
|
|
/* Blast everything including the magic */
|
|
memset(string, 0, sizeof(*string));
|
|
}
|
|
|
|
/** @relates string */
|
|
NONSTATIC_INLINE struct string *
|
|
add_to_string(struct string *string, const char *source)
|
|
{
|
|
assertm(string && source, "[add_to_string]");
|
|
if_assert_failed { return NULL; }
|
|
|
|
check_string_magic(string);
|
|
|
|
if (!*source) return string;
|
|
|
|
return add_bytes_to_string(string, source, strlen(source));
|
|
}
|
|
|
|
/** @relates string */
|
|
NONSTATIC_INLINE struct string *
|
|
add_crlf_to_string(struct string *string)
|
|
{
|
|
assertm(string != NULL, "[add_crlf_to_string]");
|
|
if_assert_failed { return NULL; }
|
|
|
|
check_string_magic(string);
|
|
|
|
if (!realloc_string(string, string->length + 2))
|
|
return NULL;
|
|
|
|
string->source[string->length++] = ASCII_CR;
|
|
string->source[string->length++] = ASCII_LF;
|
|
string->source[string->length] = '\0';
|
|
|
|
return string;
|
|
}
|
|
|
|
/** @relates string */
|
|
NONSTATIC_INLINE struct string *
|
|
add_string_to_string(struct string *string, const struct string *from)
|
|
{
|
|
assertm(string && from, "[add_string_to_string]");
|
|
if_assert_failed { return NULL; }
|
|
|
|
check_string_magic(string);
|
|
check_string_magic(from);
|
|
|
|
if (!from->length) return string; /* optimization only */
|
|
|
|
return add_bytes_to_string(string, from->source, from->length);
|
|
}
|
|
|
|
/** @relates string */
|
|
struct string *
|
|
add_file_to_string(struct string *string, const char *filename)
|
|
{
|
|
FILE *file;
|
|
off_t filelen;
|
|
int newlength;
|
|
|
|
assertm(string && filename, "[add_file_to_string]");
|
|
if_assert_failed { return NULL; }
|
|
|
|
check_string_magic(string);
|
|
|
|
file = fopen(filename, "rb");
|
|
if (!file) return NULL;
|
|
|
|
if (fseeko(file, 0, SEEK_END)) goto err;
|
|
|
|
filelen = ftello(file);
|
|
if (filelen == -1) goto err;
|
|
|
|
if (fseeko(file, 0, SEEK_SET)) goto err;
|
|
|
|
newlength = string->length + filelen;
|
|
if (!realloc_string(string, newlength)) goto err;
|
|
|
|
string->length += fread(string->source + string->length, 1,
|
|
(size_t) filelen, file);
|
|
string->source[string->length] = 0;
|
|
fclose(file);
|
|
|
|
if (string->length != newlength) goto err;
|
|
|
|
return string;
|
|
|
|
err:
|
|
fclose(file);
|
|
|
|
return NULL;
|
|
}
|
|
|
|
struct string *
|
|
string_concat(struct string *string, ...)
|
|
{
|
|
va_list ap;
|
|
const char *source;
|
|
|
|
assertm(string != NULL, "[string_concat]");
|
|
if_assert_failed { return NULL; }
|
|
|
|
check_string_magic(string);
|
|
|
|
va_start(ap, string);
|
|
while ((source = va_arg(ap, const char *)))
|
|
if (*source)
|
|
add_to_string(string, source);
|
|
|
|
va_end(ap);
|
|
|
|
return string;
|
|
}
|
|
|
|
/** @relates string */
|
|
NONSTATIC_INLINE struct string *
|
|
add_char_to_string(struct string *string, unsigned char character)
|
|
{
|
|
assertm(string && character, "[add_char_to_string]");
|
|
if_assert_failed { return NULL; }
|
|
|
|
check_string_magic(string);
|
|
|
|
if (!realloc_string(string, string->length + 1))
|
|
return NULL;
|
|
|
|
string->source[string->length++] = character;
|
|
string->source[string->length] = '\0';
|
|
|
|
return string;
|
|
}
|
|
|
|
NONSTATIC_INLINE struct string *
|
|
add_xchar_to_string(struct string *string, unsigned char character, int times)
|
|
{
|
|
int newlength;
|
|
|
|
assertm(string && character && times >= 0, "[add_xchar_to_string]");
|
|
if_assert_failed { return NULL; }
|
|
|
|
check_string_magic(string);
|
|
|
|
if (!times) return string;
|
|
|
|
newlength = string->length + times;
|
|
if (!realloc_string(string, newlength))
|
|
return NULL;
|
|
|
|
memset(string->source + string->length, character, times);
|
|
string->length = newlength;
|
|
string->source[newlength] = '\0';
|
|
|
|
return string;
|
|
}
|
|
|
|
/** Add printf()-style format string to @a string. */
|
|
struct string *
|
|
add_format_to_string(struct string *string, const char *format, ...)
|
|
{
|
|
int newlength;
|
|
int width;
|
|
va_list ap;
|
|
|
|
assertm(string && format, "[add_format_to_string]");
|
|
if_assert_failed { return NULL; }
|
|
|
|
check_string_magic(string);
|
|
|
|
va_start(ap, format);
|
|
width = vsnprintf(NULL, 0, format, ap);
|
|
va_end(ap);
|
|
if (width <= 0) return NULL;
|
|
|
|
newlength = string->length + width;
|
|
if (!realloc_string(string, newlength))
|
|
return NULL;
|
|
|
|
va_start(ap, format);
|
|
vsnprintf(&string->source[string->length], width + 1, format, ap);
|
|
va_end(ap);
|
|
|
|
string->length = newlength;
|
|
string->source[newlength] = '\0';
|
|
|
|
return string;
|
|
}
|
|
|
|
void
|
|
string_replace(struct string *res, struct string *inp, struct string *what, struct string *repl)
|
|
{
|
|
struct string tmp;
|
|
struct string tmp2;
|
|
char *head;
|
|
char *found;
|
|
char *ins;
|
|
char *tmp_cnt;
|
|
|
|
if (!init_string(&tmp)) {
|
|
return;
|
|
};
|
|
if (!init_string(&tmp2)) {
|
|
done_string(&tmp);
|
|
return;
|
|
}
|
|
|
|
add_string_to_string(&tmp, inp);
|
|
|
|
head = tmp.source;
|
|
int count = 0;
|
|
ins = head;
|
|
if (what->length==0)
|
|
{
|
|
add_string_to_string(res, inp);
|
|
return;
|
|
}
|
|
|
|
// count occurence of string in input
|
|
for (count = 0; (tmp_cnt = strstr(ins, what->source)); ++count)
|
|
{
|
|
ins = tmp_cnt + what->length;
|
|
}
|
|
|
|
for (int i=0;i<count;i++) {
|
|
// find occurence of string
|
|
found=strstr(head,what->source);
|
|
// count chars before and after occurence
|
|
int bf_len=found-tmp.source;
|
|
int af_len=tmp.length-bf_len-what->length;
|
|
// move head by what
|
|
found+=what->length;
|
|
// join the before, needle and after to res
|
|
add_bytes_to_string(&tmp2,tmp.source,bf_len);
|
|
add_bytes_to_string(&tmp2,repl->source,repl->length);
|
|
add_bytes_to_string(&tmp2,found,af_len);
|
|
// clear tmp string and tmp2 string
|
|
done_string(&tmp);
|
|
if (!init_string(&tmp)) {
|
|
done_string(&tmp2);
|
|
return;
|
|
}
|
|
add_string_to_string(&tmp, &tmp2);
|
|
done_string(&tmp2);
|
|
if (!init_string(&tmp2)) {
|
|
done_string(&tmp);
|
|
return;
|
|
}
|
|
//printf("TMP: %s |\n",tmp.source);
|
|
head = tmp.source;
|
|
}
|
|
add_string_to_string(res, &tmp);
|
|
|
|
done_string(&tmp);
|
|
done_string(&tmp2);
|
|
}
|
|
|
|
struct string *
|
|
add_to_string_list(LIST_OF(struct string_list_item) *list,
|
|
const char *source, int length)
|
|
{
|
|
struct string_list_item *item;
|
|
struct string *string;
|
|
|
|
assertm(list && source, "[add_to_string_list]");
|
|
if_assert_failed return NULL;
|
|
|
|
item = (struct string_list_item *)mem_alloc(sizeof(*item));
|
|
if (!item) return NULL;
|
|
|
|
string = &item->string;
|
|
if (length < 0) length = strlen(source);
|
|
|
|
if (!init_string(string)
|
|
|| !add_bytes_to_string(string, source, length)) {
|
|
done_string(string);
|
|
mem_free(item);
|
|
return NULL;
|
|
}
|
|
|
|
add_to_list_end(*list, item);
|
|
return string;
|
|
}
|
|
|
|
/** @relates string_list_item */
|
|
void
|
|
free_string_list(LIST_OF(struct string_list_item) *list)
|
|
{
|
|
assertm(list != NULL, "[free_string_list]");
|
|
if_assert_failed return;
|
|
|
|
while (!list_empty(*list)) {
|
|
struct string_list_item *item = (struct string_list_item *)list->next;
|
|
|
|
del_from_list(item);
|
|
done_string(&item->string);
|
|
mem_free(item);
|
|
}
|
|
}
|