ref: 78f40b98dbd8ceb0e1bae3a88a89ff7919a6bda1
dir: /include-demo/stringutil.h/
#ifndef STRUTIL_H
#define STRUTIL_H
#include <string.h>
#include <stdlib.h>
#include <stdio.h>
#include <ctype.h>
#ifndef STRUTIL_ALLOC
#define STRUTIL_ALLOC(s) malloc(s)
#endif
#ifndef STRUTIL_FREE
#define STRUTIL_FREE(s) free(s)
#endif
#ifndef STRUTIL_REALLOC
#define STRUTIL_REALLOC(s, t) realloc(s,t)
#endif
#ifndef STRUTIL_NO_SHORT_NAMES
#define strcata strcatalloc
#define strcataf1 strcatallocf1
#define strcataf2 strcatallocf2
#define strcatafb strcatallocfb
#endif
static char* strcatalloc(const char* s1, const char* s2){
char* d = NULL; d = STRUTIL_ALLOC(strlen(s1) + strlen(s2) + 1);
if(d){
strcpy(d, s1);
strcat(d, s2);
}
return d;
}
static char* strcatallocf1(char* s1, const char* s2){
char* d = STRUTIL_REALLOC(s1, strlen(s1) + strlen(s2) + 1);
if(d){
strcat(d, s2);
}
return d;
}
static char* strcatallocf2(const char* s1, char* s2){
char* d = NULL; d = STRUTIL_ALLOC(strlen(s1) + strlen(s2) + 1);
if(d){
strcpy(d, s1);
strcat(d, s2);
}
STRUTIL_FREE(s2);
return d;
}
static char* strcatallocfb(char* s1, char* s2){
char* d = NULL; d = STRUTIL_ALLOC(strlen(s1) + strlen(s2) + 1);
if(d){
strcpy(d, s1);
strcat(d, s2);
}
STRUTIL_FREE(s1);
STRUTIL_FREE(s2);
return d;
}
static char* str_null_terminated_alloc(const char* in, unsigned int len){
char* d = NULL; d = malloc(len+1);
if(d){
memcpy(d,in,len);
d[len] = '\0';
}
return d;
}
static unsigned int strprefix(const char *pre, const char *str)
{
unsigned long lenpre = strlen(pre),
lenstr = strlen(str);
return lenstr < lenpre ? 0 : memcmp(pre, str, lenpre) == 0;
}
static unsigned int streq(const char *pre, const char *str)
{
return strcmp(pre, str) == 0;
}
static long strfind(const char* text, const char* subtext){
long ti = 0;
long si = 0;
long st = strlen(subtext);
for(;text[ti] != '\0';ti++){
if(text[ti] == subtext[si]) {
si++;
if(subtext[si] == '\0') return (ti - st)+1;
}else {
si = 0;
if(text[ti] == subtext[si])si++; /*Minor case.*/
if(subtext[si] == '\0') return (ti - st);
}
}
return -1;
}
static unsigned long read_until_terminator(FILE* f, char* buf, const unsigned long buflen, char terminator){
unsigned long i = 0;
char c;
for(i = 0; i < (buflen-1); i++)
{
if(feof(f))break;
c = fgetc(f);
if(c == terminator)break;
buf[i] = c;
}
buf[buflen-1] = '\0';
return i;
}
static char* read_until_terminator_alloced(FILE* f, unsigned long* lenout, char terminator, unsigned long initsize){
char c;
char* buf;
unsigned long bcap = initsize;
char* bufold;
unsigned long blen = 0;
buf = STRUTIL_ALLOC(initsize);
if(!buf) return NULL;
while(1){
if(feof(f)){break;}
c = fgetc(f);
if(c == terminator) {break;}
if(blen == (bcap-1)) /*Grow the buffer.*/
{
bcap<<=1;
bufold = buf;
buf = STRUTIL_REALLOC(buf, bcap);
if(!buf){free(bufold); return NULL;}
}
buf[blen++] = c;
}
buf[blen] = '\0';
*lenout = blen;
return buf;
}
static void* read_file_into_alloced_buffer(FILE* f, unsigned long* len){
void* buf = NULL;
if(!f) return NULL;
fseek(f, 0, SEEK_END);
*len = ftell(f);
fseek(f,0,SEEK_SET);
buf = STRUTIL_ALLOC(*len + 1);
if(!buf) return NULL;
fread(buf, 1, *len, f);
((char*)buf)[*len] = '\0';
return buf;
}
/*LIMITATIONS
GEK'S SIMPLE TEXT COMPRESSION SCHEMA
* Token names must be alphabetic (a-z, A-Z)
* The token mark must be escaped with a backslash.
* Token names which are substrings of other ones must be listed later
*/
static char* strencodealloc(const char* inbuf, const char** tokens, unsigned long ntokens, char esc, char tokmark){
unsigned long lenin;
char c; unsigned long i = 0; unsigned long j;
char c_str[512];
char* out = NULL;
lenin = strlen(inbuf);
c_str[0] = esc;
c_str[1] = tokmark;
out = strcatalloc(c_str, "");
c_str[0] = 0;
c_str[1] = 0;
c_str[511] = 0;
for(j = 0; j < ntokens; j++){
out = strcataf1(out, tokens[2*j]);
sprintf(c_str, "%lu", (unsigned long)strlen(tokens[2*j+1]));
out = strcataf1(out, c_str);
c_str[0] = tokmark;
c_str[1] = 0;
out = strcataf1(out, c_str);
out = strcataf1(out, tokens[2*j+1]);
}
c_str[0] = esc;
c_str[1] = 0;
out = strcataf1(out, c_str);
for(i=0; i<lenin; i++){ unsigned long t;
for(t = 0; t < ntokens; t++) /*t- the token we are processing.*/
if(strprefix(tokens[t*2+1], inbuf+i)){ /*Matched at least one*/
unsigned long h, curtoklen, howmany = 1;
curtoklen = strlen(tokens[t*2+1]); /*Length of the current token we are counting*/
for(h=1;i+h*curtoklen < lenin;h++){
if(strprefix(tokens[t*2+1], inbuf+i+h*curtoklen))
{howmany++;}
else
break; /*The number of these things is limited.*/
}
/*We know what token and how many, write it to out*/
c_str[0] = tokmark;
c_str[1] = 0;
out = strcataf1(out, c_str);
if(howmany > 1){
/*snprintf(c_str, 512, "%lu", (unsigned long)howmany);*/
sprintf(c_str, "%lu", (unsigned long)howmany);
out = strcataf1(out, c_str);
}
out = strcataf1(out, tokens[t*2]);
i+=howmany*curtoklen;
continue;
}
/*Test if we need to escape a sequence.*/
if(inbuf[i] == esc || inbuf[i] == tokmark){
c_str[0] = esc;
c_str[1] = 0;
out = strcataf1(out, c_str);
}
/*We were unable to find a match, just write the character out.*/
c_str[0] = inbuf[i];
c_str[1] = 0;
out = strcataf1(out, c_str);
}
return out;
}
static char* strdecodealloc(char* inbuf){
unsigned long lenin, ntokens;
char* out;char** tokens = NULL; char esc; char tokmark; long doescape;
char c; unsigned long vv,l,i = 2;
char c_str[2] = {0,0};
esc = inbuf[0];
tokmark = inbuf[1];
lenin = strlen(inbuf);
out = strcatalloc("","");
ntokens = 0;
if(lenin < 3) {
return NULL;
}
{if(i <= lenin) c = inbuf[i++]; else {goto end;}}; /*has to occur before the loop.*/
while(c != esc){ ntokens++;
tokens = STRUTIL_REALLOC(tokens, ntokens * 2 * sizeof(char*));
tokens[(ntokens-1)*2] = strcatalloc("","");
tokens[(ntokens-1)*2+1] = strcatalloc("","");
if(!isalpha(c)) goto end;
while(isalpha(c)){
c_str[0] = c;
tokens[(ntokens-1)*2] = strcatallocf1(tokens[(ntokens-1)*2], c_str);
{if(i <= lenin) c = inbuf[i++]; else {goto end;}};
}
l = 0;
if(!isdigit(c)) goto end;
while(isdigit(c) && c!=tokmark){
c_str[0] = c;
l *= 10;
l += atoi(c_str);
{if(i <= lenin) c = inbuf[i++]; else {goto end;}};
}
for(vv = 0; vv < l; vv++){
{if(i <= lenin) c = inbuf[i++]; else {goto end;}};
c_str[0] = c;
tokens[(ntokens-1)*2+1] = strcatallocf1(tokens[(ntokens-1)*2+1], c_str);
}
{if(i <= lenin) c = inbuf[i++]; else {goto end;}};
}
{if(i <= lenin) c = inbuf[i++]; else {goto end;}};
doescape = 0;
while(i<=lenin){
if(!doescape && c==esc){
doescape=1;{if(i <= lenin) c = inbuf[i++]; else {goto end;}};continue;
}
if(!doescape && c==tokmark){
/*Handle digits prefixing a token.*/
unsigned long t,l = 0;
{if(i <= lenin) c = inbuf[i++]; else {goto end;}};
if(isdigit(c))
while(isdigit(c)){
c_str[0] = c;
l *= 10;
l += atoi(c_str);
{if(i <= lenin) c = inbuf[i++]; else {goto end;}};
}
else {l=1;}
i--;
for(t = 0; t < ntokens; t++)
if(strprefix(tokens[t*2], inbuf+i)){ unsigned long q;
for(q = 0; q < l; q++)
out = strcatallocf1(out, tokens[t*2+1]);
i+=strlen(tokens[t*2]);
break; /*break out of the for.*/
}
if(i<=lenin) {if(i <= lenin) c = inbuf[i++]; else {goto end;}};
continue;
}else{
c_str[0] = c;
out = strcatallocf1(out, c_str);
doescape = 0;
{if(i <= lenin) c = inbuf[i++]; else {goto end;}};
}
}
end:
if(tokens){unsigned long j;
for(j = 0; j < ntokens; j++)
{STRUTIL_FREE(tokens[j*2]);STRUTIL_FREE(tokens[j*2+1]);}
STRUTIL_FREE(tokens);
}
return out;
}
#endif