ref: 55c02ff080dfe0abd113a2d930c39f2da6e9316b
dir: /include-demo/stringutil.h/
#ifndef STRUTIL_H #define STRUTIL_H #include <string.h> #include <stdlib.h> #include <stdio.h> #include <ctype.h> #ifndef STRUTIL_ALLOC #define STRUTIL_ALLOC(s) malloc(s) #endif #ifndef STRUTIL_FREE #define STRUTIL_FREE(s) free(s) #endif #ifndef STRUTIL_REALLOC #define STRUTIL_REALLOC(s, t) realloc(s,t) #endif #ifndef STRUTIL_NO_SHORT_NAMES #define strcata strcatalloc #define strcataf1 strcatallocf1 #define strcataf2 strcatallocf2 #define strcatafb strcatallocfb #endif static char* strcatalloc(const char* s1, const char* s2){ char* d = NULL; d = STRUTIL_ALLOC(strlen(s1) + strlen(s2) + 1); if(d){ strcpy(d, s1); strcat(d, s2); } return d; } static char* strcatallocf1(char* s1, const char* s2){ char* d = STRUTIL_REALLOC(s1, strlen(s1) + strlen(s2) + 1); if(d){ strcat(d, s2); } return d; } static char* strcatallocf2(const char* s1, char* s2){ char* d = NULL; d = STRUTIL_ALLOC(strlen(s1) + strlen(s2) + 1); if(d){ strcpy(d, s1); strcat(d, s2); } STRUTIL_FREE(s2); return d; } static char* strcatallocfb(char* s1, char* s2){ char* d = NULL; d = STRUTIL_ALLOC(strlen(s1) + strlen(s2) + 1); if(d){ strcpy(d, s1); strcat(d, s2); } STRUTIL_FREE(s1); STRUTIL_FREE(s2); return d; } static char* str_null_terminated_alloc(const char* in, unsigned int len){ char* d = NULL; d = malloc(len+1); if(d){ memcpy(d,in,len); d[len] = '\0'; } return d; } static unsigned int strprefix(const char *pre, const char *str) { unsigned long lenpre = strlen(pre), lenstr = strlen(str); return lenstr < lenpre ? 0 : memcmp(pre, str, lenpre) == 0; } static unsigned int streq(const char *pre, const char *str) { return strcmp(pre, str) == 0; } static long strfind(const char* text, const char* subtext){ long ti = 0; long si = 0; long st = strlen(subtext); for(;text[ti] != '\0';ti++){ if(text[ti] == subtext[si]) { si++; if(subtext[si] == '\0') return (ti - st)+1; }else { if(subtext[si] == '\0') return (ti - st)+1; ti-=si;si = 0; } } return -1; } static unsigned long read_until_terminator(FILE* f, char* buf, const unsigned long buflen, char terminator){ unsigned long i = 0; char c; for(i = 0; i < (buflen-1); i++) { if(feof(f))break; c = fgetc(f); if(c == terminator)break; buf[i] = c; } buf[buflen-1] = '\0'; return i; } static char* read_until_terminator_alloced(FILE* f, unsigned long* lenout, char terminator, unsigned long initsize){ char c; char* buf; unsigned long bcap = initsize; char* bufold; unsigned long blen = 0; buf = STRUTIL_ALLOC(initsize); if(!buf) return NULL; while(1){ if(feof(f)){break;} c = fgetc(f); if(c == terminator) {break;} if(blen == (bcap-1)) /*Grow the buffer.*/ { bcap<<=1; bufold = buf; buf = STRUTIL_REALLOC(buf, bcap); if(!buf){free(bufold); return NULL;} } buf[blen++] = c; } buf[blen] = '\0'; *lenout = blen; return buf; } static void* read_file_into_alloced_buffer(FILE* f, unsigned long* len){ void* buf = NULL; if(!f) return NULL; fseek(f, 0, SEEK_END); *len = ftell(f); fseek(f,0,SEEK_SET); buf = STRUTIL_ALLOC(*len + 1); if(!buf) return NULL; fread(buf, 1, *len, f); ((char*)buf)[*len] = '\0'; return buf; } /*LIMITATIONS GEK'S SIMPLE TEXT COMPRESSION SCHEMA * Token names must be alphabetic (a-z, A-Z) * The token mark must be escaped with a backslash. * Token names which are substrings of other ones must be listed later */ static char* strencodealloc(const char* inbuf, const char** tokens, unsigned long ntokens, char esc, char tokmark){ unsigned long lenin; char c; unsigned long i = 0; unsigned long j; char c_str[512]; char* out = NULL; lenin = strlen(inbuf); c_str[0] = esc; c_str[1] = tokmark; out = strcatalloc(c_str, ""); c_str[0] = 0; c_str[1] = 0; c_str[511] = 0; for(j = 0; j < ntokens; j++){ out = strcataf1(out, tokens[2*j]); sprintf(c_str, "%lu", (unsigned long)strlen(tokens[2*j+1])); out = strcataf1(out, c_str); c_str[0] = tokmark; c_str[1] = 0; out = strcataf1(out, c_str); out = strcataf1(out, tokens[2*j+1]); } c_str[0] = esc; c_str[1] = 0; out = strcataf1(out, c_str); for(i=0; i<lenin; i++){ unsigned long t; for(t = 0; t < ntokens; t++) /*t- the token we are processing.*/ if(strprefix(tokens[t*2+1], inbuf+i)){ /*Matched at least one*/ unsigned long h, curtoklen, howmany = 1; curtoklen = strlen(tokens[t*2+1]); /*Length of the current token we are counting*/ for(h=1;i+h*curtoklen < lenin;h++){ if(strprefix(tokens[t*2+1], inbuf+i+h*curtoklen)) {howmany++;} else break; /*The number of these things is limited.*/ } /*We know what token and how many, write it to out*/ c_str[0] = tokmark; c_str[1] = 0; out = strcataf1(out, c_str); if(howmany > 1){ /*snprintf(c_str, 512, "%lu", (unsigned long)howmany);*/ sprintf(c_str, "%lu", (unsigned long)howmany); out = strcataf1(out, c_str); } out = strcataf1(out, tokens[t*2]); i+=howmany*curtoklen; continue; } /*Test if we need to escape a sequence.*/ if(inbuf[i] == esc || inbuf[i] == tokmark){ c_str[0] = esc; c_str[1] = 0; out = strcataf1(out, c_str); } /*We were unable to find a match, just write the character out.*/ c_str[0] = inbuf[i]; c_str[1] = 0; out = strcataf1(out, c_str); } return out; } static char* strdecodealloc(char* inbuf){ unsigned long lenin, ntokens; char* out;char** tokens = NULL; char esc; char tokmark; long doescape; char c; unsigned long vv,l,i = 2; char c_str[2] = {0,0}; esc = inbuf[0]; tokmark = inbuf[1]; lenin = strlen(inbuf); out = strcatalloc("",""); ntokens = 0; if(lenin < 3) { return NULL; } {if(i <= lenin) c = inbuf[i++]; else {goto end;}}; /*has to occur before the loop.*/ while(c != esc){ ntokens++; tokens = STRUTIL_REALLOC(tokens, ntokens * 2 * sizeof(char*)); tokens[(ntokens-1)*2] = strcatalloc("",""); tokens[(ntokens-1)*2+1] = strcatalloc("",""); if(!isalpha(c)) goto end; while(isalpha(c)){ c_str[0] = c; tokens[(ntokens-1)*2] = strcatallocf1(tokens[(ntokens-1)*2], c_str); {if(i <= lenin) c = inbuf[i++]; else {goto end;}}; } l = 0; if(!isdigit(c)) goto end; while(isdigit(c) && c!=tokmark){ c_str[0] = c; l *= 10; l += atoi(c_str); {if(i <= lenin) c = inbuf[i++]; else {goto end;}}; } for(vv = 0; vv < l; vv++){ {if(i <= lenin) c = inbuf[i++]; else {goto end;}}; c_str[0] = c; tokens[(ntokens-1)*2+1] = strcatallocf1(tokens[(ntokens-1)*2+1], c_str); } {if(i <= lenin) c = inbuf[i++]; else {goto end;}}; } {if(i <= lenin) c = inbuf[i++]; else {goto end;}}; doescape = 0; while(i<=lenin){ if(!doescape && c==esc){ doescape=1;{if(i <= lenin) c = inbuf[i++]; else {goto end;}};continue; } if(!doescape && c==tokmark){ /*Handle digits prefixing a token.*/ unsigned long t,l = 0; {if(i <= lenin) c = inbuf[i++]; else {goto end;}}; if(isdigit(c)) while(isdigit(c)){ c_str[0] = c; l *= 10; l += atoi(c_str); {if(i <= lenin) c = inbuf[i++]; else {goto end;}}; } else {l=1;} i--; for(t = 0; t < ntokens; t++) if(strprefix(tokens[t*2], inbuf+i)){ unsigned long q; for(q = 0; q < l; q++) out = strcatallocf1(out, tokens[t*2+1]); i+=strlen(tokens[t*2]); break; /*break out of the for.*/ } if(i<=lenin) {if(i <= lenin) c = inbuf[i++]; else {goto end;}}; continue; }else{ c_str[0] = c; out = strcatallocf1(out, c_str); doescape = 0; {if(i <= lenin) c = inbuf[i++]; else {goto end;}}; } } end: if(tokens){unsigned long j; for(j = 0; j < ntokens; j++) {STRUTIL_FREE(tokens[j*2]);STRUTIL_FREE(tokens[j*2+1]);} STRUTIL_FREE(tokens); } return out; } #endif