src/ucx/string.c

Tue, 23 Aug 2016 13:49:38 +0200

author
Mike Becker <universe@uap-core.de>
date
Tue, 23 Aug 2016 13:49:38 +0200
changeset 39
ac35daceb24c
permissions
-rw-r--r--

adds UCX + changes how the input file is read (uses an consecutive memory area now)

universe@39 1 /*
universe@39 2 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS HEADER.
universe@39 3 *
universe@39 4 * Copyright 2015 Olaf Wintermann. All rights reserved.
universe@39 5 *
universe@39 6 * Redistribution and use in source and binary forms, with or without
universe@39 7 * modification, are permitted provided that the following conditions are met:
universe@39 8 *
universe@39 9 * 1. Redistributions of source code must retain the above copyright
universe@39 10 * notice, this list of conditions and the following disclaimer.
universe@39 11 *
universe@39 12 * 2. Redistributions in binary form must reproduce the above copyright
universe@39 13 * notice, this list of conditions and the following disclaimer in the
universe@39 14 * documentation and/or other materials provided with the distribution.
universe@39 15 *
universe@39 16 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
universe@39 17 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
universe@39 18 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
universe@39 19 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE
universe@39 20 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
universe@39 21 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
universe@39 22 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
universe@39 23 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
universe@39 24 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
universe@39 25 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
universe@39 26 * POSSIBILITY OF SUCH DAMAGE.
universe@39 27 */
universe@39 28
universe@39 29 #include <stdlib.h>
universe@39 30 #include <string.h>
universe@39 31 #include <stdarg.h>
universe@39 32 #include <ctype.h>
universe@39 33
universe@39 34 #include "string.h"
universe@39 35 #include "allocator.h"
universe@39 36
universe@39 37 sstr_t sstr(char *cstring) {
universe@39 38 sstr_t string;
universe@39 39 string.ptr = cstring;
universe@39 40 string.length = strlen(cstring);
universe@39 41 return string;
universe@39 42 }
universe@39 43
universe@39 44 sstr_t sstrn(char *cstring, size_t length) {
universe@39 45 sstr_t string;
universe@39 46 string.ptr = cstring;
universe@39 47 string.length = length;
universe@39 48 return string;
universe@39 49 }
universe@39 50
universe@39 51 size_t sstrnlen(size_t n, sstr_t s, ...) {
universe@39 52 va_list ap;
universe@39 53 size_t size = s.length;
universe@39 54 va_start(ap, s);
universe@39 55
universe@39 56 for (size_t i = 1 ; i < n ; i++) {
universe@39 57 sstr_t str = va_arg(ap, sstr_t);
universe@39 58 size += str.length;
universe@39 59 }
universe@39 60 va_end(ap);
universe@39 61
universe@39 62 return size;
universe@39 63 }
universe@39 64
universe@39 65 static sstr_t sstrvcat_a(
universe@39 66 UcxAllocator *a,
universe@39 67 size_t count,
universe@39 68 sstr_t s1,
universe@39 69 sstr_t s2,
universe@39 70 va_list ap) {
universe@39 71 sstr_t str;
universe@39 72 str.ptr = NULL;
universe@39 73 str.length = 0;
universe@39 74 if(count < 2) {
universe@39 75 return str;
universe@39 76 }
universe@39 77
universe@39 78 sstr_t *strings = (sstr_t*) calloc(count, sizeof(sstr_t));
universe@39 79 if(!strings) {
universe@39 80 return str;
universe@39 81 }
universe@39 82
universe@39 83 // get all args and overall length
universe@39 84 strings[0] = s1;
universe@39 85 strings[1] = s2;
universe@39 86 size_t strlen = s1.length + s2.length;
universe@39 87 for (size_t i=2;i<count;i++) {
universe@39 88 sstr_t s = va_arg (ap, sstr_t);
universe@39 89 strings[i] = s;
universe@39 90 strlen += s.length;
universe@39 91 }
universe@39 92
universe@39 93 // create new string
universe@39 94 str.ptr = (char*) almalloc(a, strlen + 1);
universe@39 95 str.length = strlen;
universe@39 96 if(!str.ptr) {
universe@39 97 free(strings);
universe@39 98 str.length = 0;
universe@39 99 return str;
universe@39 100 }
universe@39 101
universe@39 102 // concatenate strings
universe@39 103 size_t pos = 0;
universe@39 104 for (size_t i=0;i<count;i++) {
universe@39 105 sstr_t s = strings[i];
universe@39 106 memcpy(str.ptr + pos, s.ptr, s.length);
universe@39 107 pos += s.length;
universe@39 108 }
universe@39 109
universe@39 110 str.ptr[str.length] = '\0';
universe@39 111
universe@39 112 free(strings);
universe@39 113
universe@39 114 return str;
universe@39 115 }
universe@39 116
universe@39 117 sstr_t sstrcat(size_t count, sstr_t s1, sstr_t s2, ...) {
universe@39 118 va_list ap;
universe@39 119 va_start(ap, s2);
universe@39 120 sstr_t s = sstrvcat_a(ucx_default_allocator(), count, s1, s2, ap);
universe@39 121 va_end(ap);
universe@39 122 return s;
universe@39 123 }
universe@39 124
universe@39 125 sstr_t sstrcat_a(UcxAllocator *a, size_t count, sstr_t s1, sstr_t s2, ...) {
universe@39 126 va_list ap;
universe@39 127 va_start(ap, s2);
universe@39 128 sstr_t s = sstrvcat_a(a, count, s1, s2, ap);
universe@39 129 va_end(ap);
universe@39 130 return s;
universe@39 131 }
universe@39 132
universe@39 133 sstr_t sstrsubs(sstr_t s, size_t start) {
universe@39 134 return sstrsubsl (s, start, s.length-start);
universe@39 135 }
universe@39 136
universe@39 137 sstr_t sstrsubsl(sstr_t s, size_t start, size_t length) {
universe@39 138 sstr_t new_sstr;
universe@39 139 if (start >= s.length) {
universe@39 140 new_sstr.ptr = NULL;
universe@39 141 new_sstr.length = 0;
universe@39 142 } else {
universe@39 143 if (length > s.length-start) {
universe@39 144 length = s.length-start;
universe@39 145 }
universe@39 146 new_sstr.ptr = &s.ptr[start];
universe@39 147 new_sstr.length = length;
universe@39 148 }
universe@39 149 return new_sstr;
universe@39 150 }
universe@39 151
universe@39 152 sstr_t sstrchr(sstr_t s, int c) {
universe@39 153 for(size_t i=0;i<s.length;i++) {
universe@39 154 if(s.ptr[i] == c) {
universe@39 155 return sstrsubs(s, i);
universe@39 156 }
universe@39 157 }
universe@39 158 sstr_t n;
universe@39 159 n.ptr = NULL;
universe@39 160 n.length = 0;
universe@39 161 return n;
universe@39 162 }
universe@39 163
universe@39 164 sstr_t sstrrchr(sstr_t s, int c) {
universe@39 165 if (s.length > 0) {
universe@39 166 for(size_t i=s.length;i>0;i--) {
universe@39 167 if(s.ptr[i-1] == c) {
universe@39 168 return sstrsubs(s, i-1);
universe@39 169 }
universe@39 170 }
universe@39 171 }
universe@39 172 sstr_t n;
universe@39 173 n.ptr = NULL;
universe@39 174 n.length = 0;
universe@39 175 return n;
universe@39 176 }
universe@39 177
universe@39 178 sstr_t sstrstr(sstr_t string, sstr_t match) {
universe@39 179 if (match.length == 0) {
universe@39 180 return string;
universe@39 181 }
universe@39 182
universe@39 183 for (size_t i = 0 ; i < string.length ; i++) {
universe@39 184 sstr_t substr = sstrsubs(string, i);
universe@39 185 if (sstrprefix(substr, match)) {
universe@39 186 return substr;
universe@39 187 }
universe@39 188 }
universe@39 189
universe@39 190 sstr_t emptystr;
universe@39 191 emptystr.length = 0;
universe@39 192 emptystr.ptr = NULL;
universe@39 193 return emptystr;
universe@39 194 }
universe@39 195
universe@39 196 sstr_t* sstrsplit(sstr_t s, sstr_t d, ssize_t *n) {
universe@39 197 return sstrsplit_a(ucx_default_allocator(), s, d, n);
universe@39 198 }
universe@39 199
universe@39 200 sstr_t* sstrsplit_a(UcxAllocator *allocator, sstr_t s, sstr_t d, ssize_t *n) {
universe@39 201 if (s.length == 0 || d.length == 0) {
universe@39 202 *n = -1;
universe@39 203 return NULL;
universe@39 204 }
universe@39 205
universe@39 206 sstr_t* result;
universe@39 207 ssize_t nmax = *n;
universe@39 208 *n = 1;
universe@39 209
universe@39 210 /* special case: exact match - no processing needed */
universe@39 211 if (sstrcmp(s, d) == 0) {
universe@39 212 *n = 0;
universe@39 213 return NULL;
universe@39 214 }
universe@39 215 sstr_t sv = sstrdup(s);
universe@39 216 if (sv.length == 0) {
universe@39 217 *n = -2;
universe@39 218 return NULL;
universe@39 219 }
universe@39 220
universe@39 221 for (size_t i = 0 ; i < s.length ; i++) {
universe@39 222 sstr_t substr = sstrsubs(sv, i);
universe@39 223 if (sstrprefix(substr, d)) {
universe@39 224 (*n)++;
universe@39 225 for (size_t j = 0 ; j < d.length ; j++) {
universe@39 226 sv.ptr[i+j] = 0;
universe@39 227 }
universe@39 228 i += d.length - 1; // -1, because the loop will do a i++
universe@39 229 }
universe@39 230 if ((*n) == nmax) break;
universe@39 231 }
universe@39 232 result = (sstr_t*) almalloc(allocator, sizeof(sstr_t)*(*n));
universe@39 233
universe@39 234 if (result) {
universe@39 235 char *pptr = sv.ptr;
universe@39 236 for (ssize_t i = 0 ; i < *n ; i++) {
universe@39 237 size_t l = strlen(pptr);
universe@39 238 char* ptr = (char*) almalloc(allocator, l + 1);
universe@39 239 if (ptr) {
universe@39 240 memcpy(ptr, pptr, l);
universe@39 241 ptr[l] = 0;
universe@39 242
universe@39 243 result[i] = sstrn(ptr, l);
universe@39 244 pptr += l + d.length;
universe@39 245 } else {
universe@39 246 for (ssize_t j = i-1 ; j >= 0 ; j--) {
universe@39 247 alfree(allocator, result[j].ptr);
universe@39 248 }
universe@39 249 alfree(allocator, result);
universe@39 250 *n = -2;
universe@39 251 break;
universe@39 252 }
universe@39 253 }
universe@39 254 } else {
universe@39 255 *n = -2;
universe@39 256 }
universe@39 257
universe@39 258 free(sv.ptr);
universe@39 259
universe@39 260 return result;
universe@39 261 }
universe@39 262
universe@39 263 int sstrcmp(sstr_t s1, sstr_t s2) {
universe@39 264 if (s1.length == s2.length) {
universe@39 265 return memcmp(s1.ptr, s2.ptr, s1.length);
universe@39 266 } else if (s1.length > s2.length) {
universe@39 267 return 1;
universe@39 268 } else {
universe@39 269 return -1;
universe@39 270 }
universe@39 271 }
universe@39 272
universe@39 273 int sstrcasecmp(sstr_t s1, sstr_t s2) {
universe@39 274 if (s1.length == s2.length) {
universe@39 275 #ifdef _WIN32
universe@39 276 return _strnicmp(s1.ptr, s2.ptr, s1.length);
universe@39 277 #else
universe@39 278 return strncasecmp(s1.ptr, s2.ptr, s1.length);
universe@39 279 #endif
universe@39 280 } else if (s1.length > s2.length) {
universe@39 281 return 1;
universe@39 282 } else {
universe@39 283 return -1;
universe@39 284 }
universe@39 285 }
universe@39 286
universe@39 287 sstr_t sstrdup(sstr_t s) {
universe@39 288 return sstrdup_a(ucx_default_allocator(), s);
universe@39 289 }
universe@39 290
universe@39 291 sstr_t sstrdup_a(UcxAllocator *allocator, sstr_t s) {
universe@39 292 sstr_t newstring;
universe@39 293 newstring.ptr = (char*)almalloc(allocator, s.length + 1);
universe@39 294 if (newstring.ptr) {
universe@39 295 newstring.length = s.length;
universe@39 296 newstring.ptr[newstring.length] = 0;
universe@39 297
universe@39 298 memcpy(newstring.ptr, s.ptr, s.length);
universe@39 299 } else {
universe@39 300 newstring.length = 0;
universe@39 301 }
universe@39 302
universe@39 303 return newstring;
universe@39 304 }
universe@39 305
universe@39 306 sstr_t sstrtrim(sstr_t string) {
universe@39 307 sstr_t newstr = string;
universe@39 308
universe@39 309 while (newstr.length > 0 && isspace(*newstr.ptr)) {
universe@39 310 newstr.ptr++;
universe@39 311 newstr.length--;
universe@39 312 }
universe@39 313 while (newstr.length > 0 && isspace(newstr.ptr[newstr.length-1])) {
universe@39 314 newstr.length--;
universe@39 315 }
universe@39 316
universe@39 317 return newstr;
universe@39 318 }
universe@39 319
universe@39 320 int sstrprefix(sstr_t string, sstr_t prefix) {
universe@39 321 if (string.length == 0) {
universe@39 322 return prefix.length == 0;
universe@39 323 }
universe@39 324 if (prefix.length == 0) {
universe@39 325 return 1;
universe@39 326 }
universe@39 327
universe@39 328 if (prefix.length > string.length) {
universe@39 329 return 0;
universe@39 330 } else {
universe@39 331 return memcmp(string.ptr, prefix.ptr, prefix.length) == 0;
universe@39 332 }
universe@39 333 }
universe@39 334
universe@39 335 int sstrsuffix(sstr_t string, sstr_t suffix) {
universe@39 336 if (string.length == 0) {
universe@39 337 return suffix.length == 0;
universe@39 338 }
universe@39 339 if (suffix.length == 0) {
universe@39 340 return 1;
universe@39 341 }
universe@39 342
universe@39 343 if (suffix.length > string.length) {
universe@39 344 return 0;
universe@39 345 } else {
universe@39 346 return memcmp(string.ptr+string.length-suffix.length,
universe@39 347 suffix.ptr, suffix.length) == 0;
universe@39 348 }
universe@39 349 }
universe@39 350
universe@39 351 sstr_t sstrlower(sstr_t string) {
universe@39 352 sstr_t ret = sstrdup(string);
universe@39 353 for (size_t i = 0; i < ret.length ; i++) {
universe@39 354 ret.ptr[i] = tolower(ret.ptr[i]);
universe@39 355 }
universe@39 356 return ret;
universe@39 357 }
universe@39 358
universe@39 359 sstr_t sstrlower_a(UcxAllocator *allocator, sstr_t string) {
universe@39 360 sstr_t ret = sstrdup_a(allocator, string);
universe@39 361 for (size_t i = 0; i < ret.length ; i++) {
universe@39 362 ret.ptr[i] = tolower(ret.ptr[i]);
universe@39 363 }
universe@39 364 return ret;
universe@39 365 }
universe@39 366
universe@39 367 sstr_t sstrupper(sstr_t string) {
universe@39 368 sstr_t ret = sstrdup(string);
universe@39 369 for (size_t i = 0; i < ret.length ; i++) {
universe@39 370 ret.ptr[i] = toupper(ret.ptr[i]);
universe@39 371 }
universe@39 372 return ret;
universe@39 373 }
universe@39 374
universe@39 375 sstr_t sstrupper_a(UcxAllocator *allocator, sstr_t string) {
universe@39 376 sstr_t ret = sstrdup_a(allocator, string);
universe@39 377 for (size_t i = 0; i < ret.length ; i++) {
universe@39 378 ret.ptr[i] = toupper(ret.ptr[i]);
universe@39 379 }
universe@39 380 return ret;
universe@39 381 }

mercurial