Mon, 20 Feb 2017 16:57:09 +0100
reimplementation of sstrsplit
1 /*
2 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS HEADER.
3 *
4 * Copyright 2016 Olaf Wintermann. All rights reserved.
5 *
6 * Redistribution and use in source and binary forms, with or without
7 * modification, are permitted provided that the following conditions are met:
8 *
9 * 1. Redistributions of source code must retain the above copyright
10 * notice, this list of conditions and the following disclaimer.
11 *
12 * 2. Redistributions in binary form must reproduce the above copyright
13 * notice, this list of conditions and the following disclaimer in the
14 * documentation and/or other materials provided with the distribution.
15 *
16 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
17 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
18 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
19 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE
20 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
21 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
22 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
23 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
24 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
25 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
26 * POSSIBILITY OF SUCH DAMAGE.
27 */
29 #include <stdlib.h>
30 #include <string.h>
31 #include <stdarg.h>
32 #include <ctype.h>
34 #include "string.h"
35 #include "allocator.h"
37 sstr_t sstr(char *cstring) {
38 sstr_t string;
39 string.ptr = cstring;
40 string.length = strlen(cstring);
41 return string;
42 }
44 sstr_t sstrn(char *cstring, size_t length) {
45 sstr_t string;
46 string.ptr = cstring;
47 string.length = length;
48 return string;
49 }
51 size_t sstrnlen(size_t n, sstr_t s, ...) {
52 va_list ap;
53 size_t size = s.length;
54 va_start(ap, s);
56 for (size_t i = 1 ; i < n ; i++) {
57 sstr_t str = va_arg(ap, sstr_t);
58 size += str.length;
59 }
60 va_end(ap);
62 return size;
63 }
65 static sstr_t sstrvcat_a(
66 UcxAllocator *a,
67 size_t count,
68 sstr_t s1,
69 sstr_t s2,
70 va_list ap) {
71 sstr_t str;
72 str.ptr = NULL;
73 str.length = 0;
74 if(count < 2) {
75 return str;
76 }
78 sstr_t *strings = (sstr_t*) calloc(count, sizeof(sstr_t));
79 if(!strings) {
80 return str;
81 }
83 // get all args and overall length
84 strings[0] = s1;
85 strings[1] = s2;
86 size_t strlen = s1.length + s2.length;
87 for (size_t i=2;i<count;i++) {
88 sstr_t s = va_arg (ap, sstr_t);
89 strings[i] = s;
90 strlen += s.length;
91 }
93 // create new string
94 str.ptr = (char*) almalloc(a, strlen + 1);
95 str.length = strlen;
96 if(!str.ptr) {
97 free(strings);
98 str.length = 0;
99 return str;
100 }
102 // concatenate strings
103 size_t pos = 0;
104 for (size_t i=0;i<count;i++) {
105 sstr_t s = strings[i];
106 memcpy(str.ptr + pos, s.ptr, s.length);
107 pos += s.length;
108 }
110 str.ptr[str.length] = '\0';
112 free(strings);
114 return str;
115 }
117 sstr_t sstrcat(size_t count, sstr_t s1, sstr_t s2, ...) {
118 va_list ap;
119 va_start(ap, s2);
120 sstr_t s = sstrvcat_a(ucx_default_allocator(), count, s1, s2, ap);
121 va_end(ap);
122 return s;
123 }
125 sstr_t sstrcat_a(UcxAllocator *a, size_t count, sstr_t s1, sstr_t s2, ...) {
126 va_list ap;
127 va_start(ap, s2);
128 sstr_t s = sstrvcat_a(a, count, s1, s2, ap);
129 va_end(ap);
130 return s;
131 }
133 sstr_t sstrsubs(sstr_t s, size_t start) {
134 return sstrsubsl (s, start, s.length-start);
135 }
137 sstr_t sstrsubsl(sstr_t s, size_t start, size_t length) {
138 sstr_t new_sstr;
139 if (start >= s.length) {
140 new_sstr.ptr = NULL;
141 new_sstr.length = 0;
142 } else {
143 if (length > s.length-start) {
144 length = s.length-start;
145 }
146 new_sstr.ptr = &s.ptr[start];
147 new_sstr.length = length;
148 }
149 return new_sstr;
150 }
152 sstr_t sstrchr(sstr_t s, int c) {
153 for(size_t i=0;i<s.length;i++) {
154 if(s.ptr[i] == c) {
155 return sstrsubs(s, i);
156 }
157 }
158 sstr_t n;
159 n.ptr = NULL;
160 n.length = 0;
161 return n;
162 }
164 sstr_t sstrrchr(sstr_t s, int c) {
165 if (s.length > 0) {
166 for(size_t i=s.length;i>0;i--) {
167 if(s.ptr[i-1] == c) {
168 return sstrsubs(s, i-1);
169 }
170 }
171 }
172 sstr_t n;
173 n.ptr = NULL;
174 n.length = 0;
175 return n;
176 }
178 sstr_t sstrstr(sstr_t string, sstr_t match) {
179 if (match.length == 0) {
180 return string;
181 }
183 for (size_t i = 0 ; i < string.length ; i++) {
184 sstr_t substr = sstrsubs(string, i);
185 if (sstrprefix(substr, match)) {
186 return substr;
187 }
188 }
190 sstr_t emptystr;
191 emptystr.length = 0;
192 emptystr.ptr = NULL;
193 return emptystr;
194 }
196 sstr_t* sstrsplit(sstr_t s, sstr_t d, ssize_t *n) {
197 return sstrsplit_a(ucx_default_allocator(), s, d, n);
198 }
200 sstr_t* sstrsplit_a(UcxAllocator *allocator, sstr_t s, sstr_t d, ssize_t *n) {
201 if (s.length == 0 || d.length == 0) {
202 *n = -1;
203 return NULL;
204 }
206 /* special cases: delimiter is at least as large as the string */
207 if (d.length >= s.length) {
208 /* exact match */
209 if (sstrcmp(s, d) == 0) {
210 *n = 0;
211 return NULL;
212 } else /* no match possible */ {
213 *n = 1;
214 sstr_t *result = (sstr_t*) almalloc(allocator, sizeof(sstr_t));
215 *result = sstrdup_a(allocator, s);
216 return result;
217 }
218 }
220 ssize_t nmax = *n;
221 sstr_t* result = (sstr_t*) almalloc(allocator, sizeof(sstr_t));
223 if (result) {
224 sstr_t curpos = s;
225 ssize_t j = 1;
226 while (1) {
227 sstr_t match = sstrstr(curpos, d);
228 if (match.length > 0) {
229 /* is this our last try? */
230 if (nmax == 0 || j < nmax) {
231 /* copy the current string to the array */
232 sstr_t item = sstrn(curpos.ptr, match.ptr - curpos.ptr);
233 result[j-1] = sstrdup_a(allocator, item);
234 size_t processed = item.length + d.length;
235 curpos.ptr += processed;
236 curpos.length -= processed;
238 /* allocate memory for the next string */
239 j++;
240 sstr_t* reallocated = (sstr_t*)
241 alrealloc(allocator, result, j*sizeof(sstr_t));
242 if (reallocated) {
243 result = reallocated;
244 } else {
245 for (ssize_t i = 0 ; i < j-1 ; i++) {
246 alfree(allocator, result[i].ptr);
247 }
248 alfree(allocator, result);
249 *n = -2;
250 return NULL;
251 }
252 } else {
253 /* nmax reached, copy the _full_ remaining string */
254 result[j-1] = sstrdup_a(allocator, curpos);
255 break;
256 }
257 } else {
258 /* no more matches, copy last string */
259 result[j-1] = sstrdup_a(allocator, curpos);
260 break;
261 }
262 }
263 *n = j;
264 } else {
265 *n = -2;
266 }
268 return result;
269 }
271 int sstrcmp(sstr_t s1, sstr_t s2) {
272 if (s1.length == s2.length) {
273 return memcmp(s1.ptr, s2.ptr, s1.length);
274 } else if (s1.length > s2.length) {
275 return 1;
276 } else {
277 return -1;
278 }
279 }
281 int sstrcasecmp(sstr_t s1, sstr_t s2) {
282 if (s1.length == s2.length) {
283 #ifdef _WIN32
284 return _strnicmp(s1.ptr, s2.ptr, s1.length);
285 #else
286 return strncasecmp(s1.ptr, s2.ptr, s1.length);
287 #endif
288 } else if (s1.length > s2.length) {
289 return 1;
290 } else {
291 return -1;
292 }
293 }
295 sstr_t sstrdup(sstr_t s) {
296 return sstrdup_a(ucx_default_allocator(), s);
297 }
299 sstr_t sstrdup_a(UcxAllocator *allocator, sstr_t s) {
300 sstr_t newstring;
301 newstring.ptr = (char*)almalloc(allocator, s.length + 1);
302 if (newstring.ptr) {
303 newstring.length = s.length;
304 newstring.ptr[newstring.length] = 0;
306 memcpy(newstring.ptr, s.ptr, s.length);
307 } else {
308 newstring.length = 0;
309 }
311 return newstring;
312 }
314 sstr_t sstrtrim(sstr_t string) {
315 sstr_t newstr = string;
317 while (newstr.length > 0 && isspace(*newstr.ptr)) {
318 newstr.ptr++;
319 newstr.length--;
320 }
321 while (newstr.length > 0 && isspace(newstr.ptr[newstr.length-1])) {
322 newstr.length--;
323 }
325 return newstr;
326 }
328 int sstrprefix(sstr_t string, sstr_t prefix) {
329 if (string.length == 0) {
330 return prefix.length == 0;
331 }
332 if (prefix.length == 0) {
333 return 1;
334 }
336 if (prefix.length > string.length) {
337 return 0;
338 } else {
339 return memcmp(string.ptr, prefix.ptr, prefix.length) == 0;
340 }
341 }
343 int sstrsuffix(sstr_t string, sstr_t suffix) {
344 if (string.length == 0) {
345 return suffix.length == 0;
346 }
347 if (suffix.length == 0) {
348 return 1;
349 }
351 if (suffix.length > string.length) {
352 return 0;
353 } else {
354 return memcmp(string.ptr+string.length-suffix.length,
355 suffix.ptr, suffix.length) == 0;
356 }
357 }
359 sstr_t sstrlower(sstr_t string) {
360 sstr_t ret = sstrdup(string);
361 for (size_t i = 0; i < ret.length ; i++) {
362 ret.ptr[i] = tolower(ret.ptr[i]);
363 }
364 return ret;
365 }
367 sstr_t sstrlower_a(UcxAllocator *allocator, sstr_t string) {
368 sstr_t ret = sstrdup_a(allocator, string);
369 for (size_t i = 0; i < ret.length ; i++) {
370 ret.ptr[i] = tolower(ret.ptr[i]);
371 }
372 return ret;
373 }
375 sstr_t sstrupper(sstr_t string) {
376 sstr_t ret = sstrdup(string);
377 for (size_t i = 0; i < ret.length ; i++) {
378 ret.ptr[i] = toupper(ret.ptr[i]);
379 }
380 return ret;
381 }
383 sstr_t sstrupper_a(UcxAllocator *allocator, sstr_t string) {
384 sstr_t ret = sstrdup_a(allocator, string);
385 for (size_t i = 0; i < ret.length ; i++) {
386 ret.ptr[i] = toupper(ret.ptr[i]);
387 }
388 return ret;
389 }