Mon, 20 Feb 2017 15:25:28 +0100
improves handling of special cases delimiter size >= string size in sstrsplit
1 /*
2 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS HEADER.
3 *
4 * Copyright 2016 Olaf Wintermann. All rights reserved.
5 *
6 * Redistribution and use in source and binary forms, with or without
7 * modification, are permitted provided that the following conditions are met:
8 *
9 * 1. Redistributions of source code must retain the above copyright
10 * notice, this list of conditions and the following disclaimer.
11 *
12 * 2. Redistributions in binary form must reproduce the above copyright
13 * notice, this list of conditions and the following disclaimer in the
14 * documentation and/or other materials provided with the distribution.
15 *
16 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
17 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
18 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
19 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE
20 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
21 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
22 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
23 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
24 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
25 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
26 * POSSIBILITY OF SUCH DAMAGE.
27 */
29 #include <stdlib.h>
30 #include <string.h>
31 #include <stdarg.h>
32 #include <ctype.h>
34 #include "string.h"
35 #include "allocator.h"
37 sstr_t sstr(char *cstring) {
38 sstr_t string;
39 string.ptr = cstring;
40 string.length = strlen(cstring);
41 return string;
42 }
44 sstr_t sstrn(char *cstring, size_t length) {
45 sstr_t string;
46 string.ptr = cstring;
47 string.length = length;
48 return string;
49 }
51 size_t sstrnlen(size_t n, sstr_t s, ...) {
52 va_list ap;
53 size_t size = s.length;
54 va_start(ap, s);
56 for (size_t i = 1 ; i < n ; i++) {
57 sstr_t str = va_arg(ap, sstr_t);
58 size += str.length;
59 }
60 va_end(ap);
62 return size;
63 }
65 static sstr_t sstrvcat_a(
66 UcxAllocator *a,
67 size_t count,
68 sstr_t s1,
69 sstr_t s2,
70 va_list ap) {
71 sstr_t str;
72 str.ptr = NULL;
73 str.length = 0;
74 if(count < 2) {
75 return str;
76 }
78 sstr_t *strings = (sstr_t*) calloc(count, sizeof(sstr_t));
79 if(!strings) {
80 return str;
81 }
83 // get all args and overall length
84 strings[0] = s1;
85 strings[1] = s2;
86 size_t strlen = s1.length + s2.length;
87 for (size_t i=2;i<count;i++) {
88 sstr_t s = va_arg (ap, sstr_t);
89 strings[i] = s;
90 strlen += s.length;
91 }
93 // create new string
94 str.ptr = (char*) almalloc(a, strlen + 1);
95 str.length = strlen;
96 if(!str.ptr) {
97 free(strings);
98 str.length = 0;
99 return str;
100 }
102 // concatenate strings
103 size_t pos = 0;
104 for (size_t i=0;i<count;i++) {
105 sstr_t s = strings[i];
106 memcpy(str.ptr + pos, s.ptr, s.length);
107 pos += s.length;
108 }
110 str.ptr[str.length] = '\0';
112 free(strings);
114 return str;
115 }
117 sstr_t sstrcat(size_t count, sstr_t s1, sstr_t s2, ...) {
118 va_list ap;
119 va_start(ap, s2);
120 sstr_t s = sstrvcat_a(ucx_default_allocator(), count, s1, s2, ap);
121 va_end(ap);
122 return s;
123 }
125 sstr_t sstrcat_a(UcxAllocator *a, size_t count, sstr_t s1, sstr_t s2, ...) {
126 va_list ap;
127 va_start(ap, s2);
128 sstr_t s = sstrvcat_a(a, count, s1, s2, ap);
129 va_end(ap);
130 return s;
131 }
133 sstr_t sstrsubs(sstr_t s, size_t start) {
134 return sstrsubsl (s, start, s.length-start);
135 }
137 sstr_t sstrsubsl(sstr_t s, size_t start, size_t length) {
138 sstr_t new_sstr;
139 if (start >= s.length) {
140 new_sstr.ptr = NULL;
141 new_sstr.length = 0;
142 } else {
143 if (length > s.length-start) {
144 length = s.length-start;
145 }
146 new_sstr.ptr = &s.ptr[start];
147 new_sstr.length = length;
148 }
149 return new_sstr;
150 }
152 sstr_t sstrchr(sstr_t s, int c) {
153 for(size_t i=0;i<s.length;i++) {
154 if(s.ptr[i] == c) {
155 return sstrsubs(s, i);
156 }
157 }
158 sstr_t n;
159 n.ptr = NULL;
160 n.length = 0;
161 return n;
162 }
164 sstr_t sstrrchr(sstr_t s, int c) {
165 if (s.length > 0) {
166 for(size_t i=s.length;i>0;i--) {
167 if(s.ptr[i-1] == c) {
168 return sstrsubs(s, i-1);
169 }
170 }
171 }
172 sstr_t n;
173 n.ptr = NULL;
174 n.length = 0;
175 return n;
176 }
178 sstr_t sstrstr(sstr_t string, sstr_t match) {
179 if (match.length == 0) {
180 return string;
181 }
183 for (size_t i = 0 ; i < string.length ; i++) {
184 sstr_t substr = sstrsubs(string, i);
185 if (sstrprefix(substr, match)) {
186 return substr;
187 }
188 }
190 sstr_t emptystr;
191 emptystr.length = 0;
192 emptystr.ptr = NULL;
193 return emptystr;
194 }
196 sstr_t* sstrsplit(sstr_t s, sstr_t d, ssize_t *n) {
197 return sstrsplit_a(ucx_default_allocator(), s, d, n);
198 }
200 sstr_t* sstrsplit_a(UcxAllocator *allocator, sstr_t s, sstr_t d, ssize_t *n) {
201 if (s.length == 0 || d.length == 0) {
202 *n = -1;
203 return NULL;
204 }
206 /* special cases: delimiter is at least as large as the string */
207 if (d.length >= s.length) {
208 /* exact match */
209 if (sstrcmp(s, d) == 0) {
210 *n = 0;
211 return NULL;
212 } else /* no match possible */ {
213 *n = 1;
214 sstr_t *result = (sstr_t*) almalloc(allocator, sizeof(sstr_t));
215 result->ptr = (char*) almalloc(allocator, 1+s.length);
216 memcpy(result->ptr, s.ptr, s.length);
217 result->ptr[s.length] = '\0';
218 result->length = s.length;
219 return result;
220 }
221 }
223 sstr_t* result;
224 ssize_t nmax = *n;
225 *n = 1;
227 sstr_t sv = sstrdup(s);
228 if (sv.length == 0) {
229 *n = -2;
230 return NULL;
231 }
233 for (size_t i = 0 ; i < s.length ; i++) {
234 sstr_t substr = sstrsubs(sv, i);
235 if (sstrprefix(substr, d)) {
236 (*n)++;
237 for (size_t j = 0 ; j < d.length ; j++) {
238 sv.ptr[i+j] = 0;
239 }
240 i += d.length - 1; // -1, because the loop will do a i++
241 }
242 if ((*n) == nmax) break;
243 }
244 result = (sstr_t*) almalloc(allocator, sizeof(sstr_t)*(*n));
246 if (result) {
247 char *pptr = sv.ptr;
248 for (ssize_t i = 0 ; i < *n ; i++) {
249 size_t l = strlen(pptr);
250 char* ptr = (char*) almalloc(allocator, l + 1);
251 if (ptr) {
252 memcpy(ptr, pptr, l);
253 ptr[l] = '\0';
255 result[i] = sstrn(ptr, l);
256 pptr += l + d.length;
257 } else {
258 for (ssize_t j = i-1 ; j >= 0 ; j--) {
259 alfree(allocator, result[j].ptr);
260 }
261 alfree(allocator, result);
262 *n = -2;
263 break;
264 }
265 }
266 } else {
267 *n = -2;
268 }
270 free(sv.ptr);
272 return result;
273 }
275 int sstrcmp(sstr_t s1, sstr_t s2) {
276 if (s1.length == s2.length) {
277 return memcmp(s1.ptr, s2.ptr, s1.length);
278 } else if (s1.length > s2.length) {
279 return 1;
280 } else {
281 return -1;
282 }
283 }
285 int sstrcasecmp(sstr_t s1, sstr_t s2) {
286 if (s1.length == s2.length) {
287 #ifdef _WIN32
288 return _strnicmp(s1.ptr, s2.ptr, s1.length);
289 #else
290 return strncasecmp(s1.ptr, s2.ptr, s1.length);
291 #endif
292 } else if (s1.length > s2.length) {
293 return 1;
294 } else {
295 return -1;
296 }
297 }
299 sstr_t sstrdup(sstr_t s) {
300 return sstrdup_a(ucx_default_allocator(), s);
301 }
303 sstr_t sstrdup_a(UcxAllocator *allocator, sstr_t s) {
304 sstr_t newstring;
305 newstring.ptr = (char*)almalloc(allocator, s.length + 1);
306 if (newstring.ptr) {
307 newstring.length = s.length;
308 newstring.ptr[newstring.length] = 0;
310 memcpy(newstring.ptr, s.ptr, s.length);
311 } else {
312 newstring.length = 0;
313 }
315 return newstring;
316 }
318 sstr_t sstrtrim(sstr_t string) {
319 sstr_t newstr = string;
321 while (newstr.length > 0 && isspace(*newstr.ptr)) {
322 newstr.ptr++;
323 newstr.length--;
324 }
325 while (newstr.length > 0 && isspace(newstr.ptr[newstr.length-1])) {
326 newstr.length--;
327 }
329 return newstr;
330 }
332 int sstrprefix(sstr_t string, sstr_t prefix) {
333 if (string.length == 0) {
334 return prefix.length == 0;
335 }
336 if (prefix.length == 0) {
337 return 1;
338 }
340 if (prefix.length > string.length) {
341 return 0;
342 } else {
343 return memcmp(string.ptr, prefix.ptr, prefix.length) == 0;
344 }
345 }
347 int sstrsuffix(sstr_t string, sstr_t suffix) {
348 if (string.length == 0) {
349 return suffix.length == 0;
350 }
351 if (suffix.length == 0) {
352 return 1;
353 }
355 if (suffix.length > string.length) {
356 return 0;
357 } else {
358 return memcmp(string.ptr+string.length-suffix.length,
359 suffix.ptr, suffix.length) == 0;
360 }
361 }
363 sstr_t sstrlower(sstr_t string) {
364 sstr_t ret = sstrdup(string);
365 for (size_t i = 0; i < ret.length ; i++) {
366 ret.ptr[i] = tolower(ret.ptr[i]);
367 }
368 return ret;
369 }
371 sstr_t sstrlower_a(UcxAllocator *allocator, sstr_t string) {
372 sstr_t ret = sstrdup_a(allocator, string);
373 for (size_t i = 0; i < ret.length ; i++) {
374 ret.ptr[i] = tolower(ret.ptr[i]);
375 }
376 return ret;
377 }
379 sstr_t sstrupper(sstr_t string) {
380 sstr_t ret = sstrdup(string);
381 for (size_t i = 0; i < ret.length ; i++) {
382 ret.ptr[i] = toupper(ret.ptr[i]);
383 }
384 return ret;
385 }
387 sstr_t sstrupper_a(UcxAllocator *allocator, sstr_t string) {
388 sstr_t ret = sstrdup_a(allocator, string);
389 for (size_t i = 0; i < ret.length ; i++) {
390 ret.ptr[i] = toupper(ret.ptr[i]);
391 }
392 return ret;
393 }