src/cx/string.h

Fri, 21 Apr 2023 20:28:55 +0200

author
Mike Becker <universe@uap-core.de>
date
Fri, 21 Apr 2023 20:28:55 +0200
changeset 693
494d9b20b99e
parent 684
380bd45bc94a
child 697
ebdce4bf262b
permissions
-rw-r--r--

fix missing const qualifier for allocator

universe@576 1 /*
universe@576 2 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS HEADER.
universe@576 3 *
universe@576 4 * Copyright 2021 Mike Becker, Olaf Wintermann All rights reserved.
universe@576 5 *
universe@576 6 * Redistribution and use in source and binary forms, with or without
universe@576 7 * modification, are permitted provided that the following conditions are met:
universe@576 8 *
universe@576 9 * 1. Redistributions of source code must retain the above copyright
universe@576 10 * notice, this list of conditions and the following disclaimer.
universe@576 11 *
universe@576 12 * 2. Redistributions in binary form must reproduce the above copyright
universe@576 13 * notice, this list of conditions and the following disclaimer in the
universe@576 14 * documentation and/or other materials provided with the distribution.
universe@576 15 *
universe@576 16 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
universe@576 17 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
universe@576 18 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
universe@576 19 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE
universe@576 20 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
universe@576 21 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
universe@576 22 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
universe@576 23 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
universe@576 24 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
universe@576 25 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
universe@576 26 * POSSIBILITY OF SUCH DAMAGE.
universe@576 27 */
universe@576 28 /**
universe@576 29 * \file string.h
universe@576 30 * \brief Strings that know their length.
universe@576 31 * \author Mike Becker
universe@576 32 * \author Olaf Wintermann
universe@576 33 * \version 3.0
universe@576 34 * \copyright 2-Clause BSD License
universe@576 35 */
universe@576 36
universe@576 37 #ifndef UCX_STRING_H
universe@576 38 #define UCX_STRING_H
universe@576 39
universe@576 40 #include "common.h"
universe@576 41 #include "allocator.h"
universe@576 42
universe@576 43 /**
universe@576 44 * The UCX string structure.
universe@576 45 */
universe@577 46 struct cx_mutstr_s {
universe@576 47 /**
universe@576 48 * A pointer to the string.
universe@576 49 * \note The string is not necessarily \c NULL terminated.
universe@576 50 * Always use the length.
universe@576 51 */
universe@576 52 char *ptr;
universe@576 53 /** The length of the string */
universe@576 54 size_t length;
universe@577 55 };
universe@576 56
universe@576 57 /**
universe@576 58 * A mutable string.
universe@576 59 */
universe@576 60 typedef struct cx_mutstr_s cxmutstr;
universe@576 61
universe@576 62 /**
universe@576 63 * The UCX string structure for immutable (constant) strings.
universe@576 64 */
universe@577 65 struct cx_string_s {
universe@576 66 /**
universe@576 67 * A pointer to the immutable string.
universe@576 68 * \note The string is not necessarily \c NULL terminated.
universe@576 69 * Always use the length.
universe@576 70 */
universe@576 71 char const *ptr;
universe@576 72 /** The length of the string */
universe@576 73 size_t length;
universe@577 74 };
universe@576 75
universe@576 76 /**
universe@576 77 * An immutable string.
universe@576 78 */
universe@576 79 typedef struct cx_string_s cxstring;
universe@576 80
universe@583 81 /**
universe@645 82 * Context for string tokenizing.
universe@645 83 */
universe@645 84 struct cx_strtok_ctx_s {
universe@645 85 /**
universe@645 86 * The string to tokenize.
universe@645 87 */
universe@645 88 cxstring str;
universe@645 89 /**
universe@645 90 * The primary delimiter.
universe@645 91 */
universe@645 92 cxstring delim;
universe@645 93 /**
universe@645 94 * Optional array of more delimiters.
universe@645 95 */
universe@645 96 cxstring const *delim_more;
universe@645 97 /**
universe@645 98 * Length of the array containing more delimiters.
universe@645 99 */
universe@645 100 size_t delim_more_count;
universe@645 101 /**
universe@645 102 * Position of the currently active token in the source string.
universe@645 103 */
universe@645 104 size_t pos;
universe@645 105 /**
universe@645 106 * Position of next delimiter in the source string.
universe@645 107 *
universe@645 108 * If the tokenizer has not yet returned a token, the content of this field
universe@645 109 * is undefined. If the tokenizer reached the end of the string, this field
universe@645 110 * contains the length of the source string.
universe@645 111 */
universe@645 112 size_t delim_pos;
universe@645 113 /**
universe@645 114 * The position of the next token in the source string.
universe@645 115 */
universe@645 116 size_t next_pos;
universe@645 117 /**
universe@645 118 * The number of already found tokens.
universe@645 119 */
universe@645 120 size_t found;
universe@645 121 /**
universe@645 122 * The maximum number of tokens that shall be returned.
universe@645 123 */
universe@645 124 size_t limit;
universe@645 125 };
universe@645 126
universe@645 127 /**
universe@645 128 * A string tokenizing context.
universe@645 129 */
universe@645 130 typedef struct cx_strtok_ctx_s CxStrtokCtx;
universe@645 131
universe@684 132 #ifdef __cplusplus
universe@684 133 extern "C" {
universe@684 134
universe@684 135 /**
universe@684 136 * A literal initializer for an UCX string structure.
universe@684 137 *
universe@684 138 * @param literal the string literal
universe@684 139 */
universe@684 140 #define CX_STR(literal) cxstring{literal, sizeof(literal) - 1}
universe@684 141
universe@684 142 #else // __cplusplus
universe@684 143
universe@645 144 /**
universe@583 145 * A literal initializer for an UCX string structure.
universe@583 146 *
universe@583 147 * The argument MUST be a string (const char*) \em literal.
universe@583 148 *
universe@583 149 * @param literal the string literal
universe@583 150 */
universe@684 151 #define CX_STR(literal) (cxstring){literal, sizeof(literal) - 1}
universe@583 152
universe@576 153 #endif
universe@576 154
universe@576 155
universe@576 156 /**
universe@576 157 * Wraps a mutable string that must be zero-terminated.
universe@576 158 *
universe@576 159 * The length is implicitly inferred by using a call to \c strlen().
universe@576 160 *
universe@576 161 * \note the wrapped string will share the specified pointer to the string.
universe@576 162 * If you do want a copy, use cx_strdup() on the return value of this function.
universe@576 163 *
universe@576 164 * If you need to wrap a constant string, use cx_str().
universe@576 165 *
universe@584 166 * @param cstring the string to wrap, must be zero-terminated
universe@576 167 * @return the wrapped string
universe@576 168 *
universe@576 169 * @see cx_mutstrn()
universe@576 170 */
universe@584 171 __attribute__((__warn_unused_result__, __nonnull__))
universe@576 172 cxmutstr cx_mutstr(char *cstring);
universe@576 173
universe@576 174 /**
universe@576 175 * Wraps a string that does not need to be zero-terminated.
universe@576 176 *
universe@576 177 * The argument may be \c NULL if the length is zero.
universe@576 178 *
universe@576 179 * \note the wrapped string will share the specified pointer to the string.
universe@576 180 * If you do want a copy, use cx_strdup() on the return value of this function.
universe@576 181 *
universe@576 182 * If you need to wrap a constant string, use cx_strn().
universe@576 183 *
universe@584 184 * @param cstring the string to wrap (or \c NULL, only if the length is zero)
universe@576 185 * @param length the length of the string
universe@576 186 * @return the wrapped string
universe@576 187 *
universe@576 188 * @see cx_mutstr()
universe@576 189 */
universe@576 190 __attribute__((__warn_unused_result__))
universe@576 191 cxmutstr cx_mutstrn(
universe@576 192 char *cstring,
universe@576 193 size_t length
universe@576 194 );
universe@576 195
universe@576 196 /**
universe@576 197 * Wraps a string that must be zero-terminated.
universe@576 198 *
universe@576 199 * The length is implicitly inferred by using a call to \c strlen().
universe@576 200 *
universe@576 201 * \note the wrapped string will share the specified pointer to the string.
universe@576 202 * If you do want a copy, use cx_strdup() on the return value of this function.
universe@576 203 *
universe@576 204 * If you need to wrap a non-constant string, use cx_mutstr().
universe@576 205 *
universe@584 206 * @param cstring the string to wrap, must be zero-terminated
universe@576 207 * @return the wrapped string
universe@576 208 *
universe@576 209 * @see cx_strn()
universe@576 210 */
universe@584 211 __attribute__((__warn_unused_result__, __nonnull__))
universe@576 212 cxstring cx_str(char const *cstring);
universe@576 213
universe@576 214
universe@576 215 /**
universe@576 216 * Wraps a string that does not need to be zero-terminated.
universe@576 217 *
universe@576 218 * The argument may be \c NULL if the length is zero.
universe@576 219 *
universe@576 220 * \note the wrapped string will share the specified pointer to the string.
universe@576 221 * If you do want a copy, use cx_strdup() on the return value of this function.
universe@576 222 *
universe@576 223 * If you need to wrap a non-constant string, use cx_mutstrn().
universe@576 224 *
universe@584 225 * @param cstring the string to wrap (or \c NULL, only if the length is zero)
universe@576 226 * @param length the length of the string
universe@576 227 * @return the wrapped string
universe@576 228 *
universe@576 229 * @see cx_str()
universe@576 230 */
universe@576 231 __attribute__((__warn_unused_result__))
universe@576 232 cxstring cx_strn(
universe@576 233 char const *cstring,
universe@576 234 size_t length
universe@576 235 );
universe@576 236
universe@576 237 /**
universe@576 238 * Casts a mutable string to an immutable string.
universe@576 239 *
universe@576 240 * \note This is not seriously a cast. Instead you get a copy
universe@576 241 * of the struct with the desired pointer type. Both structs still
universe@576 242 * point to the same location, though!
universe@576 243 *
universe@576 244 * @param str the mutable string to cast
universe@576 245 * @return an immutable copy of the string pointer
universe@576 246 */
universe@576 247 __attribute__((__warn_unused_result__))
universe@576 248 cxstring cx_strcast(cxmutstr str);
universe@576 249
universe@576 250 /**
universe@576 251 * Passes the pointer in this string to \c free().
universe@576 252 *
universe@576 253 * The pointer in the struct is set to \c NULL and the length is set to zero.
universe@576 254 *
universe@576 255 * \note There is no implementation for cxstring, because it is unlikely that
universe@576 256 * you ever have a \c char \c const* you are really supposed to free. If you
universe@576 257 * encounter such situation, you should double-check your code.
universe@576 258 *
universe@576 259 * @param str the string to free
universe@576 260 */
universe@583 261 __attribute__((__nonnull__))
universe@576 262 void cx_strfree(cxmutstr *str);
universe@576 263
universe@576 264 /**
universe@583 265 * Passes the pointer in this string to the allocators free function.
universe@583 266 *
universe@583 267 * The pointer in the struct is set to \c NULL and the length is set to zero.
universe@583 268 *
universe@583 269 * \note There is no implementation for cxstring, because it is unlikely that
universe@583 270 * you ever have a \c char \c const* you are really supposed to free. If you
universe@583 271 * encounter such situation, you should double-check your code.
universe@583 272 *
universe@583 273 * @param alloc the allocator
universe@583 274 * @param str the string to free
universe@583 275 */
universe@583 276 __attribute__((__nonnull__))
universe@583 277 void cx_strfree_a(
universe@693 278 CxAllocator const *alloc,
universe@583 279 cxmutstr *str
universe@583 280 );
universe@583 281
universe@583 282 /**
universe@576 283 * Returns the accumulated length of all specified strings.
universe@576 284 *
universe@576 285 * \attention if the count argument is larger than the number of the
universe@576 286 * specified strings, the behavior is undefined.
universe@576 287 *
universe@576 288 * @param count the total number of specified strings
universe@576 289 * @param ... all strings
universe@576 290 * @return the accumulated length of all strings
universe@576 291 */
universe@576 292 __attribute__((__warn_unused_result__))
universe@576 293 size_t cx_strlen(
universe@576 294 size_t count,
universe@576 295 ...
universe@576 296 );
universe@576 297
universe@576 298 /**
universe@576 299 * Concatenates two or more strings.
universe@576 300 *
universe@576 301 * The resulting string will be allocated by the specified allocator.
universe@576 302 * So developers \em must pass the return value to cx_strfree() eventually.
universe@576 303 *
universe@576 304 * \note It is guaranteed that there is only one allocation.
universe@589 305 * It is also guaranteed that the returned string is zero-terminated.
universe@576 306 *
universe@576 307 * @param alloc the allocator to use
universe@576 308 * @param count the total number of strings to concatenate
universe@576 309 * @param ... all strings
universe@576 310 * @return the concatenated string
universe@576 311 */
universe@576 312 __attribute__((__warn_unused_result__, __nonnull__))
universe@576 313 cxmutstr cx_strcat_a(
universe@693 314 CxAllocator const *alloc,
universe@576 315 size_t count,
universe@576 316 ...
universe@576 317 );
universe@576 318
universe@576 319 /**
universe@576 320 * Concatenates two or more strings.
universe@576 321 *
universe@576 322 * The resulting string will be allocated by standard \c malloc().
universe@576 323 * So developers \em must pass the return value to cx_strfree() eventually.
universe@576 324 *
universe@589 325 * \note It is guaranteed that there is only one allocation.
universe@589 326 * It is also guaranteed that the returned string is zero-terminated.
universe@589 327 *
universe@576 328 * @param count the total number of strings to concatenate
universe@576 329 * @param ... all strings
universe@576 330 * @return the concatenated string
universe@576 331 */
universe@576 332 #define cx_strcat(count, ...) \
universe@576 333 cx_strcat_a(cxDefaultAllocator, count, __VA_ARGS__)
universe@576 334
universe@576 335 /**
universe@576 336 * Returns a substring starting at the specified location.
universe@576 337 *
universe@576 338 * \attention the new string references the same memory area as the
universe@576 339 * input string and is usually \em not zero-terminated.
universe@576 340 * Use cx_strdup() to get a copy.
universe@576 341 *
universe@576 342 * @param string input string
universe@576 343 * @param start start location of the substring
universe@576 344 * @return a substring of \p string starting at \p start
universe@576 345 *
universe@576 346 * @see cx_strsubsl()
universe@576 347 * @see cx_strsubs_m()
universe@576 348 * @see cx_strsubsl_m()
universe@576 349 */
universe@576 350 __attribute__((__warn_unused_result__))
universe@576 351 cxstring cx_strsubs(
universe@576 352 cxstring string,
universe@576 353 size_t start
universe@576 354 );
universe@576 355
universe@576 356 /**
universe@576 357 * Returns a substring starting at the specified location.
universe@576 358 *
universe@576 359 * The returned string will be limited to \p length bytes or the number
universe@576 360 * of bytes available in \p string, whichever is smaller.
universe@576 361 *
universe@576 362 * \attention the new string references the same memory area as the
universe@576 363 * input string and is usually \em not zero-terminated.
universe@576 364 * Use cx_strdup() to get a copy.
universe@576 365 *
universe@576 366 * @param string input string
universe@576 367 * @param start start location of the substring
universe@576 368 * @param length the maximum length of the returned string
universe@576 369 * @return a substring of \p string starting at \p start
universe@576 370 *
universe@576 371 * @see cx_strsubs()
universe@576 372 * @see cx_strsubs_m()
universe@576 373 * @see cx_strsubsl_m()
universe@576 374 */
universe@576 375 __attribute__((__warn_unused_result__))
universe@576 376 cxstring cx_strsubsl(
universe@576 377 cxstring string,
universe@576 378 size_t start,
universe@576 379 size_t length
universe@576 380 );
universe@576 381
universe@576 382 /**
universe@576 383 * Returns a substring starting at the specified location.
universe@576 384 *
universe@576 385 * \attention the new string references the same memory area as the
universe@576 386 * input string and is usually \em not zero-terminated.
universe@576 387 * Use cx_strdup() to get a copy.
universe@576 388 *
universe@576 389 * @param string input string
universe@576 390 * @param start start location of the substring
universe@576 391 * @return a substring of \p string starting at \p start
universe@576 392 *
universe@576 393 * @see cx_strsubsl_m()
universe@576 394 * @see cx_strsubs()
universe@576 395 * @see cx_strsubsl()
universe@576 396 */
universe@576 397 __attribute__((__warn_unused_result__))
universe@576 398 cxmutstr cx_strsubs_m(
universe@576 399 cxmutstr string,
universe@576 400 size_t start
universe@576 401 );
universe@576 402
universe@576 403 /**
universe@576 404 * Returns a substring starting at the specified location.
universe@576 405 *
universe@576 406 * The returned string will be limited to \p length bytes or the number
universe@576 407 * of bytes available in \p string, whichever is smaller.
universe@576 408 *
universe@576 409 * \attention the new string references the same memory area as the
universe@576 410 * input string and is usually \em not zero-terminated.
universe@576 411 * Use cx_strdup() to get a copy.
universe@576 412 *
universe@576 413 * @param string input string
universe@576 414 * @param start start location of the substring
universe@576 415 * @param length the maximum length of the returned string
universe@576 416 * @return a substring of \p string starting at \p start
universe@576 417 *
universe@576 418 * @see cx_strsubs_m()
universe@576 419 * @see cx_strsubs()
universe@576 420 * @see cx_strsubsl()
universe@576 421 */
universe@576 422 __attribute__((__warn_unused_result__))
universe@576 423 cxmutstr cx_strsubsl_m(
universe@576 424 cxmutstr string,
universe@576 425 size_t start,
universe@576 426 size_t length
universe@576 427 );
universe@576 428
universe@576 429 /**
universe@576 430 * Returns a substring starting at the location of the first occurrence of the
universe@576 431 * specified character.
universe@576 432 *
universe@576 433 * If the string does not contain the character, an empty string is returned.
universe@576 434 *
universe@576 435 * @param string the string where to locate the character
universe@576 436 * @param chr the character to locate
universe@576 437 * @return a substring starting at the first location of \p chr
universe@576 438 *
universe@576 439 * @see cx_strchr_m()
universe@576 440 */
universe@576 441 __attribute__((__warn_unused_result__))
universe@576 442 cxstring cx_strchr(
universe@576 443 cxstring string,
universe@576 444 int chr
universe@576 445 );
universe@576 446
universe@576 447 /**
universe@576 448 * Returns a substring starting at the location of the first occurrence of the
universe@576 449 * specified character.
universe@576 450 *
universe@576 451 * If the string does not contain the character, an empty string is returned.
universe@576 452 *
universe@576 453 * @param string the string where to locate the character
universe@576 454 * @param chr the character to locate
universe@576 455 * @return a substring starting at the first location of \p chr
universe@576 456 *
universe@576 457 * @see cx_strchr()
universe@576 458 */
universe@576 459 __attribute__((__warn_unused_result__))
universe@576 460 cxmutstr cx_strchr_m(
universe@576 461 cxmutstr string,
universe@576 462 int chr
universe@576 463 );
universe@576 464
universe@576 465 /**
universe@576 466 * Returns a substring starting at the location of the last occurrence of the
universe@576 467 * specified character.
universe@576 468 *
universe@576 469 * If the string does not contain the character, an empty string is returned.
universe@576 470 *
universe@576 471 * @param string the string where to locate the character
universe@576 472 * @param chr the character to locate
universe@576 473 * @return a substring starting at the last location of \p chr
universe@576 474 *
universe@576 475 * @see cx_strrchr_m()
universe@576 476 */
universe@576 477 __attribute__((__warn_unused_result__))
universe@576 478 cxstring cx_strrchr(
universe@576 479 cxstring string,
universe@576 480 int chr
universe@576 481 );
universe@576 482
universe@576 483 /**
universe@576 484 * Returns a substring starting at the location of the last occurrence of the
universe@576 485 * specified character.
universe@576 486 *
universe@576 487 * If the string does not contain the character, an empty string is returned.
universe@576 488 *
universe@576 489 * @param string the string where to locate the character
universe@576 490 * @param chr the character to locate
universe@576 491 * @return a substring starting at the last location of \p chr
universe@576 492 *
universe@576 493 * @see cx_strrchr()
universe@576 494 */
universe@576 495 __attribute__((__warn_unused_result__))
universe@576 496 cxmutstr cx_strrchr_m(
universe@576 497 cxmutstr string,
universe@576 498 int chr
universe@576 499 );
universe@576 500
universe@576 501 /**
universe@576 502 * Returns a substring starting at the location of the first occurrence of the
universe@576 503 * specified string.
universe@576 504 *
universe@576 505 * If \p haystack does not contain \p needle, an empty string is returned.
universe@576 506 *
universe@576 507 * If \p needle is an empty string, the complete \p haystack is
universe@576 508 * returned.
universe@576 509 *
universe@576 510 * @param haystack the string to be scanned
universe@576 511 * @param needle string containing the sequence of characters to match
universe@576 512 * @return a substring starting at the first occurrence of
universe@576 513 * \p needle, or an empty string, if the sequence is not
universe@576 514 * contained
universe@576 515 * @see cx_strstr_m()
universe@576 516 */
universe@576 517 __attribute__((__warn_unused_result__))
universe@576 518 cxstring cx_strstr(
universe@576 519 cxstring haystack,
universe@576 520 cxstring needle
universe@576 521 );
universe@576 522
universe@576 523 /**
universe@576 524 * Returns a substring starting at the location of the first occurrence of the
universe@576 525 * specified string.
universe@576 526 *
universe@576 527 * If \p haystack does not contain \p needle, an empty string is returned.
universe@576 528 *
universe@576 529 * If \p needle is an empty string, the complete \p haystack is
universe@576 530 * returned.
universe@576 531 *
universe@576 532 * @param haystack the string to be scanned
universe@576 533 * @param needle string containing the sequence of characters to match
universe@576 534 * @return a substring starting at the first occurrence of
universe@576 535 * \p needle, or an empty string, if the sequence is not
universe@576 536 * contained
universe@576 537 * @see cx_strstr()
universe@576 538 */
universe@576 539 __attribute__((__warn_unused_result__))
universe@576 540 cxmutstr cx_strstr_m(
universe@576 541 cxmutstr haystack,
universe@576 542 cxstring needle
universe@576 543 );
universe@576 544
universe@576 545 /**
universe@576 546 * Splits a given string using a delimiter string.
universe@576 547 *
universe@576 548 * \note The resulting array contains strings that point to the source
universe@576 549 * \p string. Use cx_strdup() to get copies.
universe@576 550 *
universe@576 551 * @param string the string to split
universe@576 552 * @param delim the delimiter
universe@576 553 * @param limit the maximum number of split items
universe@576 554 * @param output a pre-allocated array of at least \p limit length
universe@576 555 * @return the actual number of split items
universe@576 556 */
universe@576 557 __attribute__((__warn_unused_result__, __nonnull__))
universe@576 558 size_t cx_strsplit(
universe@576 559 cxstring string,
universe@576 560 cxstring delim,
universe@576 561 size_t limit,
universe@576 562 cxstring *output
universe@576 563 );
universe@576 564
universe@576 565 /**
universe@576 566 * Splits a given string using a delimiter string.
universe@576 567 *
universe@576 568 * The array pointed to by \p output will be allocated by \p allocator.
universe@576 569 *
universe@576 570 * \note The resulting array contains strings that point to the source
universe@576 571 * \p string. Use cx_strdup() to get copies.
universe@576 572 *
universe@576 573 * \attention If allocation fails, the \c NULL pointer will be written to
universe@576 574 * \p output and the number returned will be zero.
universe@576 575 *
universe@576 576 * @param allocator the allocator to use for allocating the resulting array
universe@576 577 * @param string the string to split
universe@576 578 * @param delim the delimiter
universe@576 579 * @param limit the maximum number of split items
universe@576 580 * @param output a pointer where the address of the allocated array shall be
universe@576 581 * written to
universe@576 582 * @return the actual number of split items
universe@576 583 */
universe@576 584 __attribute__((__warn_unused_result__, __nonnull__))
universe@576 585 size_t cx_strsplit_a(
universe@693 586 CxAllocator const *allocator,
universe@576 587 cxstring string,
universe@576 588 cxstring delim,
universe@576 589 size_t limit,
universe@576 590 cxstring **output
universe@576 591 );
universe@576 592
universe@576 593
universe@576 594 /**
universe@576 595 * Splits a given string using a delimiter string.
universe@576 596 *
universe@576 597 * \note The resulting array contains strings that point to the source
universe@576 598 * \p string. Use cx_strdup() to get copies.
universe@576 599 *
universe@576 600 * @param string the string to split
universe@576 601 * @param delim the delimiter
universe@576 602 * @param limit the maximum number of split items
universe@576 603 * @param output a pre-allocated array of at least \p limit length
universe@576 604 * @return the actual number of split items
universe@576 605 */
universe@576 606 __attribute__((__warn_unused_result__, __nonnull__))
universe@576 607 size_t cx_strsplit_m(
universe@576 608 cxmutstr string,
universe@576 609 cxstring delim,
universe@576 610 size_t limit,
universe@576 611 cxmutstr *output
universe@576 612 );
universe@576 613
universe@576 614 /**
universe@576 615 * Splits a given string using a delimiter string.
universe@576 616 *
universe@576 617 * The array pointed to by \p output will be allocated by \p allocator.
universe@576 618 *
universe@576 619 * \note The resulting array contains strings that point to the source
universe@576 620 * \p string. Use cx_strdup() to get copies.
universe@576 621 *
universe@576 622 * \attention If allocation fails, the \c NULL pointer will be written to
universe@576 623 * \p output and the number returned will be zero.
universe@576 624 *
universe@576 625 * @param allocator the allocator to use for allocating the resulting array
universe@576 626 * @param string the string to split
universe@576 627 * @param delim the delimiter
universe@576 628 * @param limit the maximum number of split items
universe@576 629 * @param output a pointer where the address of the allocated array shall be
universe@576 630 * written to
universe@576 631 * @return the actual number of split items
universe@576 632 */
universe@576 633 __attribute__((__warn_unused_result__, __nonnull__))
universe@576 634 size_t cx_strsplit_ma(
universe@693 635 CxAllocator const *allocator,
universe@576 636 cxmutstr string,
universe@576 637 cxstring delim,
universe@576 638 size_t limit,
universe@576 639 cxmutstr **output
universe@576 640 );
universe@576 641
universe@576 642 /**
universe@576 643 * Compares two strings.
universe@576 644 *
universe@576 645 * @param s1 the first string
universe@576 646 * @param s2 the second string
universe@576 647 * @return negative if \p s1 is smaller than \p s2, positive if \p s1 is larger
universe@576 648 * than \p s2, zero if both strings equal
universe@576 649 */
universe@576 650 __attribute__((__warn_unused_result__))
universe@576 651 int cx_strcmp(
universe@576 652 cxstring s1,
universe@576 653 cxstring s2
universe@576 654 );
universe@576 655
universe@576 656 /**
universe@576 657 * Compares two strings ignoring case.
universe@576 658 *
universe@576 659 * @param s1 the first string
universe@576 660 * @param s2 the second string
universe@576 661 * @return negative if \p s1 is smaller than \p s2, positive if \p s1 is larger
universe@576 662 * than \p s2, zero if both strings equal ignoring case
universe@576 663 */
universe@576 664 __attribute__((__warn_unused_result__))
universe@576 665 int cx_strcasecmp(
universe@576 666 cxstring s1,
universe@576 667 cxstring s2
universe@576 668 );
universe@576 669
universe@657 670 /**
universe@657 671 * Compares two strings.
universe@657 672 *
universe@677 673 * This function has a compatible signature for the use as a cx_compare_func.
universe@657 674 *
universe@657 675 * @param s1 the first string
universe@657 676 * @param s2 the second string
universe@657 677 * @return negative if \p s1 is smaller than \p s2, positive if \p s1 is larger
universe@657 678 * than \p s2, zero if both strings equal
universe@657 679 */
universe@657 680 __attribute__((__warn_unused_result__, __nonnull__))
universe@657 681 int cx_strcmp_p(
universe@657 682 void const *s1,
universe@657 683 void const *s2
universe@657 684 );
universe@657 685
universe@657 686 /**
universe@657 687 * Compares two strings ignoring case.
universe@657 688 *
universe@677 689 * This function has a compatible signature for the use as a cx_compare_func.
universe@657 690 *
universe@657 691 * @param s1 the first string
universe@657 692 * @param s2 the second string
universe@657 693 * @return negative if \p s1 is smaller than \p s2, positive if \p s1 is larger
universe@657 694 * than \p s2, zero if both strings equal ignoring case
universe@657 695 */
universe@657 696 __attribute__((__warn_unused_result__, __nonnull__))
universe@657 697 int cx_strcasecmp_p(
universe@657 698 void const *s1,
universe@657 699 void const *s2
universe@657 700 );
universe@657 701
universe@576 702
universe@576 703 /**
universe@576 704 * Creates a duplicate of the specified string.
universe@576 705 *
universe@576 706 * The new string will contain a copy allocated by \p allocator.
universe@576 707 *
universe@589 708 * \note The returned string is guaranteed to be zero-terminated.
universe@576 709 *
universe@576 710 * @param allocator the allocator to use
universe@576 711 * @param string the string to duplicate
universe@576 712 * @return a duplicate of the string
universe@576 713 * @see cx_strdup()
universe@576 714 */
universe@576 715 __attribute__((__warn_unused_result__, __nonnull__))
universe@576 716 cxmutstr cx_strdup_a(
universe@693 717 CxAllocator const *allocator,
universe@576 718 cxstring string
universe@576 719 );
universe@576 720
universe@576 721 /**
universe@578 722 * Creates a duplicate of the specified string.
universe@578 723 *
universe@578 724 * The new string will contain a copy allocated by standard
universe@578 725 * \c malloc(). So developers \em must pass the return value to cx_strfree().
universe@578 726 *
universe@589 727 * \note The returned string is guaranteed to be zero-terminated.
universe@578 728 *
universe@578 729 * @param string the string to duplicate
universe@578 730 * @return a duplicate of the string
universe@578 731 * @see cx_strdup_a()
universe@578 732 */
universe@578 733 #define cx_strdup(string) cx_strdup_a(cxDefaultAllocator, string)
universe@578 734
universe@578 735 /**
universe@576 736 * Omits leading and trailing spaces.
universe@576 737 *
universe@576 738 * \note the returned string references the same memory, thus you
universe@576 739 * must \em not free the returned memory.
universe@576 740 *
universe@576 741 * @param string the string that shall be trimmed
universe@576 742 * @return the trimmed string
universe@576 743 */
universe@576 744 __attribute__((__warn_unused_result__))
universe@576 745 cxstring cx_strtrim(cxstring string);
universe@576 746
universe@576 747 /**
universe@576 748 * Omits leading and trailing spaces.
universe@576 749 *
universe@576 750 * \note the returned string references the same memory, thus you
universe@576 751 * must \em not free the returned memory.
universe@576 752 *
universe@576 753 * @param string the string that shall be trimmed
universe@576 754 * @return the trimmed string
universe@576 755 */
universe@576 756 __attribute__((__warn_unused_result__))
universe@576 757 cxmutstr cx_strtrim_m(cxmutstr string);
universe@576 758
universe@576 759 /**
universe@576 760 * Checks, if a string has a specific prefix.
universe@576 761 *
universe@576 762 * @param string the string to check
universe@576 763 * @param prefix the prefix the string should have
universe@576 764 * @return \c true, if and only if the string has the specified prefix,
universe@576 765 * \c false otherwise
universe@576 766 */
universe@576 767 __attribute__((__warn_unused_result__))
universe@576 768 bool cx_strprefix(
universe@576 769 cxstring string,
universe@576 770 cxstring prefix
universe@576 771 );
universe@576 772
universe@576 773 /**
universe@576 774 * Checks, if a string has a specific suffix.
universe@576 775 *
universe@576 776 * @param string the string to check
universe@576 777 * @param suffix the suffix the string should have
universe@576 778 * @return \c true, if and only if the string has the specified suffix,
universe@576 779 * \c false otherwise
universe@576 780 */
universe@576 781 __attribute__((__warn_unused_result__))
universe@581 782 bool cx_strsuffix(
universe@576 783 cxstring string,
universe@576 784 cxstring suffix
universe@576 785 );
universe@576 786
universe@576 787 /**
universe@576 788 * Checks, if a string has a specific prefix, ignoring the case.
universe@576 789 *
universe@576 790 * @param string the string to check
universe@576 791 * @param prefix the prefix the string should have
universe@576 792 * @return \c true, if and only if the string has the specified prefix,
universe@576 793 * \c false otherwise
universe@576 794 */
universe@576 795 __attribute__((__warn_unused_result__))
universe@581 796 bool cx_strcaseprefix(
universe@576 797 cxstring string,
universe@576 798 cxstring prefix
universe@576 799 );
universe@576 800
universe@576 801 /**
universe@576 802 * Checks, if a string has a specific suffix, ignoring the case.
universe@576 803 *
universe@576 804 * @param string the string to check
universe@576 805 * @param suffix the suffix the string should have
universe@576 806 * @return \c true, if and only if the string has the specified suffix,
universe@576 807 * \c false otherwise
universe@576 808 */
universe@576 809 __attribute__((__warn_unused_result__))
universe@581 810 bool cx_strcasesuffix(
universe@576 811 cxstring string,
universe@576 812 cxstring suffix
universe@576 813 );
universe@576 814
universe@576 815 /**
universe@576 816 * Converts the string to lower case.
universe@576 817 *
universe@576 818 * The change is made in-place. If you want a copy, use cx_strdup(), first.
universe@576 819 *
universe@576 820 * @param string the string to modify
universe@576 821 * @see cx_strdup()
universe@576 822 */
universe@576 823 void cx_strlower(cxmutstr string);
universe@576 824
universe@576 825 /**
universe@576 826 * Converts the string to upper case.
universe@576 827 *
universe@576 828 * The change is made in-place. If you want a copy, use cx_strdup(), first.
universe@576 829 *
universe@576 830 * @param string the string to modify
universe@576 831 * @see cx_strdup()
universe@576 832 */
universe@576 833 void cx_strupper(cxmutstr string);
universe@576 834
universe@576 835 /**
universe@576 836 * Replaces a pattern in a string with another string.
universe@576 837 *
universe@576 838 * The pattern is taken literally and is no regular expression.
universe@576 839 * Replaces at most \p replmax occurrences.
universe@576 840 *
universe@589 841 * The returned string will be allocated by \p allocator and is guaranteed
universe@589 842 * to be zero-terminated.
universe@576 843 *
universe@576 844 * If allocation fails, or the input string is empty,
universe@583 845 * the returned string will be empty.
universe@576 846 *
universe@576 847 * @param allocator the allocator to use
universe@576 848 * @param str the string where replacements should be applied
universe@576 849 * @param pattern the pattern to search for
universe@576 850 * @param replacement the replacement string
universe@576 851 * @param replmax maximum number of replacements
universe@576 852 * @return the resulting string after applying the replacements
universe@576 853 */
universe@576 854 __attribute__((__warn_unused_result__, __nonnull__))
universe@583 855 cxmutstr cx_strreplacen_a(
universe@693 856 CxAllocator const *allocator,
universe@576 857 cxstring str,
universe@576 858 cxstring pattern,
universe@576 859 cxstring replacement,
universe@576 860 size_t replmax
universe@576 861 );
universe@576 862
universe@578 863 /**
universe@578 864 * Replaces a pattern in a string with another string.
universe@578 865 *
universe@578 866 * The pattern is taken literally and is no regular expression.
universe@578 867 * Replaces at most \p replmax occurrences.
universe@578 868 *
universe@589 869 * The returned string will be allocated by \c malloc() and is guaranteed
universe@589 870 * to be zero-terminated.
universe@578 871 *
universe@578 872 * If allocation fails, or the input string is empty,
universe@583 873 * the returned string will be empty.
universe@578 874 *
universe@578 875 * @param str the string where replacements should be applied
universe@578 876 * @param pattern the pattern to search for
universe@578 877 * @param replacement the replacement string
universe@578 878 * @param replmax maximum number of replacements
universe@578 879 * @return the resulting string after applying the replacements
universe@578 880 */
universe@583 881 #define cx_strreplacen(str, pattern, replacement, replmax) \
universe@583 882 cx_strreplacen_a(cxDefaultAllocator, str, pattern, replacement, replmax)
universe@583 883
universe@583 884 /**
universe@583 885 * Replaces a pattern in a string with another string.
universe@583 886 *
universe@583 887 * The pattern is taken literally and is no regular expression.
universe@583 888 *
universe@589 889 * The returned string will be allocated by \p allocator and is guaranteed
universe@589 890 * to be zero-terminated.
universe@583 891 *
universe@583 892 * If allocation fails, or the input string is empty,
universe@583 893 * the returned string will be empty.
universe@583 894 *
universe@583 895 * @param allocator the allocator to use
universe@583 896 * @param str the string where replacements should be applied
universe@583 897 * @param pattern the pattern to search for
universe@583 898 * @param replacement the replacement string
universe@583 899 * @return the resulting string after applying the replacements
universe@583 900 */
universe@583 901 #define cx_strreplace_a(allocator, str, pattern, replacement) \
universe@583 902 cx_strreplacen_a(allocator, str, pattern, replacement, SIZE_MAX)
universe@583 903
universe@583 904 /**
universe@583 905 * Replaces a pattern in a string with another string.
universe@583 906 *
universe@583 907 * The pattern is taken literally and is no regular expression.
universe@583 908 * Replaces at most \p replmax occurrences.
universe@583 909 *
universe@589 910 * The returned string will be allocated by \c malloc() and is guaranteed
universe@589 911 * to be zero-terminated.
universe@583 912 *
universe@583 913 * If allocation fails, or the input string is empty,
universe@583 914 * the returned string will be empty.
universe@583 915 *
universe@583 916 * @param str the string where replacements should be applied
universe@583 917 * @param pattern the pattern to search for
universe@583 918 * @param replacement the replacement string
universe@583 919 * @return the resulting string after applying the replacements
universe@583 920 */
universe@583 921 #define cx_strreplace(str, pattern, replacement) \
universe@583 922 cx_strreplacen_a(cxDefaultAllocator, str, pattern, replacement, SIZE_MAX)
universe@578 923
universe@645 924 /**
universe@645 925 * Creates a string tokenization context.
universe@645 926 *
universe@645 927 * @param str the string to tokenize
universe@645 928 * @param delim the delimiter (must not be empty)
universe@645 929 * @param limit the maximum number of tokens that shall be returned
universe@645 930 * @return a new string tokenization context
universe@645 931 */
universe@645 932 __attribute__((__warn_unused_result__))
universe@645 933 CxStrtokCtx cx_strtok(
universe@645 934 cxstring str,
universe@645 935 cxstring delim,
universe@645 936 size_t limit
universe@645 937 );
universe@645 938
universe@645 939 /**
universe@645 940 * Creates a string tokenization context for a mutable string.
universe@645 941 *
universe@645 942 * @param str the string to tokenize
universe@645 943 * @param delim the delimiter (must not be empty)
universe@645 944 * @param limit the maximum number of tokens that shall be returned
universe@645 945 * @return a new string tokenization context
universe@645 946 */
universe@645 947 __attribute__((__warn_unused_result__))
universe@645 948 CxStrtokCtx cx_strtok_m(
universe@645 949 cxmutstr str,
universe@645 950 cxstring delim,
universe@645 951 size_t limit
universe@645 952 );
universe@645 953
universe@645 954 /**
universe@645 955 * Returns the next token.
universe@645 956 *
universe@645 957 * The token will point to the source string.
universe@645 958 *
universe@645 959 * @param ctx the tokenization context
universe@645 960 * @param token a pointer to memory where the next token shall be stored
universe@645 961 * @return true if successful, false if the limit or the end of the string
universe@645 962 * has been reached
universe@645 963 */
universe@645 964 __attribute__((__warn_unused_result__, __nonnull__))
universe@645 965 bool cx_strtok_next(
universe@645 966 CxStrtokCtx *ctx,
universe@645 967 cxstring *token
universe@645 968 );
universe@645 969
universe@645 970 /**
universe@645 971 * Returns the next token of a mutable string.
universe@645 972 *
universe@645 973 * The token will point to the source string.
universe@645 974 * If the context was not initialized over a mutable string, modifying
universe@645 975 * the data of the returned token is undefined behavior.
universe@645 976 *
universe@645 977 * @param ctx the tokenization context
universe@645 978 * @param token a pointer to memory where the next token shall be stored
universe@645 979 * @return true if successful, false if the limit or the end of the string
universe@645 980 * has been reached
universe@645 981 */
universe@645 982 __attribute__((__warn_unused_result__, __nonnull__))
universe@645 983 bool cx_strtok_next_m(
universe@645 984 CxStrtokCtx *ctx,
universe@645 985 cxmutstr *token
universe@645 986 );
universe@645 987
universe@645 988 /**
universe@645 989 * Defines an array of more delimiters for the specified tokenization context.
universe@645 990 *
universe@645 991 * @param ctx the tokenization context
universe@645 992 * @param delim array of more delimiters
universe@645 993 * @param count number of elements in the array
universe@645 994 */
universe@645 995 __attribute__((__nonnull__))
universe@645 996 void cx_strtok_delim(
universe@645 997 CxStrtokCtx *ctx,
universe@645 998 cxstring const *delim,
universe@645 999 size_t count
universe@645 1000 );
universe@645 1001
universe@645 1002
universe@576 1003 #ifdef __cplusplus
universe@576 1004 } // extern "C"
universe@576 1005 #endif
universe@576 1006
universe@576 1007 #endif //UCX_STRING_H

mercurial