src/ucx/map.h

Wed, 02 May 2018 16:14:40 +0200

author
Mike Becker <universe@uap-core.de>
date
Wed, 02 May 2018 16:14:40 +0200
changeset 277
f819fe5e20f5
parent 259
2f5dea574a75
child 327
fbc33813265b
permissions
-rw-r--r--

makes destructor functions for *_free_content() optional + more documentation for UcxProperties

olaf@2 1 /*
universe@103 2 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS HEADER.
universe@103 3 *
universe@259 4 * Copyright 2017 Mike Becker, Olaf Wintermann All rights reserved.
universe@103 5 *
universe@103 6 * Redistribution and use in source and binary forms, with or without
universe@103 7 * modification, are permitted provided that the following conditions are met:
universe@103 8 *
universe@103 9 * 1. Redistributions of source code must retain the above copyright
universe@103 10 * notice, this list of conditions and the following disclaimer.
universe@103 11 *
universe@103 12 * 2. Redistributions in binary form must reproduce the above copyright
universe@103 13 * notice, this list of conditions and the following disclaimer in the
universe@103 14 * documentation and/or other materials provided with the distribution.
universe@103 15 *
universe@103 16 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
universe@103 17 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
universe@103 18 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
universe@103 19 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE
universe@103 20 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
universe@103 21 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
universe@103 22 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
universe@103 23 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
universe@103 24 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
universe@103 25 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
universe@103 26 * POSSIBILITY OF SUCH DAMAGE.
olaf@2 27 */
olaf@2 28
universe@136 29 /**
universe@136 30 * @file map.h
universe@136 31 *
universe@136 32 * Hash map implementation.
universe@136 33 *
universe@136 34 * This implementation uses murmur hash 2 and separate chaining with linked
universe@136 35 * lists.
universe@136 36 *
universe@136 37 * @author Mike Becker
universe@136 38 * @author Olaf Wintermann
universe@136 39 */
universe@136 40
olaf@120 41 #ifndef UCX_MAP_H
olaf@120 42 #define UCX_MAP_H
olaf@2 43
universe@259 44 #include "ucx.h"
universe@259 45 #include "string.h"
universe@259 46 #include "allocator.h"
universe@41 47 #include <stdio.h>
olaf@20 48
olaf@2 49 #ifdef __cplusplus
olaf@2 50 extern "C" {
olaf@2 51 #endif
olaf@2 52
universe@138 53 /**
universe@138 54 * Loop statement for UCX maps.
universe@138 55 *
universe@138 56 * The <code>key</code> variable is implicitly defined, but the
universe@138 57 * <code>value</code> variable must be already declared as type information
universe@138 58 * cannot be inferred.
universe@138 59 *
universe@138 60 * @param key the variable name for the key
universe@138 61 * @param value the variable name for the value
universe@225 62 * @param iter a UcxMapIterator
universe@138 63 * @see ucx_map_iterator()
universe@138 64 */
universe@138 65 #define UCX_MAP_FOREACH(key,value,iter) \
universe@138 66 for(UcxKey key;ucx_map_iter_next(&iter,&key, (void**)&value);)
olaf@31 67
universe@138 68 /** Type for the UCX map. @see UcxMap */
olaf@31 69 typedef struct UcxMap UcxMap;
universe@146 70
universe@225 71 /** Type for a key of a UcxMap. @see UcxKey */
olaf@31 72 typedef struct UcxKey UcxKey;
universe@146 73
universe@225 74 /** Type for an element of a UcxMap. @see UcxMapElement */
olaf@31 75 typedef struct UcxMapElement UcxMapElement;
universe@146 76
universe@225 77 /** Type for an iterator over a UcxMap. @see UcxMapIterator */
olaf@31 78 typedef struct UcxMapIterator UcxMapIterator;
olaf@2 79
universe@138 80 /** Structure for the UCX map. */
olaf@20 81 struct UcxMap {
universe@138 82 /** An allocator that is used for the map elements. */
olaf@107 83 UcxAllocator *allocator;
universe@138 84 /** The array of map element lists. */
universe@29 85 UcxMapElement **map;
universe@138 86 /** The size of the map is the length of the element list array. */
olaf@20 87 size_t size;
universe@138 88 /** The count of elements currently stored in this map. */
olaf@45 89 size_t count;
olaf@20 90 };
olaf@2 91
universe@225 92 /** Structure for a key of a UcxMap. */
olaf@20 93 struct UcxKey {
universe@138 94 /** The key data. */
olaf@20 95 void *data;
universe@138 96 /** The length of the key data. */
olaf@20 97 size_t len;
universe@138 98 /** The hash value of the key data. */
olaf@20 99 int hash;
olaf@20 100 };
olaf@20 101
universe@225 102 /** Structure for an element of a UcxMap. */
olaf@20 103 struct UcxMapElement {
universe@138 104 /** The value data. */
olaf@20 105 void *data;
universe@146 106
universe@138 107 /** A pointer to the next element in the current list. */
olaf@20 108 UcxMapElement *next;
universe@146 109
universe@138 110 /** The corresponding key. */
olaf@20 111 UcxKey key;
olaf@20 112 };
olaf@20 113
universe@225 114 /** Structure for an iterator over a UcxMap. */
olaf@31 115 struct UcxMapIterator {
universe@138 116 /** The map to iterate over. */
olaf@31 117 UcxMap *map;
universe@146 118
universe@138 119 /** The current map element. */
olaf@31 120 UcxMapElement *cur;
universe@146 121
universe@138 122 /**
universe@138 123 * The current index of the element list array.
universe@138 124 * <b>Attention: </b> this is <b>NOT</b> the element index! Do <b>NOT</b>
universe@138 125 * manually iterate over the map by increasing this index. Use
universe@138 126 * ucx_map_iter_next().
universe@138 127 * @see UcxMap.map*/
universe@95 128 size_t index;
olaf@31 129 };
olaf@31 130
universe@136 131 /**
universe@136 132 * Creates a new hash map with the specified size.
universe@136 133 * @param size the size of the hash map
universe@136 134 * @return a pointer to the new hash map
universe@136 135 */
universe@136 136 UcxMap *ucx_map_new(size_t size);
olaf@20 137
universe@136 138 /**
universe@225 139 * Creates a new hash map with the specified size using a UcxAllocator.
olaf@137 140 * @param allocator the allocator to use
universe@136 141 * @param size the size of the hash map
universe@136 142 * @return a pointer to the new hash map
universe@136 143 */
olaf@137 144 UcxMap *ucx_map_new_a(UcxAllocator *allocator, size_t size);
universe@136 145
universe@136 146 /**
universe@136 147 * Frees a hash map.
universe@136 148 *
universe@208 149 * <b>Note:</b> the contents are <b>not</b> freed, use ucx_map_free_content()
universe@208 150 * before calling this function to achieve that.
universe@136 151 *
universe@136 152 * @param map the map to be freed
universe@208 153 * @see ucx_map_free_content()
universe@136 154 */
universe@29 155 void ucx_map_free(UcxMap *map);
universe@136 156
universe@138 157 /**
universe@208 158 * Frees the contents of a hash map.
universe@208 159 *
universe@208 160 * This is a convenience function that iterates over the map and passes all
universe@277 161 * values to the specified destructor function.
universe@277 162 *
universe@277 163 * If no destructor is specified (<code>NULL</code>), the free() function of
universe@277 164 * the map's own allocator is used.
universe@208 165 *
universe@209 166 * You must ensure, that it is valid to pass each value in the map to the same
universe@209 167 * destructor function.
universe@208 168 *
universe@208 169 * You should free or clear the map afterwards, as the contents will be invalid.
universe@208 170 *
universe@208 171 * @param map for which the contents shall be freed
universe@277 172 * @param destr optional pointer to a destructor function
universe@208 173 * @see ucx_map_free()
universe@208 174 * @see ucx_map_clear()
universe@208 175 */
universe@209 176 void ucx_map_free_content(UcxMap *map, ucx_destructor destr);
universe@208 177
universe@208 178 /**
universe@206 179 * Clears a hash map.
universe@206 180 *
universe@208 181 * <b>Note:</b> the contents are <b>not</b> freed, use ucx_map_free_content()
universe@208 182 * before calling this function to achieve that.
universe@206 183 *
universe@208 184 * @param map the map to be cleared
universe@208 185 * @see ucx_map_free_content()
universe@206 186 */
universe@206 187 void ucx_map_clear(UcxMap *map);
universe@206 188
universe@208 189
universe@206 190 /**
universe@138 191 * Copies contents from a map to another map using a copy function.
universe@138 192 *
universe@138 193 * <b>Note:</b> The destination map does not need to be empty. However, if it
universe@138 194 * contains data with keys that are also present in the source map, the contents
universe@138 195 * are overwritten.
universe@138 196 *
universe@138 197 * @param from the source map
universe@138 198 * @param to the destination map
universe@138 199 * @param fnc the copy function or <code>NULL</code> if the pointer address
universe@138 200 * shall be copied
universe@138 201 * @param data additional data for the copy function
universe@138 202 * @return 0 on success or a non-zero value on memory allocation errors
universe@138 203 */
universe@253 204 int ucx_map_copy(UcxMap *from, UcxMap *to, copy_func fnc, void *data);
universe@138 205
universe@138 206 /**
universe@138 207 * Clones the map and rehashes if necessary.
universe@138 208 *
universe@138 209 * <b>Note:</b> In contrast to ucx_map_rehash() the load factor is irrelevant.
universe@138 210 * This function <i>always</i> ensures a new UcxMap.size of at least
universe@138 211 * 2.5*UcxMap.count.
universe@138 212 *
universe@138 213 * @param map the map to clone
universe@138 214 * @param fnc the copy function to use or <code>NULL</code> if the new and
universe@138 215 * the old map shall share the data pointers
universe@138 216 * @param data additional data for the copy function
universe@138 217 * @return the cloned map
universe@138 218 * @see ucx_map_copy()
universe@138 219 */
olaf@44 220 UcxMap *ucx_map_clone(UcxMap *map, copy_func fnc, void *data);
universe@138 221
universe@138 222 /**
universe@138 223 * Increases size of the hash map, if necessary.
universe@138 224 *
universe@138 225 * The load value is 0.75*UcxMap.size. If the element count exceeds the load
universe@138 226 * value, the map needs to be rehashed. Otherwise no action is performed and
universe@138 227 * this function simply returns 0.
universe@138 228 *
universe@138 229 * The rehashing process ensures, that the UcxMap.size is at least
universe@138 230 * 2.5*UcxMap.count. So there is enough room for additional elements without
universe@138 231 * the need of another soon rehashing.
universe@138 232 *
universe@138 233 * You can use this function to dramatically increase access performance.
universe@138 234 *
universe@138 235 * @param map the map to rehash
universe@138 236 * @return 1, if a memory allocation error occurred, 0 otherwise
universe@138 237 */
olaf@52 238 int ucx_map_rehash(UcxMap *map);
olaf@20 239
universe@138 240 /**
universe@138 241 * Puts a key/value-pair into the map.
universe@138 242 *
universe@138 243 * @param map the map
universe@138 244 * @param key the key
universe@138 245 * @param value the value
universe@138 246 * @return 0 on success, non-zero value on failure
universe@138 247 */
universe@138 248 int ucx_map_put(UcxMap *map, UcxKey key, void *value);
universe@138 249
universe@138 250 /**
universe@138 251 * Retrieves a value by using a key.
universe@138 252 *
universe@138 253 * @param map the map
universe@138 254 * @param key the key
universe@138 255 * @return the value
universe@138 256 */
olaf@20 257 void* ucx_map_get(UcxMap *map, UcxKey key);
universe@138 258
universe@138 259 /**
universe@138 260 * Removes a key/value-pair from the map by using the key.
universe@138 261 *
universe@138 262 * @param map the map
universe@138 263 * @param key the key
universe@138 264 * @return the removed value
universe@138 265 */
universe@53 266 void* ucx_map_remove(UcxMap *map, UcxKey key);
olaf@20 267
universe@136 268 /**
universe@136 269 * Shorthand for putting data with a sstr_t key into the map.
universe@136 270 * @param map the map
universe@136 271 * @param key the key
universe@136 272 * @param value the value
universe@138 273 * @return 0 on success, non-zero value on failure
universe@136 274 * @see ucx_map_put()
universe@136 275 */
universe@136 276 #define ucx_map_sstr_put(map, key, value) \
universe@136 277 ucx_map_put(map, ucx_key(key.ptr, key.length), (void*)value)
universe@146 278
universe@136 279 /**
universe@136 280 * Shorthand for putting data with a C string key into the map.
universe@136 281 * @param map the map
universe@136 282 * @param key the key
universe@136 283 * @param value the value
universe@138 284 * @return 0 on success, non-zero value on failure
universe@136 285 * @see ucx_map_put()
universe@136 286 */
universe@136 287 #define ucx_map_cstr_put(map, key, value) \
universe@136 288 ucx_map_put(map, ucx_key((void*)key, strlen(key)), (void*)value)
universe@146 289
universe@136 290 /**
universe@136 291 * Shorthand for putting data with an integer key into the map.
universe@136 292 * @param map the map
universe@136 293 * @param key the key
universe@136 294 * @param value the value
universe@138 295 * @return 0 on success, non-zero value on failure
universe@136 296 * @see ucx_map_put()
universe@136 297 */
universe@136 298 #define ucx_map_int_put(map, key, value) \
universe@136 299 ucx_map_put(map, ucx_key((void*)&key, sizeof(key)), (void*)value)
olaf@78 300
universe@136 301 /**
universe@136 302 * Shorthand for getting data from the map with a sstr_t key.
universe@136 303 * @param map the map
universe@136 304 * @param key the key
universe@138 305 * @return the value
universe@136 306 * @see ucx_map_get()
universe@136 307 */
universe@136 308 #define ucx_map_sstr_get(map, key) \
universe@136 309 ucx_map_get(map, ucx_key(key.ptr, key.length))
universe@146 310
universe@136 311 /**
universe@136 312 * Shorthand for getting data from the map with a C string key.
universe@138 313 * @param map the map
universe@138 314 * @param key the key
universe@138 315 * @return the value
universe@136 316 * @see ucx_map_get()
universe@136 317 */
universe@136 318 #define ucx_map_cstr_get(map, key) \
universe@136 319 ucx_map_get(map, ucx_key((void*)key, strlen(key)))
universe@146 320
universe@136 321 /**
universe@136 322 * Shorthand for getting data from the map with an integer key.
universe@136 323 * @param map the map
universe@136 324 * @param key the key
universe@138 325 * @return the value
universe@136 326 * @see ucx_map_get()
universe@136 327 */
universe@136 328 #define ucx_map_int_get(map, key) \
universe@136 329 ucx_map_get(map, ucx_key((void*)&key, sizeof(int)))
universe@146 330
universe@136 331 /**
universe@136 332 * Shorthand for removing data from the map with a sstr_t key.
universe@136 333 * @param map the map
universe@136 334 * @param key the key
universe@138 335 * @return the removed value
universe@136 336 * @see ucx_map_remove()
universe@136 337 */
universe@136 338 #define ucx_map_sstr_remove(map, key) \
universe@136 339 ucx_map_remove(map, ucx_key(key.ptr, key.length))
universe@146 340
universe@136 341 /**
universe@136 342 * Shorthand for removing data from the map with a C string key.
universe@136 343 * @param map the map
universe@136 344 * @param key the key
universe@138 345 * @return the removed value
universe@136 346 * @see ucx_map_remove()
universe@136 347 */
universe@136 348 #define ucx_map_cstr_remove(map, key) \
universe@136 349 ucx_map_remove(map, ucx_key((void*)key, strlen(key)))
universe@146 350
universe@136 351 /**
universe@136 352 * Shorthand for removing data from the map with an integer key.
universe@136 353 * @param map the map
universe@136 354 * @param key the key
universe@138 355 * @return the removed value
universe@136 356 * @see ucx_map_remove()
universe@136 357 */
universe@136 358 #define ucx_map_int_remove(map, key) \
universe@136 359 ucx_map_remove(map, ucx_key((void*)&key, sizeof(key)))
olaf@20 360
universe@138 361 /**
universe@225 362 * Creates a UcxKey based on the given data.
universe@138 363 *
universe@138 364 * This function implicitly computes the hash.
universe@138 365 *
universe@138 366 * @param data the data for the key
universe@138 367 * @param len the length of the data
universe@225 368 * @return a UcxKey with implicitly computed hash
universe@138 369 * @see ucx_hash()
universe@138 370 */
olaf@20 371 UcxKey ucx_key(void *data, size_t len);
olaf@20 372
universe@138 373 /**
universe@138 374 * Computes a murmur hash-2.
universe@138 375 *
universe@138 376 * @param data the data to hash
universe@138 377 * @param len the length of the data
universe@138 378 * @return the murmur hash-2 of the data
universe@138 379 */
universe@67 380 int ucx_hash(const char *data, size_t len);
olaf@2 381
universe@138 382 /**
universe@138 383 * Creates an iterator for a map.
universe@138 384 *
universe@225 385 * <b>Note:</b> A UcxMapIterator iterates over all elements in all element
universe@138 386 * lists successively. Therefore the order highly depends on the key hashes and
universe@138 387 * may vary under different map sizes. So generally you may <b>NOT</b> rely on
universe@138 388 * the iteration order.
universe@138 389 *
universe@138 390 * <b>Note:</b> The iterator is <b>NOT</b> initialized. You need to call
universe@138 391 * ucx_map_iter_next() at least once before accessing any information. However,
universe@225 392 * it is not recommended to access the fields of a UcxMapIterator directly.
universe@138 393 *
universe@138 394 * @param map the map to create the iterator for
universe@138 395 * @return an iterator initialized on the first element of the
universe@138 396 * first element list
universe@138 397 * @see ucx_map_iter_next()
universe@138 398 */
olaf@31 399 UcxMapIterator ucx_map_iterator(UcxMap *map);
olaf@31 400
universe@138 401 /**
universe@138 402 * Proceeds to the next element of the map (if any).
universe@138 403 *
universe@138 404 * Subsequent calls on the same iterator proceed to the next element and
universe@138 405 * store the key/value-pair into the memory specified as arguments of this
universe@138 406 * function.
universe@138 407 *
universe@138 408 * If no further elements are found, this function returns zero and leaves the
universe@138 409 * last found key/value-pair in memory.
universe@138 410 *
universe@138 411 * @param iterator the iterator to use
universe@138 412 * @param key a pointer to the memory where to store the key
universe@138 413 * @param value a pointer to the memory where to store the value
universe@138 414 * @return 1, if another element was found, 0 if all elements has been processed
universe@138 415 * @see ucx_map_iterator()
universe@138 416 */
universe@138 417 int ucx_map_iter_next(UcxMapIterator *iterator, UcxKey *key, void **value);
olaf@31 418
universe@42 419
olaf@2 420 #ifdef __cplusplus
olaf@2 421 }
olaf@2 422 #endif
olaf@2 423
olaf@120 424 #endif /* UCX_MAP_H */
olaf@2 425

mercurial