ht.h 5.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195
  1. #ifndef HT_H
  2. #define HT_H
  3. #include <stdint.h>
  4. #include <stddef.h>
  5. #include <stdlib.h>
  6. #include <string.h>
  7. #include "da.h"
  8. #ifndef typeof
  9. #define typeof __typeof__
  10. #endif
  11. #define CONCAT(a, b) CONCAT_INNER(a, b)
  12. #define CONCAT_INNER(a, b) a ## b
  13. #define UNIQUE_NAME(base) CONCAT(base, __COUNTER__)
  14. typedef uint64_t (*ht_hash_func)(const char *, size_t);
  15. uint64_t ht_default_hash(const char *str, size_t str_size);
  16. #define HT_DEF_STRUCT(type, name) \
  17. struct name##_item { \
  18. struct { \
  19. const char *data; \
  20. size_t size; \
  21. } key_str; \
  22. uint64_t key; \
  23. type data; \
  24. void *next; \
  25. }; \
  26. struct name { \
  27. struct name##_item *items; \
  28. size_t size; \
  29. size_t cap; \
  30. DA_DEF_STRUCT_ITEM(uint64_t, keys); \
  31. ht_hash_func hash; \
  32. size_t collisions; \
  33. }
  34. #define HT_DEF_STRUCT_ITEM(type, name) \
  35. struct { \
  36. struct { \
  37. struct { \
  38. const char *data; \
  39. size_t size; \
  40. } key_str; \
  41. uint64_t key; \
  42. type data; \
  43. void *next; \
  44. } *items; \
  45. size_t size; \
  46. size_t cap; \
  47. DA_DEF_STRUCT_ITEM(uint64_t, keys); \
  48. ht_hash_func hash; \
  49. size_t collisions; \
  50. } name
  51. #define HT_CREATE(ht, init_cap) \
  52. do { \
  53. (ht).cap = (init_cap); \
  54. (ht).size = 0; \
  55. (ht).items = calloc((ht).cap, sizeof(*(ht).items)); \
  56. (ht).hash = ht_default_hash; \
  57. DA_CREATE((ht).keys); \
  58. } while(0)
  59. #define HT_DESTROY(ht) \
  60. do{ \
  61. free((ht).items); \
  62. free((ht).keys.items); \
  63. } while(0)
  64. #define _HT_INC_CAP(ht, _ht, _it, _i, _j, _k) \
  65. do { \
  66. typeof((ht)) _ht = {0}; \
  67. HT_CREATE(_ht, (ht).cap*2); \
  68. for ( size_t _i = 0; _i < (ht).keys.size; ++_i ) { \
  69. uint64_t _k = (ht).keys.items[_i]; \
  70. typeof(*(ht).items) _hi = (ht).items[_k % (ht).cap]; \
  71. uint64_t _j = 0; \
  72. while( _hi.key != _k) { \
  73. _hi = (ht).items[(_k + ++_j) % (ht).cap]; \
  74. } \
  75. typeof(*_ht.items) *_it = &_ht.items[_hi.key \
  76. % _ht.cap]; \
  77. _j = _hi.key; \
  78. while ( _it->key != 0 && _it->key != _hi.key ) { \
  79. _it = &_ht.items[(++_j) % _ht.cap]; \
  80. ++_ht.collisions; \
  81. } \
  82. DA_APPEND(_ht.keys, _hi.key); \
  83. _it->key_str.data = _hi.key_str.data; \
  84. _it->key_str.size = _hi.key_str.size; \
  85. _it->key = _hi.key; \
  86. _it->data = _hi.data; \
  87. _it->next = NULL; \
  88. ++_ht.size; \
  89. } \
  90. HT_DESTROY(ht); \
  91. (ht) = _ht; \
  92. } while(0)
  93. #define HT_INC_CAP(ht) \
  94. _HT_INC_CAP(ht, UNIQUE_NAME(_ht), UNIQUE_NAME(_it), \
  95. UNIQUE_NAME(_i), UNIQUE_NAME(_j), UNIQUE_NAME(_k))
  96. #include <stdio.h>
  97. #define _HT_SET(ht, _key, _key_size, val, _k, _it, _i) \
  98. do { \
  99. if ( (ht).size + 1 >= (ht).cap ) { \
  100. HT_INC_CAP(ht); \
  101. } \
  102. uint64_t _k = (ht).hash((_key), (_key_size)); \
  103. typeof(*(ht).items) *_it = &(ht).items[_k % (ht).cap]; \
  104. uint64_t _i = _k; \
  105. while ( _it->key != 0 && _it->key != _k ) { \
  106. _it = &(ht).items[(++_i) % (ht).cap]; \
  107. ++(ht).collisions; \
  108. } \
  109. if ( _it->key == _k ) { \
  110. _it->data = val; \
  111. break; \
  112. } \
  113. DA_APPEND((ht).keys, _k); \
  114. _it->key_str.data = _key; \
  115. _it->key_str.size = _key_size; \
  116. _it->key = _k; \
  117. _it->data = val; \
  118. _it->next = NULL; \
  119. ++(ht).size; \
  120. } while(0)
  121. #define HT_SET(ht, key, key_size, val) \
  122. _HT_SET(ht, key, key_size, val, \
  123. UNIQUE_NAME(_k), UNIQUE_NAME(_it), UNIQUE_NAME(_i))
  124. #define _HT_GET(ht, _key, _key_size, ret, _k, _it) \
  125. do { \
  126. uint64_t _k = (ht).hash((_key), (_key_size)); \
  127. typeof(*(ht).items) *_it = &(ht).items[_k % (ht).cap]; \
  128. (ret) = _it->data; \
  129. } while(0)
  130. #define HT_GET(ht, key, key_size, ret) \
  131. _HT_GET(ht, key, key_size, ret, UNIQUE_NAME(_k), UNIQUE_NAME(_it))
  132. #if defined(HT_IMP) || defined(IMP)
  133. uint64_t
  134. ht_default_hash(const char *str, size_t str_size)
  135. {
  136. uint64_t k = (uint64_t)((char)str[0]) << 56;
  137. k |= (((uint64_t) (str[1 * (str_size > 1)])) << 48);
  138. k |= (((uint64_t) (str[2 * (str_size > 2)])) << 40);
  139. k |= (((uint64_t) (str[3 * (str_size > 3)])) << 32);
  140. k |= (((uint64_t) (str[(str_size-4) * (str_size >= 4)])) << 24);
  141. k |= (((uint64_t) (str[(str_size-3) * (str_size >= 3)])) << 16);
  142. k |= (((uint64_t) (str[(str_size-2) * (str_size >= 2)])) << 8);
  143. k |= (((uint64_t) (str[(str_size-1) * (str_size >= 1)])) << 0);
  144. return k + ((uint64_t)str[4 * (str_size > 4)] * 31)
  145. + ((uint64_t)str[(str_size-5) * (str_size >= 5)] * 13)
  146. + ((uint64_t)str[str_size/2] * 41);
  147. /* static uint8_t _primes_list[] = { */
  148. /* 3, 5, 7, 11, 13, 17, 19, 23, 29, 31, 37, 41, 43, 47, 53, 59, */
  149. /* 61, 67, 71, 73, 79, 83, 89, 97, 101, 103, 107, 109, 113, 127, */
  150. /* 131, 137, 139, 149, 151, 157, 163, 167, 173 */
  151. /* }; */
  152. /* static uint8_t _primes_list_size = 8; */
  153. /* uint64_t max = UINT64_MAX >> 1; */
  154. /* uint64_t ret = 1; */
  155. /* uint8_t p = 0; */
  156. /* size_t i = 0; */
  157. /* uint8_t b = 0; */
  158. /* for ( i = 0; i < str_size; ++i ) { */
  159. /* b = (uint8_t)str[i]; */
  160. /* p = _primes_list[(i + b) & _primes_list_size]; */
  161. /* ret = (ret * (b * p)) % max; */
  162. /* } */
  163. /* return ret; */
  164. }
  165. #endif /* defined(HT_IMP) || defined(IMP) */
  166. #undef CONCAT
  167. #undef CONCAT_INNER
  168. #undef UNIQUE_NAME
  169. #endif