| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378 |
- /* Simple speed tests for hashtables. */
- #include <ccan/htable/htable_type.h>
- #include <ccan/htable/htable.c>
- #include <ccan/hash/hash.h>
- #include <stdio.h>
- #include <stdlib.h>
- #include <string.h>
- #include <time.h>
- #include <unistd.h>
- #include <sys/time.h>
- static size_t hashcount;
- struct object {
- /* The key. */
- unsigned int key;
- /* Some contents. Doubles as consistency check. */
- struct object *self;
- };
- static const unsigned int *objkey(const struct object *obj)
- {
- return &obj->key;
- }
- static size_t hash_obj(const unsigned int *key)
- {
- hashcount++;
- return hashl(key, 1, 0);
- }
- static bool cmp(const struct object *object, const unsigned int *key)
- {
- return object->key == *key;
- }
- HTABLE_DEFINE_TYPE(struct object, objkey, hash_obj, cmp, obj);
- static unsigned int popcount(unsigned long val)
- {
- #if HAVE_BUILTIN_POPCOUNTL
- return __builtin_popcountl(val);
- #else
- if (sizeof(long) == sizeof(u64)) {
- u64 v = val;
- v = (v & 0x5555555555555555ULL)
- + ((v >> 1) & 0x5555555555555555ULL);
- v = (v & 0x3333333333333333ULL)
- + ((v >> 1) & 0x3333333333333333ULL);
- v = (v & 0x0F0F0F0F0F0F0F0FULL)
- + ((v >> 1) & 0x0F0F0F0F0F0F0F0FULL);
- v = (v & 0x00FF00FF00FF00FFULL)
- + ((v >> 1) & 0x00FF00FF00FF00FFULL);
- v = (v & 0x0000FFFF0000FFFFULL)
- + ((v >> 1) & 0x0000FFFF0000FFFFULL);
- v = (v & 0x00000000FFFFFFFFULL)
- + ((v >> 1) & 0x00000000FFFFFFFFULL);
- return v;
- }
- val = (val & 0x55555555ULL) + ((val >> 1) & 0x55555555ULL);
- val = (val & 0x33333333ULL) + ((val >> 1) & 0x33333333ULL);
- val = (val & 0x0F0F0F0FULL) + ((val >> 1) & 0x0F0F0F0FULL);
- val = (val & 0x00FF00FFULL) + ((val >> 1) & 0x00FF00FFULL);
- val = (val & 0x0000FFFFULL) + ((val >> 1) & 0x0000FFFFULL);
- return val;
- #endif
- }
- static size_t perfect(const struct htable *ht)
- {
- size_t i, placed_perfect = 0;
- for (i = 0; i < ((size_t)1 << ht->bits); i++) {
- if (!entry_is_valid(ht->table[i]))
- continue;
- if (hash_bucket(ht, ht->rehash(get_raw_ptr(ht, ht->table[i]),
- ht->priv)) == i) {
- assert((ht->table[i] & ht->perfect_bit)
- == ht->perfect_bit);
- placed_perfect++;
- }
- }
- return placed_perfect;
- }
- static size_t count_deleted(const struct htable *ht)
- {
- size_t i, delete_markers = 0;
- for (i = 0; i < ((size_t)1 << ht->bits); i++) {
- if (ht->table[i] == HTABLE_DELETED)
- delete_markers++;
- }
- return delete_markers;
- }
- /* Nanoseconds per operation */
- static size_t normalize(const struct timeval *start,
- const struct timeval *stop,
- unsigned int num)
- {
- struct timeval diff;
- timersub(stop, start, &diff);
- /* Floating point is more accurate here. */
- return (double)(diff.tv_sec * 1000000 + diff.tv_usec)
- / num * 1000;
- }
- static size_t worst_run(struct htable *ht, size_t *deleted)
- {
- size_t longest = 0, len = 0, this_del = 0, i;
- *deleted = 0;
- /* This doesn't take into account end-wrap, but gives an idea. */
- for (i = 0; i < ((size_t)1 << ht->bits); i++) {
- if (ht->table[i]) {
- len++;
- if (ht->table[i] == HTABLE_DELETED)
- this_del++;
- } else {
- if (len > longest) {
- longest = len;
- *deleted = this_del;
- }
- len = 0;
- this_del = 0;
- }
- }
- return longest;
- }
- int main(int argc, char *argv[])
- {
- struct object *objs;
- size_t i, j, num, deleted;
- struct timeval start, stop;
- struct htable_obj *ht;
- struct htable *htr;
- bool make_dumb = false;
- if (argv[1] && strcmp(argv[1], "--dumb") == 0) {
- argv++;
- make_dumb = true;
- }
- num = argv[1] ? atoi(argv[1]) : 1000000;
- objs = calloc(num, sizeof(objs[0]));
- for (i = 0; i < num; i++) {
- objs[i].key = i;
- objs[i].self = &objs[i];
- }
- ht = htable_obj_new();
- htr = (void *)ht;
- printf("Initial insert: ");
- fflush(stdout);
- gettimeofday(&start, NULL);
- for (i = 0; i < num; i++)
- htable_obj_add(ht, objs[i].self);
- gettimeofday(&stop, NULL);
- printf(" %zu ns\n", normalize(&start, &stop, num));
- printf("Details: hash size %u, mask bits %u, perfect %.0f%%\n",
- 1U << htr->bits, popcount(htr->common_mask),
- perfect(htr) * 100.0 / htr->elems);
- if (make_dumb) {
- /* Screw with mask, to hobble us. */
- update_common(htr, (void *)~htr->common_bits);
- printf("Details: DUMB MODE: mask bits %u\n",
- popcount(htr->common_mask));
- }
- printf("Initial lookup (match): ");
- fflush(stdout);
- gettimeofday(&start, NULL);
- for (i = 0; i < num; i++)
- if (htable_obj_get(ht, &i)->self != objs[i].self)
- abort();
- gettimeofday(&stop, NULL);
- printf(" %zu ns\n", normalize(&start, &stop, num));
- printf("Initial lookup (miss): ");
- fflush(stdout);
- gettimeofday(&start, NULL);
- for (i = 0; i < num; i++) {
- unsigned int n = i + num;
- if (htable_obj_get(ht, &n))
- abort();
- }
- gettimeofday(&stop, NULL);
- printf(" %zu ns\n", normalize(&start, &stop, num));
- /* Lookups in order are very cache-friendly for judy; try random */
- printf("Initial lookup (random): ");
- fflush(stdout);
- gettimeofday(&start, NULL);
- for (i = 0, j = 0; i < num; i++, j = (j + 10007) % num)
- if (htable_obj_get(ht, &j)->self != &objs[j])
- abort();
- gettimeofday(&stop, NULL);
- printf(" %zu ns\n", normalize(&start, &stop, num));
- hashcount = 0;
- printf("Initial delete all: ");
- fflush(stdout);
- gettimeofday(&start, NULL);
- for (i = 0; i < num; i++)
- if (!htable_obj_del(ht, objs[i].self))
- abort();
- gettimeofday(&stop, NULL);
- printf(" %zu ns\n", normalize(&start, &stop, num));
- printf("Details: rehashes %zu\n", hashcount);
- printf("Initial re-inserting: ");
- fflush(stdout);
- gettimeofday(&start, NULL);
- for (i = 0; i < num; i++)
- htable_obj_add(ht, objs[i].self);
- gettimeofday(&stop, NULL);
- printf(" %zu ns\n", normalize(&start, &stop, num));
- hashcount = 0;
- printf("Deleting first half: ");
- fflush(stdout);
- gettimeofday(&start, NULL);
- for (i = 0; i < num; i+=2)
- if (!htable_obj_del(ht, objs[i].self))
- abort();
- gettimeofday(&stop, NULL);
- printf(" %zu ns\n", normalize(&start, &stop, num));
- printf("Details: rehashes %zu, delete markers %zu\n",
- hashcount, count_deleted(htr));
- printf("Adding (a different) half: ");
- fflush(stdout);
- for (i = 0; i < num; i+=2)
- objs[i].key = num+i;
- gettimeofday(&start, NULL);
- for (i = 0; i < num; i+=2)
- htable_obj_add(ht, objs[i].self);
- gettimeofday(&stop, NULL);
- printf(" %zu ns\n", normalize(&start, &stop, num));
- printf("Details: delete markers %zu, perfect %.0f%%\n",
- count_deleted(htr), perfect(htr) * 100.0 / htr->elems);
- printf("Lookup after half-change (match): ");
- fflush(stdout);
- gettimeofday(&start, NULL);
- for (i = 1; i < num; i+=2)
- if (htable_obj_get(ht, &i)->self != objs[i].self)
- abort();
- for (i = 0; i < num; i+=2) {
- unsigned int n = i + num;
- if (htable_obj_get(ht, &n)->self != objs[i].self)
- abort();
- }
- gettimeofday(&stop, NULL);
- printf(" %zu ns\n", normalize(&start, &stop, num));
- printf("Lookup after half-change (miss): ");
- fflush(stdout);
- gettimeofday(&start, NULL);
- for (i = 0; i < num; i++) {
- unsigned int n = i + num * 2;
- if (htable_obj_get(ht, &n))
- abort();
- }
- gettimeofday(&stop, NULL);
- printf(" %zu ns\n", normalize(&start, &stop, num));
- /* Hashtables with delete markers can fill with markers over time.
- * so do some changes to see how it operates in long-term. */
- for (i = 0; i < 5; i++) {
- if (i == 0) {
- /* We don't measure this: jmap is different. */
- printf("Details: initial churn\n");
- } else {
- printf("Churning %s time: ",
- i == 1 ? "second"
- : i == 2 ? "third"
- : i == 3 ? "fourth"
- : "fifth");
- fflush(stdout);
- }
- gettimeofday(&start, NULL);
- for (j = 0; j < num; j++) {
- if (!htable_obj_del(ht, &objs[j]))
- abort();
- objs[j].key = num*i+j;
- if (!htable_obj_add(ht, &objs[j]))
- abort();
- }
- gettimeofday(&stop, NULL);
- if (i != 0)
- printf(" %zu ns\n", normalize(&start, &stop, num));
- }
- /* Spread out the keys more to try to make it harder. */
- printf("Details: reinserting with spread\n");
- for (i = 0; i < num; i++) {
- if (!htable_obj_del(ht, objs[i].self))
- abort();
- objs[i].key = num * 5 + i * 9;
- if (!htable_obj_add(ht, objs[i].self))
- abort();
- }
- printf("Details: delete markers %zu, perfect %.0f%%\n",
- count_deleted(htr), perfect(htr) * 100.0 / htr->elems);
- i = worst_run(htr, &deleted);
- printf("Details: worst run %zu (%zu deleted)\n", i, deleted);
- printf("Lookup after churn & spread (match): ");
- fflush(stdout);
- gettimeofday(&start, NULL);
- for (i = 0; i < num; i++) {
- unsigned int n = num * 5 + i * 9;
- if (htable_obj_get(ht, &n)->self != objs[i].self)
- abort();
- }
- gettimeofday(&stop, NULL);
- printf(" %zu ns\n", normalize(&start, &stop, num));
- printf("Lookup after churn & spread (miss): ");
- fflush(stdout);
- gettimeofday(&start, NULL);
- for (i = 0; i < num; i++) {
- unsigned int n = num * (5 + 9) + i * 9;
- if (htable_obj_get(ht, &n))
- abort();
- }
- gettimeofday(&stop, NULL);
- printf(" %zu ns\n", normalize(&start, &stop, num));
- printf("Lookup after churn & spread (random): ");
- fflush(stdout);
- gettimeofday(&start, NULL);
- for (i = 0, j = 0; i < num; i++, j = (j + 10007) % num) {
- unsigned int n = num * 5 + j * 9;
- if (htable_obj_get(ht, &n)->self != &objs[j])
- abort();
- }
- gettimeofday(&stop, NULL);
- printf(" %zu ns\n", normalize(&start, &stop, num));
- hashcount = 0;
- printf("Deleting half after churn & spread: ");
- fflush(stdout);
- gettimeofday(&start, NULL);
- for (i = 0; i < num; i+=2)
- if (!htable_obj_del(ht, objs[i].self))
- abort();
- gettimeofday(&stop, NULL);
- printf(" %zu ns\n", normalize(&start, &stop, num));
- printf("Adding (a different) half after churn & spread: ");
- fflush(stdout);
- for (i = 0; i < num; i+=2)
- objs[i].key = num*6+i*9;
- gettimeofday(&start, NULL);
- for (i = 0; i < num; i+=2)
- htable_obj_add(ht, objs[i].self);
- gettimeofday(&stop, NULL);
- printf(" %zu ns\n", normalize(&start, &stop, num));
- printf("Details: delete markers %zu, perfect %.0f%%\n",
- count_deleted(htr), perfect(htr) * 100.0 / htr->elems);
- return 0;
- }
|