2 * Resizable, Scalable, Concurrent Hash Table
4 * Copyright (c) 2014-2015 Thomas Graf <tgraf@suug.ch>
5 * Copyright (c) 2008-2014 Patrick McHardy <kaber@trash.net>
7 * This program is free software; you can redistribute it and/or modify
8 * it under the terms of the GNU General Public License version 2 as
9 * published by the Free Software Foundation.
12 /**************************************************************************
14 **************************************************************************/
16 #include <linux/init.h>
17 #include <linux/jhash.h>
18 #include <linux/kernel.h>
19 #include <linux/kthread.h>
20 #include <linux/module.h>
21 #include <linux/rcupdate.h>
22 #include <linux/rhashtable.h>
23 #include <linux/semaphore.h>
24 #include <linux/slab.h>
25 #include <linux/sched.h>
26 #include <linux/random.h>
27 #include <linux/vmalloc.h>
29 #define MAX_ENTRIES 1000000
30 #define TEST_INSERT_FAIL INT_MAX
32 static int parm_entries = 50000;
33 module_param(parm_entries, int, 0);
34 MODULE_PARM_DESC(parm_entries, "Number of entries to add (default: 50000)");
37 module_param(runs, int, 0);
38 MODULE_PARM_DESC(runs, "Number of test runs per variant (default: 4)");
40 static int max_size = 0;
41 module_param(max_size, int, 0);
42 MODULE_PARM_DESC(max_size, "Maximum table size (default: calculated)");
44 static bool shrinking = false;
45 module_param(shrinking, bool, 0);
46 MODULE_PARM_DESC(shrinking, "Enable automatic shrinking (default: off)");
49 module_param(size, int, 0);
50 MODULE_PARM_DESC(size, "Initial size hint of table (default: 8)");
52 static int tcount = 10;
53 module_param(tcount, int, 0);
54 MODULE_PARM_DESC(tcount, "Number of threads to spawn (default: 10)");
56 static bool enomem_retry = false;
57 module_param(enomem_retry, bool, 0);
58 MODULE_PARM_DESC(enomem_retry, "Retry insert even if -ENOMEM was returned (default: off)");
66 struct test_obj_val value;
67 struct rhash_head node;
71 struct test_obj_val value;
72 struct rhlist_head list_node;
78 struct task_struct *task;
79 struct test_obj *objs;
82 static u32 my_hashfn(const void *data, u32 len, u32 seed)
84 const struct test_obj_rhl *obj = data;
86 return (obj->value.id % 10) << RHT_HASH_RESERVED_SPACE;
89 static int my_cmpfn(struct rhashtable_compare_arg *arg, const void *obj)
91 const struct test_obj_rhl *test_obj = obj;
92 const struct test_obj_val *val = arg->key;
94 return test_obj->value.id - val->id;
97 static struct rhashtable_params test_rht_params = {
98 .head_offset = offsetof(struct test_obj, node),
99 .key_offset = offsetof(struct test_obj, value),
100 .key_len = sizeof(struct test_obj_val),
102 .nulls_base = (3U << RHT_BASE_SHIFT),
105 static struct rhashtable_params test_rht_params_dup = {
106 .head_offset = offsetof(struct test_obj_rhl, list_node),
107 .key_offset = offsetof(struct test_obj_rhl, value),
108 .key_len = sizeof(struct test_obj_val),
110 .obj_hashfn = my_hashfn,
111 .obj_cmpfn = my_cmpfn,
113 .automatic_shrinking = false,
116 static struct semaphore prestart_sem;
117 static struct semaphore startup_sem = __SEMAPHORE_INITIALIZER(startup_sem, 0);
119 static int insert_retry(struct rhashtable *ht, struct test_obj *obj,
120 const struct rhashtable_params params)
122 int err, retries = -1, enomem_retries = 0;
127 err = rhashtable_insert_fast(ht, &obj->node, params);
128 if (err == -ENOMEM && enomem_retry) {
132 } while (err == -EBUSY);
135 pr_info(" %u insertions retried after -ENOMEM\n",
138 return err ? : retries;
141 static int __init test_rht_lookup(struct rhashtable *ht, struct test_obj *array,
142 unsigned int entries)
146 for (i = 0; i < entries; i++) {
147 struct test_obj *obj;
148 bool expected = !(i % 2);
149 struct test_obj_val key = {
153 if (array[i / 2].value.id == TEST_INSERT_FAIL)
156 obj = rhashtable_lookup_fast(ht, &key, test_rht_params);
158 if (expected && !obj) {
159 pr_warn("Test failed: Could not find key %u\n", key.id);
161 } else if (!expected && obj) {
162 pr_warn("Test failed: Unexpected entry found for key %u\n",
165 } else if (expected && obj) {
166 if (obj->value.id != i) {
167 pr_warn("Test failed: Lookup value mismatch %u!=%u\n",
179 static void test_bucket_stats(struct rhashtable *ht, unsigned int entries)
181 unsigned int err, total = 0, chain_len = 0;
182 struct rhashtable_iter hti;
183 struct rhash_head *pos;
185 err = rhashtable_walk_init(ht, &hti, GFP_KERNEL);
187 pr_warn("Test failed: allocation error");
191 rhashtable_walk_start(&hti);
193 while ((pos = rhashtable_walk_next(&hti))) {
194 if (PTR_ERR(pos) == -EAGAIN) {
195 pr_info("Info: encountered resize\n");
198 } else if (IS_ERR(pos)) {
199 pr_warn("Test failed: rhashtable_walk_next() error: %ld\n",
207 rhashtable_walk_stop(&hti);
208 rhashtable_walk_exit(&hti);
210 pr_info(" Traversal complete: counted=%u, nelems=%u, entries=%d, table-jumps=%u\n",
211 total, atomic_read(&ht->nelems), entries, chain_len);
213 if (total != atomic_read(&ht->nelems) || total != entries)
214 pr_warn("Test failed: Total count mismatch ^^^");
217 static s64 __init test_rhashtable(struct rhashtable *ht, struct test_obj *array,
218 unsigned int entries)
220 struct test_obj *obj;
222 unsigned int i, insert_retries = 0;
227 * Insert entries into table with all keys even numbers
229 pr_info(" Adding %d keys\n", entries);
230 start = ktime_get_ns();
231 for (i = 0; i < entries; i++) {
232 struct test_obj *obj = &array[i];
234 obj->value.id = i * 2;
235 err = insert_retry(ht, obj, test_rht_params);
237 insert_retries += err;
243 pr_info(" %u insertions retried due to memory pressure\n",
246 test_bucket_stats(ht, entries);
248 test_rht_lookup(ht, array, entries);
251 test_bucket_stats(ht, entries);
253 pr_info(" Deleting %d keys\n", entries);
254 for (i = 0; i < entries; i++) {
255 struct test_obj_val key = {
259 if (array[i].value.id != TEST_INSERT_FAIL) {
260 obj = rhashtable_lookup_fast(ht, &key, test_rht_params);
263 rhashtable_remove_fast(ht, &obj->node, test_rht_params);
269 end = ktime_get_ns();
270 pr_info(" Duration of test: %lld ns\n", end - start);
275 static struct rhashtable ht;
276 static struct rhltable rhlt;
278 static int __init test_rhltable(unsigned int entries)
280 struct test_obj_rhl *rhl_test_objects;
281 unsigned long *obj_in_table;
282 unsigned int i, j, k;
288 rhl_test_objects = vzalloc(array_size(entries,
289 sizeof(*rhl_test_objects)));
290 if (!rhl_test_objects)
294 obj_in_table = vzalloc(array_size(sizeof(unsigned long),
295 BITS_TO_LONGS(entries)));
299 /* nulls_base not supported in rhlist interface */
300 test_rht_params.nulls_base = 0;
301 err = rhltable_init(&rhlt, &test_rht_params);
307 for (i = 0; i < entries; i++) {
308 rhl_test_objects[i].value.id = k;
309 err = rhltable_insert(&rhlt, &rhl_test_objects[i].list_node,
311 if (WARN(err, "error %d on element %d\n", err, i))
314 set_bit(i, obj_in_table);
320 pr_info("test %d add/delete pairs into rhlist\n", entries);
321 for (i = 0; i < entries; i++) {
322 struct rhlist_head *h, *pos;
323 struct test_obj_rhl *obj;
324 struct test_obj_val key = {
330 h = rhltable_lookup(&rhlt, &key, test_rht_params);
331 if (WARN(!h, "key not found during iteration %d of %d", i, entries)) {
338 rhl_for_each_entry_rcu(obj, pos, h, list_node) {
339 if (WARN(pos == &rhl_test_objects[j].list_node, "old element found, should be gone"))
348 rhl_for_each_entry_rcu(obj, pos, h, list_node) {
349 if (pos == &rhl_test_objects[i].list_node) {
357 if (WARN(!found, "element %d not found", i))
360 err = rhltable_remove(&rhlt, &rhl_test_objects[i].list_node, test_rht_params);
361 WARN(err, "rhltable_remove: err %d for iteration %d\n", err, i);
363 clear_bit(i, obj_in_table);
369 for (i = 0; i < entries; i++) {
370 WARN(test_bit(i, obj_in_table), "elem %d allegedly still present", i);
372 err = rhltable_insert(&rhlt, &rhl_test_objects[i].list_node,
374 if (WARN(err, "error %d on element %d\n", err, i))
377 set_bit(i, obj_in_table);
380 pr_info("test %d random rhlist add/delete operations\n", entries);
381 for (j = 0; j < entries; j++) {
382 u32 i = prandom_u32_max(entries);
383 u32 prand = prandom_u32();
388 prand = prandom_u32();
395 err = rhltable_remove(&rhlt, &rhl_test_objects[i].list_node, test_rht_params);
396 if (test_bit(i, obj_in_table)) {
397 clear_bit(i, obj_in_table);
398 if (WARN(err, "cannot remove element at slot %d", i))
401 if (WARN(err != -ENOENT, "removed non-existant element %d, error %d not %d",
411 err = rhltable_insert(&rhlt, &rhl_test_objects[i].list_node, test_rht_params);
413 if (WARN(test_and_set_bit(i, obj_in_table), "succeeded to insert same object %d", i))
416 if (WARN(!test_bit(i, obj_in_table), "failed to insert object %d", i))
425 i = prandom_u32_max(entries);
426 if (test_bit(i, obj_in_table)) {
427 err = rhltable_remove(&rhlt, &rhl_test_objects[i].list_node, test_rht_params);
428 WARN(err, "cannot remove element at slot %d", i);
430 clear_bit(i, obj_in_table);
432 err = rhltable_insert(&rhlt, &rhl_test_objects[i].list_node, test_rht_params);
433 WARN(err, "failed to insert object %d", i);
435 set_bit(i, obj_in_table);
439 for (i = 0; i < entries; i++) {
441 err = rhltable_remove(&rhlt, &rhl_test_objects[i].list_node, test_rht_params);
442 if (test_bit(i, obj_in_table)) {
443 if (WARN(err, "cannot remove element at slot %d", i))
446 if (WARN(err != -ENOENT, "removed non-existant element, error %d not %d",
452 rhltable_destroy(&rhlt);
454 vfree(rhl_test_objects);
459 static int __init test_rhashtable_max(struct test_obj *array,
460 unsigned int entries)
462 unsigned int i, insert_retries = 0;
465 test_rht_params.max_size = roundup_pow_of_two(entries / 8);
466 err = rhashtable_init(&ht, &test_rht_params);
470 for (i = 0; i < ht.max_elems; i++) {
471 struct test_obj *obj = &array[i];
473 obj->value.id = i * 2;
474 err = insert_retry(&ht, obj, test_rht_params);
476 insert_retries += err;
481 err = insert_retry(&ht, &array[ht.max_elems], test_rht_params);
485 pr_info("insert element %u should have failed with %d, got %d\n",
486 ht.max_elems, -E2BIG, err);
491 rhashtable_destroy(&ht);
496 static unsigned int __init print_ht(struct rhltable *rhlt)
498 struct rhashtable *ht;
499 const struct bucket_table *tbl;
501 unsigned int i, cnt = 0;
504 tbl = rht_dereference(ht->tbl, ht);
505 for (i = 0; i < tbl->size; i++) {
506 struct rhash_head *pos, *next;
507 struct test_obj_rhl *p;
509 pos = rht_dereference(tbl->buckets[i], ht);
510 next = !rht_is_a_nulls(pos) ? rht_dereference(pos->next, ht) : NULL;
512 if (!rht_is_a_nulls(pos)) {
513 sprintf(buff, "%s\nbucket[%d] -> ", buff, i);
516 while (!rht_is_a_nulls(pos)) {
517 struct rhlist_head *list = container_of(pos, struct rhlist_head, rhead);
518 sprintf(buff, "%s[[", buff);
521 list = rht_dereference(list->next, ht);
522 p = rht_obj(ht, pos);
524 sprintf(buff, "%s val %d (tid=%d)%s", buff, p->value.id, p->value.tid,
530 next = !rht_is_a_nulls(pos) ?
531 rht_dereference(pos->next, ht) : NULL;
533 sprintf(buff, "%s]]%s", buff, !rht_is_a_nulls(pos) ? " -> " : "");
536 printk(KERN_ERR "\n---- ht: ----%s\n-------------\n", buff);
541 static int __init test_insert_dup(struct test_obj_rhl *rhl_test_objects,
544 struct rhltable rhlt;
549 err = rhltable_init(&rhlt, &test_rht_params_dup);
553 for (i = 0; i < cnt; i++) {
554 rhl_test_objects[i].value.tid = i;
555 key = rht_obj(&rhlt.ht, &rhl_test_objects[i].list_node.rhead);
556 key += test_rht_params_dup.key_offset;
559 err = PTR_ERR(rhashtable_insert_slow(&rhlt.ht, key,
560 &rhl_test_objects[i].list_node.rhead));
564 err = rhltable_insert(&rhlt,
565 &rhl_test_objects[i].list_node,
566 test_rht_params_dup);
567 if (WARN(err, "error %d on element %d/%d (%s)\n", err, i, cnt, slow? "slow" : "fast"))
571 ret = print_ht(&rhlt);
572 WARN(ret != cnt, "missing rhltable elements (%d != %d, %s)\n", ret, cnt, slow? "slow" : "fast");
575 rhltable_destroy(&rhlt);
580 static int __init test_insert_duplicates_run(void)
582 struct test_obj_rhl rhl_test_objects[3] = {};
584 pr_info("test inserting duplicates\n");
586 /* two different values that map to same bucket */
587 rhl_test_objects[0].value.id = 1;
588 rhl_test_objects[1].value.id = 21;
590 /* and another duplicate with same as [0] value
591 * which will be second on the bucket list */
592 rhl_test_objects[2].value.id = rhl_test_objects[0].value.id;
594 test_insert_dup(rhl_test_objects, 2, false);
595 test_insert_dup(rhl_test_objects, 3, false);
596 test_insert_dup(rhl_test_objects, 2, true);
597 test_insert_dup(rhl_test_objects, 3, true);
602 static int thread_lookup_test(struct thread_data *tdata)
604 unsigned int entries = tdata->entries;
607 for (i = 0; i < entries; i++) {
608 struct test_obj *obj;
609 struct test_obj_val key = {
614 obj = rhashtable_lookup_fast(&ht, &key, test_rht_params);
615 if (obj && (tdata->objs[i].value.id == TEST_INSERT_FAIL)) {
616 pr_err(" found unexpected object %d-%d\n", key.tid, key.id);
618 } else if (!obj && (tdata->objs[i].value.id != TEST_INSERT_FAIL)) {
619 pr_err(" object %d-%d not found!\n", key.tid, key.id);
621 } else if (obj && memcmp(&obj->value, &key, sizeof(key))) {
622 pr_err(" wrong object returned (got %d-%d, expected %d-%d)\n",
623 obj->value.tid, obj->value.id, key.tid, key.id);
632 static int threadfunc(void *data)
634 int i, step, err = 0, insert_retries = 0;
635 struct thread_data *tdata = data;
638 if (down_interruptible(&startup_sem))
639 pr_err(" thread[%d]: down_interruptible failed\n", tdata->id);
641 for (i = 0; i < tdata->entries; i++) {
642 tdata->objs[i].value.id = i;
643 tdata->objs[i].value.tid = tdata->id;
644 err = insert_retry(&ht, &tdata->objs[i], test_rht_params);
646 insert_retries += err;
648 pr_err(" thread[%d]: rhashtable_insert_fast failed\n",
654 pr_info(" thread[%d]: %u insertions retried due to memory pressure\n",
655 tdata->id, insert_retries);
657 err = thread_lookup_test(tdata);
659 pr_err(" thread[%d]: rhashtable_lookup_test failed\n",
664 for (step = 10; step > 0; step--) {
665 for (i = 0; i < tdata->entries; i += step) {
666 if (tdata->objs[i].value.id == TEST_INSERT_FAIL)
668 err = rhashtable_remove_fast(&ht, &tdata->objs[i].node,
671 pr_err(" thread[%d]: rhashtable_remove_fast failed\n",
675 tdata->objs[i].value.id = TEST_INSERT_FAIL;
679 err = thread_lookup_test(tdata);
681 pr_err(" thread[%d]: rhashtable_lookup_test (2) failed\n",
687 while (!kthread_should_stop()) {
688 set_current_state(TASK_INTERRUPTIBLE);
694 static int __init test_rht_init(void)
696 unsigned int entries;
697 int i, err, started_threads = 0, failed_threads = 0;
699 struct thread_data *tdata;
700 struct test_obj *objs;
702 if (parm_entries < 0)
705 entries = min(parm_entries, MAX_ENTRIES);
707 test_rht_params.automatic_shrinking = shrinking;
708 test_rht_params.max_size = max_size ? : roundup_pow_of_two(entries);
709 test_rht_params.nelem_hint = size;
711 objs = vzalloc(array_size(sizeof(struct test_obj),
712 test_rht_params.max_size + 1));
716 pr_info("Running rhashtable test nelem=%d, max_size=%d, shrinking=%d\n",
717 size, max_size, shrinking);
719 for (i = 0; i < runs; i++) {
722 pr_info("Test %02d:\n", i);
723 memset(objs, 0, test_rht_params.max_size * sizeof(struct test_obj));
725 err = rhashtable_init(&ht, &test_rht_params);
727 pr_warn("Test failed: Unable to initialize hashtable: %d\n",
732 time = test_rhashtable(&ht, objs, entries);
733 rhashtable_destroy(&ht);
736 pr_warn("Test failed: return code %lld\n", time);
743 pr_info("test if its possible to exceed max_size %d: %s\n",
744 test_rht_params.max_size, test_rhashtable_max(objs, entries) == 0 ?
745 "no, ok" : "YES, failed");
748 do_div(total_time, runs);
749 pr_info("Average test time: %llu\n", total_time);
751 test_insert_duplicates_run();
756 pr_info("Testing concurrent rhashtable access from %d threads\n",
758 sema_init(&prestart_sem, 1 - tcount);
759 tdata = vzalloc(array_size(tcount, sizeof(struct thread_data)));
762 objs = vzalloc(array3_size(sizeof(struct test_obj), tcount, entries));
768 test_rht_params.max_size = max_size ? :
769 roundup_pow_of_two(tcount * entries);
770 err = rhashtable_init(&ht, &test_rht_params);
772 pr_warn("Test failed: Unable to initialize hashtable: %d\n",
778 for (i = 0; i < tcount; i++) {
780 tdata[i].entries = entries;
781 tdata[i].objs = objs + i * entries;
782 tdata[i].task = kthread_run(threadfunc, &tdata[i],
783 "rhashtable_thrad[%d]", i);
784 if (IS_ERR(tdata[i].task))
785 pr_err(" kthread_run failed for thread %d\n", i);
789 if (down_interruptible(&prestart_sem))
790 pr_err(" down interruptible failed\n");
791 for (i = 0; i < tcount; i++)
793 for (i = 0; i < tcount; i++) {
794 if (IS_ERR(tdata[i].task))
796 if ((err = kthread_stop(tdata[i].task))) {
797 pr_warn("Test failed: thread %d returned: %d\n",
802 rhashtable_destroy(&ht);
807 * rhltable_remove is very expensive, default values can cause test
808 * to run for 2 minutes or more, use a smaller number instead.
810 err = test_rhltable(entries / 16);
811 pr_info("Started %d threads, %d failed, rhltable test returns %d\n",
812 started_threads, failed_threads, err);
816 static void __exit test_rht_exit(void)
820 module_init(test_rht_init);
821 module_exit(test_rht_exit);
823 MODULE_LICENSE("GPL v2");