/* * Copyright 2017 Advanced Micro Devices, Inc. * * Permission is hereby granted, free of charge, to any person obtaining a * copy of this software and associated documentation files (the "Software"), * to deal in the Software without restriction, including without limitation * the rights to use, copy, modify, merge, publish, distribute, sublicense, * and/or sell copies of the Software, and to permit persons to whom the * Software is furnished to do so, subject to the following conditions: * * The above copyright notice and this permission notice shall be included in * all copies or substantial portions of the Software. * * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR * OTHER DEALINGS IN THE SOFTWARE. * */ #include #include #include #include #include #include #include #include /** * chash_table_alloc - Allocate closed hash table * @table: Pointer to the table structure * @bits: Table size will be 2^bits entries * @key_size: Size of hash keys in bytes, 4 or 8 * @value_size: Size of data values in bytes, can be 0 */ int chash_table_alloc(struct chash_table *table, u8 bits, u8 key_size, unsigned int value_size, gfp_t gfp_mask) { if (bits > 31) return -EINVAL; if (key_size != 4 && key_size != 8) return -EINVAL; table->data = kcalloc(__CHASH_DATA_SIZE(bits, key_size, value_size), sizeof(long), gfp_mask); if (!table->data) return -ENOMEM; __CHASH_TABLE_INIT(table->table, table->data, bits, key_size, value_size); return 0; } EXPORT_SYMBOL(chash_table_alloc); /** * chash_table_free - Free closed hash table * @table: Pointer to the table structure */ void chash_table_free(struct chash_table *table) { kfree(table->data); } EXPORT_SYMBOL(chash_table_free); #ifdef CONFIG_CHASH_STATS #define DIV_FRAC(nom, denom, quot, frac, frac_digits) do { \ u64 __nom = (nom); \ u64 __denom = (denom); \ u64 __quot, __frac; \ u32 __rem; \ \ while (__denom >> 32) { \ __nom >>= 1; \ __denom >>= 1; \ } \ __quot = __nom; \ __rem = do_div(__quot, __denom); \ __frac = __rem * (frac_digits) + (__denom >> 1); \ do_div(__frac, __denom); \ (quot) = __quot; \ (frac) = __frac; \ } while (0) void __chash_table_dump_stats(struct __chash_table *table) { struct chash_iter iter = CHASH_ITER_INIT(table, 0); u32 filled = 0, empty = 0, tombstones = 0; u64 quot1, quot2; u32 frac1, frac2; do { if (chash_iter_is_valid(iter)) filled++; else if (chash_iter_is_empty(iter)) empty++; else tombstones++; CHASH_ITER_INC(iter); } while (iter.slot); pr_debug("chash: key size %u, value size %u\n", table->key_size, table->value_size); pr_debug(" Slots total/filled/empty/tombstones: %u / %u / %u / %u\n", 1 << table->bits, filled, empty, tombstones); if (table->hits > 0) { DIV_FRAC(table->hits_steps, table->hits, quot1, frac1, 1000); DIV_FRAC(table->hits * 1000, table->hits_time_ns, quot2, frac2, 1000); } else { quot1 = quot2 = 0; frac1 = frac2 = 0; } pr_debug(" Hits (avg.cost, rate): %llu (%llu.%03u, %llu.%03u M/s)\n", table->hits, quot1, frac1, quot2, frac2); if (table->miss > 0) { DIV_FRAC(table->miss_steps, table->miss, quot1, frac1, 1000); DIV_FRAC(table->miss * 1000, table->miss_time_ns, quot2, frac2, 1000); } else { quot1 = quot2 = 0; frac1 = frac2 = 0; } pr_debug(" Misses (avg.cost, rate): %llu (%llu.%03u, %llu.%03u M/s)\n", table->miss, quot1, frac1, quot2, frac2); if (table->hits + table->miss > 0) { DIV_FRAC(table->hits_steps + table->miss_steps, table->hits + table->miss, quot1, frac1, 1000); DIV_FRAC((table->hits + table->miss) * 1000, (table->hits_time_ns + table->miss_time_ns), quot2, frac2, 1000); } else { quot1 = quot2 = 0; frac1 = frac2 = 0; } pr_debug(" Total (avg.cost, rate): %llu (%llu.%03u, %llu.%03u M/s)\n", table->hits + table->miss, quot1, frac1, quot2, frac2); if (table->relocs > 0) { DIV_FRAC(table->hits + table->miss, table->relocs, quot1, frac1, 1000); DIV_FRAC(table->reloc_dist, table->relocs, quot2, frac2, 1000); pr_debug(" Relocations (freq, avg.dist): %llu (1:%llu.%03u, %llu.%03u)\n", table->relocs, quot1, frac1, quot2, frac2); } else { pr_debug(" No relocations\n"); } } EXPORT_SYMBOL(__chash_table_dump_stats); #undef DIV_FRAC #endif #define CHASH_INC(table, a) ((a) = ((a) + 1) & (table)->size_mask) #define CHASH_ADD(table, a, b) (((a) + (b)) & (table)->size_mask) #define CHASH_SUB(table, a, b) (((a) - (b)) & (table)->size_mask) #define CHASH_IN_RANGE(table, slot, first, last) \ (CHASH_SUB(table, slot, first) <= CHASH_SUB(table, last, first)) /*#define CHASH_DEBUG Uncomment this to enable verbose debug output*/ #ifdef CHASH_DEBUG static void chash_table_dump(struct __chash_table *table) { struct chash_iter iter = CHASH_ITER_INIT(table, 0); do { if ((iter.slot & 3) == 0) pr_debug("%04x: ", iter.slot); if (chash_iter_is_valid(iter)) pr_debug("[%016llx] ", chash_iter_key(iter)); else if (chash_iter_is_empty(iter)) pr_debug("[ ] "); else pr_debug("[ ] "); if ((iter.slot & 3) == 3) pr_debug("\n"); CHASH_ITER_INC(iter); } while (iter.slot); if ((iter.slot & 3) != 0) pr_debug("\n"); } static int chash_table_check(struct __chash_table *table) { u32 hash; struct chash_iter iter = CHASH_ITER_INIT(table, 0); struct chash_iter cur = CHASH_ITER_INIT(table, 0); do { if (!chash_iter_is_valid(iter)) { CHASH_ITER_INC(iter); continue; } hash = chash_iter_hash(iter); CHASH_ITER_SET(cur, hash); while (cur.slot != iter.slot) { if (chash_iter_is_empty(cur)) { pr_err("Path to element at %x with hash %x broken at slot %x\n", iter.slot, hash, cur.slot); chash_table_dump(table); return -EINVAL; } CHASH_ITER_INC(cur); } CHASH_ITER_INC(iter); } while (iter.slot); return 0; } #endif static void chash_iter_relocate(struct chash_iter dst, struct chash_iter src) { BUG_ON(src.table == dst.table && src.slot == dst.slot); BUG_ON(src.table->key_size != dst.table->key_size); BUG_ON(src.table->value_size != dst.table->value_size); if (dst.table->key_size == 4) dst.table->keys32[dst.slot] = src.table->keys32[src.slot]; else dst.table->keys64[dst.slot] = src.table->keys64[src.slot]; if (dst.table->value_size) memcpy(chash_iter_value(dst), chash_iter_value(src), dst.table->value_size); chash_iter_set_valid(dst); chash_iter_set_invalid(src); #ifdef CONFIG_CHASH_STATS if (src.table == dst.table) { dst.table->relocs++; dst.table->reloc_dist += CHASH_SUB(dst.table, src.slot, dst.slot); } #endif } /** * __chash_table_find - Helper for looking up a hash table entry * @iter: Pointer to hash table iterator * @key: Key of the entry to find * @for_removal: set to true if the element will be removed soon * * Searches for an entry in the hash table with a given key. iter must * be initialized by the caller to point to the home position of the * hypothetical entry, i.e. it must be initialized with the hash table * and the key's hash as the initial slot for the search. * * This function also does some local clean-up to speed up future * look-ups by relocating entries to better slots and removing * tombstones that are no longer needed. * * If @for_removal is true, the function avoids relocating the entry * that is being returned. * * Returns 0 if the search is successful. In this case iter is updated * to point to the found entry. Otherwise %-EINVAL is returned and the * iter is updated to point to the first available slot for the given * key. If the table is full, the slot is set to -1. */ static int chash_table_find(struct chash_iter *iter, u64 key, bool for_removal) { #ifdef CONFIG_CHASH_STATS u64 ts1 = local_clock(); #endif u32 hash = iter->slot; struct chash_iter first_redundant = CHASH_ITER_INIT(iter->table, -1); int first_avail = (for_removal ? -2 : -1); while (!chash_iter_is_valid(*iter) || chash_iter_key(*iter) != key) { if (chash_iter_is_empty(*iter)) { /* Found an empty slot, which ends the * search. Clean up any preceding tombstones * that are no longer needed because they lead * to no-where */ if ((int)first_redundant.slot < 0) goto not_found; while (first_redundant.slot != iter->slot) { if (!chash_iter_is_valid(first_redundant)) chash_iter_set_empty(first_redundant); CHASH_ITER_INC(first_redundant); } #ifdef CHASH_DEBUG chash_table_check(iter->table); #endif goto not_found; } else if (!chash_iter_is_valid(*iter)) { /* Found a tombstone. Remember it as candidate * for relocating the entry we're looking for * or for adding a new entry with the given key */ if (first_avail == -1) first_avail = iter->slot; /* Or mark it as the start of a series of * potentially redundant tombstones */ else if (first_redundant.slot == -1) CHASH_ITER_SET(first_redundant, iter->slot); } else if (first_redundant.slot >= 0) { /* Found a valid, occupied slot with a * preceding series of tombstones. Relocate it * to a better position that no longer depends * on those tombstones */ u32 cur_hash = chash_iter_hash(*iter); if (!CHASH_IN_RANGE(iter->table, cur_hash, first_redundant.slot + 1, iter->slot)) { /* This entry has a hash at or before * the first tombstone we found. We * can relocate it to that tombstone * and advance to the next tombstone */ chash_iter_relocate(first_redundant, *iter); do { CHASH_ITER_INC(first_redundant); } while (chash_iter_is_valid(first_redundant)); } else if (cur_hash != iter->slot) { /* Relocate entry to its home position * or as close as possible so it no * longer depends on any preceding * tombstones */ struct chash_iter new_iter = CHASH_ITER_INIT(iter->table, cur_hash); while (new_iter.slot != iter->slot && chash_iter_is_valid(new_iter)) CHASH_ITER_INC(new_iter); if (new_iter.slot != iter->slot) chash_iter_relocate(new_iter, *iter); } } CHASH_ITER_INC(*iter); if (iter->slot == hash) { iter->slot = -1; goto not_found; } } #ifdef CONFIG_CHASH_STATS iter->table->hits++; iter->table->hits_steps += CHASH_SUB(iter->table, iter->slot, hash) + 1; #endif if (first_avail >= 0) { CHASH_ITER_SET(first_redundant, first_avail); chash_iter_relocate(first_redundant, *iter); iter->slot = first_redundant.slot; iter->mask = first_redundant.mask; } #ifdef CONFIG_CHASH_STATS iter->table->hits_time_ns += local_clock() - ts1; #endif return 0; not_found: #ifdef CONFIG_CHASH_STATS iter->table->miss++; iter->table->miss_steps += (iter->slot < 0) ? (1 << iter->table->bits) : CHASH_SUB(iter->table, iter->slot, hash) + 1; #endif if (first_avail >= 0) CHASH_ITER_SET(*iter, first_avail); #ifdef CONFIG_CHASH_STATS iter->table->miss_time_ns += local_clock() - ts1; #endif return -EINVAL; } int __chash_table_copy_in(struct __chash_table *table, u64 key, const void *value) { u32 hash = (table->key_size == 4) ? hash_32(key, table->bits) : hash_64(key, table->bits); struct chash_iter iter = CHASH_ITER_INIT(table, hash); int r = chash_table_find(&iter, key, false); /* Found an existing entry */ if (!r) { if (value && table->value_size) memcpy(chash_iter_value(iter), value, table->value_size); return 1; } /* Is there a place to add a new entry? */ if (iter.slot < 0) { pr_err("Hash table overflow\n"); return -ENOMEM; } chash_iter_set_valid(iter); if (table->key_size == 4) table->keys32[iter.slot] = key; else table->keys64[iter.slot] = key; if (value && table->value_size) memcpy(chash_iter_value(iter), value, table->value_size); return 0; } EXPORT_SYMBOL(__chash_table_copy_in); int __chash_table_copy_out(struct __chash_table *table, u64 key, void *value, bool remove) { u32 hash = (table->key_size == 4) ? hash_32(key, table->bits) : hash_64(key, table->bits); struct chash_iter iter = CHASH_ITER_INIT(table, hash); int r = chash_table_find(&iter, key, remove); if (r < 0) return r; if (value && table->value_size) memcpy(value, chash_iter_value(iter), table->value_size); if (remove) chash_iter_set_invalid(iter); return iter.slot; } EXPORT_SYMBOL(__chash_table_copy_out); #ifdef CONFIG_CHASH_SELFTEST /** * chash_self_test - Run a self-test of the hash table implementation * @bits: Table size will be 2^bits entries * @key_size: Size of hash keys in bytes, 4 or 8 * @min_fill: Minimum fill level during the test * @max_fill: Maximum fill level during the test * @iterations: Number of test iterations * * The test adds and removes entries from a hash table, cycling the * fill level between min_fill and max_fill entries. Also tests lookup * and value retrieval. */ static int __init chash_self_test(u8 bits, u8 key_size, int min_fill, int max_fill, u64 iterations) { struct chash_table table; int ret; u64 add_count, rmv_count; u64 value; if (key_size == 4 && iterations > 0xffffffff) return -EINVAL; if (min_fill >= max_fill) return -EINVAL; ret = chash_table_alloc(&table, bits, key_size, sizeof(u64), GFP_KERNEL); if (ret) { pr_err("chash_table_alloc failed: %d\n", ret); return ret; } for (add_count = 0, rmv_count = 0; add_count < iterations; add_count++) { /* When we hit the max_fill level, remove entries down * to min_fill */ if (add_count - rmv_count == max_fill) { u64 find_count = rmv_count; /* First try to find all entries that we're * about to remove, confirm their value, test * writing them back a second time. */ for (; add_count - find_count > min_fill; find_count++) { ret = chash_table_copy_out(&table, find_count, &value); if (ret < 0) { pr_err("chash_table_copy_out failed: %d\n", ret); goto out; } if (value != ~find_count) { pr_err("Wrong value retrieved for key 0x%llx, expected 0x%llx got 0x%llx\n", find_count, ~find_count, value); #ifdef CHASH_DEBUG chash_table_dump(&table.table); #endif ret = -EFAULT; goto out; } ret = chash_table_copy_in(&table, find_count, &value); if (ret != 1) { pr_err("copy_in second time returned %d, expected 1\n", ret); ret = -EFAULT; goto out; } } /* Remove them until we hit min_fill level */ for (; add_count - rmv_count > min_fill; rmv_count++) { ret = chash_table_remove(&table, rmv_count, NULL); if (ret < 0) { pr_err("chash_table_remove failed: %d\n", ret); goto out; } } } /* Add a new value */ value = ~add_count; ret = chash_table_copy_in(&table, add_count, &value); if (ret != 0) { pr_err("copy_in first time returned %d, expected 0\n", ret); ret = -EFAULT; goto out; } } chash_table_dump_stats(&table); chash_table_reset_stats(&table); out: chash_table_free(&table); return ret; } static unsigned int chash_test_bits = 10; MODULE_PARM_DESC(test_bits, "Selftest number of hash bits ([4..20], default=10)"); module_param_named(test_bits, chash_test_bits, uint, 0444); static unsigned int chash_test_keysize = 8; MODULE_PARM_DESC(test_keysize, "Selftest keysize (4 or 8, default=8)"); module_param_named(test_keysize, chash_test_keysize, uint, 0444); static unsigned int chash_test_minfill; MODULE_PARM_DESC(test_minfill, "Selftest minimum #entries (default=50%)"); module_param_named(test_minfill, chash_test_minfill, uint, 0444); static unsigned int chash_test_maxfill; MODULE_PARM_DESC(test_maxfill, "Selftest maximum #entries (default=80%)"); module_param_named(test_maxfill, chash_test_maxfill, uint, 0444); static unsigned long chash_test_iters; MODULE_PARM_DESC(test_iters, "Selftest iterations (default=1000 x #entries)"); module_param_named(test_iters, chash_test_iters, ulong, 0444); static int __init chash_init(void) { int ret; u64 ts1_ns; /* Skip self test on user errors */ if (chash_test_bits < 4 || chash_test_bits > 20) { pr_err("chash: test_bits out of range [4..20].\n"); return 0; } if (chash_test_keysize != 4 && chash_test_keysize != 8) { pr_err("chash: test_keysize invalid. Must be 4 or 8.\n"); return 0; } if (!chash_test_minfill) chash_test_minfill = (1 << chash_test_bits) / 2; if (!chash_test_maxfill) chash_test_maxfill = (1 << chash_test_bits) * 4 / 5; if (!chash_test_iters) chash_test_iters = (1 << chash_test_bits) * 1000; if (chash_test_minfill >= (1 << chash_test_bits)) { pr_err("chash: test_minfill too big. Must be < table size.\n"); return 0; } if (chash_test_maxfill >= (1 << chash_test_bits)) { pr_err("chash: test_maxfill too big. Must be < table size.\n"); return 0; } if (chash_test_minfill >= chash_test_maxfill) { pr_err("chash: test_minfill must be < test_maxfill.\n"); return 0; } if (chash_test_keysize == 4 && chash_test_iters > 0xffffffff) { pr_err("chash: test_iters must be < 4G for 4 byte keys.\n"); return 0; } ts1_ns = local_clock(); ret = chash_self_test(chash_test_bits, chash_test_keysize, chash_test_minfill, chash_test_maxfill, chash_test_iters); if (!ret) { u64 ts_delta_us = local_clock() - ts1_ns; u64 iters_per_second = (u64)chash_test_iters * 1000000; do_div(ts_delta_us, 1000); do_div(iters_per_second, ts_delta_us); pr_info("chash: self test took %llu us, %llu iterations/s\n", ts_delta_us, iters_per_second); } else { pr_err("chash: self test failed: %d\n", ret); } return ret; } module_init(chash_init); #endif /* CONFIG_CHASH_SELFTEST */ MODULE_DESCRIPTION("Closed hash table"); MODULE_LICENSE("GPL and additional rights");