Contributors: 1
Author Tokens Token Proportion Commits Commit Proportion
Felix Kuhling 2759 100.00% 2 100.00%
Total 2759 2


/*
 * Copyright 2017 Advanced Micro Devices, Inc.
 *
 * Permission is hereby granted, free of charge, to any person obtaining a
 * copy of this software and associated documentation files (the "Software"),
 * to deal in the Software without restriction, including without limitation
 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
 * and/or sell copies of the Software, and to permit persons to whom the
 * Software is furnished to do so, subject to the following conditions:
 *
 * The above copyright notice and this permission notice shall be included in
 * all copies or substantial portions of the Software.
 *
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
 * OTHER DEALINGS IN THE SOFTWARE.
 *
 */

#include <linux/types.h>
#include <linux/hash.h>
#include <linux/bug.h>
#include <linux/slab.h>
#include <linux/module.h>
#include <linux/sched/clock.h>
#include <asm/div64.h>
#include <linux/chash.h>

/**
 * chash_table_alloc - Allocate closed hash table
 * @table: Pointer to the table structure
 * @bits: Table size will be 2^bits entries
 * @key_size: Size of hash keys in bytes, 4 or 8
 * @value_size: Size of data values in bytes, can be 0
 */
int chash_table_alloc(struct chash_table *table, u8 bits, u8 key_size,
		      unsigned int value_size, gfp_t gfp_mask)
{
	if (bits > 31)
		return -EINVAL;

	if (key_size != 4 && key_size != 8)
		return -EINVAL;

	table->data = kcalloc(__CHASH_DATA_SIZE(bits, key_size, value_size),
		       sizeof(long), gfp_mask);
	if (!table->data)
		return -ENOMEM;

	__CHASH_TABLE_INIT(table->table, table->data,
			   bits, key_size, value_size);

	return 0;
}
EXPORT_SYMBOL(chash_table_alloc);

/**
 * chash_table_free - Free closed hash table
 * @table: Pointer to the table structure
 */
void chash_table_free(struct chash_table *table)
{
	kfree(table->data);
}
EXPORT_SYMBOL(chash_table_free);

#ifdef CONFIG_CHASH_STATS

#define DIV_FRAC(nom, denom, quot, frac, frac_digits) do {		\
		u64 __nom = (nom);					\
		u64 __denom = (denom);					\
		u64 __quot, __frac;					\
		u32 __rem;						\
									\
		while (__denom >> 32) {					\
			__nom   >>= 1;					\
			__denom >>= 1;					\
		}							\
		__quot = __nom;						\
		__rem  = do_div(__quot, __denom);			\
		__frac = __rem * (frac_digits) + (__denom >> 1);	\
		do_div(__frac, __denom);				\
		(quot) = __quot;					\
		(frac) = __frac;					\
	} while (0)

void __chash_table_dump_stats(struct __chash_table *table)
{
	struct chash_iter iter = CHASH_ITER_INIT(table, 0);
	u32 filled = 0, empty = 0, tombstones = 0;
	u64 quot1, quot2;
	u32 frac1, frac2;

	do {
		if (chash_iter_is_valid(iter))
			filled++;
		else if (chash_iter_is_empty(iter))
			empty++;
		else
			tombstones++;
		CHASH_ITER_INC(iter);
	} while (iter.slot);

	pr_debug("chash: key size %u, value size %u\n",
		 table->key_size, table->value_size);
	pr_debug("  Slots total/filled/empty/tombstones: %u / %u / %u / %u\n",
		 1 << table->bits, filled, empty, tombstones);
	if (table->hits > 0) {
		DIV_FRAC(table->hits_steps, table->hits, quot1, frac1, 1000);
		DIV_FRAC(table->hits * 1000, table->hits_time_ns,
			 quot2, frac2, 1000);
	} else {
		quot1 = quot2 = 0;
		frac1 = frac2 = 0;
	}
	pr_debug("  Hits   (avg.cost, rate): %llu (%llu.%03u, %llu.%03u M/s)\n",
		 table->hits, quot1, frac1, quot2, frac2);
	if (table->miss > 0) {
		DIV_FRAC(table->miss_steps, table->miss, quot1, frac1, 1000);
		DIV_FRAC(table->miss * 1000, table->miss_time_ns,
			 quot2, frac2, 1000);
	} else {
		quot1 = quot2 = 0;
		frac1 = frac2 = 0;
	}
	pr_debug("  Misses (avg.cost, rate): %llu (%llu.%03u, %llu.%03u M/s)\n",
		 table->miss, quot1, frac1, quot2, frac2);
	if (table->hits + table->miss > 0) {
		DIV_FRAC(table->hits_steps + table->miss_steps,
			 table->hits + table->miss, quot1, frac1, 1000);
		DIV_FRAC((table->hits + table->miss) * 1000,
			 (table->hits_time_ns + table->miss_time_ns),
			 quot2, frac2, 1000);
	} else {
		quot1 = quot2 = 0;
		frac1 = frac2 = 0;
	}
	pr_debug("  Total  (avg.cost, rate): %llu (%llu.%03u, %llu.%03u M/s)\n",
		 table->hits + table->miss, quot1, frac1, quot2, frac2);
	if (table->relocs > 0) {
		DIV_FRAC(table->hits + table->miss, table->relocs,
			 quot1, frac1, 1000);
		DIV_FRAC(table->reloc_dist, table->relocs, quot2, frac2, 1000);
		pr_debug("  Relocations (freq, avg.dist): %llu (1:%llu.%03u, %llu.%03u)\n",
			 table->relocs, quot1, frac1, quot2, frac2);
	} else {
		pr_debug("  No relocations\n");
	}
}
EXPORT_SYMBOL(__chash_table_dump_stats);

#undef DIV_FRAC
#endif

#define CHASH_INC(table, a) ((a) = ((a) + 1) & (table)->size_mask)
#define CHASH_ADD(table, a, b) (((a) + (b)) & (table)->size_mask)
#define CHASH_SUB(table, a, b) (((a) - (b)) & (table)->size_mask)
#define CHASH_IN_RANGE(table, slot, first, last) \
	(CHASH_SUB(table, slot, first) <= CHASH_SUB(table, last, first))

/*#define CHASH_DEBUG Uncomment this to enable verbose debug output*/
#ifdef CHASH_DEBUG
static void chash_table_dump(struct __chash_table *table)
{
	struct chash_iter iter = CHASH_ITER_INIT(table, 0);

	do {
		if ((iter.slot & 3) == 0)
			pr_debug("%04x: ", iter.slot);

		if (chash_iter_is_valid(iter))
			pr_debug("[%016llx] ", chash_iter_key(iter));
		else if (chash_iter_is_empty(iter))
			pr_debug("[    <empty>     ] ");
		else
			pr_debug("[  <tombstone>   ] ");

		if ((iter.slot & 3) == 3)
			pr_debug("\n");

		CHASH_ITER_INC(iter);
	} while (iter.slot);

	if ((iter.slot & 3) != 0)
		pr_debug("\n");
}

static int chash_table_check(struct __chash_table *table)
{
	u32 hash;
	struct chash_iter iter = CHASH_ITER_INIT(table, 0);
	struct chash_iter cur = CHASH_ITER_INIT(table, 0);

	do {
		if (!chash_iter_is_valid(iter)) {
			CHASH_ITER_INC(iter);
			continue;
		}

		hash = chash_iter_hash(iter);
		CHASH_ITER_SET(cur, hash);
		while (cur.slot != iter.slot) {
			if (chash_iter_is_empty(cur)) {
				pr_err("Path to element at %x with hash %x broken at slot %x\n",
				       iter.slot, hash, cur.slot);
				chash_table_dump(table);
				return -EINVAL;
			}
			CHASH_ITER_INC(cur);
		}

		CHASH_ITER_INC(iter);
	} while (iter.slot);

	return 0;
}
#endif

static void chash_iter_relocate(struct chash_iter dst, struct chash_iter src)
{
	BUG_ON(src.table == dst.table && src.slot == dst.slot);
	BUG_ON(src.table->key_size != dst.table->key_size);
	BUG_ON(src.table->value_size != dst.table->value_size);

	if (dst.table->key_size == 4)
		dst.table->keys32[dst.slot] = src.table->keys32[src.slot];
	else
		dst.table->keys64[dst.slot] = src.table->keys64[src.slot];

	if (dst.table->value_size)
		memcpy(chash_iter_value(dst), chash_iter_value(src),
		       dst.table->value_size);

	chash_iter_set_valid(dst);
	chash_iter_set_invalid(src);

#ifdef CONFIG_CHASH_STATS
	if (src.table == dst.table) {
		dst.table->relocs++;
		dst.table->reloc_dist +=
			CHASH_SUB(dst.table, src.slot, dst.slot);
	}
#endif
}

/**
 * __chash_table_find - Helper for looking up a hash table entry
 * @iter: Pointer to hash table iterator
 * @key: Key of the entry to find
 * @for_removal: set to true if the element will be removed soon
 *
 * Searches for an entry in the hash table with a given key. iter must
 * be initialized by the caller to point to the home position of the
 * hypothetical entry, i.e. it must be initialized with the hash table
 * and the key's hash as the initial slot for the search.
 *
 * This function also does some local clean-up to speed up future
 * look-ups by relocating entries to better slots and removing
 * tombstones that are no longer needed.
 *
 * If @for_removal is true, the function avoids relocating the entry
 * that is being returned.
 *
 * Returns 0 if the search is successful. In this case iter is updated
 * to point to the found entry. Otherwise %-EINVAL is returned and the
 * iter is updated to point to the first available slot for the given
 * key. If the table is full, the slot is set to -1.
 */
static int chash_table_find(struct chash_iter *iter, u64 key,
			    bool for_removal)
{
#ifdef CONFIG_CHASH_STATS
	u64 ts1 = local_clock();
#endif
	u32 hash = iter->slot;
	struct chash_iter first_redundant = CHASH_ITER_INIT(iter->table, -1);
	int first_avail = (for_removal ? -2 : -1);

	while (!chash_iter_is_valid(*iter) || chash_iter_key(*iter) != key) {
		if (chash_iter_is_empty(*iter)) {
			/* Found an empty slot, which ends the
			 * search. Clean up any preceding tombstones
			 * that are no longer needed because they lead
			 * to no-where
			 */
			if ((int)first_redundant.slot < 0)
				goto not_found;
			while (first_redundant.slot != iter->slot) {
				if (!chash_iter_is_valid(first_redundant))
					chash_iter_set_empty(first_redundant);
				CHASH_ITER_INC(first_redundant);
			}
#ifdef CHASH_DEBUG
			chash_table_check(iter->table);
#endif
			goto not_found;
		} else if (!chash_iter_is_valid(*iter)) {
			/* Found a tombstone. Remember it as candidate
			 * for relocating the entry we're looking for
			 * or for adding a new entry with the given key
			 */
			if (first_avail == -1)
				first_avail = iter->slot;
			/* Or mark it as the start of a series of
			 * potentially redundant tombstones
			 */
			else if (first_redundant.slot == -1)
				CHASH_ITER_SET(first_redundant, iter->slot);
		} else if (first_redundant.slot >= 0) {
			/* Found a valid, occupied slot with a
			 * preceding series of tombstones. Relocate it
			 * to a better position that no longer depends
			 * on those tombstones
			 */
			u32 cur_hash = chash_iter_hash(*iter);

			if (!CHASH_IN_RANGE(iter->table, cur_hash,
					    first_redundant.slot + 1,
					    iter->slot)) {
				/* This entry has a hash at or before
				 * the first tombstone we found. We
				 * can relocate it to that tombstone
				 * and advance to the next tombstone
				 */
				chash_iter_relocate(first_redundant, *iter);
				do {
					CHASH_ITER_INC(first_redundant);
				} while (chash_iter_is_valid(first_redundant));
			} else if (cur_hash != iter->slot) {
				/* Relocate entry to its home position
				 * or as close as possible so it no
				 * longer depends on any preceding
				 * tombstones
				 */
				struct chash_iter new_iter =
					CHASH_ITER_INIT(iter->table, cur_hash);

				while (new_iter.slot != iter->slot &&
				       chash_iter_is_valid(new_iter))
					CHASH_ITER_INC(new_iter);

				if (new_iter.slot != iter->slot)
					chash_iter_relocate(new_iter, *iter);
			}
		}

		CHASH_ITER_INC(*iter);
		if (iter->slot == hash) {
			iter->slot = -1;
			goto not_found;
		}
	}

#ifdef CONFIG_CHASH_STATS
	iter->table->hits++;
	iter->table->hits_steps += CHASH_SUB(iter->table, iter->slot, hash) + 1;
#endif

	if (first_avail >= 0) {
		CHASH_ITER_SET(first_redundant, first_avail);
		chash_iter_relocate(first_redundant, *iter);
		iter->slot = first_redundant.slot;
		iter->mask = first_redundant.mask;
	}

#ifdef CONFIG_CHASH_STATS
	iter->table->hits_time_ns += local_clock() - ts1;
#endif

	return 0;

not_found:
#ifdef CONFIG_CHASH_STATS
	iter->table->miss++;
	iter->table->miss_steps += (iter->slot < 0) ?
		(1 << iter->table->bits) :
		CHASH_SUB(iter->table, iter->slot, hash) + 1;
#endif

	if (first_avail >= 0)
		CHASH_ITER_SET(*iter, first_avail);

#ifdef CONFIG_CHASH_STATS
	iter->table->miss_time_ns += local_clock() - ts1;
#endif

	return -EINVAL;
}

int __chash_table_copy_in(struct __chash_table *table, u64 key,
			  const void *value)
{
	u32 hash = (table->key_size == 4) ?
		hash_32(key, table->bits) : hash_64(key, table->bits);
	struct chash_iter iter = CHASH_ITER_INIT(table, hash);
	int r = chash_table_find(&iter, key, false);

	/* Found an existing entry */
	if (!r) {
		if (value && table->value_size)
			memcpy(chash_iter_value(iter), value,
			       table->value_size);
		return 1;
	}

	/* Is there a place to add a new entry? */
	if (iter.slot < 0) {
		pr_err("Hash table overflow\n");
		return -ENOMEM;
	}

	chash_iter_set_valid(iter);

	if (table->key_size == 4)
		table->keys32[iter.slot] = key;
	else
		table->keys64[iter.slot] = key;
	if (value && table->value_size)
		memcpy(chash_iter_value(iter), value, table->value_size);

	return 0;
}
EXPORT_SYMBOL(__chash_table_copy_in);

int __chash_table_copy_out(struct __chash_table *table, u64 key,
			   void *value, bool remove)
{
	u32 hash = (table->key_size == 4) ?
		hash_32(key, table->bits) : hash_64(key, table->bits);
	struct chash_iter iter = CHASH_ITER_INIT(table, hash);
	int r = chash_table_find(&iter, key, remove);

	if (r < 0)
		return r;

	if (value && table->value_size)
		memcpy(value, chash_iter_value(iter), table->value_size);

	if (remove)
		chash_iter_set_invalid(iter);

	return iter.slot;
}
EXPORT_SYMBOL(__chash_table_copy_out);

#ifdef CONFIG_CHASH_SELFTEST
/**
 * chash_self_test - Run a self-test of the hash table implementation
 * @bits: Table size will be 2^bits entries
 * @key_size: Size of hash keys in bytes, 4 or 8
 * @min_fill: Minimum fill level during the test
 * @max_fill: Maximum fill level during the test
 * @iterations: Number of test iterations
 *
 * The test adds and removes entries from a hash table, cycling the
 * fill level between min_fill and max_fill entries. Also tests lookup
 * and value retrieval.
 */
static int __init chash_self_test(u8 bits, u8 key_size,
				  int min_fill, int max_fill,
				  u64 iterations)
{
	struct chash_table table;
	int ret;
	u64 add_count, rmv_count;
	u64 value;

	if (key_size == 4 && iterations > 0xffffffff)
		return -EINVAL;
	if (min_fill >= max_fill)
		return -EINVAL;

	ret = chash_table_alloc(&table, bits, key_size, sizeof(u64),
				GFP_KERNEL);
	if (ret) {
		pr_err("chash_table_alloc failed: %d\n", ret);
		return ret;
	}

	for (add_count = 0, rmv_count = 0; add_count < iterations;
	     add_count++) {
		/* When we hit the max_fill level, remove entries down
		 * to min_fill
		 */
		if (add_count - rmv_count == max_fill) {
			u64 find_count = rmv_count;

			/* First try to find all entries that we're
			 * about to remove, confirm their value, test
			 * writing them back a second time.
			 */
			for (; add_count - find_count > min_fill;
			     find_count++) {
				ret = chash_table_copy_out(&table, find_count,
							   &value);
				if (ret < 0) {
					pr_err("chash_table_copy_out failed: %d\n",
					       ret);
					goto out;
				}
				if (value != ~find_count) {
					pr_err("Wrong value retrieved for key 0x%llx, expected 0x%llx got 0x%llx\n",
					       find_count, ~find_count, value);
#ifdef CHASH_DEBUG
					chash_table_dump(&table.table);
#endif
					ret = -EFAULT;
					goto out;
				}
				ret = chash_table_copy_in(&table, find_count,
							  &value);
				if (ret != 1) {
					pr_err("copy_in second time returned %d, expected 1\n",
					       ret);
					ret = -EFAULT;
					goto out;
				}
			}
			/* Remove them until we hit min_fill level */
			for (; add_count - rmv_count > min_fill; rmv_count++) {
				ret = chash_table_remove(&table, rmv_count,
							 NULL);
				if (ret < 0) {
					pr_err("chash_table_remove failed: %d\n",
					       ret);
					goto out;
				}
			}
		}

		/* Add a new value */
		value = ~add_count;
		ret = chash_table_copy_in(&table, add_count, &value);
		if (ret != 0) {
			pr_err("copy_in first time returned %d, expected 0\n",
			       ret);
			ret = -EFAULT;
			goto out;
		}
	}

	chash_table_dump_stats(&table);
	chash_table_reset_stats(&table);

out:
	chash_table_free(&table);
	return ret;
}

static unsigned int chash_test_bits = 10;
MODULE_PARM_DESC(test_bits,
		 "Selftest number of hash bits ([4..20], default=10)");
module_param_named(test_bits, chash_test_bits, uint, 0444);

static unsigned int chash_test_keysize = 8;
MODULE_PARM_DESC(test_keysize, "Selftest keysize (4 or 8, default=8)");
module_param_named(test_keysize, chash_test_keysize, uint, 0444);

static unsigned int chash_test_minfill;
MODULE_PARM_DESC(test_minfill, "Selftest minimum #entries (default=50%)");
module_param_named(test_minfill, chash_test_minfill, uint, 0444);

static unsigned int chash_test_maxfill;
MODULE_PARM_DESC(test_maxfill, "Selftest maximum #entries (default=80%)");
module_param_named(test_maxfill, chash_test_maxfill, uint, 0444);

static unsigned long chash_test_iters;
MODULE_PARM_DESC(test_iters, "Selftest iterations (default=1000 x #entries)");
module_param_named(test_iters, chash_test_iters, ulong, 0444);

static int __init chash_init(void)
{
	int ret;
	u64 ts1_ns;

	/* Skip self test on user errors */
	if (chash_test_bits < 4 || chash_test_bits > 20) {
		pr_err("chash: test_bits out of range [4..20].\n");
		return 0;
	}
	if (chash_test_keysize != 4 && chash_test_keysize != 8) {
		pr_err("chash: test_keysize invalid. Must be 4 or 8.\n");
		return 0;
	}

	if (!chash_test_minfill)
		chash_test_minfill = (1 << chash_test_bits) / 2;
	if (!chash_test_maxfill)
		chash_test_maxfill = (1 << chash_test_bits) * 4 / 5;
	if (!chash_test_iters)
		chash_test_iters = (1 << chash_test_bits) * 1000;

	if (chash_test_minfill >= (1 << chash_test_bits)) {
		pr_err("chash: test_minfill too big. Must be < table size.\n");
		return 0;
	}
	if (chash_test_maxfill >= (1 << chash_test_bits)) {
		pr_err("chash: test_maxfill too big. Must be < table size.\n");
		return 0;
	}
	if (chash_test_minfill >= chash_test_maxfill) {
		pr_err("chash: test_minfill must be < test_maxfill.\n");
		return 0;
	}
	if (chash_test_keysize == 4 && chash_test_iters > 0xffffffff) {
		pr_err("chash: test_iters must be < 4G for 4 byte keys.\n");
		return 0;
	}

	ts1_ns = local_clock();
	ret = chash_self_test(chash_test_bits, chash_test_keysize,
			      chash_test_minfill, chash_test_maxfill,
			      chash_test_iters);
	if (!ret) {
		u64 ts_delta_us = local_clock() - ts1_ns;
		u64 iters_per_second = (u64)chash_test_iters * 1000000;

		do_div(ts_delta_us, 1000);
		do_div(iters_per_second, ts_delta_us);
		pr_info("chash: self test took %llu us, %llu iterations/s\n",
			ts_delta_us, iters_per_second);
	} else {
		pr_err("chash: self test failed: %d\n", ret);
	}

	return ret;
}

module_init(chash_init);

#endif /* CONFIG_CHASH_SELFTEST */

MODULE_DESCRIPTION("Closed hash table");
MODULE_LICENSE("GPL and additional rights");