NetBSD/usr.bin/config/hash.c

/*	$NetBSD: hash.c,v 1.11 2014/10/29 17:14:50 christos Exp $	*/

/*
 * Copyright (c) 1992, 1993
 *	The Regents of the University of California.  All rights reserved.
 *
 * This software was developed by the Computer Systems Engineering group
 * at Lawrence Berkeley Laboratory under DARPA contract BG 91-66 and
 * contributed to Berkeley.
 *
 * All advertising materials mentioning features or use of this software
 * must display the following acknowledgement:
 *	This product includes software developed by the University of
 *	California, Lawrence Berkeley Laboratories.
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions
 * are met:
 * 1. Redistributions of source code must retain the above copyright
 *    notice, this list of conditions and the following disclaimer.
 * 2. Redistributions in binary form must reproduce the above copyright
 *    notice, this list of conditions and the following disclaimer in the
 *    documentation and/or other materials provided with the distribution.
 * 3. Neither the name of the University nor the names of its contributors
 *    may be used to endorse or promote products derived from this software
 *    without specific prior written permission.
 *
 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
 * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
 * SUCH DAMAGE.
 *
 *	from: @(#)hash.c	8.1 (Berkeley) 6/6/93
 */

#if HAVE_NBTOOL_CONFIG_H
#include "nbtool_config.h"
#endif

#include <sys/cdefs.h>
__RCSID("$NetBSD: hash.c,v 1.11 2014/10/29 17:14:50 christos Exp $");

#include <sys/param.h>
#include <assert.h>
#include <stdlib.h>
#include <string.h>
#include <util.h>
#include "defs.h"

/*
 * Interned strings are kept in a hash table.  By making each string
 * unique, the program can compare strings by comparing pointers.
 */
struct hashent {
	// XXXLUKEM: a SIMPLEQ might be more appropriate
	TAILQ_ENTRY(hashent) h_next;
	const char *h_names[2];		/* the string */
#define	h_name1	h_names[0]
#define	h_name2	h_names[1]
#define	h_name	h_name1
	u_int	h_hash;			/* its hash value */
	void	*h_value;		/* other values (for name=value) */
};
struct hashtab {
	size_t	ht_size;		/* size (power of 2) */
	size_t	ht_mask;		/* == ht_size - 1 */
	size_t	ht_used;		/* number of entries used */
	size_t	ht_lim;			/* when to expand */
	TAILQ_HEAD(hashenthead, hashent) *ht_tab;
};

static struct hashtab strings;

/*
 * HASHFRACTION controls ht_lim, which in turn controls the average chain
 * length.  We allow a few entries, on average, as comparing them is usually
 * cheap (the h_hash values prevent a strcmp).
 */
#define	HASHFRACTION(sz) ((sz) * 3 / 2)

static void			ht_expand(struct hashtab *);
static void			ht_init(struct hashtab *, size_t);
static inline u_int		hash(u_int, const char *);
static inline u_int		hash2(u_int, const char *, const char *);
static inline struct hashent   *newhashent(const char *, u_int);

/*
 * Initialize a new hash table.  The size must be a power of 2.
 */
static void
ht_init(struct hashtab *ht, size_t sz)
{
	u_int n;

	ht->ht_tab = emalloc(sz * sizeof (ht->ht_tab[0]));
	ht->ht_size = sz;
	ht->ht_mask = sz - 1;
	for (n = 0; n < sz; n++)
		TAILQ_INIT(&ht->ht_tab[n]);
	ht->ht_used = 0;
	ht->ht_lim = HASHFRACTION(sz);
}

/*
 * Expand an existing hash table.
 */
static void
ht_expand(struct hashtab *ht)
{
	struct hashenthead *h, *oldh;
	struct hashent *p;
	size_t n, i;

	n = ht->ht_size * 2;
	h = emalloc(n * sizeof *h);
	for (i = 0; i < n; i++)
		TAILQ_INIT(&h[i]);
	oldh = ht->ht_tab;
	n--;
	for (i = 0; i < ht->ht_size; i++) {
		while ((p = TAILQ_FIRST(&oldh[i])) != NULL) {
			TAILQ_REMOVE(&oldh[i], p, h_next);
				// XXXLUKEM: really should be TAILQ_INSERT_TAIL
			TAILQ_INSERT_HEAD(&h[p->h_hash & n], p, h_next);
		}
	}
	free(ht->ht_tab);
	ht->ht_tab = h;
	ht->ht_mask = n;
	ht->ht_size = ++n;
	ht->ht_lim = HASHFRACTION(n);
}

/*
 * Make a new hash entry, setting its h_next to NULL.
 * If the free list is not empty, use the first entry from there,
 * otherwise allocate a new entry.
 */
static inline struct hashent *
newhashent2(const char *name1, const char *name2, u_int h)
{
	struct hashent *hp;

	hp = ecalloc(1, sizeof(*hp));

	hp->h_name1 = name1;
	hp->h_name2 = name2;
	hp->h_hash = h;
	return (hp);
}

static inline struct hashent *
newhashent(const char *name, u_int h)
{
	return newhashent2(name, NULL, h);
}

static inline u_int
hv(u_int h, char c)
{
	return (h << 5) + h + (unsigned char)c;
}

/*
 * Hash a string.
 */
static inline u_int
hash(u_int h, const char *str)
{

	while (str && *str)
		h = hv(h, *str++);
	return (h);
}

#define	HASH2DELIM	' '

static inline u_int
hash2(u_int h, const char *str1, const char *str2)
{

	h = hash(h, str1);
	h = hv(h, HASH2DELIM);
	h = hash(h, str2);
	return (h);
}

void
initintern(void)
{

	ht_init(&strings, 128);
}

/*
 * Generate a single unique copy of the given string.  We expect this
 * function to be used frequently, so it should be fast.
 */
const char *
intern(const char *s)
{
	struct hashtab *ht;
	struct hashent *hp;
	struct hashenthead *hpp;
	u_int h;
	char *p;

	ht = &strings;
	h = hash2(0, s, NULL);
	hpp = &ht->ht_tab[h & ht->ht_mask];
	TAILQ_FOREACH(hp, hpp, h_next) {
		if (hp->h_hash == h && strcmp(hp->h_name, s) == 0)
			return (hp->h_name);
	}
	p = estrdup(s);
	hp = newhashent(p, h);
	TAILQ_INSERT_TAIL(hpp, hp, h_next);
	if (++ht->ht_used > ht->ht_lim)
		ht_expand(ht);
	return (p);
}

struct hashtab *
ht_new(void)
{
	struct hashtab *ht;

	ht = ecalloc(1, sizeof *ht);
	ht_init(ht, 8);
	return (ht);
}

void
ht_free(struct hashtab *ht)
{
	size_t i;
	struct hashent *hp;
	struct hashenthead *hpp;

	for (i = 0; i < ht->ht_size; i++) {
		hpp = &ht->ht_tab[i];
		while ((hp = TAILQ_FIRST(hpp)) != NULL) {
			TAILQ_REMOVE(hpp, hp, h_next);
			free(hp);
			ht->ht_used--;
		}
	}

	assert(ht->ht_used == 0);
	free(ht->ht_tab);
	free(ht);
}

/*
 * Insert and/or replace.
 */
int
ht_insrep2(struct hashtab *ht, const char *nam1, const char *nam2, void *val, int replace)
{
	struct hashent *hp;
	struct hashenthead *hpp;
	u_int h;

	h = hash2(0, nam1, nam2);
	hpp = &ht->ht_tab[h & ht->ht_mask];
	TAILQ_FOREACH(hp, hpp, h_next) {
		if (hp->h_name1 == nam1 &&
		    hp->h_name2 == nam2) {
			if (replace)
				hp->h_value = val;
			return (1);
		}
	}
	hp = newhashent2(nam1, nam2, h);
	TAILQ_INSERT_TAIL(hpp, hp, h_next);
	hp->h_value = val;
	if (++ht->ht_used > ht->ht_lim)
		ht_expand(ht);
	return (0);
}

int
ht_insrep(struct hashtab *ht, const char *nam, void *val, int replace)
{
	return ht_insrep2(ht, nam, NULL, val, replace);
}

/*
 * Remove.
 */
int
ht_remove2(struct hashtab *ht, const char *name1, const char *name2)
{
	struct hashent *hp;
	struct hashenthead *hpp;
	u_int h;

	h = hash2(0, name1, name2);
	hpp = &ht->ht_tab[h & ht->ht_mask];

	TAILQ_FOREACH(hp, hpp, h_next) {
		if (hp->h_name1 != name1 || hp->h_name2 != name2)
			continue;
		TAILQ_REMOVE(hpp, hp, h_next);

		free(hp);
		ht->ht_used--;
		return (0);
	}
	return (1);
}

int
ht_remove(struct hashtab *ht, const char *name)
{
	return ht_remove2(ht, name, NULL);
}

void *
ht_lookup2(struct hashtab *ht, const char *nam1, const char *nam2)
{
	struct hashent *hp;
	struct hashenthead *hpp;
	u_int h;

	h = hash2(0, nam1, nam2);
	hpp = &ht->ht_tab[h & ht->ht_mask];
	TAILQ_FOREACH(hp, hpp, h_next)
		if (hp->h_name == nam1)
			return (hp->h_value);
	return (NULL);
}

void *
ht_lookup(struct hashtab *ht, const char *nam)
{
	return ht_lookup2(ht, nam, NULL);
}

/*
 * first parameter to callback is the entry name from the hash table
 * second parameter is the value from the hash table
 * third argument is passed through from the "arg" parameter to ht_enumerate()
 */

int
ht_enumerate2(struct hashtab *ht, ht_callback2 cbfunc2, void *arg)
{
	struct hashent *hp;
	struct hashenthead *hpp;
	size_t i;
	int rval = 0;

	for (i = 0; i < ht->ht_size; i++) {
		hpp = &ht->ht_tab[i];
		TAILQ_FOREACH(hp, hpp, h_next)
			rval += (*cbfunc2)(hp->h_name1, hp->h_name2, hp->h_value, arg);
	}
	return rval;
}

int
ht_enumerate(struct hashtab *ht, ht_callback cbfunc, void *arg)
{
	struct hashent *hp;
	struct hashenthead *hpp;
	size_t i;
	int rval = 0;

	for (i = 0; i < ht->ht_size; i++) {
		hpp = &ht->ht_tab[i];
		TAILQ_FOREACH(hp, hpp, h_next)
			rval += (*cbfunc)(hp->h_name, hp->h_value, arg);
	}
	return rval;
}

/************************************************************/

/*
 * Type-safe wrappers.
 */

#define DEFHASH(HT, VT) \
	struct HT {						\
		struct hashtab imp;				\
	};							\
								\
	struct HT *						\
	HT##_create(void)					\
	{							\
		struct HT *tbl;					\
								\
		tbl = ecalloc(1, sizeof(*tbl));			\
		ht_init(&tbl->imp, 8);				\
		return tbl;					\
	}							\
								\
	int							\
	HT##_insert(struct HT *tbl, const char *name, struct VT *val) \
	{							\
		return ht_insert(&tbl->imp, name, val);		\
	}							\
								\
	int							\
	HT##_replace(struct HT *tbl, const char *name, struct VT *val) \
	{							\
		return ht_replace(&tbl->imp, name, val);	\
	}							\
								\
	int							\
	HT##_remove(struct HT *tbl, const char *name)		\
	{							\
		return ht_remove(&tbl->imp, name);		\
	}							\
								\
	struct VT *						\
	HT##_lookup(struct HT *tbl, const char *name)		\
	{							\
		return ht_lookup(&tbl->imp, name);		\
	}							\
								\
	struct HT##_enumcontext {				\
		int (*func)(const char *, struct VT *, void *);	\
		void *userctx;					\
	};							\
								\
	static int						\
	HT##_enumerate_thunk(const char *name, void *value, void *voidctx) \
	{							\
		struct HT##_enumcontext *ctx = voidctx;		\
								\
		return ctx->func(name, value, ctx->userctx);	\
	}							\
								\
	int							\
	HT##_enumerate(struct HT *tbl,				\
		      int (*func)(const char *, struct VT *, void *), \
		      void *userctx)				\
	{							\
		struct HT##_enumcontext ctx;			\
								\
		ctx.func = func;				\
		ctx.userctx = userctx;				\
		return ht_enumerate(&tbl->imp, HT##_enumerate_thunk, &ctx); \
	}

DEFHASH(nvhash, nvlist);
DEFHASH(dlhash, defoptlist);