Home | History | Annotate | Line # | Download | only in npf
npf_tableset.c revision 1.22
      1  1.22   rmind /*	$NetBSD: npf_tableset.c,v 1.22 2014/08/11 01:54:12 rmind Exp $	*/
      2   1.1   rmind 
      3   1.1   rmind /*-
      4  1.21   rmind  * Copyright (c) 2009-2014 The NetBSD Foundation, Inc.
      5   1.1   rmind  * All rights reserved.
      6   1.1   rmind  *
      7   1.1   rmind  * This material is based upon work partially supported by The
      8   1.1   rmind  * NetBSD Foundation under a contract with Mindaugas Rasiukevicius.
      9   1.1   rmind  *
     10   1.1   rmind  * Redistribution and use in source and binary forms, with or without
     11   1.1   rmind  * modification, are permitted provided that the following conditions
     12   1.1   rmind  * are met:
     13   1.1   rmind  * 1. Redistributions of source code must retain the above copyright
     14   1.1   rmind  *    notice, this list of conditions and the following disclaimer.
     15   1.1   rmind  * 2. Redistributions in binary form must reproduce the above copyright
     16   1.1   rmind  *    notice, this list of conditions and the following disclaimer in the
     17   1.1   rmind  *    documentation and/or other materials provided with the distribution.
     18   1.1   rmind  *
     19   1.1   rmind  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     20   1.1   rmind  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     21   1.1   rmind  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     22   1.1   rmind  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     23   1.1   rmind  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     24   1.1   rmind  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     25   1.1   rmind  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     26   1.1   rmind  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     27   1.1   rmind  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     28   1.1   rmind  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     29   1.1   rmind  * POSSIBILITY OF SUCH DAMAGE.
     30   1.1   rmind  */
     31   1.1   rmind 
     32   1.1   rmind /*
     33   1.4   rmind  * NPF tableset module.
     34   1.1   rmind  *
     35  1.15   rmind  * Notes
     36  1.15   rmind  *
     37  1.15   rmind  *	The tableset is an array of tables.  After the creation, the array
     38  1.15   rmind  *	is immutable.  The caller is responsible to synchronise the access
     39  1.15   rmind  *	to the tableset.  The table can either be a hash or a tree.  Its
     40  1.15   rmind  *	entries are protected by a read-write lock.
     41   1.1   rmind  */
     42   1.1   rmind 
     43   1.1   rmind #include <sys/cdefs.h>
     44  1.22   rmind __KERNEL_RCSID(0, "$NetBSD: npf_tableset.c,v 1.22 2014/08/11 01:54:12 rmind Exp $");
     45   1.1   rmind 
     46   1.1   rmind #include <sys/param.h>
     47  1.10   rmind #include <sys/types.h>
     48   1.1   rmind 
     49   1.1   rmind #include <sys/atomic.h>
     50   1.1   rmind #include <sys/hash.h>
     51  1.21   rmind #include <sys/cdbr.h>
     52   1.1   rmind #include <sys/kmem.h>
     53  1.21   rmind #include <sys/malloc.h>
     54   1.1   rmind #include <sys/pool.h>
     55   1.1   rmind #include <sys/queue.h>
     56   1.1   rmind #include <sys/rwlock.h>
     57   1.1   rmind #include <sys/systm.h>
     58   1.1   rmind #include <sys/types.h>
     59   1.1   rmind 
     60   1.1   rmind #include "npf_impl.h"
     61   1.1   rmind 
     62  1.15   rmind typedef struct npf_tblent {
     63   1.1   rmind 	union {
     64  1.21   rmind 		LIST_ENTRY(npf_tblent) te_hashent;
     65  1.21   rmind 		pt_node_t	te_node;
     66  1.21   rmind 	} /* C11 */;
     67  1.13   rmind 	int			te_alen;
     68  1.13   rmind 	npf_addr_t		te_addr;
     69  1.15   rmind } npf_tblent_t;
     70   1.1   rmind 
     71   1.1   rmind LIST_HEAD(npf_hashl, npf_tblent);
     72   1.1   rmind 
     73   1.1   rmind struct npf_table {
     74  1.19   rmind 	/*
     75  1.21   rmind 	 * The storage type can be: a) hash b) tree c) cdb.
     76  1.19   rmind 	 * There are separate trees for IPv4 and IPv6.
     77  1.19   rmind 	 */
     78  1.21   rmind 	union {
     79  1.21   rmind 		struct {
     80  1.21   rmind 			struct npf_hashl *t_hashl;
     81  1.21   rmind 			u_long		t_hashmask;
     82  1.21   rmind 		};
     83  1.21   rmind 		struct {
     84  1.21   rmind 			pt_tree_t	t_tree[2];
     85  1.21   rmind 		};
     86  1.21   rmind 		struct {
     87  1.21   rmind 			void *		t_blob;
     88  1.21   rmind 			size_t		t_bsize;
     89  1.21   rmind 			struct cdbr *	t_cdb;
     90  1.21   rmind 		};
     91  1.21   rmind 	} /* C11 */;
     92  1.19   rmind 
     93  1.19   rmind 	/*
     94  1.19   rmind 	 * Table ID, type and lock.  The ID may change during the
     95  1.19   rmind 	 * config reload, it is protected by the npf_config_lock.
     96  1.19   rmind 	 */
     97  1.19   rmind 	int			t_type;
     98  1.19   rmind 	u_int			t_id;
     99  1.19   rmind 	krwlock_t		t_lock;
    100  1.19   rmind 
    101  1.19   rmind 	/* The number of items, reference count and table name. */
    102  1.19   rmind 	u_int			t_nitems;
    103  1.19   rmind 	u_int			t_refcnt;
    104  1.19   rmind 	char			t_name[NPF_TABLE_MAXNAMELEN];
    105  1.19   rmind };
    106  1.19   rmind 
    107  1.19   rmind struct npf_tableset {
    108  1.19   rmind 	u_int			ts_nitems;
    109  1.19   rmind 	npf_table_t *		ts_map[];
    110   1.1   rmind };
    111   1.1   rmind 
    112  1.19   rmind #define	NPF_TABLESET_SIZE(n)	\
    113  1.19   rmind     (offsetof(npf_tableset_t, ts_map[n]) * sizeof(npf_table_t *))
    114  1.19   rmind 
    115  1.13   rmind #define	NPF_ADDRLEN2TREE(alen)	((alen) >> 4)
    116  1.13   rmind 
    117  1.13   rmind static pool_cache_t		tblent_cache	__read_mostly;
    118   1.1   rmind 
    119   1.1   rmind /*
    120   1.1   rmind  * npf_table_sysinit: initialise tableset structures.
    121   1.1   rmind  */
    122   1.4   rmind void
    123   1.1   rmind npf_tableset_sysinit(void)
    124   1.1   rmind {
    125   1.1   rmind 	tblent_cache = pool_cache_init(sizeof(npf_tblent_t), coherency_unit,
    126  1.14   rmind 	    0, 0, "npftblpl", NULL, IPL_NONE, NULL, NULL, NULL);
    127   1.1   rmind }
    128   1.1   rmind 
    129   1.1   rmind void
    130   1.1   rmind npf_tableset_sysfini(void)
    131   1.1   rmind {
    132   1.1   rmind 	pool_cache_destroy(tblent_cache);
    133   1.1   rmind }
    134   1.1   rmind 
    135   1.1   rmind npf_tableset_t *
    136  1.19   rmind npf_tableset_create(u_int nitems)
    137   1.1   rmind {
    138  1.19   rmind 	npf_tableset_t *ts = kmem_zalloc(NPF_TABLESET_SIZE(nitems), KM_SLEEP);
    139  1.19   rmind 	ts->ts_nitems = nitems;
    140  1.19   rmind 	return ts;
    141   1.1   rmind }
    142   1.1   rmind 
    143   1.1   rmind void
    144  1.19   rmind npf_tableset_destroy(npf_tableset_t *ts)
    145   1.1   rmind {
    146   1.1   rmind 	/*
    147  1.19   rmind 	 * Destroy all tables (no references should be held, since the
    148  1.19   rmind 	 * ruleset should be destroyed before).
    149   1.1   rmind 	 */
    150  1.19   rmind 	for (u_int tid = 0; tid < ts->ts_nitems; tid++) {
    151  1.19   rmind 		npf_table_t *t = ts->ts_map[tid];
    152  1.19   rmind 
    153  1.17   rmind 		if (t && atomic_dec_uint_nv(&t->t_refcnt) == 0) {
    154   1.1   rmind 			npf_table_destroy(t);
    155   1.1   rmind 		}
    156   1.1   rmind 	}
    157  1.19   rmind 	kmem_free(ts, NPF_TABLESET_SIZE(ts->ts_nitems));
    158   1.1   rmind }
    159   1.1   rmind 
    160   1.1   rmind /*
    161   1.1   rmind  * npf_tableset_insert: insert the table into the specified tableset.
    162   1.1   rmind  *
    163  1.13   rmind  * => Returns 0 on success.  Fails and returns error if ID is already used.
    164   1.1   rmind  */
    165   1.1   rmind int
    166  1.19   rmind npf_tableset_insert(npf_tableset_t *ts, npf_table_t *t)
    167   1.1   rmind {
    168   1.1   rmind 	const u_int tid = t->t_id;
    169   1.1   rmind 	int error;
    170   1.1   rmind 
    171  1.19   rmind 	KASSERT((u_int)tid < ts->ts_nitems);
    172   1.1   rmind 
    173  1.19   rmind 	if (ts->ts_map[tid] == NULL) {
    174  1.17   rmind 		atomic_inc_uint(&t->t_refcnt);
    175  1.19   rmind 		ts->ts_map[tid] = t;
    176   1.1   rmind 		error = 0;
    177   1.1   rmind 	} else {
    178   1.1   rmind 		error = EEXIST;
    179   1.1   rmind 	}
    180   1.1   rmind 	return error;
    181   1.1   rmind }
    182   1.1   rmind 
    183   1.1   rmind /*
    184  1.19   rmind  * npf_tableset_getbyname: look for a table in the set given the name.
    185  1.19   rmind  */
    186  1.19   rmind npf_table_t *
    187  1.19   rmind npf_tableset_getbyname(npf_tableset_t *ts, const char *name)
    188  1.19   rmind {
    189  1.19   rmind 	npf_table_t *t;
    190  1.19   rmind 
    191  1.19   rmind 	for (u_int tid = 0; tid < ts->ts_nitems; tid++) {
    192  1.19   rmind 		if ((t = ts->ts_map[tid]) == NULL)
    193  1.19   rmind 			continue;
    194  1.19   rmind 		if (strcmp(name, t->t_name) == 0)
    195  1.19   rmind 			return t;
    196  1.19   rmind 	}
    197  1.19   rmind 	return NULL;
    198  1.19   rmind }
    199  1.19   rmind 
    200  1.19   rmind npf_table_t *
    201  1.19   rmind npf_tableset_getbyid(npf_tableset_t *ts, u_int tid)
    202  1.19   rmind {
    203  1.19   rmind 	if (__predict_true(tid < ts->ts_nitems)) {
    204  1.19   rmind 		return ts->ts_map[tid];
    205  1.19   rmind 	}
    206  1.19   rmind 	return NULL;
    207  1.19   rmind }
    208  1.19   rmind 
    209  1.19   rmind /*
    210  1.15   rmind  * npf_tableset_reload: iterate all tables and if the new table is of the
    211  1.15   rmind  * same type and has no items, then we preserve the old one and its entries.
    212  1.15   rmind  *
    213  1.15   rmind  * => The caller is responsible for providing synchronisation.
    214  1.15   rmind  */
    215  1.15   rmind void
    216  1.19   rmind npf_tableset_reload(npf_tableset_t *nts, npf_tableset_t *ots)
    217  1.15   rmind {
    218  1.19   rmind 	for (u_int tid = 0; tid < nts->ts_nitems; tid++) {
    219  1.19   rmind 		npf_table_t *t, *ot;
    220  1.19   rmind 
    221  1.19   rmind 		if ((t = nts->ts_map[tid]) == NULL) {
    222  1.19   rmind 			continue;
    223  1.19   rmind 		}
    224  1.15   rmind 
    225  1.19   rmind 		/* If our table has entries, just load it. */
    226  1.19   rmind 		if (t->t_nitems) {
    227  1.15   rmind 			continue;
    228  1.15   rmind 		}
    229  1.19   rmind 
    230  1.19   rmind 		/* Look for a currently existing table with such name. */
    231  1.19   rmind 		ot = npf_tableset_getbyname(ots, t->t_name);
    232  1.19   rmind 		if (ot == NULL) {
    233  1.19   rmind 			/* Not found: we have a new table. */
    234  1.19   rmind 			continue;
    235  1.19   rmind 		}
    236  1.19   rmind 
    237  1.19   rmind 		/* Found.  Did the type change? */
    238  1.19   rmind 		if (t->t_type != ot->t_type) {
    239  1.19   rmind 			/* Yes, load the new. */
    240  1.15   rmind 			continue;
    241  1.15   rmind 		}
    242  1.17   rmind 
    243  1.17   rmind 		/*
    244  1.19   rmind 		 * Preserve the current table.  Acquire a reference since
    245  1.19   rmind 		 * we are keeping it in the old table set.  Update its ID.
    246  1.17   rmind 		 */
    247  1.17   rmind 		atomic_inc_uint(&ot->t_refcnt);
    248  1.19   rmind 		nts->ts_map[tid] = ot;
    249  1.19   rmind 
    250  1.19   rmind 		KASSERT(npf_config_locked_p());
    251  1.19   rmind 		ot->t_id = tid;
    252  1.17   rmind 
    253  1.21   rmind 		/* Destroy the new table (we hold the only reference). */
    254  1.17   rmind 		t->t_refcnt--;
    255  1.15   rmind 		npf_table_destroy(t);
    256  1.15   rmind 	}
    257  1.15   rmind }
    258  1.15   rmind 
    259  1.22   rmind int
    260  1.22   rmind npf_tableset_export(const npf_tableset_t *ts, prop_array_t tables)
    261  1.20   rmind {
    262  1.20   rmind 	const npf_table_t *t;
    263  1.20   rmind 
    264  1.20   rmind 	KASSERT(npf_config_locked_p());
    265  1.20   rmind 
    266  1.20   rmind 	for (u_int tid = 0; tid < ts->ts_nitems; tid++) {
    267  1.20   rmind 		if ((t = ts->ts_map[tid]) == NULL) {
    268  1.20   rmind 			continue;
    269  1.20   rmind 		}
    270  1.20   rmind 		prop_dictionary_t tdict = prop_dictionary_create();
    271  1.20   rmind 		prop_dictionary_set_cstring(tdict, "name", t->t_name);
    272  1.20   rmind 		prop_dictionary_set_uint32(tdict, "type", t->t_type);
    273  1.20   rmind 		prop_dictionary_set_uint32(tdict, "id", tid);
    274  1.20   rmind 
    275  1.20   rmind 		prop_array_add(tables, tdict);
    276  1.20   rmind 		prop_object_release(tdict);
    277  1.20   rmind 	}
    278  1.22   rmind 	return 0;
    279  1.20   rmind }
    280  1.20   rmind 
    281  1.15   rmind /*
    282  1.13   rmind  * Few helper routines.
    283   1.1   rmind  */
    284   1.1   rmind 
    285  1.13   rmind static npf_tblent_t *
    286  1.13   rmind table_hash_lookup(const npf_table_t *t, const npf_addr_t *addr,
    287  1.13   rmind     const int alen, struct npf_hashl **rhtbl)
    288   1.1   rmind {
    289  1.13   rmind 	const uint32_t hidx = hash32_buf(addr, alen, HASH32_BUF_INIT);
    290  1.13   rmind 	struct npf_hashl *htbl = &t->t_hashl[hidx & t->t_hashmask];
    291  1.13   rmind 	npf_tblent_t *ent;
    292   1.1   rmind 
    293  1.13   rmind 	/*
    294  1.13   rmind 	 * Lookup the hash table and check for duplicates.
    295  1.13   rmind 	 * Note: mask is ignored for the hash storage.
    296  1.13   rmind 	 */
    297  1.21   rmind 	LIST_FOREACH(ent, htbl, te_hashent) {
    298  1.13   rmind 		if (ent->te_alen != alen) {
    299  1.13   rmind 			continue;
    300  1.13   rmind 		}
    301  1.13   rmind 		if (memcmp(&ent->te_addr, addr, alen) == 0) {
    302  1.13   rmind 			break;
    303  1.13   rmind 		}
    304  1.13   rmind 	}
    305  1.13   rmind 	*rhtbl = htbl;
    306  1.13   rmind 	return ent;
    307   1.1   rmind }
    308   1.1   rmind 
    309  1.13   rmind static void
    310  1.18   rmind table_hash_destroy(npf_table_t *t)
    311  1.18   rmind {
    312  1.18   rmind 	for (unsigned n = 0; n <= t->t_hashmask; n++) {
    313  1.18   rmind 		npf_tblent_t *ent;
    314  1.18   rmind 
    315  1.18   rmind 		while ((ent = LIST_FIRST(&t->t_hashl[n])) != NULL) {
    316  1.21   rmind 			LIST_REMOVE(ent, te_hashent);
    317  1.18   rmind 			pool_cache_put(tblent_cache, ent);
    318  1.18   rmind 		}
    319  1.18   rmind 	}
    320  1.18   rmind }
    321  1.18   rmind 
    322  1.18   rmind static void
    323  1.13   rmind table_tree_destroy(pt_tree_t *tree)
    324   1.1   rmind {
    325  1.13   rmind 	npf_tblent_t *ent;
    326   1.1   rmind 
    327  1.13   rmind 	while ((ent = ptree_iterate(tree, NULL, PT_ASCENDING)) != NULL) {
    328  1.13   rmind 		ptree_remove_node(tree, ent);
    329  1.13   rmind 		pool_cache_put(tblent_cache, ent);
    330  1.13   rmind 	}
    331   1.1   rmind }
    332   1.1   rmind 
    333   1.1   rmind /*
    334   1.1   rmind  * npf_table_create: create table with a specified ID.
    335   1.1   rmind  */
    336   1.1   rmind npf_table_t *
    337  1.21   rmind npf_table_create(const char *name, u_int tid, int type,
    338  1.21   rmind     void *blob, size_t size)
    339   1.1   rmind {
    340   1.1   rmind 	npf_table_t *t;
    341   1.1   rmind 
    342  1.19   rmind 	t = kmem_zalloc(sizeof(npf_table_t), KM_SLEEP);
    343  1.19   rmind 	strlcpy(t->t_name, name, NPF_TABLE_MAXNAMELEN);
    344   1.1   rmind 
    345   1.1   rmind 	switch (type) {
    346   1.9   rmind 	case NPF_TABLE_TREE:
    347  1.13   rmind 		ptree_init(&t->t_tree[0], &npf_table_ptree_ops,
    348  1.13   rmind 		    (void *)(sizeof(struct in_addr) / sizeof(uint32_t)),
    349  1.21   rmind 		    offsetof(npf_tblent_t, te_node),
    350  1.13   rmind 		    offsetof(npf_tblent_t, te_addr));
    351  1.13   rmind 		ptree_init(&t->t_tree[1], &npf_table_ptree_ops,
    352  1.13   rmind 		    (void *)(sizeof(struct in6_addr) / sizeof(uint32_t)),
    353  1.21   rmind 		    offsetof(npf_tblent_t, te_node),
    354  1.13   rmind 		    offsetof(npf_tblent_t, te_addr));
    355   1.1   rmind 		break;
    356   1.1   rmind 	case NPF_TABLE_HASH:
    357  1.21   rmind 		t->t_hashl = hashinit(1024, HASH_LIST, true, &t->t_hashmask);
    358   1.1   rmind 		if (t->t_hashl == NULL) {
    359   1.1   rmind 			kmem_free(t, sizeof(npf_table_t));
    360   1.1   rmind 			return NULL;
    361   1.1   rmind 		}
    362   1.1   rmind 		break;
    363  1.21   rmind 	case NPF_TABLE_CDB:
    364  1.21   rmind 		t->t_blob = blob;
    365  1.21   rmind 		t->t_bsize = size;
    366  1.21   rmind 		t->t_cdb = cdbr_open_mem(blob, size, CDBR_DEFAULT, NULL, NULL);
    367  1.21   rmind 		if (t->t_cdb == NULL) {
    368  1.21   rmind 			kmem_free(t, sizeof(npf_table_t));
    369  1.21   rmind 			free(blob, M_TEMP);
    370  1.21   rmind 			return NULL;
    371  1.21   rmind 		}
    372  1.21   rmind 		t->t_nitems = cdbr_entries(t->t_cdb);
    373  1.21   rmind 		break;
    374   1.1   rmind 	default:
    375   1.1   rmind 		KASSERT(false);
    376   1.1   rmind 	}
    377   1.1   rmind 	rw_init(&t->t_lock);
    378   1.1   rmind 	t->t_type = type;
    379   1.1   rmind 	t->t_id = tid;
    380  1.15   rmind 
    381   1.1   rmind 	return t;
    382   1.1   rmind }
    383   1.1   rmind 
    384   1.1   rmind /*
    385   1.1   rmind  * npf_table_destroy: free all table entries and table itself.
    386   1.1   rmind  */
    387   1.1   rmind void
    388   1.1   rmind npf_table_destroy(npf_table_t *t)
    389   1.1   rmind {
    390  1.17   rmind 	KASSERT(t->t_refcnt == 0);
    391   1.1   rmind 
    392   1.1   rmind 	switch (t->t_type) {
    393  1.15   rmind 	case NPF_TABLE_HASH:
    394  1.18   rmind 		table_hash_destroy(t);
    395   1.1   rmind 		hashdone(t->t_hashl, HASH_LIST, t->t_hashmask);
    396   1.1   rmind 		break;
    397  1.15   rmind 	case NPF_TABLE_TREE:
    398  1.13   rmind 		table_tree_destroy(&t->t_tree[0]);
    399  1.13   rmind 		table_tree_destroy(&t->t_tree[1]);
    400   1.1   rmind 		break;
    401  1.21   rmind 	case NPF_TABLE_CDB:
    402  1.21   rmind 		cdbr_close(t->t_cdb);
    403  1.21   rmind 		free(t->t_blob, M_TEMP);
    404  1.21   rmind 		break;
    405   1.1   rmind 	default:
    406   1.1   rmind 		KASSERT(false);
    407   1.1   rmind 	}
    408   1.1   rmind 	rw_destroy(&t->t_lock);
    409   1.1   rmind 	kmem_free(t, sizeof(npf_table_t));
    410   1.1   rmind }
    411   1.1   rmind 
    412   1.1   rmind /*
    413  1.19   rmind  * npf_table_check: validate the name, ID and type.
    414  1.13   rmind  */
    415   1.1   rmind int
    416  1.19   rmind npf_table_check(npf_tableset_t *ts, const char *name, u_int tid, int type)
    417   1.1   rmind {
    418  1.19   rmind 	if ((u_int)tid >= ts->ts_nitems) {
    419   1.1   rmind 		return EINVAL;
    420   1.1   rmind 	}
    421  1.19   rmind 	if (ts->ts_map[tid] != NULL) {
    422   1.1   rmind 		return EEXIST;
    423   1.1   rmind 	}
    424  1.21   rmind 	switch (type) {
    425  1.21   rmind 	case NPF_TABLE_TREE:
    426  1.21   rmind 	case NPF_TABLE_HASH:
    427  1.21   rmind 	case NPF_TABLE_CDB:
    428  1.21   rmind 		break;
    429  1.21   rmind 	default:
    430   1.1   rmind 		return EINVAL;
    431   1.1   rmind 	}
    432  1.19   rmind 	if (strlen(name) >= NPF_TABLE_MAXNAMELEN) {
    433  1.19   rmind 		return ENAMETOOLONG;
    434  1.19   rmind 	}
    435  1.19   rmind 	if (npf_tableset_getbyname(ts, name)) {
    436  1.20   rmind 		return EEXIST;
    437  1.19   rmind 	}
    438   1.1   rmind 	return 0;
    439   1.1   rmind }
    440   1.1   rmind 
    441  1.13   rmind static int
    442  1.15   rmind table_cidr_check(const u_int aidx, const npf_addr_t *addr,
    443  1.13   rmind     const npf_netmask_t mask)
    444  1.13   rmind {
    445  1.19   rmind 	if (aidx > 1) {
    446  1.13   rmind 		return EINVAL;
    447  1.13   rmind 	}
    448  1.19   rmind 	if (mask > NPF_MAX_NETMASK && mask != NPF_NO_NETMASK) {
    449  1.13   rmind 		return EINVAL;
    450  1.13   rmind 	}
    451  1.13   rmind 
    452  1.13   rmind 	/*
    453  1.13   rmind 	 * For IPv4 (aidx = 0) - 32 and for IPv6 (aidx = 1) - 128.
    454  1.13   rmind 	 * If it is a host - shall use NPF_NO_NETMASK.
    455  1.13   rmind 	 */
    456  1.13   rmind 	if (mask >= (aidx ? 128 : 32) && mask != NPF_NO_NETMASK) {
    457  1.13   rmind 		return EINVAL;
    458  1.13   rmind 	}
    459  1.13   rmind 	return 0;
    460  1.13   rmind }
    461  1.13   rmind 
    462   1.1   rmind /*
    463  1.13   rmind  * npf_table_insert: add an IP CIDR entry into the table.
    464   1.1   rmind  */
    465   1.1   rmind int
    466  1.19   rmind npf_table_insert(npf_table_t *t, const int alen,
    467   1.6  zoltan     const npf_addr_t *addr, const npf_netmask_t mask)
    468   1.1   rmind {
    469  1.13   rmind 	const u_int aidx = NPF_ADDRLEN2TREE(alen);
    470  1.13   rmind 	npf_tblent_t *ent;
    471  1.13   rmind 	int error;
    472   1.1   rmind 
    473  1.15   rmind 	error = table_cidr_check(aidx, addr, mask);
    474  1.13   rmind 	if (error) {
    475  1.13   rmind 		return error;
    476   1.8   rmind 	}
    477  1.12   rmind 	ent = pool_cache_get(tblent_cache, PR_WAITOK);
    478  1.13   rmind 	memcpy(&ent->te_addr, addr, alen);
    479  1.13   rmind 	ent->te_alen = alen;
    480   1.1   rmind 
    481  1.13   rmind 	/*
    482  1.13   rmind 	 * Insert the entry.  Return an error on duplicate.
    483  1.13   rmind 	 */
    484  1.15   rmind 	rw_enter(&t->t_lock, RW_WRITER);
    485   1.1   rmind 	switch (t->t_type) {
    486  1.13   rmind 	case NPF_TABLE_HASH: {
    487  1.13   rmind 		struct npf_hashl *htbl;
    488  1.13   rmind 
    489  1.13   rmind 		/*
    490  1.13   rmind 		 * Hash tables by the concept support only IPs.
    491  1.13   rmind 		 */
    492  1.13   rmind 		if (mask != NPF_NO_NETMASK) {
    493  1.13   rmind 			error = EINVAL;
    494  1.13   rmind 			break;
    495   1.1   rmind 		}
    496  1.13   rmind 		if (!table_hash_lookup(t, addr, alen, &htbl)) {
    497  1.21   rmind 			LIST_INSERT_HEAD(htbl, ent, te_hashent);
    498  1.15   rmind 			t->t_nitems++;
    499   1.1   rmind 		} else {
    500   1.1   rmind 			error = EEXIST;
    501   1.1   rmind 		}
    502   1.1   rmind 		break;
    503  1.13   rmind 	}
    504  1.13   rmind 	case NPF_TABLE_TREE: {
    505  1.13   rmind 		pt_tree_t *tree = &t->t_tree[aidx];
    506  1.13   rmind 		bool ok;
    507  1.13   rmind 
    508  1.13   rmind 		/*
    509  1.13   rmind 		 * If no mask specified, use maximum mask.
    510  1.13   rmind 		 */
    511  1.15   rmind 		ok = (mask != NPF_NO_NETMASK) ?
    512  1.15   rmind 		    ptree_insert_mask_node(tree, ent, mask) :
    513  1.15   rmind 		    ptree_insert_node(tree, ent);
    514  1.15   rmind 		if (ok) {
    515  1.15   rmind 			t->t_nitems++;
    516  1.15   rmind 			error = 0;
    517  1.13   rmind 		} else {
    518  1.15   rmind 			error = EEXIST;
    519   1.1   rmind 		}
    520   1.1   rmind 		break;
    521  1.13   rmind 	}
    522  1.21   rmind 	case NPF_TABLE_CDB:
    523  1.21   rmind 		error = EINVAL;
    524  1.21   rmind 		break;
    525   1.1   rmind 	default:
    526   1.1   rmind 		KASSERT(false);
    527   1.1   rmind 	}
    528  1.15   rmind 	rw_exit(&t->t_lock);
    529   1.1   rmind 
    530   1.8   rmind 	if (error) {
    531  1.12   rmind 		pool_cache_put(tblent_cache, ent);
    532   1.1   rmind 	}
    533   1.1   rmind 	return error;
    534   1.1   rmind }
    535   1.1   rmind 
    536   1.1   rmind /*
    537  1.13   rmind  * npf_table_remove: remove the IP CIDR entry from the table.
    538   1.1   rmind  */
    539   1.1   rmind int
    540  1.19   rmind npf_table_remove(npf_table_t *t, const int alen,
    541   1.6  zoltan     const npf_addr_t *addr, const npf_netmask_t mask)
    542   1.1   rmind {
    543  1.13   rmind 	const u_int aidx = NPF_ADDRLEN2TREE(alen);
    544  1.21   rmind 	npf_tblent_t *ent = NULL;
    545  1.21   rmind 	int error = ENOENT;
    546   1.1   rmind 
    547  1.15   rmind 	error = table_cidr_check(aidx, addr, mask);
    548  1.13   rmind 	if (error) {
    549  1.13   rmind 		return error;
    550   1.8   rmind 	}
    551  1.15   rmind 
    552  1.15   rmind 	rw_enter(&t->t_lock, RW_WRITER);
    553  1.13   rmind 	switch (t->t_type) {
    554  1.13   rmind 	case NPF_TABLE_HASH: {
    555  1.13   rmind 		struct npf_hashl *htbl;
    556   1.8   rmind 
    557  1.13   rmind 		ent = table_hash_lookup(t, addr, alen, &htbl);
    558  1.12   rmind 		if (__predict_true(ent != NULL)) {
    559  1.21   rmind 			LIST_REMOVE(ent, te_hashent);
    560  1.15   rmind 			t->t_nitems--;
    561   1.1   rmind 		}
    562   1.1   rmind 		break;
    563  1.13   rmind 	}
    564  1.13   rmind 	case NPF_TABLE_TREE: {
    565  1.13   rmind 		pt_tree_t *tree = &t->t_tree[aidx];
    566  1.13   rmind 
    567  1.13   rmind 		ent = ptree_find_node(tree, addr);
    568  1.12   rmind 		if (__predict_true(ent != NULL)) {
    569  1.13   rmind 			ptree_remove_node(tree, ent);
    570  1.15   rmind 			t->t_nitems--;
    571   1.1   rmind 		}
    572   1.1   rmind 		break;
    573  1.13   rmind 	}
    574  1.21   rmind 	case NPF_TABLE_CDB:
    575  1.21   rmind 		error = EINVAL;
    576  1.21   rmind 		break;
    577   1.1   rmind 	default:
    578   1.1   rmind 		KASSERT(false);
    579  1.13   rmind 		ent = NULL;
    580   1.1   rmind 	}
    581  1.15   rmind 	rw_exit(&t->t_lock);
    582   1.1   rmind 
    583  1.21   rmind 	if (ent) {
    584  1.21   rmind 		pool_cache_put(tblent_cache, ent);
    585   1.1   rmind 	}
    586  1.21   rmind 	return error;
    587   1.1   rmind }
    588   1.1   rmind 
    589   1.1   rmind /*
    590  1.13   rmind  * npf_table_lookup: find the table according to ID, lookup and match
    591  1.13   rmind  * the contents with the specified IP address.
    592   1.1   rmind  */
    593   1.1   rmind int
    594  1.19   rmind npf_table_lookup(npf_table_t *t, const int alen, const npf_addr_t *addr)
    595   1.1   rmind {
    596  1.13   rmind 	const u_int aidx = NPF_ADDRLEN2TREE(alen);
    597  1.21   rmind 	struct npf_hashl *htbl;
    598  1.21   rmind 	const void *data;
    599  1.21   rmind 	size_t dlen;
    600  1.21   rmind 	bool found;
    601   1.1   rmind 
    602  1.13   rmind 	if (__predict_false(aidx > 1)) {
    603  1.13   rmind 		return EINVAL;
    604  1.13   rmind 	}
    605  1.13   rmind 
    606   1.1   rmind 	switch (t->t_type) {
    607  1.21   rmind 	case NPF_TABLE_HASH:
    608  1.21   rmind 		rw_enter(&t->t_lock, RW_READER);
    609  1.21   rmind 		found = table_hash_lookup(t, addr, alen, &htbl) != NULL;
    610  1.21   rmind 		rw_exit(&t->t_lock);
    611   1.1   rmind 		break;
    612  1.21   rmind 	case NPF_TABLE_TREE:
    613  1.21   rmind 		rw_enter(&t->t_lock, RW_READER);
    614  1.21   rmind 		found = ptree_find_node(&t->t_tree[aidx], addr) != NULL;
    615  1.21   rmind 		rw_exit(&t->t_lock);
    616  1.21   rmind 		break;
    617  1.21   rmind 	case NPF_TABLE_CDB:
    618  1.21   rmind 		if (cdbr_find(t->t_cdb, addr, alen, &data, &dlen) == 0) {
    619  1.21   rmind 			found = dlen == alen && memcmp(addr, data, dlen) == 0;
    620  1.21   rmind 		} else {
    621  1.21   rmind 			found = false;
    622  1.21   rmind 		}
    623   1.1   rmind 		break;
    624   1.1   rmind 	default:
    625   1.1   rmind 		KASSERT(false);
    626  1.21   rmind 		found = false;
    627   1.1   rmind 	}
    628   1.1   rmind 
    629  1.21   rmind 	return found ? 0 : ENOENT;
    630   1.1   rmind }
    631  1.15   rmind 
    632  1.15   rmind static int
    633  1.21   rmind table_ent_copyout(const npf_addr_t *addr, const int alen, npf_netmask_t mask,
    634  1.15   rmind     void *ubuf, size_t len, size_t *off)
    635  1.15   rmind {
    636  1.15   rmind 	void *ubufp = (uint8_t *)ubuf + *off;
    637  1.15   rmind 	npf_ioctl_ent_t uent;
    638  1.15   rmind 
    639  1.15   rmind 	if ((*off += sizeof(npf_ioctl_ent_t)) > len) {
    640  1.15   rmind 		return ENOMEM;
    641  1.15   rmind 	}
    642  1.21   rmind 	uent.alen = alen;
    643  1.21   rmind 	memcpy(&uent.addr, addr, sizeof(npf_addr_t));
    644  1.15   rmind 	uent.mask = mask;
    645  1.15   rmind 
    646  1.15   rmind 	return copyout(&uent, ubufp, sizeof(npf_ioctl_ent_t));
    647  1.15   rmind }
    648  1.15   rmind 
    649  1.15   rmind static int
    650  1.21   rmind table_hash_list(const npf_table_t *t, void *ubuf, size_t len)
    651  1.21   rmind {
    652  1.21   rmind 	size_t off = 0;
    653  1.21   rmind 	int error = 0;
    654  1.21   rmind 
    655  1.21   rmind 	for (unsigned n = 0; n <= t->t_hashmask; n++) {
    656  1.21   rmind 		npf_tblent_t *ent;
    657  1.21   rmind 
    658  1.21   rmind 		LIST_FOREACH(ent, &t->t_hashl[n], te_hashent) {
    659  1.21   rmind 			error = table_ent_copyout(&ent->te_addr,
    660  1.21   rmind 			    ent->te_alen, 0, ubuf, len, &off);
    661  1.21   rmind 			if (error)
    662  1.21   rmind 				break;
    663  1.21   rmind 		}
    664  1.21   rmind 	}
    665  1.21   rmind 	return error;
    666  1.21   rmind }
    667  1.21   rmind 
    668  1.21   rmind static int
    669  1.15   rmind table_tree_list(pt_tree_t *tree, npf_netmask_t maxmask, void *ubuf,
    670  1.15   rmind     size_t len, size_t *off)
    671  1.15   rmind {
    672  1.15   rmind 	npf_tblent_t *ent = NULL;
    673  1.15   rmind 	int error = 0;
    674  1.15   rmind 
    675  1.15   rmind 	while ((ent = ptree_iterate(tree, ent, PT_ASCENDING)) != NULL) {
    676  1.15   rmind 		pt_bitlen_t blen;
    677  1.15   rmind 
    678  1.15   rmind 		if (!ptree_mask_node_p(tree, ent, &blen)) {
    679  1.15   rmind 			blen = maxmask;
    680  1.15   rmind 		}
    681  1.21   rmind 		error = table_ent_copyout(&ent->te_addr, ent->te_alen,
    682  1.21   rmind 		    blen, ubuf, len, off);
    683  1.21   rmind 		if (error)
    684  1.21   rmind 			break;
    685  1.21   rmind 	}
    686  1.21   rmind 	return error;
    687  1.21   rmind }
    688  1.21   rmind 
    689  1.21   rmind static int
    690  1.21   rmind table_cdb_list(npf_table_t *t, void *ubuf, size_t len)
    691  1.21   rmind {
    692  1.21   rmind 	size_t off = 0, dlen;
    693  1.21   rmind 	const void *data;
    694  1.21   rmind 	int error = 0;
    695  1.21   rmind 
    696  1.21   rmind 	for (size_t i = 0; i < t->t_nitems; i++) {
    697  1.21   rmind 		if (cdbr_get(t->t_cdb, i, &data, &dlen) != 0) {
    698  1.21   rmind 			return EINVAL;
    699  1.21   rmind 		}
    700  1.21   rmind 		error = table_ent_copyout(data, dlen, 0, ubuf, len, &off);
    701  1.15   rmind 		if (error)
    702  1.15   rmind 			break;
    703  1.15   rmind 	}
    704  1.15   rmind 	return error;
    705  1.15   rmind }
    706  1.15   rmind 
    707  1.15   rmind /*
    708  1.15   rmind  * npf_table_list: copy a list of all table entries into a userspace buffer.
    709  1.15   rmind  */
    710  1.15   rmind int
    711  1.19   rmind npf_table_list(npf_table_t *t, void *ubuf, size_t len)
    712  1.15   rmind {
    713  1.15   rmind 	size_t off = 0;
    714  1.15   rmind 	int error = 0;
    715  1.15   rmind 
    716  1.15   rmind 	rw_enter(&t->t_lock, RW_READER);
    717  1.15   rmind 	switch (t->t_type) {
    718  1.15   rmind 	case NPF_TABLE_HASH:
    719  1.21   rmind 		error = table_hash_list(t, ubuf, len);
    720  1.15   rmind 		break;
    721  1.15   rmind 	case NPF_TABLE_TREE:
    722  1.15   rmind 		error = table_tree_list(&t->t_tree[0], 32, ubuf, len, &off);
    723  1.15   rmind 		if (error)
    724  1.15   rmind 			break;
    725  1.15   rmind 		error = table_tree_list(&t->t_tree[1], 128, ubuf, len, &off);
    726  1.16   rmind 		break;
    727  1.21   rmind 	case NPF_TABLE_CDB:
    728  1.21   rmind 		error = table_cdb_list(t, ubuf, len);
    729  1.21   rmind 		break;
    730  1.15   rmind 	default:
    731  1.15   rmind 		KASSERT(false);
    732  1.15   rmind 	}
    733  1.15   rmind 	rw_exit(&t->t_lock);
    734  1.15   rmind 
    735  1.15   rmind 	return error;
    736  1.15   rmind }
    737  1.18   rmind 
    738  1.18   rmind /*
    739  1.18   rmind  * npf_table_flush: remove all table entries.
    740  1.18   rmind  */
    741  1.18   rmind int
    742  1.19   rmind npf_table_flush(npf_table_t *t)
    743  1.18   rmind {
    744  1.21   rmind 	int error = 0;
    745  1.21   rmind 
    746  1.18   rmind 	rw_enter(&t->t_lock, RW_WRITER);
    747  1.18   rmind 	switch (t->t_type) {
    748  1.18   rmind 	case NPF_TABLE_HASH:
    749  1.18   rmind 		table_hash_destroy(t);
    750  1.18   rmind 		t->t_nitems = 0;
    751  1.18   rmind 		break;
    752  1.18   rmind 	case NPF_TABLE_TREE:
    753  1.18   rmind 		table_tree_destroy(&t->t_tree[0]);
    754  1.18   rmind 		table_tree_destroy(&t->t_tree[1]);
    755  1.18   rmind 		t->t_nitems = 0;
    756  1.18   rmind 		break;
    757  1.21   rmind 	case NPF_TABLE_CDB:
    758  1.21   rmind 		error = EINVAL;
    759  1.21   rmind 		break;
    760  1.18   rmind 	default:
    761  1.18   rmind 		KASSERT(false);
    762  1.18   rmind 	}
    763  1.18   rmind 	rw_exit(&t->t_lock);
    764  1.21   rmind 	return error;
    765  1.18   rmind }
    766