Home | History | Annotate | Line # | Download | only in npf
npf_tableset.c revision 1.2.4.2
      1  1.2.4.2  uebayasi /*	$NetBSD: npf_tableset.c,v 1.2.4.2 2010/10/22 09:23:15 uebayasi Exp $	*/
      2  1.2.4.2  uebayasi 
      3  1.2.4.2  uebayasi /*-
      4  1.2.4.2  uebayasi  * Copyright (c) 2009-2010 The NetBSD Foundation, Inc.
      5  1.2.4.2  uebayasi  * All rights reserved.
      6  1.2.4.2  uebayasi  *
      7  1.2.4.2  uebayasi  * This material is based upon work partially supported by The
      8  1.2.4.2  uebayasi  * NetBSD Foundation under a contract with Mindaugas Rasiukevicius.
      9  1.2.4.2  uebayasi  *
     10  1.2.4.2  uebayasi  * Redistribution and use in source and binary forms, with or without
     11  1.2.4.2  uebayasi  * modification, are permitted provided that the following conditions
     12  1.2.4.2  uebayasi  * are met:
     13  1.2.4.2  uebayasi  * 1. Redistributions of source code must retain the above copyright
     14  1.2.4.2  uebayasi  *    notice, this list of conditions and the following disclaimer.
     15  1.2.4.2  uebayasi  * 2. Redistributions in binary form must reproduce the above copyright
     16  1.2.4.2  uebayasi  *    notice, this list of conditions and the following disclaimer in the
     17  1.2.4.2  uebayasi  *    documentation and/or other materials provided with the distribution.
     18  1.2.4.2  uebayasi  *
     19  1.2.4.2  uebayasi  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     20  1.2.4.2  uebayasi  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     21  1.2.4.2  uebayasi  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     22  1.2.4.2  uebayasi  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     23  1.2.4.2  uebayasi  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     24  1.2.4.2  uebayasi  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     25  1.2.4.2  uebayasi  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     26  1.2.4.2  uebayasi  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     27  1.2.4.2  uebayasi  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     28  1.2.4.2  uebayasi  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     29  1.2.4.2  uebayasi  * POSSIBILITY OF SUCH DAMAGE.
     30  1.2.4.2  uebayasi  */
     31  1.2.4.2  uebayasi 
     32  1.2.4.2  uebayasi /*
     33  1.2.4.2  uebayasi  * NPF table module.
     34  1.2.4.2  uebayasi  *
     35  1.2.4.2  uebayasi  *	table_lock ->
     36  1.2.4.2  uebayasi  *		npf_table_t::t_lock
     37  1.2.4.2  uebayasi  *
     38  1.2.4.2  uebayasi  * TODO:
     39  1.2.4.2  uebayasi  * - Currently, code is modeled to handle IPv4 CIDR blocks.
     40  1.2.4.2  uebayasi  * - Dynamic hash growing/shrinking (i.e. re-hash functionality), maybe?
     41  1.2.4.2  uebayasi  * - Dynamic array resize.
     42  1.2.4.2  uebayasi  */
     43  1.2.4.2  uebayasi 
     44  1.2.4.2  uebayasi #ifdef _KERNEL
     45  1.2.4.2  uebayasi #include <sys/cdefs.h>
     46  1.2.4.2  uebayasi __KERNEL_RCSID(0, "$NetBSD: npf_tableset.c,v 1.2.4.2 2010/10/22 09:23:15 uebayasi Exp $");
     47  1.2.4.2  uebayasi #endif
     48  1.2.4.2  uebayasi 
     49  1.2.4.2  uebayasi #include <sys/param.h>
     50  1.2.4.2  uebayasi #include <sys/kernel.h>
     51  1.2.4.2  uebayasi 
     52  1.2.4.2  uebayasi #include <sys/atomic.h>
     53  1.2.4.2  uebayasi #include <sys/hash.h>
     54  1.2.4.2  uebayasi #include <sys/kmem.h>
     55  1.2.4.2  uebayasi #include <sys/pool.h>
     56  1.2.4.2  uebayasi #include <sys/queue.h>
     57  1.2.4.2  uebayasi #include <sys/rwlock.h>
     58  1.2.4.2  uebayasi #include <sys/systm.h>
     59  1.2.4.2  uebayasi #include <sys/types.h>
     60  1.2.4.2  uebayasi 
     61  1.2.4.2  uebayasi #include "npf_impl.h"
     62  1.2.4.2  uebayasi 
     63  1.2.4.2  uebayasi /* Table entry structure. */
     64  1.2.4.2  uebayasi struct npf_tblent {
     65  1.2.4.2  uebayasi 	/* Hash/tree entry. */
     66  1.2.4.2  uebayasi 	union {
     67  1.2.4.2  uebayasi 		LIST_ENTRY(npf_tblent)	hashq;
     68  1.2.4.2  uebayasi 		struct rb_node		rbnode;
     69  1.2.4.2  uebayasi 	} te_entry;
     70  1.2.4.2  uebayasi 	/* IPv4 CIDR block. */
     71  1.2.4.2  uebayasi 	in_addr_t			te_addr;
     72  1.2.4.2  uebayasi 	in_addr_t			te_mask;
     73  1.2.4.2  uebayasi };
     74  1.2.4.2  uebayasi 
     75  1.2.4.2  uebayasi LIST_HEAD(npf_hashl, npf_tblent);
     76  1.2.4.2  uebayasi 
     77  1.2.4.2  uebayasi /* Table structure. */
     78  1.2.4.2  uebayasi struct npf_table {
     79  1.2.4.2  uebayasi 	char				t_name[16];
     80  1.2.4.2  uebayasi 	/* Lock and reference count. */
     81  1.2.4.2  uebayasi 	krwlock_t			t_lock;
     82  1.2.4.2  uebayasi 	u_int				t_refcnt;
     83  1.2.4.2  uebayasi 	/* Table ID. */
     84  1.2.4.2  uebayasi 	u_int				t_id;
     85  1.2.4.2  uebayasi 	/* The storage type can be: 1. Hash 2. RB-tree. */
     86  1.2.4.2  uebayasi 	u_int				t_type;
     87  1.2.4.2  uebayasi 	struct npf_hashl *		t_hashl;
     88  1.2.4.2  uebayasi 	u_long				t_hashmask;
     89  1.2.4.2  uebayasi 	rb_tree_t			t_rbtree;
     90  1.2.4.2  uebayasi };
     91  1.2.4.2  uebayasi 
     92  1.2.4.2  uebayasi /* Global table array and its lock. */
     93  1.2.4.2  uebayasi static npf_tableset_t *		table_array;
     94  1.2.4.2  uebayasi static krwlock_t		table_lock;
     95  1.2.4.2  uebayasi static pool_cache_t		tblent_cache;
     96  1.2.4.2  uebayasi 
     97  1.2.4.2  uebayasi /*
     98  1.2.4.2  uebayasi  * npf_table_sysinit: initialise tableset structures.
     99  1.2.4.2  uebayasi  */
    100  1.2.4.2  uebayasi int
    101  1.2.4.2  uebayasi npf_tableset_sysinit(void)
    102  1.2.4.2  uebayasi {
    103  1.2.4.2  uebayasi 
    104  1.2.4.2  uebayasi 	tblent_cache = pool_cache_init(sizeof(npf_tblent_t), coherency_unit,
    105  1.2.4.2  uebayasi 	    0, 0, "npftenpl", NULL, IPL_NONE, NULL, NULL, NULL);
    106  1.2.4.2  uebayasi 	if (tblent_cache == NULL) {
    107  1.2.4.2  uebayasi 		return ENOMEM;
    108  1.2.4.2  uebayasi 	}
    109  1.2.4.2  uebayasi 	table_array = npf_tableset_create();
    110  1.2.4.2  uebayasi 	if (table_array == NULL) {
    111  1.2.4.2  uebayasi 		pool_cache_destroy(tblent_cache);
    112  1.2.4.2  uebayasi 		return ENOMEM;
    113  1.2.4.2  uebayasi 	}
    114  1.2.4.2  uebayasi 	rw_init(&table_lock);
    115  1.2.4.2  uebayasi 	return 0;
    116  1.2.4.2  uebayasi }
    117  1.2.4.2  uebayasi 
    118  1.2.4.2  uebayasi void
    119  1.2.4.2  uebayasi npf_tableset_sysfini(void)
    120  1.2.4.2  uebayasi {
    121  1.2.4.2  uebayasi 
    122  1.2.4.2  uebayasi 	npf_tableset_destroy(table_array);
    123  1.2.4.2  uebayasi 	pool_cache_destroy(tblent_cache);
    124  1.2.4.2  uebayasi 	rw_destroy(&table_lock);
    125  1.2.4.2  uebayasi }
    126  1.2.4.2  uebayasi 
    127  1.2.4.2  uebayasi npf_tableset_t *
    128  1.2.4.2  uebayasi npf_tableset_create(void)
    129  1.2.4.2  uebayasi {
    130  1.2.4.2  uebayasi 	const size_t sz = NPF_TABLE_SLOTS * sizeof(npf_table_t *);
    131  1.2.4.2  uebayasi 
    132  1.2.4.2  uebayasi 	return kmem_zalloc(sz, KM_SLEEP);
    133  1.2.4.2  uebayasi }
    134  1.2.4.2  uebayasi 
    135  1.2.4.2  uebayasi void
    136  1.2.4.2  uebayasi npf_tableset_destroy(npf_tableset_t *tblset)
    137  1.2.4.2  uebayasi {
    138  1.2.4.2  uebayasi 	const size_t sz = NPF_TABLE_SLOTS * sizeof(npf_table_t *);
    139  1.2.4.2  uebayasi 	npf_table_t *t;
    140  1.2.4.2  uebayasi 	u_int tid;
    141  1.2.4.2  uebayasi 
    142  1.2.4.2  uebayasi 	/*
    143  1.2.4.2  uebayasi 	 * Destroy all tables (no references should be held, as ruleset
    144  1.2.4.2  uebayasi 	 * should be destroyed before).
    145  1.2.4.2  uebayasi 	 */
    146  1.2.4.2  uebayasi 	for (tid = 0; tid < NPF_TABLE_SLOTS; tid++) {
    147  1.2.4.2  uebayasi 		t = tblset[tid];
    148  1.2.4.2  uebayasi 		if (t != NULL) {
    149  1.2.4.2  uebayasi 			npf_table_destroy(t);
    150  1.2.4.2  uebayasi 		}
    151  1.2.4.2  uebayasi 	}
    152  1.2.4.2  uebayasi 	kmem_free(tblset, sz);
    153  1.2.4.2  uebayasi }
    154  1.2.4.2  uebayasi 
    155  1.2.4.2  uebayasi /*
    156  1.2.4.2  uebayasi  * npf_tableset_insert: insert the table into the specified tableset.
    157  1.2.4.2  uebayasi  *
    158  1.2.4.2  uebayasi  * => Returns 0 on success, fails and returns errno if ID is already used.
    159  1.2.4.2  uebayasi  */
    160  1.2.4.2  uebayasi int
    161  1.2.4.2  uebayasi npf_tableset_insert(npf_tableset_t *tblset, npf_table_t *t)
    162  1.2.4.2  uebayasi {
    163  1.2.4.2  uebayasi 	const u_int tid = t->t_id;
    164  1.2.4.2  uebayasi 	int error;
    165  1.2.4.2  uebayasi 
    166  1.2.4.2  uebayasi 	KASSERT((u_int)tid < NPF_TABLE_SLOTS);
    167  1.2.4.2  uebayasi 
    168  1.2.4.2  uebayasi 	if (tblset[tid] == NULL) {
    169  1.2.4.2  uebayasi 		tblset[tid] = t;
    170  1.2.4.2  uebayasi 		error = 0;
    171  1.2.4.2  uebayasi 	} else {
    172  1.2.4.2  uebayasi 		error = EEXIST;
    173  1.2.4.2  uebayasi 	}
    174  1.2.4.2  uebayasi 	return error;
    175  1.2.4.2  uebayasi }
    176  1.2.4.2  uebayasi 
    177  1.2.4.2  uebayasi /*
    178  1.2.4.2  uebayasi  * npf_tableset_reload: replace old tableset array with a new one.
    179  1.2.4.2  uebayasi  *
    180  1.2.4.2  uebayasi  * => Called from npf_ruleset_reload() with a global ruleset lock held.
    181  1.2.4.2  uebayasi  * => Returns pointer to the old tableset, caller will destroy it.
    182  1.2.4.2  uebayasi  */
    183  1.2.4.2  uebayasi npf_tableset_t *
    184  1.2.4.2  uebayasi npf_tableset_reload(npf_tableset_t *tblset)
    185  1.2.4.2  uebayasi {
    186  1.2.4.2  uebayasi 	npf_tableset_t *oldtblset;
    187  1.2.4.2  uebayasi 
    188  1.2.4.2  uebayasi 	rw_enter(&table_lock, RW_WRITER);
    189  1.2.4.2  uebayasi 	oldtblset = table_array;
    190  1.2.4.2  uebayasi 	table_array = tblset;
    191  1.2.4.2  uebayasi 	rw_exit(&table_lock);
    192  1.2.4.2  uebayasi 
    193  1.2.4.2  uebayasi 	return oldtblset;
    194  1.2.4.2  uebayasi }
    195  1.2.4.2  uebayasi 
    196  1.2.4.2  uebayasi /*
    197  1.2.4.2  uebayasi  * Red-black tree storage.
    198  1.2.4.2  uebayasi  */
    199  1.2.4.2  uebayasi 
    200  1.2.4.2  uebayasi static signed int
    201  1.2.4.2  uebayasi table_rbtree_cmp_nodes(void *ctx, const void *n1, const void *n2)
    202  1.2.4.2  uebayasi {
    203  1.2.4.2  uebayasi 	const npf_tblent_t * const te1 = n1;
    204  1.2.4.2  uebayasi 	const npf_tblent_t * const te2 = n2;
    205  1.2.4.2  uebayasi 	const in_addr_t x = te1->te_addr & te1->te_mask;
    206  1.2.4.2  uebayasi 	const in_addr_t y = te2->te_addr & te2->te_mask;
    207  1.2.4.2  uebayasi 
    208  1.2.4.2  uebayasi 	if (x < y)
    209  1.2.4.2  uebayasi 		return -1;
    210  1.2.4.2  uebayasi 	if (x > y)
    211  1.2.4.2  uebayasi 		return 1;
    212  1.2.4.2  uebayasi 	return 0;
    213  1.2.4.2  uebayasi }
    214  1.2.4.2  uebayasi 
    215  1.2.4.2  uebayasi static signed int
    216  1.2.4.2  uebayasi table_rbtree_cmp_key(void *ctx, const void *n1, const void *key)
    217  1.2.4.2  uebayasi {
    218  1.2.4.2  uebayasi 	const npf_tblent_t * const te = n1;
    219  1.2.4.2  uebayasi 	const in_addr_t x = te->te_addr & te->te_mask;
    220  1.2.4.2  uebayasi 	const in_addr_t y = *(const in_addr_t *)key;
    221  1.2.4.2  uebayasi 
    222  1.2.4.2  uebayasi 	if (x < y)
    223  1.2.4.2  uebayasi 		return -1;
    224  1.2.4.2  uebayasi 	if (x > y)
    225  1.2.4.2  uebayasi 		return 1;
    226  1.2.4.2  uebayasi 	return 0;
    227  1.2.4.2  uebayasi }
    228  1.2.4.2  uebayasi 
    229  1.2.4.2  uebayasi static const rb_tree_ops_t table_rbtree_ops = {
    230  1.2.4.2  uebayasi 	.rbto_compare_nodes = table_rbtree_cmp_nodes,
    231  1.2.4.2  uebayasi 	.rbto_compare_key = table_rbtree_cmp_key,
    232  1.2.4.2  uebayasi 	.rbto_node_offset = offsetof(npf_tblent_t, te_entry.rbnode),
    233  1.2.4.2  uebayasi 	.rbto_context = NULL
    234  1.2.4.2  uebayasi };
    235  1.2.4.2  uebayasi 
    236  1.2.4.2  uebayasi /*
    237  1.2.4.2  uebayasi  * Hash helper routine.
    238  1.2.4.2  uebayasi  */
    239  1.2.4.2  uebayasi 
    240  1.2.4.2  uebayasi static inline struct npf_hashl *
    241  1.2.4.2  uebayasi table_hash_bucket(npf_table_t *t, void *buf, size_t sz)
    242  1.2.4.2  uebayasi {
    243  1.2.4.2  uebayasi 	const uint32_t hidx = hash32_buf(buf, sz, HASH32_BUF_INIT);
    244  1.2.4.2  uebayasi 
    245  1.2.4.2  uebayasi 	return &t->t_hashl[hidx & t->t_hashmask];
    246  1.2.4.2  uebayasi }
    247  1.2.4.2  uebayasi 
    248  1.2.4.2  uebayasi /*
    249  1.2.4.2  uebayasi  * npf_table_create: create table with a specified ID.
    250  1.2.4.2  uebayasi  */
    251  1.2.4.2  uebayasi npf_table_t *
    252  1.2.4.2  uebayasi npf_table_create(u_int tid, int type, size_t hsize)
    253  1.2.4.2  uebayasi {
    254  1.2.4.2  uebayasi 	npf_table_t *t;
    255  1.2.4.2  uebayasi 
    256  1.2.4.2  uebayasi 	KASSERT((u_int)tid < NPF_TABLE_SLOTS);
    257  1.2.4.2  uebayasi 
    258  1.2.4.2  uebayasi 	t = kmem_zalloc(sizeof(npf_table_t), KM_SLEEP);
    259  1.2.4.2  uebayasi 	switch (type) {
    260  1.2.4.2  uebayasi 	case NPF_TABLE_RBTREE:
    261  1.2.4.2  uebayasi 		rb_tree_init(&t->t_rbtree, &table_rbtree_ops);
    262  1.2.4.2  uebayasi 		break;
    263  1.2.4.2  uebayasi 	case NPF_TABLE_HASH:
    264  1.2.4.2  uebayasi 		t->t_hashl = hashinit(hsize, HASH_LIST, true, &t->t_hashmask);
    265  1.2.4.2  uebayasi 		if (t->t_hashl == NULL) {
    266  1.2.4.2  uebayasi 			kmem_free(t, sizeof(npf_table_t));
    267  1.2.4.2  uebayasi 			return NULL;
    268  1.2.4.2  uebayasi 		}
    269  1.2.4.2  uebayasi 		break;
    270  1.2.4.2  uebayasi 	default:
    271  1.2.4.2  uebayasi 		KASSERT(false);
    272  1.2.4.2  uebayasi 	}
    273  1.2.4.2  uebayasi 	rw_init(&t->t_lock);
    274  1.2.4.2  uebayasi 	t->t_type = type;
    275  1.2.4.2  uebayasi 	t->t_refcnt = 1;
    276  1.2.4.2  uebayasi 	t->t_id = tid;
    277  1.2.4.2  uebayasi 	return t;
    278  1.2.4.2  uebayasi }
    279  1.2.4.2  uebayasi 
    280  1.2.4.2  uebayasi /*
    281  1.2.4.2  uebayasi  * npf_table_destroy: free all table entries and table itself.
    282  1.2.4.2  uebayasi  */
    283  1.2.4.2  uebayasi void
    284  1.2.4.2  uebayasi npf_table_destroy(npf_table_t *t)
    285  1.2.4.2  uebayasi {
    286  1.2.4.2  uebayasi 	npf_tblent_t *e;
    287  1.2.4.2  uebayasi 	u_int n;
    288  1.2.4.2  uebayasi 
    289  1.2.4.2  uebayasi 	switch (t->t_type) {
    290  1.2.4.2  uebayasi 	case NPF_TABLE_HASH:
    291  1.2.4.2  uebayasi 		for (n = 0; n <= t->t_hashmask; n++) {
    292  1.2.4.2  uebayasi 			while ((e = LIST_FIRST(&t->t_hashl[n])) != NULL) {
    293  1.2.4.2  uebayasi 				LIST_REMOVE(e, te_entry.hashq);
    294  1.2.4.2  uebayasi 				pool_cache_put(tblent_cache, e);
    295  1.2.4.2  uebayasi 			}
    296  1.2.4.2  uebayasi 		}
    297  1.2.4.2  uebayasi 		hashdone(t->t_hashl, HASH_LIST, t->t_hashmask);
    298  1.2.4.2  uebayasi 		break;
    299  1.2.4.2  uebayasi 	case NPF_TABLE_RBTREE:
    300  1.2.4.2  uebayasi 		while ((e = rb_tree_iterate(&t->t_rbtree, NULL,
    301  1.2.4.2  uebayasi 		    RB_DIR_LEFT)) != NULL) {
    302  1.2.4.2  uebayasi 			rb_tree_remove_node(&t->t_rbtree, e);
    303  1.2.4.2  uebayasi 			pool_cache_put(tblent_cache, e);
    304  1.2.4.2  uebayasi 		}
    305  1.2.4.2  uebayasi 		break;
    306  1.2.4.2  uebayasi 	default:
    307  1.2.4.2  uebayasi 		KASSERT(false);
    308  1.2.4.2  uebayasi 	}
    309  1.2.4.2  uebayasi 	rw_destroy(&t->t_lock);
    310  1.2.4.2  uebayasi 	kmem_free(t, sizeof(npf_table_t));
    311  1.2.4.2  uebayasi }
    312  1.2.4.2  uebayasi 
    313  1.2.4.2  uebayasi /*
    314  1.2.4.2  uebayasi  * npf_table_ref: holds the reference on table.
    315  1.2.4.2  uebayasi  *
    316  1.2.4.2  uebayasi  * => Table must be locked.
    317  1.2.4.2  uebayasi  */
    318  1.2.4.2  uebayasi void
    319  1.2.4.2  uebayasi npf_table_ref(npf_table_t *t)
    320  1.2.4.2  uebayasi {
    321  1.2.4.2  uebayasi 
    322  1.2.4.2  uebayasi 	KASSERT(rw_lock_held(&t->t_lock));
    323  1.2.4.2  uebayasi 	atomic_inc_uint(&t->t_refcnt);
    324  1.2.4.2  uebayasi }
    325  1.2.4.2  uebayasi 
    326  1.2.4.2  uebayasi /*
    327  1.2.4.2  uebayasi  * npf_table_unref: drop reference from the table and destroy the table if
    328  1.2.4.2  uebayasi  * it is the last reference.
    329  1.2.4.2  uebayasi  */
    330  1.2.4.2  uebayasi void
    331  1.2.4.2  uebayasi npf_table_unref(npf_table_t *t)
    332  1.2.4.2  uebayasi {
    333  1.2.4.2  uebayasi 
    334  1.2.4.2  uebayasi 	if (atomic_dec_uint_nv(&t->t_refcnt) != 0) {
    335  1.2.4.2  uebayasi 		return;
    336  1.2.4.2  uebayasi 	}
    337  1.2.4.2  uebayasi 	npf_table_destroy(t);
    338  1.2.4.2  uebayasi }
    339  1.2.4.2  uebayasi 
    340  1.2.4.2  uebayasi /*
    341  1.2.4.2  uebayasi  * npf_table_get: find the table according to ID and "get it" by locking it.
    342  1.2.4.2  uebayasi  */
    343  1.2.4.2  uebayasi npf_table_t *
    344  1.2.4.2  uebayasi npf_table_get(npf_tableset_t *tset, u_int tid)
    345  1.2.4.2  uebayasi {
    346  1.2.4.2  uebayasi 	npf_table_t *t;
    347  1.2.4.2  uebayasi 
    348  1.2.4.2  uebayasi 	if ((u_int)tid >= NPF_TABLE_SLOTS) {
    349  1.2.4.2  uebayasi 		return NULL;
    350  1.2.4.2  uebayasi 	}
    351  1.2.4.2  uebayasi 	if (tset) {
    352  1.2.4.2  uebayasi 		t = tset[tid];
    353  1.2.4.2  uebayasi 		if (t != NULL) {
    354  1.2.4.2  uebayasi 			rw_enter(&t->t_lock, RW_READER);
    355  1.2.4.2  uebayasi 		}
    356  1.2.4.2  uebayasi 		return t;
    357  1.2.4.2  uebayasi 	}
    358  1.2.4.2  uebayasi 	rw_enter(&table_lock, RW_READER);
    359  1.2.4.2  uebayasi 	t = table_array[tid];
    360  1.2.4.2  uebayasi 	if (t != NULL) {
    361  1.2.4.2  uebayasi 		rw_enter(&t->t_lock, RW_READER);
    362  1.2.4.2  uebayasi 	}
    363  1.2.4.2  uebayasi 	rw_exit(&table_lock);
    364  1.2.4.2  uebayasi 	return t;
    365  1.2.4.2  uebayasi }
    366  1.2.4.2  uebayasi 
    367  1.2.4.2  uebayasi /*
    368  1.2.4.2  uebayasi  * npf_table_put: "put table back" by unlocking it.
    369  1.2.4.2  uebayasi  */
    370  1.2.4.2  uebayasi void
    371  1.2.4.2  uebayasi npf_table_put(npf_table_t *t)
    372  1.2.4.2  uebayasi {
    373  1.2.4.2  uebayasi 
    374  1.2.4.2  uebayasi 	rw_exit(&t->t_lock);
    375  1.2.4.2  uebayasi }
    376  1.2.4.2  uebayasi 
    377  1.2.4.2  uebayasi /*
    378  1.2.4.2  uebayasi  * npf_table_check: validate ID and type.
    379  1.2.4.2  uebayasi  * */
    380  1.2.4.2  uebayasi int
    381  1.2.4.2  uebayasi npf_table_check(npf_tableset_t *tset, u_int tid, int type)
    382  1.2.4.2  uebayasi {
    383  1.2.4.2  uebayasi 
    384  1.2.4.2  uebayasi 	if ((u_int)tid >= NPF_TABLE_SLOTS) {
    385  1.2.4.2  uebayasi 		return EINVAL;
    386  1.2.4.2  uebayasi 	}
    387  1.2.4.2  uebayasi 	if (tset[tid] != NULL) {
    388  1.2.4.2  uebayasi 		return EEXIST;
    389  1.2.4.2  uebayasi 	}
    390  1.2.4.2  uebayasi 	if (type != NPF_TABLE_RBTREE && type != NPF_TABLE_HASH) {
    391  1.2.4.2  uebayasi 		return EINVAL;
    392  1.2.4.2  uebayasi 	}
    393  1.2.4.2  uebayasi 	return 0;
    394  1.2.4.2  uebayasi }
    395  1.2.4.2  uebayasi 
    396  1.2.4.2  uebayasi /*
    397  1.2.4.2  uebayasi  * npf_table_add_v4cidr: add an IPv4 CIDR into the table.
    398  1.2.4.2  uebayasi  */
    399  1.2.4.2  uebayasi int
    400  1.2.4.2  uebayasi npf_table_add_v4cidr(npf_tableset_t *tset, u_int tid,
    401  1.2.4.2  uebayasi     in_addr_t addr, in_addr_t mask)
    402  1.2.4.2  uebayasi {
    403  1.2.4.2  uebayasi 	struct npf_hashl *htbl;
    404  1.2.4.2  uebayasi 	npf_tblent_t *e, *it;
    405  1.2.4.2  uebayasi 	npf_table_t *t;
    406  1.2.4.2  uebayasi 	in_addr_t val;
    407  1.2.4.2  uebayasi 	int error = 0;
    408  1.2.4.2  uebayasi 
    409  1.2.4.2  uebayasi 	/* Allocate and setup entry. */
    410  1.2.4.2  uebayasi 	e = pool_cache_get(tblent_cache, PR_WAITOK);
    411  1.2.4.2  uebayasi 	if (e == NULL) {
    412  1.2.4.2  uebayasi 		return ENOMEM;
    413  1.2.4.2  uebayasi 	}
    414  1.2.4.2  uebayasi 	e->te_addr = addr;
    415  1.2.4.2  uebayasi 	e->te_mask = mask;
    416  1.2.4.2  uebayasi 
    417  1.2.4.2  uebayasi 	/* Locks the table. */
    418  1.2.4.2  uebayasi 	t = npf_table_get(tset, tid);
    419  1.2.4.2  uebayasi 	if (__predict_false(t == NULL)) {
    420  1.2.4.2  uebayasi 		pool_cache_put(tblent_cache, e);
    421  1.2.4.2  uebayasi 		return EINVAL;
    422  1.2.4.2  uebayasi 	}
    423  1.2.4.2  uebayasi 	switch (t->t_type) {
    424  1.2.4.2  uebayasi 	case NPF_TABLE_HASH:
    425  1.2.4.2  uebayasi 		/* Generate hash value from: address & mask. */
    426  1.2.4.2  uebayasi 		val = addr & mask;
    427  1.2.4.2  uebayasi 		htbl = table_hash_bucket(t, &val, sizeof(in_addr_t));
    428  1.2.4.2  uebayasi 		/* Lookup to check for duplicates. */
    429  1.2.4.2  uebayasi 		LIST_FOREACH(it, htbl, te_entry.hashq) {
    430  1.2.4.2  uebayasi 			if (it->te_addr == addr && it->te_mask == mask)
    431  1.2.4.2  uebayasi 				break;
    432  1.2.4.2  uebayasi 		}
    433  1.2.4.2  uebayasi 		/* If no duplicate - insert entry. */
    434  1.2.4.2  uebayasi 		if (__predict_true(it == NULL)) {
    435  1.2.4.2  uebayasi 			LIST_INSERT_HEAD(htbl, e, te_entry.hashq);
    436  1.2.4.2  uebayasi 		} else {
    437  1.2.4.2  uebayasi 			error = EEXIST;
    438  1.2.4.2  uebayasi 		}
    439  1.2.4.2  uebayasi 		break;
    440  1.2.4.2  uebayasi 	case NPF_TABLE_RBTREE:
    441  1.2.4.2  uebayasi 		/* Insert entry.  Returns false, if duplicate. */
    442  1.2.4.2  uebayasi 		if (rb_tree_insert_node(&t->t_rbtree, e) != e) {
    443  1.2.4.2  uebayasi 			error = EEXIST;
    444  1.2.4.2  uebayasi 		}
    445  1.2.4.2  uebayasi 		break;
    446  1.2.4.2  uebayasi 	default:
    447  1.2.4.2  uebayasi 		KASSERT(false);
    448  1.2.4.2  uebayasi 	}
    449  1.2.4.2  uebayasi 	npf_table_put(t);
    450  1.2.4.2  uebayasi 
    451  1.2.4.2  uebayasi 	if (__predict_false(error)) {
    452  1.2.4.2  uebayasi 		pool_cache_put(tblent_cache, e);
    453  1.2.4.2  uebayasi 	}
    454  1.2.4.2  uebayasi 	return error;
    455  1.2.4.2  uebayasi }
    456  1.2.4.2  uebayasi 
    457  1.2.4.2  uebayasi /*
    458  1.2.4.2  uebayasi  * npf_table_rem_v4cidr: remove an IPv4 CIDR from the table.
    459  1.2.4.2  uebayasi  */
    460  1.2.4.2  uebayasi int
    461  1.2.4.2  uebayasi npf_table_rem_v4cidr(npf_tableset_t *tset, u_int tid,
    462  1.2.4.2  uebayasi     in_addr_t addr, in_addr_t mask)
    463  1.2.4.2  uebayasi {
    464  1.2.4.2  uebayasi 	struct npf_hashl *htbl;
    465  1.2.4.2  uebayasi 	npf_tblent_t *e;
    466  1.2.4.2  uebayasi 	npf_table_t *t;
    467  1.2.4.2  uebayasi 	in_addr_t val;
    468  1.2.4.2  uebayasi 	int error;
    469  1.2.4.2  uebayasi 
    470  1.2.4.2  uebayasi 	e = NULL;
    471  1.2.4.2  uebayasi 
    472  1.2.4.2  uebayasi 	/* Locks the table. */
    473  1.2.4.2  uebayasi 	t = npf_table_get(tset, tid);
    474  1.2.4.2  uebayasi 	if (__predict_false(t == NULL)) {
    475  1.2.4.2  uebayasi 		return EINVAL;
    476  1.2.4.2  uebayasi 	}
    477  1.2.4.2  uebayasi 	/* Lookup & remove. */
    478  1.2.4.2  uebayasi 	switch (t->t_type) {
    479  1.2.4.2  uebayasi 	case NPF_TABLE_HASH:
    480  1.2.4.2  uebayasi 		/* Generate hash value from: (address & mask). */
    481  1.2.4.2  uebayasi 		val = addr & mask;
    482  1.2.4.2  uebayasi 		htbl = table_hash_bucket(t, &val, sizeof(in_addr_t));
    483  1.2.4.2  uebayasi 		LIST_FOREACH(e, htbl, te_entry.hashq) {
    484  1.2.4.2  uebayasi 			if (e->te_addr == addr && e->te_mask == mask)
    485  1.2.4.2  uebayasi 				break;
    486  1.2.4.2  uebayasi 		}
    487  1.2.4.2  uebayasi 		if (__predict_true(e != NULL)) {
    488  1.2.4.2  uebayasi 			LIST_REMOVE(e, te_entry.hashq);
    489  1.2.4.2  uebayasi 		} else {
    490  1.2.4.2  uebayasi 			error = ESRCH;
    491  1.2.4.2  uebayasi 		}
    492  1.2.4.2  uebayasi 		break;
    493  1.2.4.2  uebayasi 	case NPF_TABLE_RBTREE:
    494  1.2.4.2  uebayasi 		/* Key: (address & mask). */
    495  1.2.4.2  uebayasi 		val = addr & mask;
    496  1.2.4.2  uebayasi 		e = rb_tree_find_node(&t->t_rbtree, &val);
    497  1.2.4.2  uebayasi 		if (__predict_true(e != NULL)) {
    498  1.2.4.2  uebayasi 			rb_tree_remove_node(&t->t_rbtree, e);
    499  1.2.4.2  uebayasi 		} else {
    500  1.2.4.2  uebayasi 			error = ESRCH;
    501  1.2.4.2  uebayasi 		}
    502  1.2.4.2  uebayasi 		break;
    503  1.2.4.2  uebayasi 	default:
    504  1.2.4.2  uebayasi 		KASSERT(false);
    505  1.2.4.2  uebayasi 	}
    506  1.2.4.2  uebayasi 	npf_table_put(t);
    507  1.2.4.2  uebayasi 
    508  1.2.4.2  uebayasi 	/* Free table the entry. */
    509  1.2.4.2  uebayasi 	if (__predict_true(e != NULL)) {
    510  1.2.4.2  uebayasi 		pool_cache_put(tblent_cache, e);
    511  1.2.4.2  uebayasi 	}
    512  1.2.4.2  uebayasi 	return e ? 0 : -1;
    513  1.2.4.2  uebayasi }
    514  1.2.4.2  uebayasi 
    515  1.2.4.2  uebayasi /*
    516  1.2.4.2  uebayasi  * npf_table_match_v4addr: find the table according to ID, lookup and
    517  1.2.4.2  uebayasi  * match the contents with specified IPv4 address.
    518  1.2.4.2  uebayasi  */
    519  1.2.4.2  uebayasi int
    520  1.2.4.2  uebayasi npf_table_match_v4addr(u_int tid, in_addr_t ip4addr)
    521  1.2.4.2  uebayasi {
    522  1.2.4.2  uebayasi 	struct npf_hashl *htbl;
    523  1.2.4.2  uebayasi 	npf_tblent_t *e;
    524  1.2.4.2  uebayasi 	npf_table_t *t;
    525  1.2.4.2  uebayasi 
    526  1.2.4.2  uebayasi 	e = NULL;
    527  1.2.4.2  uebayasi 
    528  1.2.4.2  uebayasi 	/* Locks the table. */
    529  1.2.4.2  uebayasi 	t = npf_table_get(NULL, tid);
    530  1.2.4.2  uebayasi 	if (__predict_false(t == NULL)) {
    531  1.2.4.2  uebayasi 		return EINVAL;
    532  1.2.4.2  uebayasi 	}
    533  1.2.4.2  uebayasi 	switch (t->t_type) {
    534  1.2.4.2  uebayasi 	case NPF_TABLE_HASH:
    535  1.2.4.2  uebayasi 		htbl = table_hash_bucket(t, &ip4addr, sizeof(in_addr_t));
    536  1.2.4.2  uebayasi 		LIST_FOREACH(e, htbl, te_entry.hashq) {
    537  1.2.4.2  uebayasi 			if ((ip4addr & e->te_mask) == e->te_addr) {
    538  1.2.4.2  uebayasi 				break;
    539  1.2.4.2  uebayasi 			}
    540  1.2.4.2  uebayasi 		}
    541  1.2.4.2  uebayasi 		break;
    542  1.2.4.2  uebayasi 	case NPF_TABLE_RBTREE:
    543  1.2.4.2  uebayasi 		e = rb_tree_find_node(&t->t_rbtree, &ip4addr);
    544  1.2.4.2  uebayasi 		KASSERT((ip4addr & e->te_mask) == e->te_addr);
    545  1.2.4.2  uebayasi 		break;
    546  1.2.4.2  uebayasi 	default:
    547  1.2.4.2  uebayasi 		KASSERT(false);
    548  1.2.4.2  uebayasi 	}
    549  1.2.4.2  uebayasi 	npf_table_put(t);
    550  1.2.4.2  uebayasi 
    551  1.2.4.2  uebayasi 	return e ? 0 : -1;
    552  1.2.4.2  uebayasi }
    553