Home | History | Annotate | Line # | Download | only in npf
npf.c revision 1.2.2.1
      1  1.2.2.1  jruoho /*	$NetBSD: npf.c,v 1.2.2.1 2011/06/06 09:09:53 jruoho Exp $	*/
      2      1.1   rmind 
      3      1.1   rmind /*-
      4      1.1   rmind  * Copyright (c) 2009-2010 The NetBSD Foundation, Inc.
      5      1.1   rmind  * All rights reserved.
      6      1.1   rmind  *
      7      1.1   rmind  * This material is based upon work partially supported by The
      8      1.1   rmind  * NetBSD Foundation under a contract with Mindaugas Rasiukevicius.
      9      1.1   rmind  *
     10      1.1   rmind  * Redistribution and use in source and binary forms, with or without
     11      1.1   rmind  * modification, are permitted provided that the following conditions
     12      1.1   rmind  * are met:
     13      1.1   rmind  * 1. Redistributions of source code must retain the above copyright
     14      1.1   rmind  *    notice, this list of conditions and the following disclaimer.
     15      1.1   rmind  * 2. Redistributions in binary form must reproduce the above copyright
     16      1.1   rmind  *    notice, this list of conditions and the following disclaimer in the
     17      1.1   rmind  *    documentation and/or other materials provided with the distribution.
     18      1.1   rmind  *
     19      1.1   rmind  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     20      1.1   rmind  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     21      1.1   rmind  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     22      1.1   rmind  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     23      1.1   rmind  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     24      1.1   rmind  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     25      1.1   rmind  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     26      1.1   rmind  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     27      1.1   rmind  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     28      1.1   rmind  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     29      1.1   rmind  * POSSIBILITY OF SUCH DAMAGE.
     30      1.1   rmind  */
     31      1.1   rmind 
     32      1.1   rmind /*
     33      1.1   rmind  * NPF main: dynamic load/initialisation and unload routines.
     34      1.1   rmind  */
     35      1.1   rmind 
     36      1.1   rmind #include <sys/cdefs.h>
     37  1.2.2.1  jruoho __KERNEL_RCSID(0, "$NetBSD: npf.c,v 1.2.2.1 2011/06/06 09:09:53 jruoho Exp $");
     38      1.1   rmind 
     39      1.1   rmind #include <sys/param.h>
     40      1.1   rmind #include <sys/types.h>
     41      1.1   rmind 
     42      1.2   rmind #include <sys/atomic.h>
     43      1.1   rmind #include <sys/conf.h>
     44      1.1   rmind #include <sys/kauth.h>
     45      1.2   rmind #include <sys/kmem.h>
     46      1.1   rmind #include <sys/lwp.h>
     47      1.1   rmind #include <sys/module.h>
     48      1.2   rmind #include <sys/percpu.h>
     49      1.2   rmind #include <sys/rwlock.h>
     50      1.1   rmind #include <sys/socketvar.h>
     51      1.1   rmind #include <sys/uio.h>
     52      1.1   rmind 
     53      1.1   rmind #include "npf_impl.h"
     54      1.1   rmind 
     55      1.1   rmind /*
     56      1.1   rmind  * Module and device structures.
     57      1.1   rmind  */
     58      1.1   rmind MODULE(MODULE_CLASS_MISC, npf, NULL);
     59      1.1   rmind 
     60      1.1   rmind void		npfattach(int);
     61      1.1   rmind 
     62  1.2.2.1  jruoho static int	npf_fini(void);
     63      1.1   rmind static int	npf_dev_open(dev_t, int, int, lwp_t *);
     64      1.1   rmind static int	npf_dev_close(dev_t, int, int, lwp_t *);
     65      1.1   rmind static int	npf_dev_ioctl(dev_t, u_long, void *, int, lwp_t *);
     66      1.1   rmind static int	npf_dev_poll(dev_t, int, lwp_t *);
     67      1.1   rmind static int	npf_dev_read(dev_t, struct uio *, int);
     68      1.1   rmind 
     69      1.2   rmind typedef struct {
     70      1.2   rmind 	npf_ruleset_t *		n_rules;
     71      1.2   rmind 	npf_tableset_t *	n_tables;
     72      1.2   rmind 	npf_ruleset_t *		n_nat_rules;
     73      1.2   rmind } npf_core_t;
     74      1.2   rmind 
     75      1.2   rmind static void	npf_core_destroy(npf_core_t *);
     76      1.2   rmind static int	npfctl_stats(void *);
     77      1.2   rmind 
     78      1.2   rmind static krwlock_t		npf_lock		__cacheline_aligned;
     79      1.2   rmind static npf_core_t *		npf_core		__cacheline_aligned;
     80      1.2   rmind static percpu_t *		npf_stats_percpu	__read_mostly;
     81      1.2   rmind 
     82      1.1   rmind const struct cdevsw npf_cdevsw = {
     83      1.1   rmind 	npf_dev_open, npf_dev_close, npf_dev_read, nowrite, npf_dev_ioctl,
     84      1.1   rmind 	nostop, notty, npf_dev_poll, nommap, nokqfilter, D_OTHER | D_MPSAFE
     85      1.1   rmind };
     86      1.1   rmind 
     87      1.1   rmind static int
     88      1.1   rmind npf_init(void)
     89      1.1   rmind {
     90      1.1   rmind #ifdef _MODULE
     91      1.1   rmind 	devmajor_t bmajor = NODEVMAJOR, cmajor = NODEVMAJOR;
     92      1.1   rmind #endif
     93      1.2   rmind 	npf_ruleset_t *rset, *nset;
     94      1.2   rmind 	npf_tableset_t *tset;
     95      1.2   rmind 	int error = 0;
     96      1.2   rmind 
     97      1.2   rmind 	rw_init(&npf_lock);
     98      1.2   rmind 	npf_stats_percpu = percpu_alloc(NPF_STATS_SIZE);
     99      1.2   rmind 	npf_tableset_sysinit();
    100      1.2   rmind 	npf_session_sysinit();
    101      1.1   rmind 	npf_nat_sysinit();
    102      1.1   rmind 	npf_alg_sysinit();
    103      1.2   rmind 	npflogattach(1);
    104      1.2   rmind 
    105      1.2   rmind 	/* Load empty configuration. */
    106      1.2   rmind 	rset = npf_ruleset_create();
    107      1.2   rmind 	tset = npf_tableset_create();
    108      1.2   rmind 	nset = npf_ruleset_create();
    109      1.2   rmind 	npf_reload(rset, tset, nset);
    110      1.2   rmind 	KASSERT(npf_core != NULL);
    111      1.1   rmind 
    112      1.1   rmind #ifdef _MODULE
    113      1.1   rmind 	/* Attach /dev/npf device. */
    114      1.1   rmind 	error = devsw_attach("npf", NULL, &bmajor, &npf_cdevsw, &cmajor);
    115      1.1   rmind 	if (error) {
    116      1.2   rmind 		/* It will call devsw_detach(), which is safe. */
    117      1.2   rmind 		(void)npf_fini();
    118      1.1   rmind 	}
    119      1.1   rmind #endif
    120      1.1   rmind 	return error;
    121      1.1   rmind }
    122      1.1   rmind 
    123      1.1   rmind static int
    124      1.1   rmind npf_fini(void)
    125      1.1   rmind {
    126      1.1   rmind 
    127      1.2   rmind 	/*
    128      1.2   rmind 	 * At first, detach device, remove pfil hooks and unload existing
    129      1.2   rmind 	 * configuration, destroy structures.
    130      1.2   rmind 	 */
    131      1.1   rmind #ifdef _MODULE
    132      1.1   rmind 	devsw_detach(NULL, &npf_cdevsw);
    133      1.1   rmind #endif
    134      1.2   rmind 	npf_unregister_pfil();
    135      1.2   rmind 	npf_core_destroy(npf_core);
    136      1.2   rmind 	npflogdetach();
    137      1.2   rmind 
    138      1.2   rmind 	/* Note: order is particular. */
    139      1.1   rmind 	npf_nat_sysfini();
    140      1.1   rmind 	npf_alg_sysfini();
    141      1.1   rmind 	npf_session_sysfini();
    142      1.1   rmind 	npf_tableset_sysfini();
    143      1.2   rmind 	percpu_free(npf_stats_percpu, NPF_STATS_SIZE);
    144      1.2   rmind 	rw_destroy(&npf_lock);
    145      1.1   rmind 
    146      1.1   rmind 	return 0;
    147      1.1   rmind }
    148      1.1   rmind 
    149      1.1   rmind /*
    150      1.1   rmind  * Module interface.
    151      1.1   rmind  */
    152      1.1   rmind static int
    153      1.1   rmind npf_modcmd(modcmd_t cmd, void *arg)
    154      1.1   rmind {
    155      1.1   rmind 
    156      1.1   rmind 	switch (cmd) {
    157      1.1   rmind 	case MODULE_CMD_INIT:
    158      1.1   rmind 		return npf_init();
    159      1.1   rmind 	case MODULE_CMD_FINI:
    160      1.1   rmind 		return npf_fini();
    161      1.1   rmind 	default:
    162      1.1   rmind 		return ENOTTY;
    163      1.1   rmind 	}
    164      1.1   rmind 	return 0;
    165      1.1   rmind }
    166      1.1   rmind 
    167      1.1   rmind void
    168      1.1   rmind npfattach(int nunits)
    169      1.1   rmind {
    170      1.1   rmind 
    171      1.1   rmind 	/* Void. */
    172      1.1   rmind }
    173      1.1   rmind 
    174      1.1   rmind static int
    175      1.1   rmind npf_dev_open(dev_t dev, int flag, int mode, lwp_t *l)
    176      1.1   rmind {
    177      1.1   rmind 
    178      1.1   rmind 	/* Available only for super-user. */
    179      1.1   rmind 	if (kauth_authorize_generic(l->l_cred, KAUTH_GENERIC_ISSUSER, NULL)) {
    180      1.1   rmind 		return EPERM;
    181      1.1   rmind 	}
    182      1.1   rmind 	return 0;
    183      1.1   rmind }
    184      1.1   rmind 
    185      1.1   rmind static int
    186      1.1   rmind npf_dev_close(dev_t dev, int flag, int mode, lwp_t *l)
    187      1.1   rmind {
    188      1.1   rmind 
    189      1.1   rmind 	return 0;
    190      1.1   rmind }
    191      1.1   rmind 
    192      1.1   rmind static int
    193      1.1   rmind npf_dev_ioctl(dev_t dev, u_long cmd, void *data, int flag, lwp_t *l)
    194      1.1   rmind {
    195      1.1   rmind 	int error;
    196      1.1   rmind 
    197      1.1   rmind 	/* Available only for super-user. */
    198      1.1   rmind 	if (kauth_authorize_generic(l->l_cred, KAUTH_GENERIC_ISSUSER, NULL)) {
    199      1.1   rmind 		return EPERM;
    200      1.1   rmind 	}
    201      1.1   rmind 
    202      1.1   rmind 	switch (cmd) {
    203      1.1   rmind 	case IOC_NPF_VERSION:
    204      1.1   rmind 		*(int *)data = NPF_VERSION;
    205      1.1   rmind 		error = 0;
    206      1.1   rmind 		break;
    207      1.1   rmind 	case IOC_NPF_SWITCH:
    208      1.1   rmind 		error = npfctl_switch(data);
    209      1.1   rmind 		break;
    210      1.1   rmind 	case IOC_NPF_RELOAD:
    211      1.1   rmind 		error = npfctl_reload(cmd, data);
    212      1.1   rmind 		break;
    213      1.1   rmind 	case IOC_NPF_TABLE:
    214      1.1   rmind 		error = npfctl_table(data);
    215      1.1   rmind 		break;
    216      1.2   rmind 	case IOC_NPF_STATS:
    217      1.2   rmind 		error = npfctl_stats(data);
    218      1.2   rmind 		break;
    219      1.2   rmind 	case IOC_NPF_SESSIONS_SAVE:
    220      1.2   rmind 		error = npfctl_sessions_save(cmd, data);
    221      1.2   rmind 		break;
    222      1.2   rmind 	case IOC_NPF_SESSIONS_LOAD:
    223      1.2   rmind 		error = npfctl_sessions_load(cmd, data);
    224      1.2   rmind 		break;
    225  1.2.2.1  jruoho 	case IOC_NPF_UPDATE_RULE:
    226  1.2.2.1  jruoho 		error = npfctl_update_rule(cmd, data);
    227  1.2.2.1  jruoho 		break;
    228      1.1   rmind 	default:
    229      1.1   rmind 		error = ENOTTY;
    230      1.1   rmind 		break;
    231      1.1   rmind 	}
    232      1.1   rmind 	return error;
    233      1.1   rmind }
    234      1.1   rmind 
    235      1.1   rmind static int
    236      1.1   rmind npf_dev_poll(dev_t dev, int events, lwp_t *l)
    237      1.1   rmind {
    238      1.1   rmind 
    239      1.1   rmind 	return ENOTSUP;
    240      1.1   rmind }
    241      1.1   rmind 
    242      1.1   rmind static int
    243      1.1   rmind npf_dev_read(dev_t dev, struct uio *uio, int flag)
    244      1.1   rmind {
    245      1.1   rmind 
    246      1.1   rmind 	return ENOTSUP;
    247      1.1   rmind }
    248      1.2   rmind 
    249      1.2   rmind /*
    250      1.2   rmind  * NPF core loading/reloading/unloading mechanism.
    251      1.2   rmind  */
    252      1.2   rmind 
    253      1.2   rmind static void
    254      1.2   rmind npf_core_destroy(npf_core_t *nc)
    255      1.2   rmind {
    256      1.2   rmind 
    257      1.2   rmind 	npf_ruleset_destroy(nc->n_rules);
    258      1.2   rmind 	npf_ruleset_destroy(nc->n_nat_rules);
    259  1.2.2.1  jruoho 	npf_tableset_destroy(nc->n_tables);
    260      1.2   rmind 	kmem_free(nc, sizeof(npf_core_t));
    261      1.2   rmind }
    262      1.2   rmind 
    263      1.2   rmind /*
    264      1.2   rmind  * npf_reload: atomically load new ruleset, tableset and NAT policies.
    265      1.2   rmind  * Then destroy old (unloaded) structures.
    266      1.2   rmind  */
    267      1.2   rmind void
    268      1.2   rmind npf_reload(npf_ruleset_t *rset, npf_tableset_t *tset, npf_ruleset_t *nset)
    269      1.2   rmind {
    270      1.2   rmind 	npf_core_t *nc, *onc;
    271      1.2   rmind 
    272      1.2   rmind 	/* Setup a new core structure. */
    273      1.2   rmind 	nc = kmem_alloc(sizeof(npf_core_t), KM_SLEEP);
    274      1.2   rmind 	nc->n_rules = rset;
    275      1.2   rmind 	nc->n_tables = tset;
    276      1.2   rmind 	nc->n_nat_rules = nset;
    277      1.2   rmind 
    278      1.2   rmind 	/* Lock and load the core structure. */
    279      1.2   rmind 	rw_enter(&npf_lock, RW_WRITER);
    280      1.2   rmind 	onc = atomic_swap_ptr(&npf_core, nc);
    281      1.2   rmind 	if (onc) {
    282      1.2   rmind 		/* Reload only necessary NAT policies. */
    283      1.2   rmind 		npf_ruleset_natreload(nset, onc->n_nat_rules);
    284      1.2   rmind 	}
    285      1.2   rmind 	/* Unlock.  Everything goes "live" now. */
    286      1.2   rmind 	rw_exit(&npf_lock);
    287      1.2   rmind 
    288      1.2   rmind 	/* Turn on/off session tracking accordingly. */
    289      1.2   rmind 	npf_session_tracking(true);
    290      1.2   rmind 
    291      1.2   rmind 	if (onc) {
    292      1.2   rmind 		/* Destroy unloaded structures. */
    293      1.2   rmind 		npf_core_destroy(onc);
    294      1.2   rmind 	}
    295      1.2   rmind }
    296      1.2   rmind 
    297      1.2   rmind void
    298      1.2   rmind npf_core_enter(void)
    299      1.2   rmind {
    300      1.2   rmind 	rw_enter(&npf_lock, RW_READER);
    301      1.2   rmind }
    302      1.2   rmind 
    303      1.2   rmind npf_ruleset_t *
    304      1.2   rmind npf_core_ruleset(void)
    305      1.2   rmind {
    306      1.2   rmind 	KASSERT(rw_lock_held(&npf_lock));
    307      1.2   rmind 	return npf_core->n_rules;
    308      1.2   rmind }
    309      1.2   rmind 
    310      1.2   rmind npf_ruleset_t *
    311      1.2   rmind npf_core_natset(void)
    312      1.2   rmind {
    313      1.2   rmind 	KASSERT(rw_lock_held(&npf_lock));
    314      1.2   rmind 	return npf_core->n_nat_rules;
    315      1.2   rmind }
    316      1.2   rmind 
    317      1.2   rmind npf_tableset_t *
    318      1.2   rmind npf_core_tableset(void)
    319      1.2   rmind {
    320      1.2   rmind 	KASSERT(rw_lock_held(&npf_lock));
    321      1.2   rmind 	return npf_core->n_tables;
    322      1.2   rmind }
    323      1.2   rmind 
    324      1.2   rmind void
    325      1.2   rmind npf_core_exit(void)
    326      1.2   rmind {
    327      1.2   rmind 	rw_exit(&npf_lock);
    328      1.2   rmind }
    329      1.2   rmind 
    330      1.2   rmind bool
    331      1.2   rmind npf_core_locked(void)
    332      1.2   rmind {
    333      1.2   rmind 	return rw_lock_held(&npf_lock);
    334      1.2   rmind }
    335      1.2   rmind 
    336      1.2   rmind /*
    337      1.2   rmind  * NPF statistics interface.
    338      1.2   rmind  */
    339      1.2   rmind 
    340      1.2   rmind void
    341      1.2   rmind npf_stats_inc(npf_stats_t st)
    342      1.2   rmind {
    343      1.2   rmind 	uint64_t *stats = percpu_getref(npf_stats_percpu);
    344      1.2   rmind 	stats[st]++;
    345      1.2   rmind 	percpu_putref(npf_stats_percpu);
    346      1.2   rmind }
    347      1.2   rmind 
    348      1.2   rmind void
    349      1.2   rmind npf_stats_dec(npf_stats_t st)
    350      1.2   rmind {
    351      1.2   rmind 	uint64_t *stats = percpu_getref(npf_stats_percpu);
    352      1.2   rmind 	stats[st]--;
    353      1.2   rmind 	percpu_putref(npf_stats_percpu);
    354      1.2   rmind }
    355      1.2   rmind 
    356      1.2   rmind static void
    357      1.2   rmind npf_stats_collect(void *mem, void *arg, struct cpu_info *ci)
    358      1.2   rmind {
    359      1.2   rmind 	uint64_t *percpu_stats = mem, *full_stats = arg;
    360      1.2   rmind 	int i;
    361      1.2   rmind 
    362      1.2   rmind 	for (i = 0; i < NPF_STATS_COUNT; i++) {
    363      1.2   rmind 		full_stats[i] += percpu_stats[i];
    364      1.2   rmind 	}
    365      1.2   rmind }
    366      1.2   rmind 
    367      1.2   rmind /*
    368      1.2   rmind  * npfctl_stats: export collected statistics.
    369      1.2   rmind  */
    370      1.2   rmind static int
    371      1.2   rmind npfctl_stats(void *data)
    372      1.2   rmind {
    373      1.2   rmind 	uint64_t *fullst, *uptr = *(uint64_t **)data;
    374      1.2   rmind 	int error;
    375      1.2   rmind 
    376      1.2   rmind 	fullst = kmem_zalloc(NPF_STATS_SIZE, KM_SLEEP);
    377      1.2   rmind 	percpu_foreach(npf_stats_percpu, npf_stats_collect, fullst);
    378      1.2   rmind 	error = copyout(fullst, uptr, NPF_STATS_SIZE);
    379      1.2   rmind 	kmem_free(fullst, NPF_STATS_SIZE);
    380      1.2   rmind 	return error;
    381      1.2   rmind }
    382