Home | History | Annotate | Line # | Download | only in npf
npf.c revision 1.7.2.3
      1  1.7.2.3    riz /*	$NetBSD: npf.c,v 1.7.2.3 2012/07/16 22:13:27 riz Exp $	*/
      2      1.1  rmind 
      3      1.1  rmind /*-
      4      1.1  rmind  * Copyright (c) 2009-2010 The NetBSD Foundation, Inc.
      5      1.1  rmind  * All rights reserved.
      6      1.1  rmind  *
      7      1.1  rmind  * This material is based upon work partially supported by The
      8      1.1  rmind  * NetBSD Foundation under a contract with Mindaugas Rasiukevicius.
      9      1.1  rmind  *
     10      1.1  rmind  * Redistribution and use in source and binary forms, with or without
     11      1.1  rmind  * modification, are permitted provided that the following conditions
     12      1.1  rmind  * are met:
     13      1.1  rmind  * 1. Redistributions of source code must retain the above copyright
     14      1.1  rmind  *    notice, this list of conditions and the following disclaimer.
     15      1.1  rmind  * 2. Redistributions in binary form must reproduce the above copyright
     16      1.1  rmind  *    notice, this list of conditions and the following disclaimer in the
     17      1.1  rmind  *    documentation and/or other materials provided with the distribution.
     18      1.1  rmind  *
     19      1.1  rmind  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     20      1.1  rmind  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     21      1.1  rmind  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     22      1.1  rmind  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     23      1.1  rmind  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     24      1.1  rmind  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     25      1.1  rmind  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     26      1.1  rmind  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     27      1.1  rmind  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     28      1.1  rmind  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     29      1.1  rmind  * POSSIBILITY OF SUCH DAMAGE.
     30      1.1  rmind  */
     31      1.1  rmind 
     32      1.1  rmind /*
     33      1.1  rmind  * NPF main: dynamic load/initialisation and unload routines.
     34      1.1  rmind  */
     35      1.1  rmind 
     36      1.1  rmind #include <sys/cdefs.h>
     37  1.7.2.3    riz __KERNEL_RCSID(0, "$NetBSD: npf.c,v 1.7.2.3 2012/07/16 22:13:27 riz Exp $");
     38      1.1  rmind 
     39      1.1  rmind #include <sys/param.h>
     40      1.1  rmind #include <sys/types.h>
     41      1.1  rmind 
     42      1.2  rmind #include <sys/atomic.h>
     43      1.1  rmind #include <sys/conf.h>
     44      1.1  rmind #include <sys/kauth.h>
     45      1.2  rmind #include <sys/kmem.h>
     46      1.1  rmind #include <sys/lwp.h>
     47      1.1  rmind #include <sys/module.h>
     48      1.2  rmind #include <sys/percpu.h>
     49      1.2  rmind #include <sys/rwlock.h>
     50      1.1  rmind #include <sys/socketvar.h>
     51  1.7.2.2    riz #include <sys/sysctl.h>
     52      1.1  rmind #include <sys/uio.h>
     53      1.1  rmind 
     54      1.1  rmind #include "npf_impl.h"
     55      1.1  rmind 
     56      1.1  rmind /*
     57      1.1  rmind  * Module and device structures.
     58      1.1  rmind  */
     59      1.6   tron MODULE(MODULE_CLASS_DRIVER, npf, NULL);
     60      1.1  rmind 
     61      1.1  rmind void		npfattach(int);
     62      1.1  rmind 
     63      1.5   yamt static int	npf_fini(void);
     64      1.1  rmind static int	npf_dev_open(dev_t, int, int, lwp_t *);
     65      1.1  rmind static int	npf_dev_close(dev_t, int, int, lwp_t *);
     66      1.1  rmind static int	npf_dev_ioctl(dev_t, u_long, void *, int, lwp_t *);
     67      1.1  rmind static int	npf_dev_poll(dev_t, int, lwp_t *);
     68      1.1  rmind static int	npf_dev_read(dev_t, struct uio *, int);
     69      1.1  rmind 
     70      1.2  rmind typedef struct {
     71      1.2  rmind 	npf_ruleset_t *		n_rules;
     72      1.2  rmind 	npf_tableset_t *	n_tables;
     73      1.2  rmind 	npf_ruleset_t *		n_nat_rules;
     74  1.7.2.1    riz 	prop_dictionary_t	n_dict;
     75  1.7.2.1    riz 	bool			n_default_pass;
     76      1.2  rmind } npf_core_t;
     77      1.2  rmind 
     78      1.2  rmind static void	npf_core_destroy(npf_core_t *);
     79      1.2  rmind static int	npfctl_stats(void *);
     80      1.2  rmind 
     81      1.2  rmind static krwlock_t		npf_lock		__cacheline_aligned;
     82      1.2  rmind static npf_core_t *		npf_core		__cacheline_aligned;
     83      1.2  rmind static percpu_t *		npf_stats_percpu	__read_mostly;
     84  1.7.2.2    riz static struct sysctllog *	npf_sysctl		__read_mostly;
     85      1.2  rmind 
     86      1.1  rmind const struct cdevsw npf_cdevsw = {
     87      1.1  rmind 	npf_dev_open, npf_dev_close, npf_dev_read, nowrite, npf_dev_ioctl,
     88      1.1  rmind 	nostop, notty, npf_dev_poll, nommap, nokqfilter, D_OTHER | D_MPSAFE
     89      1.1  rmind };
     90      1.1  rmind 
     91      1.1  rmind static int
     92      1.1  rmind npf_init(void)
     93      1.1  rmind {
     94      1.1  rmind #ifdef _MODULE
     95      1.1  rmind 	devmajor_t bmajor = NODEVMAJOR, cmajor = NODEVMAJOR;
     96      1.1  rmind #endif
     97      1.2  rmind 	npf_ruleset_t *rset, *nset;
     98      1.2  rmind 	npf_tableset_t *tset;
     99  1.7.2.1    riz 	prop_dictionary_t dict;
    100      1.2  rmind 	int error = 0;
    101      1.2  rmind 
    102      1.2  rmind 	rw_init(&npf_lock);
    103      1.2  rmind 	npf_stats_percpu = percpu_alloc(NPF_STATS_SIZE);
    104  1.7.2.2    riz 	npf_sysctl = NULL;
    105  1.7.2.2    riz 
    106      1.2  rmind 	npf_tableset_sysinit();
    107      1.2  rmind 	npf_session_sysinit();
    108      1.1  rmind 	npf_nat_sysinit();
    109      1.1  rmind 	npf_alg_sysinit();
    110      1.2  rmind 	npflogattach(1);
    111      1.2  rmind 
    112      1.2  rmind 	/* Load empty configuration. */
    113  1.7.2.1    riz 	dict = prop_dictionary_create();
    114      1.2  rmind 	rset = npf_ruleset_create();
    115      1.2  rmind 	tset = npf_tableset_create();
    116      1.2  rmind 	nset = npf_ruleset_create();
    117  1.7.2.1    riz 	npf_reload(dict, rset, tset, nset, true);
    118      1.2  rmind 	KASSERT(npf_core != NULL);
    119      1.1  rmind 
    120      1.1  rmind #ifdef _MODULE
    121      1.1  rmind 	/* Attach /dev/npf device. */
    122      1.1  rmind 	error = devsw_attach("npf", NULL, &bmajor, &npf_cdevsw, &cmajor);
    123      1.1  rmind 	if (error) {
    124      1.2  rmind 		/* It will call devsw_detach(), which is safe. */
    125      1.2  rmind 		(void)npf_fini();
    126      1.1  rmind 	}
    127      1.1  rmind #endif
    128      1.1  rmind 	return error;
    129      1.1  rmind }
    130      1.1  rmind 
    131      1.1  rmind static int
    132      1.1  rmind npf_fini(void)
    133      1.1  rmind {
    134      1.1  rmind 
    135  1.7.2.1    riz 	/* At first, detach device and remove pfil hooks. */
    136      1.1  rmind #ifdef _MODULE
    137      1.1  rmind 	devsw_detach(NULL, &npf_cdevsw);
    138      1.1  rmind #endif
    139      1.2  rmind 	npflogdetach();
    140  1.7.2.1    riz 	npf_pfil_unregister();
    141      1.2  rmind 
    142  1.7.2.1    riz 	/* Flush all sessions, destroy configuration (ruleset, etc). */
    143  1.7.2.1    riz 	npf_session_tracking(false);
    144  1.7.2.1    riz 	npf_core_destroy(npf_core);
    145  1.7.2.1    riz 
    146  1.7.2.1    riz 	/* Finally, safe to destroy the subsystems. */
    147      1.1  rmind 	npf_alg_sysfini();
    148  1.7.2.1    riz 	npf_nat_sysfini();
    149      1.1  rmind 	npf_session_sysfini();
    150      1.1  rmind 	npf_tableset_sysfini();
    151  1.7.2.2    riz 
    152  1.7.2.2    riz 	if (npf_sysctl) {
    153  1.7.2.2    riz 		sysctl_teardown(&npf_sysctl);
    154  1.7.2.2    riz 	}
    155      1.2  rmind 	percpu_free(npf_stats_percpu, NPF_STATS_SIZE);
    156      1.2  rmind 	rw_destroy(&npf_lock);
    157      1.1  rmind 
    158      1.1  rmind 	return 0;
    159      1.1  rmind }
    160      1.1  rmind 
    161      1.1  rmind /*
    162      1.1  rmind  * Module interface.
    163      1.1  rmind  */
    164      1.1  rmind static int
    165      1.1  rmind npf_modcmd(modcmd_t cmd, void *arg)
    166      1.1  rmind {
    167      1.1  rmind 
    168      1.1  rmind 	switch (cmd) {
    169      1.1  rmind 	case MODULE_CMD_INIT:
    170      1.1  rmind 		return npf_init();
    171      1.1  rmind 	case MODULE_CMD_FINI:
    172      1.1  rmind 		return npf_fini();
    173  1.7.2.3    riz 	case MODULE_CMD_AUTOUNLOAD:
    174  1.7.2.3    riz 		if (npf_pfil_registered_p() || !npf_default_pass()) {
    175  1.7.2.3    riz 			return EBUSY;
    176  1.7.2.3    riz 		}
    177  1.7.2.3    riz 		break;
    178      1.1  rmind 	default:
    179      1.1  rmind 		return ENOTTY;
    180      1.1  rmind 	}
    181      1.1  rmind 	return 0;
    182      1.1  rmind }
    183      1.1  rmind 
    184      1.1  rmind void
    185      1.1  rmind npfattach(int nunits)
    186      1.1  rmind {
    187      1.1  rmind 
    188      1.1  rmind 	/* Void. */
    189      1.1  rmind }
    190      1.1  rmind 
    191      1.1  rmind static int
    192      1.1  rmind npf_dev_open(dev_t dev, int flag, int mode, lwp_t *l)
    193      1.1  rmind {
    194      1.1  rmind 
    195      1.1  rmind 	/* Available only for super-user. */
    196      1.1  rmind 	if (kauth_authorize_generic(l->l_cred, KAUTH_GENERIC_ISSUSER, NULL)) {
    197      1.1  rmind 		return EPERM;
    198      1.1  rmind 	}
    199      1.1  rmind 	return 0;
    200      1.1  rmind }
    201      1.1  rmind 
    202      1.1  rmind static int
    203      1.1  rmind npf_dev_close(dev_t dev, int flag, int mode, lwp_t *l)
    204      1.1  rmind {
    205      1.1  rmind 
    206      1.1  rmind 	return 0;
    207      1.1  rmind }
    208      1.1  rmind 
    209      1.1  rmind static int
    210      1.1  rmind npf_dev_ioctl(dev_t dev, u_long cmd, void *data, int flag, lwp_t *l)
    211      1.1  rmind {
    212      1.1  rmind 	int error;
    213      1.1  rmind 
    214      1.1  rmind 	/* Available only for super-user. */
    215      1.1  rmind 	if (kauth_authorize_generic(l->l_cred, KAUTH_GENERIC_ISSUSER, NULL)) {
    216      1.1  rmind 		return EPERM;
    217      1.1  rmind 	}
    218      1.1  rmind 
    219      1.1  rmind 	switch (cmd) {
    220      1.1  rmind 	case IOC_NPF_VERSION:
    221      1.1  rmind 		*(int *)data = NPF_VERSION;
    222      1.1  rmind 		error = 0;
    223      1.1  rmind 		break;
    224      1.1  rmind 	case IOC_NPF_SWITCH:
    225      1.1  rmind 		error = npfctl_switch(data);
    226      1.1  rmind 		break;
    227      1.1  rmind 	case IOC_NPF_RELOAD:
    228      1.1  rmind 		error = npfctl_reload(cmd, data);
    229      1.1  rmind 		break;
    230  1.7.2.1    riz 	case IOC_NPF_GETCONF:
    231  1.7.2.1    riz 		error = npfctl_getconf(cmd, data);
    232  1.7.2.1    riz 		break;
    233      1.1  rmind 	case IOC_NPF_TABLE:
    234      1.1  rmind 		error = npfctl_table(data);
    235      1.1  rmind 		break;
    236      1.2  rmind 	case IOC_NPF_STATS:
    237      1.2  rmind 		error = npfctl_stats(data);
    238      1.2  rmind 		break;
    239      1.2  rmind 	case IOC_NPF_SESSIONS_SAVE:
    240      1.2  rmind 		error = npfctl_sessions_save(cmd, data);
    241      1.2  rmind 		break;
    242      1.2  rmind 	case IOC_NPF_SESSIONS_LOAD:
    243      1.2  rmind 		error = npfctl_sessions_load(cmd, data);
    244      1.2  rmind 		break;
    245      1.4  rmind 	case IOC_NPF_UPDATE_RULE:
    246      1.4  rmind 		error = npfctl_update_rule(cmd, data);
    247      1.4  rmind 		break;
    248      1.1  rmind 	default:
    249      1.1  rmind 		error = ENOTTY;
    250      1.1  rmind 		break;
    251      1.1  rmind 	}
    252      1.1  rmind 	return error;
    253      1.1  rmind }
    254      1.1  rmind 
    255      1.1  rmind static int
    256      1.1  rmind npf_dev_poll(dev_t dev, int events, lwp_t *l)
    257      1.1  rmind {
    258      1.1  rmind 
    259      1.1  rmind 	return ENOTSUP;
    260      1.1  rmind }
    261      1.1  rmind 
    262      1.1  rmind static int
    263      1.1  rmind npf_dev_read(dev_t dev, struct uio *uio, int flag)
    264      1.1  rmind {
    265      1.1  rmind 
    266      1.1  rmind 	return ENOTSUP;
    267      1.1  rmind }
    268      1.2  rmind 
    269      1.2  rmind /*
    270      1.2  rmind  * NPF core loading/reloading/unloading mechanism.
    271      1.2  rmind  */
    272      1.2  rmind 
    273      1.2  rmind static void
    274      1.2  rmind npf_core_destroy(npf_core_t *nc)
    275      1.2  rmind {
    276      1.2  rmind 
    277  1.7.2.1    riz 	prop_object_release(nc->n_dict);
    278      1.2  rmind 	npf_ruleset_destroy(nc->n_rules);
    279      1.2  rmind 	npf_ruleset_destroy(nc->n_nat_rules);
    280      1.3  rmind 	npf_tableset_destroy(nc->n_tables);
    281      1.2  rmind 	kmem_free(nc, sizeof(npf_core_t));
    282      1.2  rmind }
    283      1.2  rmind 
    284      1.2  rmind /*
    285      1.2  rmind  * npf_reload: atomically load new ruleset, tableset and NAT policies.
    286      1.2  rmind  * Then destroy old (unloaded) structures.
    287      1.2  rmind  */
    288      1.2  rmind void
    289  1.7.2.1    riz npf_reload(prop_dictionary_t dict, npf_ruleset_t *rset,
    290  1.7.2.1    riz     npf_tableset_t *tset, npf_ruleset_t *nset, bool flush)
    291      1.2  rmind {
    292      1.2  rmind 	npf_core_t *nc, *onc;
    293      1.2  rmind 
    294      1.2  rmind 	/* Setup a new core structure. */
    295  1.7.2.1    riz 	nc = kmem_zalloc(sizeof(npf_core_t), KM_SLEEP);
    296      1.2  rmind 	nc->n_rules = rset;
    297      1.2  rmind 	nc->n_tables = tset;
    298      1.2  rmind 	nc->n_nat_rules = nset;
    299  1.7.2.1    riz 	nc->n_dict = dict;
    300  1.7.2.1    riz 	nc->n_default_pass = flush;
    301      1.2  rmind 
    302      1.2  rmind 	/* Lock and load the core structure. */
    303      1.2  rmind 	rw_enter(&npf_lock, RW_WRITER);
    304      1.2  rmind 	onc = atomic_swap_ptr(&npf_core, nc);
    305      1.2  rmind 	if (onc) {
    306      1.2  rmind 		/* Reload only necessary NAT policies. */
    307      1.2  rmind 		npf_ruleset_natreload(nset, onc->n_nat_rules);
    308      1.2  rmind 	}
    309      1.2  rmind 	/* Unlock.  Everything goes "live" now. */
    310      1.2  rmind 	rw_exit(&npf_lock);
    311      1.2  rmind 
    312      1.2  rmind 	if (onc) {
    313      1.2  rmind 		/* Destroy unloaded structures. */
    314      1.2  rmind 		npf_core_destroy(onc);
    315      1.2  rmind 	}
    316      1.2  rmind }
    317      1.2  rmind 
    318      1.2  rmind void
    319      1.2  rmind npf_core_enter(void)
    320      1.2  rmind {
    321      1.2  rmind 	rw_enter(&npf_lock, RW_READER);
    322      1.2  rmind }
    323      1.2  rmind 
    324      1.2  rmind npf_ruleset_t *
    325      1.2  rmind npf_core_ruleset(void)
    326      1.2  rmind {
    327      1.2  rmind 	KASSERT(rw_lock_held(&npf_lock));
    328      1.2  rmind 	return npf_core->n_rules;
    329      1.2  rmind }
    330      1.2  rmind 
    331      1.2  rmind npf_ruleset_t *
    332      1.2  rmind npf_core_natset(void)
    333      1.2  rmind {
    334      1.2  rmind 	KASSERT(rw_lock_held(&npf_lock));
    335      1.2  rmind 	return npf_core->n_nat_rules;
    336      1.2  rmind }
    337      1.2  rmind 
    338      1.2  rmind npf_tableset_t *
    339      1.2  rmind npf_core_tableset(void)
    340      1.2  rmind {
    341      1.2  rmind 	KASSERT(rw_lock_held(&npf_lock));
    342      1.2  rmind 	return npf_core->n_tables;
    343      1.2  rmind }
    344      1.2  rmind 
    345      1.2  rmind void
    346      1.2  rmind npf_core_exit(void)
    347      1.2  rmind {
    348      1.2  rmind 	rw_exit(&npf_lock);
    349      1.2  rmind }
    350      1.2  rmind 
    351      1.2  rmind bool
    352      1.2  rmind npf_core_locked(void)
    353      1.2  rmind {
    354      1.2  rmind 	return rw_lock_held(&npf_lock);
    355      1.2  rmind }
    356      1.2  rmind 
    357  1.7.2.1    riz prop_dictionary_t
    358  1.7.2.1    riz npf_core_dict(void)
    359  1.7.2.1    riz {
    360  1.7.2.1    riz 	KASSERT(rw_lock_held(&npf_lock));
    361  1.7.2.1    riz 	return npf_core->n_dict;
    362  1.7.2.1    riz }
    363  1.7.2.1    riz 
    364  1.7.2.1    riz bool
    365  1.7.2.1    riz npf_default_pass(void)
    366  1.7.2.1    riz {
    367  1.7.2.1    riz 	KASSERT(rw_lock_held(&npf_lock));
    368  1.7.2.1    riz 	return npf_core->n_default_pass;
    369  1.7.2.1    riz }
    370  1.7.2.1    riz 
    371      1.2  rmind /*
    372      1.2  rmind  * NPF statistics interface.
    373      1.2  rmind  */
    374      1.2  rmind 
    375      1.2  rmind void
    376      1.2  rmind npf_stats_inc(npf_stats_t st)
    377      1.2  rmind {
    378      1.2  rmind 	uint64_t *stats = percpu_getref(npf_stats_percpu);
    379      1.2  rmind 	stats[st]++;
    380      1.2  rmind 	percpu_putref(npf_stats_percpu);
    381      1.2  rmind }
    382      1.2  rmind 
    383      1.2  rmind void
    384      1.2  rmind npf_stats_dec(npf_stats_t st)
    385      1.2  rmind {
    386      1.2  rmind 	uint64_t *stats = percpu_getref(npf_stats_percpu);
    387      1.2  rmind 	stats[st]--;
    388      1.2  rmind 	percpu_putref(npf_stats_percpu);
    389      1.2  rmind }
    390      1.2  rmind 
    391      1.2  rmind static void
    392      1.2  rmind npf_stats_collect(void *mem, void *arg, struct cpu_info *ci)
    393      1.2  rmind {
    394      1.2  rmind 	uint64_t *percpu_stats = mem, *full_stats = arg;
    395      1.2  rmind 	int i;
    396      1.2  rmind 
    397      1.2  rmind 	for (i = 0; i < NPF_STATS_COUNT; i++) {
    398      1.2  rmind 		full_stats[i] += percpu_stats[i];
    399      1.2  rmind 	}
    400      1.2  rmind }
    401      1.2  rmind 
    402      1.2  rmind /*
    403      1.2  rmind  * npfctl_stats: export collected statistics.
    404      1.2  rmind  */
    405      1.2  rmind static int
    406      1.2  rmind npfctl_stats(void *data)
    407      1.2  rmind {
    408      1.2  rmind 	uint64_t *fullst, *uptr = *(uint64_t **)data;
    409      1.2  rmind 	int error;
    410      1.2  rmind 
    411      1.2  rmind 	fullst = kmem_zalloc(NPF_STATS_SIZE, KM_SLEEP);
    412      1.2  rmind 	percpu_foreach(npf_stats_percpu, npf_stats_collect, fullst);
    413      1.2  rmind 	error = copyout(fullst, uptr, NPF_STATS_SIZE);
    414      1.2  rmind 	kmem_free(fullst, NPF_STATS_SIZE);
    415      1.2  rmind 	return error;
    416      1.2  rmind }
    417