Home | History | Annotate | Line # | Download | only in kern
uipc_accf.c revision 1.10
      1  1.10   pooka /*	$NetBSD: uipc_accf.c,v 1.10 2009/09/17 08:09:49 pooka Exp $	*/
      2   1.5      ad 
      3   1.5      ad /*-
      4   1.5      ad  * Copyright (c) 2008 The NetBSD Foundation, Inc.
      5   1.5      ad  * All rights reserved.
      6   1.5      ad  *
      7   1.5      ad  * This code is derived from software developed for The NetBSD Foundation
      8   1.5      ad  * by Andrew Doran.
      9   1.5      ad  *
     10   1.5      ad  * Redistribution and use in source and binary forms, with or without
     11   1.5      ad  * modification, are permitted provided that the following conditions
     12   1.5      ad  * are met:
     13   1.5      ad  * 1. Redistributions of source code must retain the above copyright
     14   1.5      ad  *    notice, this list of conditions and the following disclaimer.
     15   1.5      ad  * 2. Redistributions in binary form must reproduce the above copyright
     16   1.5      ad  *    notice, this list of conditions and the following disclaimer in the
     17   1.5      ad  *    documentation and/or other materials provided with the distribution.
     18   1.5      ad  *
     19   1.5      ad  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     20   1.5      ad  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     21   1.5      ad  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     22   1.5      ad  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     23   1.5      ad  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     24   1.5      ad  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     25   1.5      ad  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     26   1.5      ad  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     27   1.5      ad  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     28   1.5      ad  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     29   1.5      ad  * POSSIBILITY OF SUCH DAMAGE.
     30   1.5      ad  */
     31   1.3   pooka 
     32   1.1     tls /*-
     33   1.1     tls  * Copyright (c) 2000 Paycounter, Inc.
     34   1.1     tls  * Copyright (c) 2005 Robert N. M. Watson
     35   1.1     tls  * Author: Alfred Perlstein <alfred (at) paycounter.com>, <alfred (at) FreeBSD.org>
     36   1.1     tls  * All rights reserved.
     37   1.1     tls  *
     38   1.1     tls  * Redistribution and use in source and binary forms, with or without
     39   1.1     tls  * modification, are permitted provided that the following conditions
     40   1.1     tls  * are met:
     41   1.1     tls  * 1. Redistributions of source code must retain the above copyright
     42   1.1     tls  *    notice, this list of conditions and the following disclaimer.
     43   1.1     tls  * 2. Redistributions in binary form must reproduce the above copyright
     44   1.1     tls  *    notice, this list of conditions and the following disclaimer in the
     45   1.1     tls  *    documentation and/or other materials provided with the distribution.
     46   1.1     tls  *
     47   1.1     tls  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
     48   1.1     tls  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     49   1.1     tls  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     50   1.1     tls  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
     51   1.1     tls  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     52   1.1     tls  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     53   1.1     tls  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     54   1.1     tls  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     55   1.1     tls  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     56   1.1     tls  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     57   1.1     tls  * SUCH DAMAGE.
     58   1.1     tls  */
     59   1.1     tls 
     60   1.1     tls #include <sys/cdefs.h>
     61  1.10   pooka __KERNEL_RCSID(0, "$NetBSD: uipc_accf.c,v 1.10 2009/09/17 08:09:49 pooka Exp $");
     62   1.1     tls 
     63   1.1     tls #define ACCEPT_FILTER_MOD
     64   1.1     tls 
     65   1.1     tls #include <sys/param.h>
     66   1.1     tls #include <sys/systm.h>
     67   1.1     tls #include <sys/domain.h>
     68   1.1     tls #include <sys/kernel.h>
     69   1.1     tls #include <sys/lock.h>
     70   1.4     tls #include <sys/kmem.h>
     71   1.1     tls #include <sys/mbuf.h>
     72   1.5      ad #include <sys/rwlock.h>
     73   1.1     tls #include <sys/protosw.h>
     74   1.1     tls #include <sys/sysctl.h>
     75   1.1     tls #include <sys/socket.h>
     76   1.1     tls #include <sys/socketvar.h>
     77   1.1     tls #include <sys/queue.h>
     78   1.1     tls #include <sys/once.h>
     79   1.5      ad #include <sys/atomic.h>
     80   1.8      ad #include <sys/module.h>
     81   1.1     tls 
     82   1.5      ad static krwlock_t accept_filter_lock;
     83   1.1     tls 
     84   1.5      ad static LIST_HEAD(, accept_filter) accept_filtlsthd =
     85   1.5      ad     LIST_HEAD_INITIALIZER(&accept_filtlsthd);
     86   1.1     tls 
     87   1.1     tls /*
     88   1.1     tls  * Names of Accept filter sysctl objects
     89   1.1     tls  */
     90  1.10   pooka static struct sysctllog *ctllog;
     91   1.9   pooka static void
     92  1.10   pooka sysctl_net_inet_accf_setup(void)
     93   1.1     tls {
     94   1.5      ad 
     95  1.10   pooka 	sysctl_createv(&ctllog, 0, NULL, NULL,
     96   1.1     tls 		       CTLFLAG_PERMANENT,
     97   1.1     tls 		       CTLTYPE_NODE, "net", NULL,
     98   1.1     tls 		       NULL, 0, NULL, 0,
     99   1.1     tls 		       CTL_NET, CTL_EOL);
    100  1.10   pooka 	sysctl_createv(&ctllog, 0, NULL, NULL,
    101   1.1     tls 		       CTLFLAG_PERMANENT,
    102   1.1     tls 		       CTLTYPE_NODE, "inet", NULL,
    103   1.1     tls 		       NULL, 0, NULL, 0,
    104   1.1     tls 		       CTL_NET, PF_INET, CTL_EOL);
    105  1.10   pooka 	sysctl_createv(&ctllog, 0, NULL, NULL,
    106   1.1     tls 		       CTLFLAG_PERMANENT,
    107   1.1     tls 		       CTLTYPE_NODE, "accf",
    108   1.1     tls 		       SYSCTL_DESCR("Accept filters"),
    109   1.1     tls 		       NULL, 0, NULL, 0,
    110   1.1     tls 		       CTL_NET, PF_INET, SO_ACCEPTFILTER, CTL_EOL);
    111   1.1     tls }
    112   1.1     tls 
    113   1.1     tls int
    114   1.1     tls accept_filt_add(struct accept_filter *filt)
    115   1.1     tls {
    116   1.1     tls 	struct accept_filter *p;
    117   1.1     tls 
    118   1.7      ad 	accept_filter_init();
    119   1.7      ad 
    120   1.5      ad 	rw_enter(&accept_filter_lock, RW_WRITER);
    121   1.5      ad 	LIST_FOREACH(p, &accept_filtlsthd, accf_next) {
    122   1.1     tls 		if (strcmp(p->accf_name, filt->accf_name) == 0)  {
    123   1.5      ad 			rw_exit(&accept_filter_lock);
    124   1.5      ad 			return EEXIST;
    125   1.1     tls 		}
    126   1.5      ad 	}
    127   1.5      ad 	LIST_INSERT_HEAD(&accept_filtlsthd, filt, accf_next);
    128   1.5      ad 	rw_exit(&accept_filter_lock);
    129   1.5      ad 
    130   1.5      ad 	return 0;
    131   1.1     tls }
    132   1.1     tls 
    133   1.1     tls int
    134   1.5      ad accept_filt_del(struct accept_filter *p)
    135   1.1     tls {
    136   1.1     tls 
    137   1.5      ad 	rw_enter(&accept_filter_lock, RW_WRITER);
    138   1.5      ad 	if (p->accf_refcnt != 0) {
    139   1.5      ad 		rw_exit(&accept_filter_lock);
    140   1.5      ad 		return EBUSY;
    141   1.5      ad 	}
    142   1.5      ad 	LIST_REMOVE(p, accf_next);
    143   1.5      ad 	rw_exit(&accept_filter_lock);
    144   1.1     tls 
    145   1.5      ad 	return 0;
    146   1.1     tls }
    147   1.1     tls 
    148   1.1     tls struct accept_filter *
    149   1.1     tls accept_filt_get(char *name)
    150   1.1     tls {
    151   1.1     tls 	struct accept_filter *p;
    152   1.8      ad 	char buf[32];
    153   1.8      ad 	u_int gen;
    154   1.1     tls 
    155   1.8      ad 	do {
    156   1.8      ad 		rw_enter(&accept_filter_lock, RW_READER);
    157   1.8      ad 		LIST_FOREACH(p, &accept_filtlsthd, accf_next) {
    158   1.8      ad 			if (strcmp(p->accf_name, name) == 0) {
    159   1.8      ad 				atomic_inc_uint(&p->accf_refcnt);
    160   1.8      ad 				break;
    161   1.8      ad 			}
    162   1.8      ad 		}
    163   1.8      ad 		rw_exit(&accept_filter_lock);
    164   1.8      ad 		if (p != NULL) {
    165   1.1     tls 			break;
    166   1.5      ad 		}
    167   1.8      ad 		/* Try to autoload a module to satisfy the request. */
    168   1.8      ad 		strcpy(buf, "accf_");
    169   1.8      ad 		strlcat(buf, name, sizeof(buf));
    170   1.8      ad 		mutex_enter(&module_lock);
    171   1.8      ad 		gen = module_gen;
    172   1.8      ad 		(void)module_autoload(buf, MODULE_CLASS_ANY);
    173   1.8      ad 		mutex_exit(&module_lock);
    174   1.8      ad 	} while (gen != module_gen);
    175   1.1     tls 
    176   1.5      ad 	return p;
    177   1.1     tls }
    178   1.1     tls 
    179   1.1     tls /*
    180   1.1     tls  * Accept filter initialization routine.
    181   1.1     tls  * This should be called only once.
    182   1.1     tls  */
    183   1.1     tls 
    184   1.1     tls static int
    185   1.1     tls accept_filter_init0(void)
    186   1.1     tls {
    187   1.5      ad 
    188   1.5      ad 	rw_init(&accept_filter_lock);
    189  1.10   pooka 	sysctl_net_inet_accf_setup();
    190   1.1     tls 
    191   1.1     tls 	return 0;
    192   1.1     tls }
    193   1.1     tls 
    194   1.1     tls /*
    195   1.1     tls  * Initialization routine: This can also be replaced with
    196   1.1     tls  * accept_filt_generic_mod_event for attaching new accept filter.
    197   1.1     tls  */
    198   1.1     tls 
    199   1.1     tls void
    200   1.1     tls accept_filter_init(void)
    201   1.1     tls {
    202   1.1     tls 	static ONCE_DECL(accept_filter_init_once);
    203   1.1     tls 
    204   1.1     tls 	RUN_ONCE(&accept_filter_init_once, accept_filter_init0);
    205   1.1     tls }
    206   1.1     tls 
    207   1.1     tls int
    208   1.5      ad accept_filt_getopt(struct socket *so, struct sockopt *sopt)
    209   1.1     tls {
    210   1.2  plunky 	struct accept_filter_arg afa;
    211   1.1     tls 	int error;
    212   1.1     tls 
    213   1.5      ad 	KASSERT(solocked(so));
    214   1.5      ad 
    215   1.1     tls 	if ((so->so_options & SO_ACCEPTCONN) == 0) {
    216   1.1     tls 		error = EINVAL;
    217   1.1     tls 		goto out;
    218   1.1     tls 	}
    219   1.1     tls 	if ((so->so_options & SO_ACCEPTFILTER) == 0) {
    220   1.1     tls 		error = EINVAL;
    221   1.1     tls 		goto out;
    222   1.1     tls 	}
    223   1.2  plunky 
    224   1.2  plunky 	memset(&afa, 0, sizeof(afa));
    225   1.2  plunky 	strcpy(afa.af_name, so->so_accf->so_accept_filter->accf_name);
    226   1.1     tls 	if (so->so_accf->so_accept_filter_str != NULL)
    227   1.2  plunky 		strcpy(afa.af_arg, so->so_accf->so_accept_filter_str);
    228   1.2  plunky 	error = sockopt_set(sopt, &afa, sizeof(afa));
    229   1.1     tls out:
    230   1.5      ad 	return error;
    231   1.5      ad }
    232   1.5      ad 
    233   1.5      ad /*
    234   1.5      ad  * Simple delete case, with socket locked.
    235   1.5      ad  */
    236   1.5      ad int
    237   1.5      ad accept_filt_clear(struct socket *so)
    238   1.5      ad {
    239   1.5      ad 	struct accept_filter_arg afa;
    240   1.5      ad 	struct accept_filter *afp;
    241   1.6      ad 	struct socket *so2, *next;
    242   1.5      ad 	struct so_accf *af;
    243   1.5      ad 
    244   1.5      ad 	KASSERT(solocked(so));
    245   1.5      ad 
    246   1.5      ad 	if ((so->so_options & SO_ACCEPTCONN) == 0) {
    247   1.5      ad 		return EINVAL;
    248   1.5      ad 	}
    249   1.5      ad 	if (so->so_accf != NULL) {
    250   1.5      ad 		/* Break in-flight processing. */
    251   1.6      ad 		for (so2 = TAILQ_FIRST(&so->so_q0); so2 != NULL; so2 = next) {
    252   1.6      ad 			next = TAILQ_NEXT(so2, so_qe);
    253   1.5      ad 			if (so2->so_upcall == NULL) {
    254   1.5      ad 				continue;
    255   1.5      ad 			}
    256   1.5      ad 			so2->so_upcall = NULL;
    257   1.5      ad 			so2->so_upcallarg = NULL;
    258   1.6      ad 			so2->so_options &= ~SO_ACCEPTFILTER;
    259   1.5      ad 			so2->so_rcv.sb_flags &= ~SB_UPCALL;
    260   1.6      ad 			soisconnected(so2);
    261   1.5      ad 		}
    262   1.5      ad 		af = so->so_accf;
    263   1.5      ad 		afp = af->so_accept_filter;
    264   1.5      ad 		if (afp != NULL && afp->accf_destroy != NULL) {
    265   1.5      ad 			(*afp->accf_destroy)(so);
    266   1.5      ad 		}
    267   1.5      ad 		if (af->so_accept_filter_str != NULL) {
    268   1.5      ad 			kmem_free(af->so_accept_filter_str,
    269   1.5      ad 			    sizeof(afa.af_name));
    270   1.5      ad 		}
    271   1.5      ad 		kmem_free(af, sizeof(*af));
    272   1.5      ad 		so->so_accf = NULL;
    273   1.5      ad 		atomic_dec_uint(&afp->accf_refcnt);
    274   1.5      ad 	}
    275   1.5      ad 	so->so_options &= ~SO_ACCEPTFILTER;
    276   1.5      ad 	return 0;
    277   1.1     tls }
    278   1.1     tls 
    279   1.5      ad /*
    280   1.5      ad  * setsockopt() for accept filters.  Called with the socket unlocked,
    281   1.5      ad  * will always return it locked.
    282   1.5      ad  */
    283   1.1     tls int
    284   1.5      ad accept_filt_setopt(struct socket *so, const struct sockopt *sopt)
    285   1.1     tls {
    286   1.2  plunky 	struct accept_filter_arg afa;
    287   1.1     tls 	struct accept_filter *afp;
    288   1.1     tls 	struct so_accf *newaf;
    289   1.2  plunky 	int error;
    290   1.1     tls 
    291   1.2  plunky 	if (sopt == NULL || sopt->sopt_size == 0) {
    292   1.5      ad 		solock(so);
    293   1.5      ad 		return accept_filt_clear(so);
    294   1.1     tls 	}
    295   1.1     tls 
    296   1.1     tls 	/*
    297   1.1     tls 	 * Pre-allocate any memory we may need later to avoid blocking at
    298   1.1     tls 	 * untimely moments.  This does not optimize for invalid arguments.
    299   1.1     tls 	 */
    300   1.2  plunky 	error = sockopt_get(sopt, &afa, sizeof(afa));
    301   1.2  plunky 	if (error) {
    302   1.5      ad 		solock(so);
    303   1.5      ad 		return error;
    304   1.1     tls 	}
    305   1.2  plunky 	afa.af_name[sizeof(afa.af_name)-1] = '\0';
    306   1.2  plunky 	afa.af_arg[sizeof(afa.af_arg)-1] = '\0';
    307   1.2  plunky 	afp = accept_filt_get(afa.af_name);
    308   1.1     tls 	if (afp == NULL) {
    309   1.5      ad 		solock(so);
    310   1.5      ad 		return ENOENT;
    311   1.1     tls 	}
    312   1.1     tls 	/*
    313   1.1     tls 	 * Allocate the new accept filter instance storage.  We may
    314   1.1     tls 	 * have to free it again later if we fail to attach it.  If
    315   1.1     tls 	 * attached properly, 'newaf' is NULLed to avoid a free()
    316   1.1     tls 	 * while in use.
    317   1.1     tls 	 */
    318   1.5      ad 	newaf = kmem_zalloc(sizeof(*newaf), KM_SLEEP);
    319   1.2  plunky 	if (afp->accf_create != NULL && afa.af_name[0] != '\0') {
    320   1.4     tls 		/*
    321   1.4     tls 		 * FreeBSD did a variable-size allocation here
    322   1.4     tls 		 * with the actual string length from afa.af_name
    323   1.4     tls 		 * but it is so short, why bother tracking it?
    324   1.4     tls 		 * XXX as others have noted, this is an API mistake;
    325   1.4     tls 		 * XXX accept_filter_arg should have a mandatory namelen.
    326   1.4     tls 		 * XXX (but it's a bit too late to fix that now)
    327   1.4     tls 		 */
    328   1.4     tls 		newaf->so_accept_filter_str =
    329   1.5      ad 		    kmem_alloc(sizeof(afa.af_name), KM_SLEEP);
    330   1.2  plunky 		strcpy(newaf->so_accept_filter_str, afa.af_name);
    331   1.1     tls 	}
    332   1.1     tls 
    333   1.1     tls 	/*
    334   1.1     tls 	 * Require a listen socket; don't try to replace an existing filter
    335   1.1     tls 	 * without first removing it.
    336   1.1     tls 	 */
    337   1.5      ad 	solock(so);
    338   1.5      ad 	if ((so->so_options & SO_ACCEPTCONN) == 0 || so->so_accf != NULL) {
    339   1.1     tls 		error = EINVAL;
    340   1.1     tls 		goto out;
    341   1.1     tls 	}
    342   1.1     tls 
    343   1.1     tls 	/*
    344   1.1     tls 	 * Invoke the accf_create() method of the filter if required.  The
    345   1.5      ad 	 * socket lock is held over this call, so create methods for filters
    346   1.5      ad 	 * shouldn't block.
    347   1.1     tls 	 */
    348   1.1     tls 	if (afp->accf_create != NULL) {
    349   1.1     tls 		newaf->so_accept_filter_arg =
    350   1.5      ad 		    (*afp->accf_create)(so, afa.af_arg);
    351   1.1     tls 		if (newaf->so_accept_filter_arg == NULL) {
    352   1.1     tls 			error = EINVAL;
    353   1.1     tls 			goto out;
    354   1.1     tls 		}
    355   1.1     tls 	}
    356   1.1     tls 	newaf->so_accept_filter = afp;
    357   1.1     tls 	so->so_accf = newaf;
    358   1.1     tls 	so->so_options |= SO_ACCEPTFILTER;
    359   1.1     tls 	newaf = NULL;
    360   1.1     tls out:
    361   1.1     tls 	if (newaf != NULL) {
    362   1.1     tls 		if (newaf->so_accept_filter_str != NULL)
    363   1.4     tls 			kmem_free(newaf->so_accept_filter_str,
    364   1.5      ad 			    sizeof(afa.af_name));
    365   1.4     tls 		kmem_free(newaf, sizeof(*newaf));
    366   1.5      ad 		atomic_dec_uint(&afp->accf_refcnt);
    367   1.1     tls 	}
    368   1.5      ad 	return error;
    369   1.1     tls }
    370