1 1.16 riastrad /* $NetBSD: uipc_accf.c,v 1.16 2024/12/06 18:44:00 riastradh Exp $ */ 2 1.5 ad 3 1.5 ad /*- 4 1.5 ad * Copyright (c) 2008 The NetBSD Foundation, Inc. 5 1.5 ad * All rights reserved. 6 1.5 ad * 7 1.5 ad * This code is derived from software developed for The NetBSD Foundation 8 1.5 ad * by Andrew Doran. 9 1.5 ad * 10 1.5 ad * Redistribution and use in source and binary forms, with or without 11 1.5 ad * modification, are permitted provided that the following conditions 12 1.5 ad * are met: 13 1.5 ad * 1. Redistributions of source code must retain the above copyright 14 1.5 ad * notice, this list of conditions and the following disclaimer. 15 1.5 ad * 2. Redistributions in binary form must reproduce the above copyright 16 1.5 ad * notice, this list of conditions and the following disclaimer in the 17 1.5 ad * documentation and/or other materials provided with the distribution. 18 1.5 ad * 19 1.5 ad * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS 20 1.5 ad * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED 21 1.5 ad * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR 22 1.5 ad * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS 23 1.5 ad * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR 24 1.5 ad * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF 25 1.5 ad * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS 26 1.5 ad * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN 27 1.5 ad * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) 28 1.5 ad * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE 29 1.5 ad * POSSIBILITY OF SUCH DAMAGE. 30 1.5 ad */ 31 1.3 pooka 32 1.1 tls /*- 33 1.1 tls * Copyright (c) 2000 Paycounter, Inc. 34 1.1 tls * Copyright (c) 2005 Robert N. M. Watson 35 1.1 tls * Author: Alfred Perlstein <alfred (at) paycounter.com>, <alfred (at) FreeBSD.org> 36 1.1 tls * All rights reserved. 37 1.1 tls * 38 1.1 tls * Redistribution and use in source and binary forms, with or without 39 1.1 tls * modification, are permitted provided that the following conditions 40 1.1 tls * are met: 41 1.1 tls * 1. Redistributions of source code must retain the above copyright 42 1.1 tls * notice, this list of conditions and the following disclaimer. 43 1.1 tls * 2. Redistributions in binary form must reproduce the above copyright 44 1.1 tls * notice, this list of conditions and the following disclaimer in the 45 1.1 tls * documentation and/or other materials provided with the distribution. 46 1.1 tls * 47 1.1 tls * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND 48 1.1 tls * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 49 1.1 tls * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 50 1.1 tls * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE 51 1.1 tls * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 52 1.1 tls * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 53 1.1 tls * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 54 1.1 tls * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 55 1.1 tls * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 56 1.1 tls * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 57 1.1 tls * SUCH DAMAGE. 58 1.1 tls */ 59 1.1 tls 60 1.1 tls #include <sys/cdefs.h> 61 1.16 riastrad __KERNEL_RCSID(0, "$NetBSD: uipc_accf.c,v 1.16 2024/12/06 18:44:00 riastradh Exp $"); 62 1.1 tls 63 1.1 tls #define ACCEPT_FILTER_MOD 64 1.1 tls 65 1.1 tls #include <sys/param.h> 66 1.14 riastrad #include <sys/types.h> 67 1.14 riastrad 68 1.14 riastrad #include <sys/atomic.h> 69 1.1 tls #include <sys/domain.h> 70 1.1 tls #include <sys/kernel.h> 71 1.14 riastrad #include <sys/kmem.h> 72 1.1 tls #include <sys/lock.h> 73 1.1 tls #include <sys/mbuf.h> 74 1.14 riastrad #include <sys/module.h> 75 1.14 riastrad #include <sys/once.h> 76 1.14 riastrad #include <sys/protosw.h> 77 1.14 riastrad #include <sys/queue.h> 78 1.5 ad #include <sys/rwlock.h> 79 1.16 riastrad #include <sys/sdt.h> 80 1.1 tls #include <sys/socket.h> 81 1.1 tls #include <sys/socketvar.h> 82 1.14 riastrad #include <sys/sysctl.h> 83 1.14 riastrad #include <sys/systm.h> 84 1.1 tls 85 1.5 ad static krwlock_t accept_filter_lock; 86 1.1 tls 87 1.5 ad static LIST_HEAD(, accept_filter) accept_filtlsthd = 88 1.5 ad LIST_HEAD_INITIALIZER(&accept_filtlsthd); 89 1.1 tls 90 1.1 tls /* 91 1.1 tls * Names of Accept filter sysctl objects 92 1.1 tls */ 93 1.10 pooka static struct sysctllog *ctllog; 94 1.9 pooka static void 95 1.10 pooka sysctl_net_inet_accf_setup(void) 96 1.1 tls { 97 1.5 ad 98 1.10 pooka sysctl_createv(&ctllog, 0, NULL, NULL, 99 1.1 tls CTLFLAG_PERMANENT, 100 1.1 tls CTLTYPE_NODE, "inet", NULL, 101 1.1 tls NULL, 0, NULL, 0, 102 1.1 tls CTL_NET, PF_INET, CTL_EOL); 103 1.10 pooka sysctl_createv(&ctllog, 0, NULL, NULL, 104 1.1 tls CTLFLAG_PERMANENT, 105 1.1 tls CTLTYPE_NODE, "accf", 106 1.1 tls SYSCTL_DESCR("Accept filters"), 107 1.1 tls NULL, 0, NULL, 0, 108 1.1 tls CTL_NET, PF_INET, SO_ACCEPTFILTER, CTL_EOL); 109 1.1 tls } 110 1.1 tls 111 1.1 tls int 112 1.1 tls accept_filt_add(struct accept_filter *filt) 113 1.1 tls { 114 1.1 tls struct accept_filter *p; 115 1.1 tls 116 1.7 ad accept_filter_init(); 117 1.7 ad 118 1.5 ad rw_enter(&accept_filter_lock, RW_WRITER); 119 1.5 ad LIST_FOREACH(p, &accept_filtlsthd, accf_next) { 120 1.1 tls if (strcmp(p->accf_name, filt->accf_name) == 0) { 121 1.5 ad rw_exit(&accept_filter_lock); 122 1.16 riastrad return SET_ERROR(EEXIST); 123 1.1 tls } 124 1.15 riastrad } 125 1.5 ad LIST_INSERT_HEAD(&accept_filtlsthd, filt, accf_next); 126 1.5 ad rw_exit(&accept_filter_lock); 127 1.5 ad 128 1.5 ad return 0; 129 1.1 tls } 130 1.1 tls 131 1.1 tls int 132 1.5 ad accept_filt_del(struct accept_filter *p) 133 1.1 tls { 134 1.1 tls 135 1.5 ad rw_enter(&accept_filter_lock, RW_WRITER); 136 1.5 ad if (p->accf_refcnt != 0) { 137 1.5 ad rw_exit(&accept_filter_lock); 138 1.16 riastrad return SET_ERROR(EBUSY); 139 1.5 ad } 140 1.5 ad LIST_REMOVE(p, accf_next); 141 1.5 ad rw_exit(&accept_filter_lock); 142 1.1 tls 143 1.5 ad return 0; 144 1.1 tls } 145 1.1 tls 146 1.1 tls struct accept_filter * 147 1.1 tls accept_filt_get(char *name) 148 1.1 tls { 149 1.1 tls struct accept_filter *p; 150 1.8 ad char buf[32]; 151 1.8 ad u_int gen; 152 1.1 tls 153 1.8 ad do { 154 1.8 ad rw_enter(&accept_filter_lock, RW_READER); 155 1.8 ad LIST_FOREACH(p, &accept_filtlsthd, accf_next) { 156 1.8 ad if (strcmp(p->accf_name, name) == 0) { 157 1.8 ad atomic_inc_uint(&p->accf_refcnt); 158 1.8 ad break; 159 1.8 ad } 160 1.8 ad } 161 1.8 ad rw_exit(&accept_filter_lock); 162 1.8 ad if (p != NULL) { 163 1.1 tls break; 164 1.5 ad } 165 1.8 ad /* Try to autoload a module to satisfy the request. */ 166 1.8 ad strcpy(buf, "accf_"); 167 1.8 ad strlcat(buf, name, sizeof(buf)); 168 1.8 ad gen = module_gen; 169 1.8 ad (void)module_autoload(buf, MODULE_CLASS_ANY); 170 1.8 ad } while (gen != module_gen); 171 1.1 tls 172 1.5 ad return p; 173 1.1 tls } 174 1.1 tls 175 1.1 tls /* 176 1.1 tls * Accept filter initialization routine. 177 1.1 tls * This should be called only once. 178 1.1 tls */ 179 1.1 tls 180 1.1 tls static int 181 1.1 tls accept_filter_init0(void) 182 1.1 tls { 183 1.5 ad 184 1.5 ad rw_init(&accept_filter_lock); 185 1.10 pooka sysctl_net_inet_accf_setup(); 186 1.1 tls 187 1.1 tls return 0; 188 1.1 tls } 189 1.1 tls 190 1.1 tls /* 191 1.15 riastrad * Initialization routine: This can also be replaced with 192 1.1 tls * accept_filt_generic_mod_event for attaching new accept filter. 193 1.1 tls */ 194 1.1 tls 195 1.1 tls void 196 1.1 tls accept_filter_init(void) 197 1.1 tls { 198 1.1 tls static ONCE_DECL(accept_filter_init_once); 199 1.1 tls 200 1.1 tls RUN_ONCE(&accept_filter_init_once, accept_filter_init0); 201 1.1 tls } 202 1.1 tls 203 1.1 tls int 204 1.5 ad accept_filt_getopt(struct socket *so, struct sockopt *sopt) 205 1.1 tls { 206 1.2 plunky struct accept_filter_arg afa; 207 1.1 tls int error; 208 1.1 tls 209 1.5 ad KASSERT(solocked(so)); 210 1.5 ad 211 1.1 tls if ((so->so_options & SO_ACCEPTCONN) == 0) { 212 1.16 riastrad error = SET_ERROR(EINVAL); 213 1.1 tls goto out; 214 1.1 tls } 215 1.1 tls if ((so->so_options & SO_ACCEPTFILTER) == 0) { 216 1.16 riastrad error = SET_ERROR(EINVAL); 217 1.1 tls goto out; 218 1.1 tls } 219 1.2 plunky 220 1.2 plunky memset(&afa, 0, sizeof(afa)); 221 1.2 plunky strcpy(afa.af_name, so->so_accf->so_accept_filter->accf_name); 222 1.1 tls if (so->so_accf->so_accept_filter_str != NULL) 223 1.2 plunky strcpy(afa.af_arg, so->so_accf->so_accept_filter_str); 224 1.2 plunky error = sockopt_set(sopt, &afa, sizeof(afa)); 225 1.1 tls out: 226 1.5 ad return error; 227 1.5 ad } 228 1.5 ad 229 1.5 ad /* 230 1.5 ad * Simple delete case, with socket locked. 231 1.5 ad */ 232 1.5 ad int 233 1.5 ad accept_filt_clear(struct socket *so) 234 1.5 ad { 235 1.5 ad struct accept_filter_arg afa; 236 1.5 ad struct accept_filter *afp; 237 1.6 ad struct socket *so2, *next; 238 1.5 ad struct so_accf *af; 239 1.5 ad 240 1.5 ad KASSERT(solocked(so)); 241 1.5 ad 242 1.5 ad if ((so->so_options & SO_ACCEPTCONN) == 0) { 243 1.16 riastrad return SET_ERROR(EINVAL); 244 1.5 ad } 245 1.5 ad if (so->so_accf != NULL) { 246 1.5 ad /* Break in-flight processing. */ 247 1.6 ad for (so2 = TAILQ_FIRST(&so->so_q0); so2 != NULL; so2 = next) { 248 1.6 ad next = TAILQ_NEXT(so2, so_qe); 249 1.5 ad if (so2->so_upcall == NULL) { 250 1.5 ad continue; 251 1.5 ad } 252 1.5 ad so2->so_upcall = NULL; 253 1.5 ad so2->so_upcallarg = NULL; 254 1.6 ad so2->so_options &= ~SO_ACCEPTFILTER; 255 1.5 ad so2->so_rcv.sb_flags &= ~SB_UPCALL; 256 1.6 ad soisconnected(so2); 257 1.5 ad } 258 1.5 ad af = so->so_accf; 259 1.5 ad afp = af->so_accept_filter; 260 1.5 ad if (afp != NULL && afp->accf_destroy != NULL) { 261 1.5 ad (*afp->accf_destroy)(so); 262 1.5 ad } 263 1.5 ad if (af->so_accept_filter_str != NULL) { 264 1.5 ad kmem_free(af->so_accept_filter_str, 265 1.5 ad sizeof(afa.af_name)); 266 1.5 ad } 267 1.5 ad kmem_free(af, sizeof(*af)); 268 1.5 ad so->so_accf = NULL; 269 1.5 ad atomic_dec_uint(&afp->accf_refcnt); 270 1.5 ad } 271 1.5 ad so->so_options &= ~SO_ACCEPTFILTER; 272 1.5 ad return 0; 273 1.1 tls } 274 1.1 tls 275 1.5 ad /* 276 1.5 ad * setsockopt() for accept filters. Called with the socket unlocked, 277 1.5 ad * will always return it locked. 278 1.5 ad */ 279 1.1 tls int 280 1.5 ad accept_filt_setopt(struct socket *so, const struct sockopt *sopt) 281 1.1 tls { 282 1.2 plunky struct accept_filter_arg afa; 283 1.1 tls struct accept_filter *afp; 284 1.1 tls struct so_accf *newaf; 285 1.2 plunky int error; 286 1.1 tls 287 1.11 christos accept_filter_init(); 288 1.11 christos 289 1.2 plunky if (sopt == NULL || sopt->sopt_size == 0) { 290 1.5 ad solock(so); 291 1.5 ad return accept_filt_clear(so); 292 1.1 tls } 293 1.1 tls 294 1.1 tls /* 295 1.1 tls * Pre-allocate any memory we may need later to avoid blocking at 296 1.1 tls * untimely moments. This does not optimize for invalid arguments. 297 1.1 tls */ 298 1.2 plunky error = sockopt_get(sopt, &afa, sizeof(afa)); 299 1.2 plunky if (error) { 300 1.5 ad solock(so); 301 1.5 ad return error; 302 1.1 tls } 303 1.2 plunky afa.af_name[sizeof(afa.af_name)-1] = '\0'; 304 1.2 plunky afa.af_arg[sizeof(afa.af_arg)-1] = '\0'; 305 1.2 plunky afp = accept_filt_get(afa.af_name); 306 1.1 tls if (afp == NULL) { 307 1.5 ad solock(so); 308 1.16 riastrad return SET_ERROR(ENOENT); 309 1.1 tls } 310 1.1 tls /* 311 1.1 tls * Allocate the new accept filter instance storage. We may 312 1.1 tls * have to free it again later if we fail to attach it. If 313 1.1 tls * attached properly, 'newaf' is NULLed to avoid a free() 314 1.1 tls * while in use. 315 1.1 tls */ 316 1.5 ad newaf = kmem_zalloc(sizeof(*newaf), KM_SLEEP); 317 1.2 plunky if (afp->accf_create != NULL && afa.af_name[0] != '\0') { 318 1.4 tls /* 319 1.4 tls * FreeBSD did a variable-size allocation here 320 1.4 tls * with the actual string length from afa.af_name 321 1.4 tls * but it is so short, why bother tracking it? 322 1.4 tls * XXX as others have noted, this is an API mistake; 323 1.4 tls * XXX accept_filter_arg should have a mandatory namelen. 324 1.4 tls * XXX (but it's a bit too late to fix that now) 325 1.4 tls */ 326 1.4 tls newaf->so_accept_filter_str = 327 1.5 ad kmem_alloc(sizeof(afa.af_name), KM_SLEEP); 328 1.2 plunky strcpy(newaf->so_accept_filter_str, afa.af_name); 329 1.1 tls } 330 1.1 tls 331 1.1 tls /* 332 1.1 tls * Require a listen socket; don't try to replace an existing filter 333 1.1 tls * without first removing it. 334 1.1 tls */ 335 1.5 ad solock(so); 336 1.5 ad if ((so->so_options & SO_ACCEPTCONN) == 0 || so->so_accf != NULL) { 337 1.16 riastrad error = SET_ERROR(EINVAL); 338 1.1 tls goto out; 339 1.1 tls } 340 1.1 tls 341 1.1 tls /* 342 1.1 tls * Invoke the accf_create() method of the filter if required. The 343 1.5 ad * socket lock is held over this call, so create methods for filters 344 1.5 ad * shouldn't block. 345 1.1 tls */ 346 1.1 tls if (afp->accf_create != NULL) { 347 1.1 tls newaf->so_accept_filter_arg = 348 1.5 ad (*afp->accf_create)(so, afa.af_arg); 349 1.1 tls if (newaf->so_accept_filter_arg == NULL) { 350 1.16 riastrad error = SET_ERROR(EINVAL); 351 1.1 tls goto out; 352 1.1 tls } 353 1.1 tls } 354 1.1 tls newaf->so_accept_filter = afp; 355 1.1 tls so->so_accf = newaf; 356 1.1 tls so->so_options |= SO_ACCEPTFILTER; 357 1.1 tls newaf = NULL; 358 1.1 tls out: 359 1.1 tls if (newaf != NULL) { 360 1.1 tls if (newaf->so_accept_filter_str != NULL) 361 1.4 tls kmem_free(newaf->so_accept_filter_str, 362 1.5 ad sizeof(afa.af_name)); 363 1.4 tls kmem_free(newaf, sizeof(*newaf)); 364 1.5 ad atomic_dec_uint(&afp->accf_refcnt); 365 1.1 tls } 366 1.5 ad return error; 367 1.1 tls } 368