in_pcb.c revision 1.193 1 1.193 ozaki /* $NetBSD: in_pcb.c,v 1.193 2022/10/28 05:25:36 ozaki-r Exp $ */
2 1.59 itojun
3 1.59 itojun /*
4 1.59 itojun * Copyright (C) 1995, 1996, 1997, and 1998 WIDE Project.
5 1.59 itojun * All rights reserved.
6 1.78 itojun *
7 1.59 itojun * Redistribution and use in source and binary forms, with or without
8 1.59 itojun * modification, are permitted provided that the following conditions
9 1.59 itojun * are met:
10 1.59 itojun * 1. Redistributions of source code must retain the above copyright
11 1.59 itojun * notice, this list of conditions and the following disclaimer.
12 1.59 itojun * 2. Redistributions in binary form must reproduce the above copyright
13 1.59 itojun * notice, this list of conditions and the following disclaimer in the
14 1.59 itojun * documentation and/or other materials provided with the distribution.
15 1.59 itojun * 3. Neither the name of the project nor the names of its contributors
16 1.59 itojun * may be used to endorse or promote products derived from this software
17 1.59 itojun * without specific prior written permission.
18 1.78 itojun *
19 1.59 itojun * THIS SOFTWARE IS PROVIDED BY THE PROJECT AND CONTRIBUTORS ``AS IS'' AND
20 1.59 itojun * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
21 1.59 itojun * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
22 1.59 itojun * ARE DISCLAIMED. IN NO EVENT SHALL THE PROJECT OR CONTRIBUTORS BE LIABLE
23 1.59 itojun * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
24 1.59 itojun * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
25 1.59 itojun * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
26 1.59 itojun * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
27 1.59 itojun * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
28 1.59 itojun * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
29 1.59 itojun * SUCH DAMAGE.
30 1.59 itojun */
31 1.57 thorpej
32 1.57 thorpej /*-
33 1.138 dyoung * Copyright (c) 1998, 2011 The NetBSD Foundation, Inc.
34 1.57 thorpej * All rights reserved.
35 1.57 thorpej *
36 1.57 thorpej * This code is derived from software contributed to The NetBSD Foundation
37 1.138 dyoung * by Coyote Point Systems, Inc.
38 1.138 dyoung * This code is derived from software contributed to The NetBSD Foundation
39 1.57 thorpej * by Public Access Networks Corporation ("Panix"). It was developed under
40 1.57 thorpej * contract to Panix by Eric Haszlakiewicz and Thor Lancelot Simon.
41 1.57 thorpej *
42 1.57 thorpej * Redistribution and use in source and binary forms, with or without
43 1.57 thorpej * modification, are permitted provided that the following conditions
44 1.57 thorpej * are met:
45 1.57 thorpej * 1. Redistributions of source code must retain the above copyright
46 1.57 thorpej * notice, this list of conditions and the following disclaimer.
47 1.57 thorpej * 2. Redistributions in binary form must reproduce the above copyright
48 1.57 thorpej * notice, this list of conditions and the following disclaimer in the
49 1.57 thorpej * documentation and/or other materials provided with the distribution.
50 1.57 thorpej *
51 1.57 thorpej * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
52 1.57 thorpej * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
53 1.57 thorpej * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
54 1.57 thorpej * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
55 1.57 thorpej * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
56 1.57 thorpej * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
57 1.57 thorpej * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
58 1.57 thorpej * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
59 1.57 thorpej * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
60 1.57 thorpej * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
61 1.57 thorpej * POSSIBILITY OF SUCH DAMAGE.
62 1.57 thorpej */
63 1.11 cgd
64 1.1 cgd /*
65 1.44 thorpej * Copyright (c) 1982, 1986, 1991, 1993, 1995
66 1.10 mycroft * The Regents of the University of California. All rights reserved.
67 1.1 cgd *
68 1.1 cgd * Redistribution and use in source and binary forms, with or without
69 1.1 cgd * modification, are permitted provided that the following conditions
70 1.1 cgd * are met:
71 1.1 cgd * 1. Redistributions of source code must retain the above copyright
72 1.1 cgd * notice, this list of conditions and the following disclaimer.
73 1.1 cgd * 2. Redistributions in binary form must reproduce the above copyright
74 1.1 cgd * notice, this list of conditions and the following disclaimer in the
75 1.1 cgd * documentation and/or other materials provided with the distribution.
76 1.86 agc * 3. Neither the name of the University nor the names of its contributors
77 1.1 cgd * may be used to endorse or promote products derived from this software
78 1.1 cgd * without specific prior written permission.
79 1.1 cgd *
80 1.1 cgd * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
81 1.1 cgd * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
82 1.1 cgd * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
83 1.1 cgd * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
84 1.1 cgd * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
85 1.1 cgd * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
86 1.1 cgd * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
87 1.1 cgd * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
88 1.1 cgd * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
89 1.1 cgd * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
90 1.1 cgd * SUCH DAMAGE.
91 1.1 cgd *
92 1.44 thorpej * @(#)in_pcb.c 8.4 (Berkeley) 5/24/95
93 1.1 cgd */
94 1.73 lukem
95 1.73 lukem #include <sys/cdefs.h>
96 1.193 ozaki __KERNEL_RCSID(0, "$NetBSD: in_pcb.c,v 1.193 2022/10/28 05:25:36 ozaki-r Exp $");
97 1.60 thorpej
98 1.162 pooka #ifdef _KERNEL_OPT
99 1.88 itojun #include "opt_inet.h"
100 1.60 thorpej #include "opt_ipsec.h"
101 1.162 pooka #endif
102 1.1 cgd
103 1.7 mycroft #include <sys/param.h>
104 1.7 mycroft #include <sys/systm.h>
105 1.7 mycroft #include <sys/mbuf.h>
106 1.7 mycroft #include <sys/socket.h>
107 1.7 mycroft #include <sys/socketvar.h>
108 1.7 mycroft #include <sys/ioctl.h>
109 1.10 mycroft #include <sys/errno.h>
110 1.10 mycroft #include <sys/time.h>
111 1.128 pooka #include <sys/once.h>
112 1.52 thorpej #include <sys/pool.h>
113 1.10 mycroft #include <sys/proc.h>
114 1.102 elad #include <sys/kauth.h>
115 1.129 pooka #include <sys/uidinfo.h>
116 1.132 elad #include <sys/domain.h>
117 1.1 cgd
118 1.7 mycroft #include <net/if.h>
119 1.7 mycroft #include <net/route.h>
120 1.1 cgd
121 1.7 mycroft #include <netinet/in.h>
122 1.7 mycroft #include <netinet/in_systm.h>
123 1.7 mycroft #include <netinet/ip.h>
124 1.7 mycroft #include <netinet/in_pcb.h>
125 1.7 mycroft #include <netinet/in_var.h>
126 1.7 mycroft #include <netinet/ip_var.h>
127 1.143 christos #include <netinet/portalgo.h>
128 1.1 cgd
129 1.88 itojun #ifdef INET6
130 1.88 itojun #include <netinet/ip6.h>
131 1.88 itojun #include <netinet6/ip6_var.h>
132 1.88 itojun #include <netinet6/in6_pcb.h>
133 1.88 itojun #endif
134 1.88 itojun
135 1.145 christos #ifdef IPSEC
136 1.87 jonathan #include <netipsec/ipsec.h>
137 1.87 jonathan #include <netipsec/key.h>
138 1.59 itojun #endif /* IPSEC */
139 1.59 itojun
140 1.138 dyoung #include <netinet/tcp_vtw.h>
141 1.138 dyoung
142 1.1 cgd struct in_addr zeroin_addr;
143 1.1 cgd
144 1.90 provos #define INPCBHASH_PORT(table, lport) \
145 1.92 itojun &(table)->inpt_porthashtbl[ntohs(lport) & (table)->inpt_porthash]
146 1.33 mycroft #define INPCBHASH_BIND(table, laddr, lport) \
147 1.33 mycroft &(table)->inpt_bindhashtbl[ \
148 1.33 mycroft ((ntohl((laddr).s_addr) + ntohs(lport))) & (table)->inpt_bindhash]
149 1.33 mycroft #define INPCBHASH_CONNECT(table, faddr, fport, laddr, lport) \
150 1.33 mycroft &(table)->inpt_connecthashtbl[ \
151 1.33 mycroft ((ntohl((faddr).s_addr) + ntohs(fport)) + \
152 1.33 mycroft (ntohl((laddr).s_addr) + ntohs(lport))) & (table)->inpt_connecthash]
153 1.33 mycroft
154 1.43 lukem int anonportmin = IPPORT_ANONMIN;
155 1.43 lukem int anonportmax = IPPORT_ANONMAX;
156 1.67 tron int lowportmin = IPPORT_RESERVEDMIN;
157 1.67 tron int lowportmax = IPPORT_RESERVEDMAX;
158 1.43 lukem
159 1.193 ozaki static struct pool in4pcb_pool;
160 1.193 ozaki static struct pool in6pcb_pool;
161 1.128 pooka
162 1.128 pooka static int
163 1.128 pooka inpcb_poolinit(void)
164 1.128 pooka {
165 1.128 pooka
166 1.193 ozaki pool_init(&in4pcb_pool, sizeof(struct in4pcb), 0, 0, 0, "in4pcbpl", NULL,
167 1.193 ozaki IPL_NET);
168 1.193 ozaki pool_init(&in6pcb_pool, sizeof(struct in6pcb), 0, 0, 0, "in6pcbpl", NULL,
169 1.128 pooka IPL_NET);
170 1.128 pooka return 0;
171 1.128 pooka }
172 1.52 thorpej
173 1.18 mycroft void
174 1.98 perry in_pcbinit(struct inpcbtable *table, int bindhashsize, int connecthashsize)
175 1.18 mycroft {
176 1.128 pooka static ONCE_DECL(control);
177 1.18 mycroft
178 1.146 christos TAILQ_INIT(&table->inpt_queue);
179 1.125 ad table->inpt_porthashtbl = hashinit(bindhashsize, HASH_LIST, true,
180 1.125 ad &table->inpt_porthash);
181 1.125 ad table->inpt_bindhashtbl = hashinit(bindhashsize, HASH_LIST, true,
182 1.125 ad &table->inpt_bindhash);
183 1.125 ad table->inpt_connecthashtbl = hashinit(connecthashsize, HASH_LIST, true,
184 1.125 ad &table->inpt_connecthash);
185 1.47 lukem table->inpt_lastlow = IPPORT_RESERVEDMAX;
186 1.47 lukem table->inpt_lastport = (u_int16_t)anonportmax;
187 1.128 pooka
188 1.128 pooka RUN_ONCE(&control, inpcb_poolinit);
189 1.18 mycroft }
190 1.18 mycroft
191 1.10 mycroft int
192 1.98 perry in_pcballoc(struct socket *so, void *v)
193 1.1 cgd {
194 1.25 christos struct inpcbtable *table = v;
195 1.64 augustss struct inpcb *inp;
196 1.24 mycroft int s;
197 1.1 cgd
198 1.192 ozaki KASSERT(soaf(so) == AF_INET || soaf(so) == AF_INET6);
199 1.177 ozaki
200 1.193 ozaki if (soaf(so) == AF_INET)
201 1.193 ozaki inp = pool_get(&in4pcb_pool, PR_NOWAIT|PR_ZERO);
202 1.193 ozaki else
203 1.193 ozaki inp = pool_get(&in6pcb_pool, PR_NOWAIT|PR_ZERO);
204 1.10 mycroft if (inp == NULL)
205 1.1 cgd return (ENOBUFS);
206 1.192 ozaki inp->inp_af = soaf(so);
207 1.18 mycroft inp->inp_table = table;
208 1.1 cgd inp->inp_socket = so;
209 1.143 christos inp->inp_portalgo = PORTALGO_DEFAULT;
210 1.139 christos inp->inp_bindportonsend = false;
211 1.184 riastrad inp->inp_overudp_cb = NULL;
212 1.184 riastrad inp->inp_overudp_arg = NULL;
213 1.193 ozaki
214 1.193 ozaki if (inp->inp_af == AF_INET) {
215 1.193 ozaki in4p_errormtu(inp) = -1;
216 1.193 ozaki in4p_prefsrcip(inp).s_addr = INADDR_ANY;
217 1.193 ozaki }
218 1.192 ozaki #ifdef INET6
219 1.193 ozaki else {
220 1.193 ozaki in6p_hops6(inp) = -1; /* use kernel default */
221 1.193 ozaki if (ip6_v6only)
222 1.193 ozaki inp->inp_flags |= IN6P_IPV6_V6ONLY;
223 1.193 ozaki }
224 1.192 ozaki #endif
225 1.145 christos #if defined(IPSEC)
226 1.148 christos if (ipsec_enabled) {
227 1.148 christos int error = ipsec_init_pcbpolicy(so, &inp->inp_sp);
228 1.148 christos if (error != 0) {
229 1.193 ozaki if (inp->inp_af == AF_INET)
230 1.193 ozaki pool_put(&in4pcb_pool, inp);
231 1.193 ozaki else
232 1.193 ozaki pool_put(&in6pcb_pool, inp);
233 1.148 christos return error;
234 1.148 christos }
235 1.192 ozaki inp->inp_sp->sp_inp = inp;
236 1.70 itojun }
237 1.70 itojun #endif
238 1.33 mycroft so->so_pcb = inp;
239 1.175 ozaki s = splsoftnet();
240 1.192 ozaki TAILQ_INSERT_HEAD(&table->inpt_queue, inp, inp_queue);
241 1.192 ozaki LIST_INSERT_HEAD(INPCBHASH_PORT(table, inp->inp_lport), inp,
242 1.192 ozaki inp_lhash);
243 1.33 mycroft in_pcbstate(inp, INP_ATTACHED);
244 1.24 mycroft splx(s);
245 1.1 cgd return (0);
246 1.1 cgd }
247 1.8 mycroft
248 1.132 elad static int
249 1.134 elad in_pcbsetport(struct sockaddr_in *sin, struct inpcb *inp, kauth_cred_t cred)
250 1.1 cgd {
251 1.132 elad struct inpcbtable *table = inp->inp_table;
252 1.64 augustss struct socket *so = inp->inp_socket;
253 1.132 elad u_int16_t *lastport;
254 1.13 cgd u_int16_t lport = 0;
255 1.134 elad enum kauth_network_req req;
256 1.134 elad int error;
257 1.1 cgd
258 1.132 elad if (inp->inp_flags & INP_LOWPORT) {
259 1.132 elad #ifndef IPNOPRIVPORTS
260 1.134 elad req = KAUTH_REQ_NETWORK_BIND_PRIVPORT;
261 1.134 elad #else
262 1.134 elad req = KAUTH_REQ_NETWORK_BIND_PORT;
263 1.132 elad #endif
264 1.134 elad
265 1.132 elad lastport = &table->inpt_lastlow;
266 1.132 elad } else {
267 1.134 elad req = KAUTH_REQ_NETWORK_BIND_PORT;
268 1.134 elad
269 1.132 elad lastport = &table->inpt_lastport;
270 1.132 elad }
271 1.134 elad
272 1.134 elad /* XXX-kauth: KAUTH_REQ_NETWORK_BIND_AUTOASSIGN_{,PRIV}PORT */
273 1.134 elad error = kauth_authorize_network(cred, KAUTH_NETWORK_BIND, req, so, sin,
274 1.134 elad NULL);
275 1.134 elad if (error)
276 1.137 elad return (EACCES);
277 1.134 elad
278 1.139 christos /*
279 1.139 christos * Use RFC6056 randomized port selection
280 1.139 christos */
281 1.192 ozaki error = portalgo_randport(&lport, inp, cred);
282 1.139 christos if (error)
283 1.139 christos return error;
284 1.132 elad
285 1.132 elad inp->inp_flags |= INP_ANONPORT;
286 1.132 elad *lastport = lport;
287 1.132 elad lport = htons(lport);
288 1.132 elad inp->inp_lport = lport;
289 1.132 elad in_pcbstate(inp, INP_BOUND);
290 1.132 elad
291 1.132 elad return (0);
292 1.132 elad }
293 1.88 itojun
294 1.179 ryo int
295 1.185 christos in_pcbbindableaddr(const struct inpcb *inp, struct sockaddr_in *sin,
296 1.185 christos kauth_cred_t cred)
297 1.132 elad {
298 1.168 ozaki int error = EADDRNOTAVAIL;
299 1.168 ozaki struct ifaddr *ifa = NULL;
300 1.168 ozaki int s;
301 1.168 ozaki
302 1.28 mycroft if (sin->sin_family != AF_INET)
303 1.28 mycroft return (EAFNOSUPPORT);
304 1.132 elad
305 1.168 ozaki s = pserialize_read_enter();
306 1.136 elad if (IN_MULTICAST(sin->sin_addr.s_addr)) {
307 1.136 elad /* Always succeed; port reuse handled in in_pcbbind_port(). */
308 1.136 elad } else if (!in_nullhost(sin->sin_addr)) {
309 1.168 ozaki struct in_ifaddr *ia;
310 1.132 elad
311 1.166 ozaki ia = in_get_ia(sin->sin_addr);
312 1.132 elad /* check for broadcast addresses */
313 1.168 ozaki if (ia == NULL) {
314 1.168 ozaki ifa = ifa_ifwithaddr(sintosa(sin));
315 1.168 ozaki if (ifa != NULL)
316 1.168 ozaki ia = ifatoia(ifa);
317 1.185 christos else if ((inp->inp_flags & INP_BINDANY) != 0) {
318 1.185 christos error = 0;
319 1.185 christos goto error;
320 1.185 christos }
321 1.168 ozaki }
322 1.132 elad if (ia == NULL)
323 1.168 ozaki goto error;
324 1.170 roy if (ia->ia4_flags & IN_IFF_DUPLICATED)
325 1.168 ozaki goto error;
326 1.132 elad }
327 1.179 ryo error = 0;
328 1.179 ryo error:
329 1.168 ozaki pserialize_read_exit(s);
330 1.179 ryo return error;
331 1.179 ryo }
332 1.132 elad
333 1.179 ryo static int
334 1.179 ryo in_pcbbind_addr(struct inpcb *inp, struct sockaddr_in *sin, kauth_cred_t cred)
335 1.179 ryo {
336 1.179 ryo int error;
337 1.132 elad
338 1.185 christos error = in_pcbbindableaddr(inp, sin, cred);
339 1.179 ryo if (error == 0)
340 1.193 ozaki in4p_laddr(inp) = sin->sin_addr;
341 1.168 ozaki return error;
342 1.132 elad }
343 1.132 elad
344 1.132 elad static int
345 1.132 elad in_pcbbind_port(struct inpcb *inp, struct sockaddr_in *sin, kauth_cred_t cred)
346 1.132 elad {
347 1.132 elad struct inpcbtable *table = inp->inp_table;
348 1.132 elad struct socket *so = inp->inp_socket;
349 1.132 elad int reuseport = (so->so_options & SO_REUSEPORT);
350 1.133 elad int wild = 0, error;
351 1.132 elad
352 1.28 mycroft if (IN_MULTICAST(sin->sin_addr.s_addr)) {
353 1.10 mycroft /*
354 1.28 mycroft * Treat SO_REUSEADDR as SO_REUSEPORT for multicast;
355 1.28 mycroft * allow complete duplication of binding if
356 1.28 mycroft * SO_REUSEPORT is set, or if SO_REUSEADDR is set
357 1.28 mycroft * and a multicast address is bound on both
358 1.28 mycroft * new and duplicated sockets.
359 1.10 mycroft */
360 1.155 seanb if (so->so_options & (SO_REUSEADDR | SO_REUSEPORT))
361 1.28 mycroft reuseport = SO_REUSEADDR|SO_REUSEPORT;
362 1.132 elad }
363 1.132 elad
364 1.132 elad if (sin->sin_port == 0) {
365 1.134 elad error = in_pcbsetport(sin, inp, cred);
366 1.132 elad if (error)
367 1.132 elad return (error);
368 1.132 elad } else {
369 1.28 mycroft struct inpcb *t;
370 1.138 dyoung vestigial_inpcb_t vestige;
371 1.88 itojun #ifdef INET6
372 1.192 ozaki struct inpcb *t6;
373 1.88 itojun struct in6_addr mapped;
374 1.88 itojun #endif
375 1.133 elad enum kauth_network_req req;
376 1.132 elad
377 1.132 elad if ((so->so_options & (SO_REUSEADDR|SO_REUSEPORT)) == 0)
378 1.132 elad wild = 1;
379 1.132 elad
380 1.31 perry #ifndef IPNOPRIVPORTS
381 1.133 elad if (ntohs(sin->sin_port) < IPPORT_RESERVED)
382 1.133 elad req = KAUTH_REQ_NETWORK_BIND_PRIVPORT;
383 1.133 elad else
384 1.133 elad #endif /* !IPNOPRIVPORTS */
385 1.133 elad req = KAUTH_REQ_NETWORK_BIND_PORT;
386 1.133 elad
387 1.133 elad error = kauth_authorize_network(cred, KAUTH_NETWORK_BIND, req,
388 1.133 elad so, sin, NULL);
389 1.133 elad if (error)
390 1.137 elad return (EACCES);
391 1.133 elad
392 1.88 itojun #ifdef INET6
393 1.163 rtr in6_in_2_v4mapin6(&sin->sin_addr, &mapped);
394 1.138 dyoung t6 = in6_pcblookup_port(table, &mapped, sin->sin_port, wild, &vestige);
395 1.192 ozaki if (t6 && (reuseport & t6->inp_socket->so_options) == 0)
396 1.88 itojun return (EADDRINUSE);
397 1.138 dyoung if (!t6 && vestige.valid) {
398 1.138 dyoung if (!!reuseport != !!vestige.reuse_port) {
399 1.138 dyoung return EADDRINUSE;
400 1.138 dyoung }
401 1.138 dyoung }
402 1.88 itojun #endif
403 1.133 elad
404 1.133 elad /* XXX-kauth */
405 1.99 christos if (so->so_uidinfo->ui_uid && !IN_MULTICAST(sin->sin_addr.s_addr)) {
406 1.138 dyoung t = in_pcblookup_port(table, sin->sin_addr, sin->sin_port, 1, &vestige);
407 1.133 elad /*
408 1.133 elad * XXX: investigate ramifications of loosening this
409 1.133 elad * restriction so that as long as both ports have
410 1.133 elad * SO_REUSEPORT allow the bind
411 1.133 elad */
412 1.58 lukem if (t &&
413 1.58 lukem (!in_nullhost(sin->sin_addr) ||
414 1.193 ozaki !in_nullhost(in4p_laddr(t)) ||
415 1.58 lukem (t->inp_socket->so_options & SO_REUSEPORT) == 0)
416 1.99 christos && (so->so_uidinfo->ui_uid != t->inp_socket->so_uidinfo->ui_uid)) {
417 1.58 lukem return (EADDRINUSE);
418 1.58 lukem }
419 1.138 dyoung if (!t && vestige.valid) {
420 1.138 dyoung if ((!in_nullhost(sin->sin_addr)
421 1.138 dyoung || !in_nullhost(vestige.laddr.v4)
422 1.138 dyoung || !vestige.reuse_port)
423 1.138 dyoung && so->so_uidinfo->ui_uid != vestige.uid) {
424 1.138 dyoung return EADDRINUSE;
425 1.138 dyoung }
426 1.138 dyoung }
427 1.58 lukem }
428 1.138 dyoung t = in_pcblookup_port(table, sin->sin_addr, sin->sin_port, wild, &vestige);
429 1.28 mycroft if (t && (reuseport & t->inp_socket->so_options) == 0)
430 1.28 mycroft return (EADDRINUSE);
431 1.138 dyoung if (!t
432 1.138 dyoung && vestige.valid
433 1.138 dyoung && !(reuseport && vestige.reuse_port))
434 1.138 dyoung return EADDRINUSE;
435 1.132 elad
436 1.132 elad inp->inp_lport = sin->sin_port;
437 1.132 elad in_pcbstate(inp, INP_BOUND);
438 1.1 cgd }
439 1.45 lukem
440 1.192 ozaki LIST_REMOVE(inp, inp_lhash);
441 1.192 ozaki LIST_INSERT_HEAD(INPCBHASH_PORT(table, inp->inp_lport), inp,
442 1.192 ozaki inp_lhash);
443 1.132 elad
444 1.132 elad return (0);
445 1.132 elad }
446 1.132 elad
447 1.132 elad int
448 1.156 rtr in_pcbbind(void *v, struct sockaddr_in *sin, struct lwp *l)
449 1.132 elad {
450 1.132 elad struct inpcb *inp = v;
451 1.134 elad struct sockaddr_in lsin;
452 1.132 elad int error;
453 1.132 elad
454 1.132 elad if (inp->inp_af != AF_INET)
455 1.132 elad return (EINVAL);
456 1.132 elad
457 1.193 ozaki if (inp->inp_lport || !in_nullhost(in4p_laddr(inp)))
458 1.132 elad return (EINVAL);
459 1.132 elad
460 1.156 rtr if (NULL != sin) {
461 1.156 rtr if (sin->sin_len != sizeof(*sin))
462 1.132 elad return (EINVAL);
463 1.132 elad } else {
464 1.134 elad lsin = *((const struct sockaddr_in *)
465 1.134 elad inp->inp_socket->so_proto->pr_domain->dom_sa_any);
466 1.134 elad sin = &lsin;
467 1.132 elad }
468 1.132 elad
469 1.132 elad /* Bind address. */
470 1.151 rtr error = in_pcbbind_addr(inp, sin, l->l_cred);
471 1.132 elad if (error)
472 1.132 elad return (error);
473 1.132 elad
474 1.132 elad /* Bind port. */
475 1.151 rtr error = in_pcbbind_port(inp, sin, l->l_cred);
476 1.132 elad if (error) {
477 1.193 ozaki in4p_laddr(inp).s_addr = INADDR_ANY;
478 1.132 elad
479 1.132 elad return (error);
480 1.132 elad }
481 1.132 elad
482 1.1 cgd return (0);
483 1.1 cgd }
484 1.1 cgd
485 1.1 cgd /*
486 1.1 cgd * Connect from a socket to a specified address.
487 1.1 cgd * Both address and port must be specified in argument sin.
488 1.1 cgd * If don't have a local address for this socket yet,
489 1.1 cgd * then pick one.
490 1.1 cgd */
491 1.10 mycroft int
492 1.160 rtr in_pcbconnect(void *v, struct sockaddr_in *sin, struct lwp *l)
493 1.1 cgd {
494 1.64 augustss struct inpcb *inp = v;
495 1.138 dyoung vestigial_inpcb_t vestige;
496 1.40 thorpej int error;
497 1.167 ozaki struct in_addr laddr;
498 1.1 cgd
499 1.88 itojun if (inp->inp_af != AF_INET)
500 1.88 itojun return (EINVAL);
501 1.88 itojun
502 1.158 rtr if (sin->sin_len != sizeof (*sin))
503 1.158 rtr return (EINVAL);
504 1.1 cgd if (sin->sin_family != AF_INET)
505 1.1 cgd return (EAFNOSUPPORT);
506 1.1 cgd if (sin->sin_port == 0)
507 1.1 cgd return (EADDRNOTAVAIL);
508 1.144 christos
509 1.144 christos if (IN_MULTICAST(sin->sin_addr.s_addr) &&
510 1.144 christos inp->inp_socket->so_type == SOCK_STREAM)
511 1.144 christos return EADDRNOTAVAIL;
512 1.144 christos
513 1.165 ozaki if (!IN_ADDRLIST_READER_EMPTY()) {
514 1.1 cgd /*
515 1.1 cgd * If the destination address is INADDR_ANY,
516 1.49 tls * use any local address (likely loopback).
517 1.1 cgd * If the supplied address is INADDR_BROADCAST,
518 1.49 tls * use the broadcast address of an interface
519 1.49 tls * which supports broadcast. (loopback does not)
520 1.1 cgd */
521 1.49 tls
522 1.72 matt if (in_nullhost(sin->sin_addr)) {
523 1.165 ozaki /* XXX racy */
524 1.72 matt sin->sin_addr =
525 1.165 ozaki IN_ADDRLIST_READER_FIRST()->ia_addr.sin_addr;
526 1.72 matt } else if (sin->sin_addr.s_addr == INADDR_BROADCAST) {
527 1.167 ozaki struct in_ifaddr *ia;
528 1.168 ozaki int s = pserialize_read_enter();
529 1.165 ozaki IN_ADDRLIST_READER_FOREACH(ia) {
530 1.72 matt if (ia->ia_ifp->if_flags & IFF_BROADCAST) {
531 1.72 matt sin->sin_addr =
532 1.72 matt ia->ia_broadaddr.sin_addr;
533 1.72 matt break;
534 1.72 matt }
535 1.49 tls }
536 1.168 ozaki pserialize_read_exit(s);
537 1.72 matt }
538 1.1 cgd }
539 1.32 mycroft /*
540 1.32 mycroft * If we haven't bound which network number to use as ours,
541 1.32 mycroft * we will use the number of the outgoing interface.
542 1.32 mycroft * This depends on having done a routing lookup, which
543 1.32 mycroft * we will probably have to do anyway, so we might
544 1.32 mycroft * as well do it now. On the other hand if we are
545 1.32 mycroft * sending to multiple destinations we may have already
546 1.32 mycroft * done the lookup, so see if we can use the route
547 1.32 mycroft * from before. In any case, we only
548 1.32 mycroft * chose a port number once, even if sending to multiple
549 1.32 mycroft * destinations.
550 1.32 mycroft */
551 1.193 ozaki if (in_nullhost(in4p_laddr(inp))) {
552 1.100 christos int xerror;
553 1.168 ozaki struct in_ifaddr *ia, *_ia;
554 1.168 ozaki int s;
555 1.168 ozaki struct psref psref;
556 1.168 ozaki int bound;
557 1.168 ozaki
558 1.168 ozaki bound = curlwp_bind();
559 1.168 ozaki ia = in_selectsrc(sin, &inp->inp_route,
560 1.168 ozaki inp->inp_socket->so_options, inp->inp_moptions, &xerror,
561 1.168 ozaki &psref);
562 1.168 ozaki if (ia == NULL) {
563 1.168 ozaki curlwp_bindx(bound);
564 1.100 christos if (xerror == 0)
565 1.100 christos xerror = EADDRNOTAVAIL;
566 1.100 christos return xerror;
567 1.59 itojun }
568 1.168 ozaki s = pserialize_read_enter();
569 1.168 ozaki _ia = in_get_ia(IA_SIN(ia)->sin_addr);
570 1.185 christos if (_ia == NULL && (inp->inp_flags & INP_BINDANY) == 0) {
571 1.168 ozaki pserialize_read_exit(s);
572 1.168 ozaki ia4_release(ia, &psref);
573 1.168 ozaki curlwp_bindx(bound);
574 1.83 itojun return (EADDRNOTAVAIL);
575 1.168 ozaki }
576 1.168 ozaki pserialize_read_exit(s);
577 1.168 ozaki laddr = IA_SIN(ia)->sin_addr;
578 1.168 ozaki ia4_release(ia, &psref);
579 1.168 ozaki curlwp_bindx(bound);
580 1.167 ozaki } else
581 1.193 ozaki laddr = in4p_laddr(inp);
582 1.33 mycroft if (in_pcblookup_connect(inp->inp_table, sin->sin_addr, sin->sin_port,
583 1.168 ozaki laddr, inp->inp_lport, &vestige) != NULL ||
584 1.168 ozaki vestige.valid) {
585 1.1 cgd return (EADDRINUSE);
586 1.168 ozaki }
587 1.193 ozaki if (in_nullhost(in4p_laddr(inp))) {
588 1.40 thorpej if (inp->inp_lport == 0) {
589 1.151 rtr error = in_pcbbind(inp, NULL, l);
590 1.40 thorpej /*
591 1.40 thorpej * This used to ignore the return value
592 1.40 thorpej * completely, but we need to check for
593 1.40 thorpej * ephemeral port shortage.
594 1.101 dsl * And attempts to request low ports if not root.
595 1.40 thorpej */
596 1.101 dsl if (error != 0)
597 1.40 thorpej return (error);
598 1.40 thorpej }
599 1.193 ozaki in4p_laddr(inp) = laddr;
600 1.1 cgd }
601 1.193 ozaki in4p_faddr(inp) = sin->sin_addr;
602 1.1 cgd inp->inp_fport = sin->sin_port;
603 1.139 christos
604 1.139 christos /* Late bind, if needed */
605 1.139 christos if (inp->inp_bindportonsend) {
606 1.139 christos struct sockaddr_in lsin = *((const struct sockaddr_in *)
607 1.139 christos inp->inp_socket->so_proto->pr_domain->dom_sa_any);
608 1.193 ozaki lsin.sin_addr = in4p_laddr(inp);
609 1.139 christos lsin.sin_port = 0;
610 1.139 christos
611 1.185 christos if ((error = in_pcbbind_port(inp, &lsin, l->l_cred)) != 0)
612 1.139 christos return error;
613 1.139 christos }
614 1.139 christos
615 1.33 mycroft in_pcbstate(inp, INP_CONNECTED);
616 1.145 christos #if defined(IPSEC)
617 1.148 christos if (ipsec_enabled && inp->inp_socket->so_type == SOCK_STREAM)
618 1.71 itojun ipsec_pcbconn(inp->inp_sp);
619 1.71 itojun #endif
620 1.1 cgd return (0);
621 1.1 cgd }
622 1.1 cgd
623 1.25 christos void
624 1.98 perry in_pcbdisconnect(void *v)
625 1.1 cgd {
626 1.25 christos struct inpcb *inp = v;
627 1.1 cgd
628 1.88 itojun if (inp->inp_af != AF_INET)
629 1.88 itojun return;
630 1.88 itojun
631 1.193 ozaki in4p_faddr(inp) = zeroin_addr;
632 1.1 cgd inp->inp_fport = 0;
633 1.33 mycroft in_pcbstate(inp, INP_BOUND);
634 1.145 christos #if defined(IPSEC)
635 1.148 christos if (ipsec_enabled)
636 1.148 christos ipsec_pcbdisconn(inp->inp_sp);
637 1.71 itojun #endif
638 1.93 itojun if (inp->inp_socket->so_state & SS_NOFDREF)
639 1.93 itojun in_pcbdetach(inp);
640 1.1 cgd }
641 1.1 cgd
642 1.25 christos void
643 1.98 perry in_pcbdetach(void *v)
644 1.1 cgd {
645 1.25 christos struct inpcb *inp = v;
646 1.1 cgd struct socket *so = inp->inp_socket;
647 1.24 mycroft int s;
648 1.1 cgd
649 1.192 ozaki KASSERT(inp->inp_af == AF_INET || inp->inp_af == AF_INET6);
650 1.88 itojun
651 1.145 christos #if defined(IPSEC)
652 1.148 christos if (ipsec_enabled)
653 1.182 maxv ipsec_delete_pcbpolicy(inp);
654 1.150 rmind #endif
655 1.150 rmind so->so_pcb = NULL;
656 1.150 rmind
657 1.175 ozaki s = splsoftnet();
658 1.33 mycroft in_pcbstate(inp, INP_ATTACHED);
659 1.192 ozaki LIST_REMOVE(inp, inp_lhash);
660 1.192 ozaki TAILQ_REMOVE(&inp->inp_table->inpt_queue, inp, inp_queue);
661 1.24 mycroft splx(s);
662 1.150 rmind
663 1.150 rmind if (inp->inp_options) {
664 1.150 rmind m_free(inp->inp_options);
665 1.150 rmind }
666 1.150 rmind rtcache_free(&inp->inp_route);
667 1.152 rmind ip_freemoptions(inp->inp_moptions);
668 1.193 ozaki if (inp->inp_af == AF_INET6) {
669 1.193 ozaki if (in6p_outputopts(inp) != NULL) {
670 1.193 ozaki ip6_clearpktopts(in6p_outputopts(inp), -1);
671 1.193 ozaki free(in6p_outputopts(inp), M_IP6OPT);
672 1.193 ozaki }
673 1.193 ozaki ip6_freemoptions(in6p_moptions(inp));
674 1.193 ozaki }
675 1.127 spz sofree(so); /* drops the socket's lock */
676 1.150 rmind
677 1.193 ozaki if (inp->inp_af == AF_INET)
678 1.193 ozaki pool_put(&in4pcb_pool, inp);
679 1.193 ozaki else
680 1.193 ozaki pool_put(&in6pcb_pool, inp);
681 1.126 matt mutex_enter(softnet_lock); /* reacquire the softnet_lock */
682 1.1 cgd }
683 1.1 cgd
684 1.25 christos void
685 1.157 rtr in_setsockaddr(struct inpcb *inp, struct sockaddr_in *sin)
686 1.1 cgd {
687 1.78 itojun
688 1.88 itojun if (inp->inp_af != AF_INET)
689 1.88 itojun return;
690 1.88 itojun
691 1.193 ozaki sockaddr_in_init(sin, &in4p_laddr(inp), inp->inp_lport);
692 1.1 cgd }
693 1.1 cgd
694 1.25 christos void
695 1.157 rtr in_setpeeraddr(struct inpcb *inp, struct sockaddr_in *sin)
696 1.1 cgd {
697 1.78 itojun
698 1.88 itojun if (inp->inp_af != AF_INET)
699 1.88 itojun return;
700 1.88 itojun
701 1.193 ozaki sockaddr_in_init(sin, &in4p_faddr(inp), inp->inp_fport);
702 1.1 cgd }
703 1.1 cgd
704 1.1 cgd /*
705 1.1 cgd * Pass some notification to all connections of a protocol
706 1.1 cgd * associated with address dst. The local address and/or port numbers
707 1.1 cgd * may be specified to limit the search. The "usual action" will be
708 1.1 cgd * taken, depending on the ctlinput cmd. The caller must filter any
709 1.1 cgd * cmds that are uninteresting (e.g., no error in the map).
710 1.1 cgd * Call the protocol specific routine (if any) to report
711 1.1 cgd * any errors for each matching socket.
712 1.1 cgd *
713 1.22 mycroft * Must be called at splsoftnet.
714 1.1 cgd */
715 1.37 thorpej int
716 1.98 perry in_pcbnotify(struct inpcbtable *table, struct in_addr faddr, u_int fport_arg,
717 1.98 perry struct in_addr laddr, u_int lport_arg, int errno,
718 1.98 perry void (*notify)(struct inpcb *, int))
719 1.1 cgd {
720 1.33 mycroft struct inpcbhead *head;
721 1.188 knakahar struct inpcb *inp;
722 1.13 cgd u_int16_t fport = fport_arg, lport = lport_arg;
723 1.37 thorpej int nmatch;
724 1.1 cgd
725 1.33 mycroft if (in_nullhost(faddr) || notify == 0)
726 1.37 thorpej return (0);
727 1.1 cgd
728 1.37 thorpej nmatch = 0;
729 1.33 mycroft head = INPCBHASH_CONNECT(table, faddr, fport, laddr, lport);
730 1.192 ozaki LIST_FOREACH(inp, head, inp_hash) {
731 1.88 itojun if (inp->inp_af != AF_INET)
732 1.88 itojun continue;
733 1.188 knakahar
734 1.193 ozaki if (in_hosteq(in4p_faddr(inp), faddr) &&
735 1.33 mycroft inp->inp_fport == fport &&
736 1.33 mycroft inp->inp_lport == lport &&
737 1.193 ozaki in_hosteq(in4p_laddr(inp), laddr)) {
738 1.33 mycroft (*notify)(inp, errno);
739 1.37 thorpej nmatch++;
740 1.37 thorpej }
741 1.1 cgd }
742 1.37 thorpej return (nmatch);
743 1.18 mycroft }
744 1.18 mycroft
745 1.20 mycroft void
746 1.98 perry in_pcbnotifyall(struct inpcbtable *table, struct in_addr faddr, int errno,
747 1.98 perry void (*notify)(struct inpcb *, int))
748 1.18 mycroft {
749 1.192 ozaki struct inpcb *inp;
750 1.18 mycroft
751 1.33 mycroft if (in_nullhost(faddr) || notify == 0)
752 1.18 mycroft return;
753 1.18 mycroft
754 1.192 ozaki TAILQ_FOREACH(inp, &table->inpt_queue, inp_queue) {
755 1.88 itojun if (inp->inp_af != AF_INET)
756 1.88 itojun continue;
757 1.193 ozaki if (in_hosteq(in4p_faddr(inp), faddr))
758 1.33 mycroft (*notify)(inp, errno);
759 1.63 thorpej }
760 1.63 thorpej }
761 1.63 thorpej
762 1.63 thorpej void
763 1.154 seanb in_purgeifmcast(struct ip_moptions *imo, struct ifnet *ifp)
764 1.154 seanb {
765 1.154 seanb int i, gap;
766 1.154 seanb
767 1.176 ozaki /* The owner of imo should be protected by solock */
768 1.164 ozaki KASSERT(ifp != NULL);
769 1.164 ozaki
770 1.154 seanb if (imo == NULL)
771 1.154 seanb return;
772 1.154 seanb
773 1.154 seanb /*
774 1.154 seanb * Unselect the outgoing interface if it is being
775 1.154 seanb * detached.
776 1.154 seanb */
777 1.164 ozaki if (imo->imo_multicast_if_index == ifp->if_index)
778 1.164 ozaki imo->imo_multicast_if_index = 0;
779 1.154 seanb
780 1.154 seanb /*
781 1.154 seanb * Drop multicast group membership if we joined
782 1.154 seanb * through the interface being detached.
783 1.154 seanb */
784 1.154 seanb for (i = 0, gap = 0; i < imo->imo_num_memberships; i++) {
785 1.154 seanb if (imo->imo_membership[i]->inm_ifp == ifp) {
786 1.154 seanb in_delmulti(imo->imo_membership[i]);
787 1.154 seanb gap++;
788 1.154 seanb } else if (gap != 0)
789 1.154 seanb imo->imo_membership[i - gap] = imo->imo_membership[i];
790 1.154 seanb }
791 1.154 seanb imo->imo_num_memberships -= gap;
792 1.154 seanb }
793 1.154 seanb
794 1.154 seanb void
795 1.98 perry in_pcbpurgeif0(struct inpcbtable *table, struct ifnet *ifp)
796 1.63 thorpej {
797 1.192 ozaki struct inpcb *inp;
798 1.63 thorpej
799 1.192 ozaki TAILQ_FOREACH(inp, &table->inpt_queue, inp_queue) {
800 1.176 ozaki bool need_unlock = false;
801 1.176 ozaki
802 1.88 itojun if (inp->inp_af != AF_INET)
803 1.88 itojun continue;
804 1.176 ozaki
805 1.176 ozaki /* The caller holds either one of inps' lock */
806 1.176 ozaki if (!inp_locked(inp)) {
807 1.176 ozaki inp_lock(inp);
808 1.176 ozaki need_unlock = true;
809 1.176 ozaki }
810 1.176 ozaki
811 1.154 seanb in_purgeifmcast(inp->inp_moptions, ifp);
812 1.176 ozaki
813 1.176 ozaki if (need_unlock)
814 1.176 ozaki inp_unlock(inp);
815 1.69 itojun }
816 1.69 itojun }
817 1.69 itojun
818 1.69 itojun void
819 1.98 perry in_pcbpurgeif(struct inpcbtable *table, struct ifnet *ifp)
820 1.69 itojun {
821 1.121 dyoung struct rtentry *rt;
822 1.192 ozaki struct inpcb *inp;
823 1.69 itojun
824 1.192 ozaki TAILQ_FOREACH(inp, &table->inpt_queue, inp_queue) {
825 1.88 itojun if (inp->inp_af != AF_INET)
826 1.88 itojun continue;
827 1.122 dyoung if ((rt = rtcache_validate(&inp->inp_route)) != NULL &&
828 1.171 ozaki rt->rt_ifp == ifp) {
829 1.171 ozaki rtcache_unref(rt, &inp->inp_route);
830 1.69 itojun in_rtchange(inp, 0);
831 1.171 ozaki } else
832 1.171 ozaki rtcache_unref(rt, &inp->inp_route);
833 1.1 cgd }
834 1.1 cgd }
835 1.1 cgd
836 1.1 cgd /*
837 1.1 cgd * Check for alternatives when higher level complains
838 1.1 cgd * about service problems. For now, invalidate cached
839 1.1 cgd * routing information. If the route was created dynamically
840 1.1 cgd * (by a redirect), time to try a default gateway again.
841 1.1 cgd */
842 1.25 christos void
843 1.98 perry in_losing(struct inpcb *inp)
844 1.1 cgd {
845 1.64 augustss struct rtentry *rt;
846 1.10 mycroft struct rt_addrinfo info;
847 1.1 cgd
848 1.88 itojun if (inp->inp_af != AF_INET)
849 1.88 itojun return;
850 1.88 itojun
851 1.122 dyoung if ((rt = rtcache_validate(&inp->inp_route)) == NULL)
852 1.122 dyoung return;
853 1.122 dyoung
854 1.122 dyoung memset(&info, 0, sizeof(info));
855 1.122 dyoung info.rti_info[RTAX_DST] = rtcache_getdst(&inp->inp_route);
856 1.122 dyoung info.rti_info[RTAX_GATEWAY] = rt->rt_gateway;
857 1.122 dyoung info.rti_info[RTAX_NETMASK] = rt_mask(rt);
858 1.122 dyoung rt_missmsg(RTM_LOSING, &info, rt->rt_flags, 0);
859 1.171 ozaki if (rt->rt_flags & RTF_DYNAMIC) {
860 1.171 ozaki int error;
861 1.171 ozaki struct rtentry *nrt;
862 1.171 ozaki
863 1.171 ozaki error = rtrequest(RTM_DELETE, rt_getkey(rt),
864 1.171 ozaki rt->rt_gateway, rt_mask(rt), rt->rt_flags, &nrt);
865 1.171 ozaki rtcache_unref(rt, &inp->inp_route);
866 1.190 knakahar if (error == 0) {
867 1.190 knakahar rt_newmsg_dynamic(RTM_DELETE, nrt);
868 1.172 ozaki rt_free(nrt);
869 1.190 knakahar }
870 1.171 ozaki } else
871 1.171 ozaki rtcache_unref(rt, &inp->inp_route);
872 1.122 dyoung /*
873 1.122 dyoung * A new route can be allocated
874 1.122 dyoung * the next time output is attempted.
875 1.122 dyoung */
876 1.122 dyoung rtcache_free(&inp->inp_route);
877 1.1 cgd }
878 1.1 cgd
879 1.1 cgd /*
880 1.111 dyoung * After a routing change, flush old routing. A new route can be
881 1.111 dyoung * allocated the next time output is attempted.
882 1.1 cgd */
883 1.10 mycroft void
884 1.109 christos in_rtchange(struct inpcb *inp, int errno)
885 1.1 cgd {
886 1.32 mycroft
887 1.88 itojun if (inp->inp_af != AF_INET)
888 1.88 itojun return;
889 1.88 itojun
890 1.112 joerg rtcache_free(&inp->inp_route);
891 1.112 joerg
892 1.49 tls /* XXX SHOULD NOTIFY HIGHER-LEVEL PROTOCOLS */
893 1.1 cgd }
894 1.1 cgd
895 1.1 cgd struct inpcb *
896 1.98 perry in_pcblookup_port(struct inpcbtable *table, struct in_addr laddr,
897 1.138 dyoung u_int lport_arg, int lookup_wildcard, vestigial_inpcb_t *vp)
898 1.1 cgd {
899 1.90 provos struct inpcbhead *head;
900 1.192 ozaki struct inpcb *inp;
901 1.142 yamt struct inpcb *match = NULL;
902 1.142 yamt int matchwild = 3;
903 1.142 yamt int wildcard;
904 1.33 mycroft u_int16_t lport = lport_arg;
905 1.1 cgd
906 1.138 dyoung if (vp)
907 1.138 dyoung vp->valid = 0;
908 1.138 dyoung
909 1.90 provos head = INPCBHASH_PORT(table, lport);
910 1.192 ozaki LIST_FOREACH(inp, head, inp_lhash) {
911 1.88 itojun if (inp->inp_af != AF_INET)
912 1.88 itojun continue;
913 1.1 cgd if (inp->inp_lport != lport)
914 1.1 cgd continue;
915 1.142 yamt /*
916 1.142 yamt * check if inp's faddr and laddr match with ours.
917 1.142 yamt * our faddr is considered null.
918 1.142 yamt * count the number of wildcard matches. (0 - 2)
919 1.142 yamt *
920 1.142 yamt * null null match
921 1.142 yamt * A null wildcard match
922 1.142 yamt * null B wildcard match
923 1.142 yamt * A B non match
924 1.142 yamt * A A match
925 1.142 yamt */
926 1.1 cgd wildcard = 0;
927 1.193 ozaki if (!in_nullhost(in4p_faddr(inp)))
928 1.33 mycroft wildcard++;
929 1.193 ozaki if (in_nullhost(in4p_laddr(inp))) {
930 1.32 mycroft if (!in_nullhost(laddr))
931 1.1 cgd wildcard++;
932 1.1 cgd } else {
933 1.32 mycroft if (in_nullhost(laddr))
934 1.1 cgd wildcard++;
935 1.32 mycroft else {
936 1.193 ozaki if (!in_hosteq(in4p_laddr(inp), laddr))
937 1.32 mycroft continue;
938 1.32 mycroft }
939 1.1 cgd }
940 1.54 lukem if (wildcard && !lookup_wildcard)
941 1.1 cgd continue;
942 1.142 yamt /*
943 1.142 yamt * prefer an address with less wildcards.
944 1.142 yamt */
945 1.1 cgd if (wildcard < matchwild) {
946 1.1 cgd match = inp;
947 1.1 cgd matchwild = wildcard;
948 1.1 cgd if (matchwild == 0)
949 1.1 cgd break;
950 1.1 cgd }
951 1.1 cgd }
952 1.138 dyoung if (match && matchwild == 0)
953 1.138 dyoung return match;
954 1.138 dyoung
955 1.138 dyoung if (vp && table->vestige) {
956 1.138 dyoung void *state = (*table->vestige->init_ports4)(laddr, lport_arg, lookup_wildcard);
957 1.138 dyoung vestigial_inpcb_t better;
958 1.191 ryo bool has_better = false;
959 1.138 dyoung
960 1.138 dyoung while (table->vestige
961 1.138 dyoung && (*table->vestige->next_port4)(state, vp)) {
962 1.138 dyoung
963 1.138 dyoung if (vp->lport != lport)
964 1.138 dyoung continue;
965 1.138 dyoung wildcard = 0;
966 1.138 dyoung if (!in_nullhost(vp->faddr.v4))
967 1.138 dyoung wildcard++;
968 1.138 dyoung if (in_nullhost(vp->laddr.v4)) {
969 1.138 dyoung if (!in_nullhost(laddr))
970 1.138 dyoung wildcard++;
971 1.138 dyoung } else {
972 1.138 dyoung if (in_nullhost(laddr))
973 1.138 dyoung wildcard++;
974 1.138 dyoung else {
975 1.138 dyoung if (!in_hosteq(vp->laddr.v4, laddr))
976 1.138 dyoung continue;
977 1.138 dyoung }
978 1.138 dyoung }
979 1.138 dyoung if (wildcard && !lookup_wildcard)
980 1.138 dyoung continue;
981 1.138 dyoung if (wildcard < matchwild) {
982 1.138 dyoung better = *vp;
983 1.191 ryo has_better = true;
984 1.138 dyoung
985 1.138 dyoung matchwild = wildcard;
986 1.138 dyoung if (matchwild == 0)
987 1.138 dyoung break;
988 1.138 dyoung }
989 1.138 dyoung }
990 1.138 dyoung
991 1.191 ryo if (has_better) {
992 1.191 ryo *vp = better;
993 1.191 ryo return 0;
994 1.138 dyoung }
995 1.138 dyoung }
996 1.138 dyoung
997 1.1 cgd return (match);
998 1.24 mycroft }
999 1.24 mycroft
1000 1.24 mycroft #ifdef DIAGNOSTIC
1001 1.24 mycroft int in_pcbnotifymiss = 0;
1002 1.24 mycroft #endif
1003 1.24 mycroft
1004 1.24 mycroft struct inpcb *
1005 1.98 perry in_pcblookup_connect(struct inpcbtable *table,
1006 1.98 perry struct in_addr faddr, u_int fport_arg,
1007 1.138 dyoung struct in_addr laddr, u_int lport_arg,
1008 1.138 dyoung vestigial_inpcb_t *vp)
1009 1.24 mycroft {
1010 1.24 mycroft struct inpcbhead *head;
1011 1.64 augustss struct inpcb *inp;
1012 1.24 mycroft u_int16_t fport = fport_arg, lport = lport_arg;
1013 1.24 mycroft
1014 1.138 dyoung if (vp)
1015 1.138 dyoung vp->valid = 0;
1016 1.138 dyoung
1017 1.33 mycroft head = INPCBHASH_CONNECT(table, faddr, fport, laddr, lport);
1018 1.192 ozaki LIST_FOREACH(inp, head, inp_hash) {
1019 1.88 itojun if (inp->inp_af != AF_INET)
1020 1.88 itojun continue;
1021 1.88 itojun
1022 1.193 ozaki if (in_hosteq(in4p_faddr(inp), faddr) &&
1023 1.33 mycroft inp->inp_fport == fport &&
1024 1.33 mycroft inp->inp_lport == lport &&
1025 1.193 ozaki in_hosteq(in4p_laddr(inp), laddr))
1026 1.33 mycroft goto out;
1027 1.24 mycroft }
1028 1.138 dyoung if (vp && table->vestige) {
1029 1.138 dyoung if ((*table->vestige->lookup4)(faddr, fport_arg,
1030 1.138 dyoung laddr, lport_arg, vp))
1031 1.138 dyoung return 0;
1032 1.138 dyoung }
1033 1.138 dyoung
1034 1.24 mycroft #ifdef DIAGNOSTIC
1035 1.33 mycroft if (in_pcbnotifymiss) {
1036 1.35 christos printf("in_pcblookup_connect: faddr=%08x fport=%d laddr=%08x lport=%d\n",
1037 1.24 mycroft ntohl(faddr.s_addr), ntohs(fport),
1038 1.24 mycroft ntohl(laddr.s_addr), ntohs(lport));
1039 1.24 mycroft }
1040 1.24 mycroft #endif
1041 1.33 mycroft return (0);
1042 1.33 mycroft
1043 1.33 mycroft out:
1044 1.33 mycroft /* Move this PCB to the head of hash chain. */
1045 1.192 ozaki if (inp != LIST_FIRST(head)) {
1046 1.192 ozaki LIST_REMOVE(inp, inp_hash);
1047 1.192 ozaki LIST_INSERT_HEAD(head, inp, inp_hash);
1048 1.33 mycroft }
1049 1.33 mycroft return (inp);
1050 1.33 mycroft }
1051 1.33 mycroft
1052 1.33 mycroft struct inpcb *
1053 1.98 perry in_pcblookup_bind(struct inpcbtable *table,
1054 1.98 perry struct in_addr laddr, u_int lport_arg)
1055 1.33 mycroft {
1056 1.33 mycroft struct inpcbhead *head;
1057 1.64 augustss struct inpcb *inp;
1058 1.33 mycroft u_int16_t lport = lport_arg;
1059 1.33 mycroft
1060 1.33 mycroft head = INPCBHASH_BIND(table, laddr, lport);
1061 1.192 ozaki LIST_FOREACH(inp, head, inp_hash) {
1062 1.88 itojun if (inp->inp_af != AF_INET)
1063 1.88 itojun continue;
1064 1.88 itojun
1065 1.33 mycroft if (inp->inp_lport == lport &&
1066 1.193 ozaki in_hosteq(in4p_laddr(inp), laddr))
1067 1.33 mycroft goto out;
1068 1.33 mycroft }
1069 1.33 mycroft head = INPCBHASH_BIND(table, zeroin_addr, lport);
1070 1.192 ozaki LIST_FOREACH(inp, head, inp_hash) {
1071 1.88 itojun if (inp->inp_af != AF_INET)
1072 1.88 itojun continue;
1073 1.88 itojun
1074 1.33 mycroft if (inp->inp_lport == lport &&
1075 1.193 ozaki in_hosteq(in4p_laddr(inp), zeroin_addr))
1076 1.33 mycroft goto out;
1077 1.33 mycroft }
1078 1.33 mycroft #ifdef DIAGNOSTIC
1079 1.33 mycroft if (in_pcbnotifymiss) {
1080 1.35 christos printf("in_pcblookup_bind: laddr=%08x lport=%d\n",
1081 1.33 mycroft ntohl(laddr.s_addr), ntohs(lport));
1082 1.33 mycroft }
1083 1.33 mycroft #endif
1084 1.33 mycroft return (0);
1085 1.33 mycroft
1086 1.33 mycroft out:
1087 1.33 mycroft /* Move this PCB to the head of hash chain. */
1088 1.192 ozaki if (inp != LIST_FIRST(head)) {
1089 1.192 ozaki LIST_REMOVE(inp, inp_hash);
1090 1.192 ozaki LIST_INSERT_HEAD(head, inp, inp_hash);
1091 1.33 mycroft }
1092 1.24 mycroft return (inp);
1093 1.33 mycroft }
1094 1.33 mycroft
1095 1.33 mycroft void
1096 1.98 perry in_pcbstate(struct inpcb *inp, int state)
1097 1.33 mycroft {
1098 1.33 mycroft
1099 1.192 ozaki if (inp->inp_af == AF_INET6) {
1100 1.192 ozaki in6_pcbstate(inp, state);
1101 1.88 itojun return;
1102 1.192 ozaki }
1103 1.88 itojun
1104 1.33 mycroft if (inp->inp_state > INP_ATTACHED)
1105 1.192 ozaki LIST_REMOVE(inp, inp_hash);
1106 1.33 mycroft
1107 1.33 mycroft switch (state) {
1108 1.33 mycroft case INP_BOUND:
1109 1.33 mycroft LIST_INSERT_HEAD(INPCBHASH_BIND(inp->inp_table,
1110 1.193 ozaki in4p_laddr(inp), inp->inp_lport), inp,
1111 1.192 ozaki inp_hash);
1112 1.33 mycroft break;
1113 1.33 mycroft case INP_CONNECTED:
1114 1.33 mycroft LIST_INSERT_HEAD(INPCBHASH_CONNECT(inp->inp_table,
1115 1.193 ozaki in4p_faddr(inp), inp->inp_fport,
1116 1.193 ozaki in4p_laddr(inp), inp->inp_lport), inp,
1117 1.192 ozaki inp_hash);
1118 1.33 mycroft break;
1119 1.33 mycroft }
1120 1.33 mycroft
1121 1.33 mycroft inp->inp_state = state;
1122 1.38 thorpej }
1123 1.38 thorpej
1124 1.38 thorpej struct rtentry *
1125 1.98 perry in_pcbrtentry(struct inpcb *inp)
1126 1.38 thorpej {
1127 1.38 thorpej struct route *ro;
1128 1.117 dyoung union {
1129 1.117 dyoung struct sockaddr dst;
1130 1.117 dyoung struct sockaddr_in dst4;
1131 1.117 dyoung } u;
1132 1.88 itojun
1133 1.192 ozaki if (inp->inp_af == AF_INET6)
1134 1.192 ozaki return in6_pcbrtentry(inp);
1135 1.88 itojun if (inp->inp_af != AF_INET)
1136 1.88 itojun return (NULL);
1137 1.38 thorpej
1138 1.38 thorpej ro = &inp->inp_route;
1139 1.38 thorpej
1140 1.193 ozaki sockaddr_in_init(&u.dst4, &in4p_faddr(inp), 0);
1141 1.117 dyoung return rtcache_lookup(ro, &u.dst);
1142 1.59 itojun }
1143 1.171 ozaki
1144 1.171 ozaki void
1145 1.171 ozaki in_pcbrtentry_unref(struct rtentry *rt, struct inpcb *inp)
1146 1.171 ozaki {
1147 1.171 ozaki
1148 1.171 ozaki rtcache_unref(rt, &inp->inp_route);
1149 1.171 ozaki }
1150