in_pcb.c revision 1.180 1 1.180 ozaki /* $NetBSD: in_pcb.c,v 1.180 2017/12/15 04:03:46 ozaki-r Exp $ */
2 1.59 itojun
3 1.59 itojun /*
4 1.59 itojun * Copyright (C) 1995, 1996, 1997, and 1998 WIDE Project.
5 1.59 itojun * All rights reserved.
6 1.78 itojun *
7 1.59 itojun * Redistribution and use in source and binary forms, with or without
8 1.59 itojun * modification, are permitted provided that the following conditions
9 1.59 itojun * are met:
10 1.59 itojun * 1. Redistributions of source code must retain the above copyright
11 1.59 itojun * notice, this list of conditions and the following disclaimer.
12 1.59 itojun * 2. Redistributions in binary form must reproduce the above copyright
13 1.59 itojun * notice, this list of conditions and the following disclaimer in the
14 1.59 itojun * documentation and/or other materials provided with the distribution.
15 1.59 itojun * 3. Neither the name of the project nor the names of its contributors
16 1.59 itojun * may be used to endorse or promote products derived from this software
17 1.59 itojun * without specific prior written permission.
18 1.78 itojun *
19 1.59 itojun * THIS SOFTWARE IS PROVIDED BY THE PROJECT AND CONTRIBUTORS ``AS IS'' AND
20 1.59 itojun * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
21 1.59 itojun * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
22 1.59 itojun * ARE DISCLAIMED. IN NO EVENT SHALL THE PROJECT OR CONTRIBUTORS BE LIABLE
23 1.59 itojun * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
24 1.59 itojun * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
25 1.59 itojun * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
26 1.59 itojun * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
27 1.59 itojun * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
28 1.59 itojun * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
29 1.59 itojun * SUCH DAMAGE.
30 1.59 itojun */
31 1.57 thorpej
32 1.57 thorpej /*-
33 1.138 dyoung * Copyright (c) 1998, 2011 The NetBSD Foundation, Inc.
34 1.57 thorpej * All rights reserved.
35 1.57 thorpej *
36 1.57 thorpej * This code is derived from software contributed to The NetBSD Foundation
37 1.138 dyoung * by Coyote Point Systems, Inc.
38 1.138 dyoung * This code is derived from software contributed to The NetBSD Foundation
39 1.57 thorpej * by Public Access Networks Corporation ("Panix"). It was developed under
40 1.57 thorpej * contract to Panix by Eric Haszlakiewicz and Thor Lancelot Simon.
41 1.57 thorpej *
42 1.57 thorpej * Redistribution and use in source and binary forms, with or without
43 1.57 thorpej * modification, are permitted provided that the following conditions
44 1.57 thorpej * are met:
45 1.57 thorpej * 1. Redistributions of source code must retain the above copyright
46 1.57 thorpej * notice, this list of conditions and the following disclaimer.
47 1.57 thorpej * 2. Redistributions in binary form must reproduce the above copyright
48 1.57 thorpej * notice, this list of conditions and the following disclaimer in the
49 1.57 thorpej * documentation and/or other materials provided with the distribution.
50 1.57 thorpej *
51 1.57 thorpej * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
52 1.57 thorpej * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
53 1.57 thorpej * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
54 1.57 thorpej * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
55 1.57 thorpej * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
56 1.57 thorpej * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
57 1.57 thorpej * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
58 1.57 thorpej * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
59 1.57 thorpej * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
60 1.57 thorpej * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
61 1.57 thorpej * POSSIBILITY OF SUCH DAMAGE.
62 1.57 thorpej */
63 1.11 cgd
64 1.1 cgd /*
65 1.44 thorpej * Copyright (c) 1982, 1986, 1991, 1993, 1995
66 1.10 mycroft * The Regents of the University of California. All rights reserved.
67 1.1 cgd *
68 1.1 cgd * Redistribution and use in source and binary forms, with or without
69 1.1 cgd * modification, are permitted provided that the following conditions
70 1.1 cgd * are met:
71 1.1 cgd * 1. Redistributions of source code must retain the above copyright
72 1.1 cgd * notice, this list of conditions and the following disclaimer.
73 1.1 cgd * 2. Redistributions in binary form must reproduce the above copyright
74 1.1 cgd * notice, this list of conditions and the following disclaimer in the
75 1.1 cgd * documentation and/or other materials provided with the distribution.
76 1.86 agc * 3. Neither the name of the University nor the names of its contributors
77 1.1 cgd * may be used to endorse or promote products derived from this software
78 1.1 cgd * without specific prior written permission.
79 1.1 cgd *
80 1.1 cgd * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
81 1.1 cgd * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
82 1.1 cgd * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
83 1.1 cgd * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
84 1.1 cgd * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
85 1.1 cgd * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
86 1.1 cgd * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
87 1.1 cgd * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
88 1.1 cgd * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
89 1.1 cgd * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
90 1.1 cgd * SUCH DAMAGE.
91 1.1 cgd *
92 1.44 thorpej * @(#)in_pcb.c 8.4 (Berkeley) 5/24/95
93 1.1 cgd */
94 1.73 lukem
95 1.73 lukem #include <sys/cdefs.h>
96 1.180 ozaki __KERNEL_RCSID(0, "$NetBSD: in_pcb.c,v 1.180 2017/12/15 04:03:46 ozaki-r Exp $");
97 1.60 thorpej
98 1.162 pooka #ifdef _KERNEL_OPT
99 1.88 itojun #include "opt_inet.h"
100 1.60 thorpej #include "opt_ipsec.h"
101 1.162 pooka #endif
102 1.1 cgd
103 1.7 mycroft #include <sys/param.h>
104 1.7 mycroft #include <sys/systm.h>
105 1.7 mycroft #include <sys/mbuf.h>
106 1.7 mycroft #include <sys/socket.h>
107 1.7 mycroft #include <sys/socketvar.h>
108 1.7 mycroft #include <sys/ioctl.h>
109 1.10 mycroft #include <sys/errno.h>
110 1.10 mycroft #include <sys/time.h>
111 1.128 pooka #include <sys/once.h>
112 1.52 thorpej #include <sys/pool.h>
113 1.10 mycroft #include <sys/proc.h>
114 1.102 elad #include <sys/kauth.h>
115 1.129 pooka #include <sys/uidinfo.h>
116 1.132 elad #include <sys/domain.h>
117 1.1 cgd
118 1.7 mycroft #include <net/if.h>
119 1.7 mycroft #include <net/route.h>
120 1.1 cgd
121 1.7 mycroft #include <netinet/in.h>
122 1.7 mycroft #include <netinet/in_systm.h>
123 1.7 mycroft #include <netinet/ip.h>
124 1.7 mycroft #include <netinet/in_pcb.h>
125 1.7 mycroft #include <netinet/in_var.h>
126 1.7 mycroft #include <netinet/ip_var.h>
127 1.143 christos #include <netinet/portalgo.h>
128 1.1 cgd
129 1.88 itojun #ifdef INET6
130 1.88 itojun #include <netinet/ip6.h>
131 1.88 itojun #include <netinet6/ip6_var.h>
132 1.88 itojun #include <netinet6/in6_pcb.h>
133 1.88 itojun #endif
134 1.88 itojun
135 1.145 christos #ifdef IPSEC
136 1.87 jonathan #include <netipsec/ipsec.h>
137 1.87 jonathan #include <netipsec/key.h>
138 1.59 itojun #endif /* IPSEC */
139 1.59 itojun
140 1.138 dyoung #include <netinet/tcp_vtw.h>
141 1.138 dyoung
142 1.1 cgd struct in_addr zeroin_addr;
143 1.1 cgd
144 1.90 provos #define INPCBHASH_PORT(table, lport) \
145 1.92 itojun &(table)->inpt_porthashtbl[ntohs(lport) & (table)->inpt_porthash]
146 1.33 mycroft #define INPCBHASH_BIND(table, laddr, lport) \
147 1.33 mycroft &(table)->inpt_bindhashtbl[ \
148 1.33 mycroft ((ntohl((laddr).s_addr) + ntohs(lport))) & (table)->inpt_bindhash]
149 1.33 mycroft #define INPCBHASH_CONNECT(table, faddr, fport, laddr, lport) \
150 1.33 mycroft &(table)->inpt_connecthashtbl[ \
151 1.33 mycroft ((ntohl((faddr).s_addr) + ntohs(fport)) + \
152 1.33 mycroft (ntohl((laddr).s_addr) + ntohs(lport))) & (table)->inpt_connecthash]
153 1.33 mycroft
154 1.43 lukem int anonportmin = IPPORT_ANONMIN;
155 1.43 lukem int anonportmax = IPPORT_ANONMAX;
156 1.67 tron int lowportmin = IPPORT_RESERVEDMIN;
157 1.67 tron int lowportmax = IPPORT_RESERVEDMAX;
158 1.43 lukem
159 1.128 pooka static struct pool inpcb_pool;
160 1.128 pooka
161 1.128 pooka static int
162 1.128 pooka inpcb_poolinit(void)
163 1.128 pooka {
164 1.128 pooka
165 1.128 pooka pool_init(&inpcb_pool, sizeof(struct inpcb), 0, 0, 0, "inpcbpl", NULL,
166 1.128 pooka IPL_NET);
167 1.128 pooka return 0;
168 1.128 pooka }
169 1.52 thorpej
170 1.18 mycroft void
171 1.98 perry in_pcbinit(struct inpcbtable *table, int bindhashsize, int connecthashsize)
172 1.18 mycroft {
173 1.128 pooka static ONCE_DECL(control);
174 1.18 mycroft
175 1.146 christos TAILQ_INIT(&table->inpt_queue);
176 1.125 ad table->inpt_porthashtbl = hashinit(bindhashsize, HASH_LIST, true,
177 1.125 ad &table->inpt_porthash);
178 1.125 ad table->inpt_bindhashtbl = hashinit(bindhashsize, HASH_LIST, true,
179 1.125 ad &table->inpt_bindhash);
180 1.125 ad table->inpt_connecthashtbl = hashinit(connecthashsize, HASH_LIST, true,
181 1.125 ad &table->inpt_connecthash);
182 1.47 lukem table->inpt_lastlow = IPPORT_RESERVEDMAX;
183 1.47 lukem table->inpt_lastport = (u_int16_t)anonportmax;
184 1.128 pooka
185 1.128 pooka RUN_ONCE(&control, inpcb_poolinit);
186 1.18 mycroft }
187 1.18 mycroft
188 1.10 mycroft int
189 1.98 perry in_pcballoc(struct socket *so, void *v)
190 1.1 cgd {
191 1.25 christos struct inpcbtable *table = v;
192 1.64 augustss struct inpcb *inp;
193 1.24 mycroft int s;
194 1.1 cgd
195 1.177 ozaki KASSERT(so->so_proto->pr_domain->dom_family == AF_INET);
196 1.177 ozaki
197 1.52 thorpej inp = pool_get(&inpcb_pool, PR_NOWAIT);
198 1.10 mycroft if (inp == NULL)
199 1.1 cgd return (ENOBUFS);
200 1.139 christos memset(inp, 0, sizeof(*inp));
201 1.88 itojun inp->inp_af = AF_INET;
202 1.18 mycroft inp->inp_table = table;
203 1.1 cgd inp->inp_socket = so;
204 1.39 matt inp->inp_errormtu = -1;
205 1.143 christos inp->inp_portalgo = PORTALGO_DEFAULT;
206 1.139 christos inp->inp_bindportonsend = false;
207 1.145 christos #if defined(IPSEC)
208 1.148 christos if (ipsec_enabled) {
209 1.148 christos int error = ipsec_init_pcbpolicy(so, &inp->inp_sp);
210 1.148 christos if (error != 0) {
211 1.148 christos pool_put(&inpcb_pool, inp);
212 1.148 christos return error;
213 1.148 christos }
214 1.178 ozaki inp->inp_sp->sp_inph = (struct inpcb_hdr *)inp;
215 1.70 itojun }
216 1.70 itojun #endif
217 1.33 mycroft so->so_pcb = inp;
218 1.175 ozaki s = splsoftnet();
219 1.146 christos TAILQ_INSERT_HEAD(&table->inpt_queue, &inp->inp_head, inph_queue);
220 1.90 provos LIST_INSERT_HEAD(INPCBHASH_PORT(table, inp->inp_lport), &inp->inp_head,
221 1.90 provos inph_lhash);
222 1.33 mycroft in_pcbstate(inp, INP_ATTACHED);
223 1.24 mycroft splx(s);
224 1.1 cgd return (0);
225 1.1 cgd }
226 1.8 mycroft
227 1.132 elad static int
228 1.134 elad in_pcbsetport(struct sockaddr_in *sin, struct inpcb *inp, kauth_cred_t cred)
229 1.1 cgd {
230 1.132 elad struct inpcbtable *table = inp->inp_table;
231 1.64 augustss struct socket *so = inp->inp_socket;
232 1.132 elad u_int16_t *lastport;
233 1.13 cgd u_int16_t lport = 0;
234 1.134 elad enum kauth_network_req req;
235 1.134 elad int error;
236 1.1 cgd
237 1.132 elad if (inp->inp_flags & INP_LOWPORT) {
238 1.132 elad #ifndef IPNOPRIVPORTS
239 1.134 elad req = KAUTH_REQ_NETWORK_BIND_PRIVPORT;
240 1.134 elad #else
241 1.134 elad req = KAUTH_REQ_NETWORK_BIND_PORT;
242 1.132 elad #endif
243 1.134 elad
244 1.132 elad lastport = &table->inpt_lastlow;
245 1.132 elad } else {
246 1.134 elad req = KAUTH_REQ_NETWORK_BIND_PORT;
247 1.134 elad
248 1.132 elad lastport = &table->inpt_lastport;
249 1.132 elad }
250 1.134 elad
251 1.134 elad /* XXX-kauth: KAUTH_REQ_NETWORK_BIND_AUTOASSIGN_{,PRIV}PORT */
252 1.134 elad error = kauth_authorize_network(cred, KAUTH_NETWORK_BIND, req, so, sin,
253 1.134 elad NULL);
254 1.134 elad if (error)
255 1.137 elad return (EACCES);
256 1.134 elad
257 1.139 christos /*
258 1.139 christos * Use RFC6056 randomized port selection
259 1.139 christos */
260 1.143 christos error = portalgo_randport(&lport, &inp->inp_head, cred);
261 1.139 christos if (error)
262 1.139 christos return error;
263 1.132 elad
264 1.132 elad inp->inp_flags |= INP_ANONPORT;
265 1.132 elad *lastport = lport;
266 1.132 elad lport = htons(lport);
267 1.132 elad inp->inp_lport = lport;
268 1.132 elad in_pcbstate(inp, INP_BOUND);
269 1.132 elad
270 1.132 elad return (0);
271 1.132 elad }
272 1.88 itojun
273 1.179 ryo int
274 1.179 ryo in_pcbbindableaddr(struct sockaddr_in *sin, kauth_cred_t cred)
275 1.132 elad {
276 1.168 ozaki int error = EADDRNOTAVAIL;
277 1.168 ozaki struct ifaddr *ifa = NULL;
278 1.168 ozaki int s;
279 1.168 ozaki
280 1.28 mycroft if (sin->sin_family != AF_INET)
281 1.28 mycroft return (EAFNOSUPPORT);
282 1.132 elad
283 1.168 ozaki s = pserialize_read_enter();
284 1.136 elad if (IN_MULTICAST(sin->sin_addr.s_addr)) {
285 1.136 elad /* Always succeed; port reuse handled in in_pcbbind_port(). */
286 1.136 elad } else if (!in_nullhost(sin->sin_addr)) {
287 1.168 ozaki struct in_ifaddr *ia;
288 1.132 elad
289 1.166 ozaki ia = in_get_ia(sin->sin_addr);
290 1.132 elad /* check for broadcast addresses */
291 1.168 ozaki if (ia == NULL) {
292 1.168 ozaki ifa = ifa_ifwithaddr(sintosa(sin));
293 1.168 ozaki if (ifa != NULL)
294 1.168 ozaki ia = ifatoia(ifa);
295 1.168 ozaki }
296 1.132 elad if (ia == NULL)
297 1.168 ozaki goto error;
298 1.170 roy if (ia->ia4_flags & IN_IFF_DUPLICATED)
299 1.168 ozaki goto error;
300 1.132 elad }
301 1.179 ryo error = 0;
302 1.179 ryo error:
303 1.168 ozaki pserialize_read_exit(s);
304 1.179 ryo return error;
305 1.179 ryo }
306 1.132 elad
307 1.179 ryo static int
308 1.179 ryo in_pcbbind_addr(struct inpcb *inp, struct sockaddr_in *sin, kauth_cred_t cred)
309 1.179 ryo {
310 1.179 ryo int error;
311 1.132 elad
312 1.179 ryo error = in_pcbbindableaddr(sin, cred);
313 1.179 ryo if (error == 0)
314 1.179 ryo inp->inp_laddr = sin->sin_addr;
315 1.168 ozaki return error;
316 1.132 elad }
317 1.132 elad
318 1.132 elad static int
319 1.132 elad in_pcbbind_port(struct inpcb *inp, struct sockaddr_in *sin, kauth_cred_t cred)
320 1.132 elad {
321 1.132 elad struct inpcbtable *table = inp->inp_table;
322 1.132 elad struct socket *so = inp->inp_socket;
323 1.132 elad int reuseport = (so->so_options & SO_REUSEPORT);
324 1.133 elad int wild = 0, error;
325 1.132 elad
326 1.28 mycroft if (IN_MULTICAST(sin->sin_addr.s_addr)) {
327 1.10 mycroft /*
328 1.28 mycroft * Treat SO_REUSEADDR as SO_REUSEPORT for multicast;
329 1.28 mycroft * allow complete duplication of binding if
330 1.28 mycroft * SO_REUSEPORT is set, or if SO_REUSEADDR is set
331 1.28 mycroft * and a multicast address is bound on both
332 1.28 mycroft * new and duplicated sockets.
333 1.10 mycroft */
334 1.155 seanb if (so->so_options & (SO_REUSEADDR | SO_REUSEPORT))
335 1.28 mycroft reuseport = SO_REUSEADDR|SO_REUSEPORT;
336 1.132 elad }
337 1.132 elad
338 1.132 elad if (sin->sin_port == 0) {
339 1.134 elad error = in_pcbsetport(sin, inp, cred);
340 1.132 elad if (error)
341 1.132 elad return (error);
342 1.132 elad } else {
343 1.28 mycroft struct inpcb *t;
344 1.138 dyoung vestigial_inpcb_t vestige;
345 1.88 itojun #ifdef INET6
346 1.88 itojun struct in6pcb *t6;
347 1.88 itojun struct in6_addr mapped;
348 1.88 itojun #endif
349 1.133 elad enum kauth_network_req req;
350 1.132 elad
351 1.132 elad if ((so->so_options & (SO_REUSEADDR|SO_REUSEPORT)) == 0)
352 1.132 elad wild = 1;
353 1.132 elad
354 1.31 perry #ifndef IPNOPRIVPORTS
355 1.133 elad if (ntohs(sin->sin_port) < IPPORT_RESERVED)
356 1.133 elad req = KAUTH_REQ_NETWORK_BIND_PRIVPORT;
357 1.133 elad else
358 1.133 elad #endif /* !IPNOPRIVPORTS */
359 1.133 elad req = KAUTH_REQ_NETWORK_BIND_PORT;
360 1.133 elad
361 1.133 elad error = kauth_authorize_network(cred, KAUTH_NETWORK_BIND, req,
362 1.133 elad so, sin, NULL);
363 1.133 elad if (error)
364 1.137 elad return (EACCES);
365 1.133 elad
366 1.88 itojun #ifdef INET6
367 1.163 rtr in6_in_2_v4mapin6(&sin->sin_addr, &mapped);
368 1.138 dyoung t6 = in6_pcblookup_port(table, &mapped, sin->sin_port, wild, &vestige);
369 1.88 itojun if (t6 && (reuseport & t6->in6p_socket->so_options) == 0)
370 1.88 itojun return (EADDRINUSE);
371 1.138 dyoung if (!t6 && vestige.valid) {
372 1.138 dyoung if (!!reuseport != !!vestige.reuse_port) {
373 1.138 dyoung return EADDRINUSE;
374 1.138 dyoung }
375 1.138 dyoung }
376 1.88 itojun #endif
377 1.133 elad
378 1.133 elad /* XXX-kauth */
379 1.99 christos if (so->so_uidinfo->ui_uid && !IN_MULTICAST(sin->sin_addr.s_addr)) {
380 1.138 dyoung t = in_pcblookup_port(table, sin->sin_addr, sin->sin_port, 1, &vestige);
381 1.133 elad /*
382 1.133 elad * XXX: investigate ramifications of loosening this
383 1.133 elad * restriction so that as long as both ports have
384 1.133 elad * SO_REUSEPORT allow the bind
385 1.133 elad */
386 1.58 lukem if (t &&
387 1.58 lukem (!in_nullhost(sin->sin_addr) ||
388 1.58 lukem !in_nullhost(t->inp_laddr) ||
389 1.58 lukem (t->inp_socket->so_options & SO_REUSEPORT) == 0)
390 1.99 christos && (so->so_uidinfo->ui_uid != t->inp_socket->so_uidinfo->ui_uid)) {
391 1.58 lukem return (EADDRINUSE);
392 1.58 lukem }
393 1.138 dyoung if (!t && vestige.valid) {
394 1.138 dyoung if ((!in_nullhost(sin->sin_addr)
395 1.138 dyoung || !in_nullhost(vestige.laddr.v4)
396 1.138 dyoung || !vestige.reuse_port)
397 1.138 dyoung && so->so_uidinfo->ui_uid != vestige.uid) {
398 1.138 dyoung return EADDRINUSE;
399 1.138 dyoung }
400 1.138 dyoung }
401 1.58 lukem }
402 1.138 dyoung t = in_pcblookup_port(table, sin->sin_addr, sin->sin_port, wild, &vestige);
403 1.28 mycroft if (t && (reuseport & t->inp_socket->so_options) == 0)
404 1.28 mycroft return (EADDRINUSE);
405 1.138 dyoung if (!t
406 1.138 dyoung && vestige.valid
407 1.138 dyoung && !(reuseport && vestige.reuse_port))
408 1.138 dyoung return EADDRINUSE;
409 1.132 elad
410 1.132 elad inp->inp_lport = sin->sin_port;
411 1.132 elad in_pcbstate(inp, INP_BOUND);
412 1.1 cgd }
413 1.45 lukem
414 1.90 provos LIST_REMOVE(&inp->inp_head, inph_lhash);
415 1.90 provos LIST_INSERT_HEAD(INPCBHASH_PORT(table, inp->inp_lport), &inp->inp_head,
416 1.90 provos inph_lhash);
417 1.132 elad
418 1.132 elad return (0);
419 1.132 elad }
420 1.132 elad
421 1.132 elad int
422 1.156 rtr in_pcbbind(void *v, struct sockaddr_in *sin, struct lwp *l)
423 1.132 elad {
424 1.132 elad struct inpcb *inp = v;
425 1.134 elad struct sockaddr_in lsin;
426 1.132 elad int error;
427 1.132 elad
428 1.132 elad if (inp->inp_af != AF_INET)
429 1.132 elad return (EINVAL);
430 1.132 elad
431 1.165 ozaki if (IN_ADDRLIST_READER_EMPTY())
432 1.132 elad return (EADDRNOTAVAIL);
433 1.132 elad if (inp->inp_lport || !in_nullhost(inp->inp_laddr))
434 1.132 elad return (EINVAL);
435 1.132 elad
436 1.156 rtr if (NULL != sin) {
437 1.156 rtr if (sin->sin_len != sizeof(*sin))
438 1.132 elad return (EINVAL);
439 1.132 elad } else {
440 1.134 elad lsin = *((const struct sockaddr_in *)
441 1.134 elad inp->inp_socket->so_proto->pr_domain->dom_sa_any);
442 1.134 elad sin = &lsin;
443 1.132 elad }
444 1.132 elad
445 1.132 elad /* Bind address. */
446 1.151 rtr error = in_pcbbind_addr(inp, sin, l->l_cred);
447 1.132 elad if (error)
448 1.132 elad return (error);
449 1.132 elad
450 1.132 elad /* Bind port. */
451 1.151 rtr error = in_pcbbind_port(inp, sin, l->l_cred);
452 1.132 elad if (error) {
453 1.132 elad inp->inp_laddr.s_addr = INADDR_ANY;
454 1.132 elad
455 1.132 elad return (error);
456 1.132 elad }
457 1.132 elad
458 1.1 cgd return (0);
459 1.1 cgd }
460 1.1 cgd
461 1.1 cgd /*
462 1.1 cgd * Connect from a socket to a specified address.
463 1.1 cgd * Both address and port must be specified in argument sin.
464 1.1 cgd * If don't have a local address for this socket yet,
465 1.1 cgd * then pick one.
466 1.1 cgd */
467 1.10 mycroft int
468 1.160 rtr in_pcbconnect(void *v, struct sockaddr_in *sin, struct lwp *l)
469 1.1 cgd {
470 1.64 augustss struct inpcb *inp = v;
471 1.138 dyoung vestigial_inpcb_t vestige;
472 1.40 thorpej int error;
473 1.167 ozaki struct in_addr laddr;
474 1.1 cgd
475 1.88 itojun if (inp->inp_af != AF_INET)
476 1.88 itojun return (EINVAL);
477 1.88 itojun
478 1.158 rtr if (sin->sin_len != sizeof (*sin))
479 1.158 rtr return (EINVAL);
480 1.1 cgd if (sin->sin_family != AF_INET)
481 1.1 cgd return (EAFNOSUPPORT);
482 1.1 cgd if (sin->sin_port == 0)
483 1.1 cgd return (EADDRNOTAVAIL);
484 1.144 christos
485 1.144 christos if (IN_MULTICAST(sin->sin_addr.s_addr) &&
486 1.144 christos inp->inp_socket->so_type == SOCK_STREAM)
487 1.144 christos return EADDRNOTAVAIL;
488 1.144 christos
489 1.165 ozaki if (!IN_ADDRLIST_READER_EMPTY()) {
490 1.1 cgd /*
491 1.1 cgd * If the destination address is INADDR_ANY,
492 1.49 tls * use any local address (likely loopback).
493 1.1 cgd * If the supplied address is INADDR_BROADCAST,
494 1.49 tls * use the broadcast address of an interface
495 1.49 tls * which supports broadcast. (loopback does not)
496 1.1 cgd */
497 1.49 tls
498 1.72 matt if (in_nullhost(sin->sin_addr)) {
499 1.165 ozaki /* XXX racy */
500 1.72 matt sin->sin_addr =
501 1.165 ozaki IN_ADDRLIST_READER_FIRST()->ia_addr.sin_addr;
502 1.72 matt } else if (sin->sin_addr.s_addr == INADDR_BROADCAST) {
503 1.167 ozaki struct in_ifaddr *ia;
504 1.168 ozaki int s = pserialize_read_enter();
505 1.165 ozaki IN_ADDRLIST_READER_FOREACH(ia) {
506 1.72 matt if (ia->ia_ifp->if_flags & IFF_BROADCAST) {
507 1.72 matt sin->sin_addr =
508 1.72 matt ia->ia_broadaddr.sin_addr;
509 1.72 matt break;
510 1.72 matt }
511 1.49 tls }
512 1.168 ozaki pserialize_read_exit(s);
513 1.72 matt }
514 1.1 cgd }
515 1.32 mycroft /*
516 1.32 mycroft * If we haven't bound which network number to use as ours,
517 1.32 mycroft * we will use the number of the outgoing interface.
518 1.32 mycroft * This depends on having done a routing lookup, which
519 1.32 mycroft * we will probably have to do anyway, so we might
520 1.32 mycroft * as well do it now. On the other hand if we are
521 1.32 mycroft * sending to multiple destinations we may have already
522 1.32 mycroft * done the lookup, so see if we can use the route
523 1.32 mycroft * from before. In any case, we only
524 1.32 mycroft * chose a port number once, even if sending to multiple
525 1.32 mycroft * destinations.
526 1.32 mycroft */
527 1.32 mycroft if (in_nullhost(inp->inp_laddr)) {
528 1.100 christos int xerror;
529 1.168 ozaki struct in_ifaddr *ia, *_ia;
530 1.168 ozaki int s;
531 1.168 ozaki struct psref psref;
532 1.168 ozaki int bound;
533 1.168 ozaki
534 1.168 ozaki bound = curlwp_bind();
535 1.168 ozaki ia = in_selectsrc(sin, &inp->inp_route,
536 1.168 ozaki inp->inp_socket->so_options, inp->inp_moptions, &xerror,
537 1.168 ozaki &psref);
538 1.168 ozaki if (ia == NULL) {
539 1.168 ozaki curlwp_bindx(bound);
540 1.100 christos if (xerror == 0)
541 1.100 christos xerror = EADDRNOTAVAIL;
542 1.100 christos return xerror;
543 1.59 itojun }
544 1.168 ozaki s = pserialize_read_enter();
545 1.168 ozaki _ia = in_get_ia(IA_SIN(ia)->sin_addr);
546 1.168 ozaki if (_ia == NULL) {
547 1.168 ozaki pserialize_read_exit(s);
548 1.168 ozaki ia4_release(ia, &psref);
549 1.168 ozaki curlwp_bindx(bound);
550 1.83 itojun return (EADDRNOTAVAIL);
551 1.168 ozaki }
552 1.168 ozaki pserialize_read_exit(s);
553 1.168 ozaki laddr = IA_SIN(ia)->sin_addr;
554 1.168 ozaki ia4_release(ia, &psref);
555 1.168 ozaki curlwp_bindx(bound);
556 1.167 ozaki } else
557 1.167 ozaki laddr = inp->inp_laddr;
558 1.33 mycroft if (in_pcblookup_connect(inp->inp_table, sin->sin_addr, sin->sin_port,
559 1.168 ozaki laddr, inp->inp_lport, &vestige) != NULL ||
560 1.168 ozaki vestige.valid) {
561 1.1 cgd return (EADDRINUSE);
562 1.168 ozaki }
563 1.32 mycroft if (in_nullhost(inp->inp_laddr)) {
564 1.40 thorpej if (inp->inp_lport == 0) {
565 1.151 rtr error = in_pcbbind(inp, NULL, l);
566 1.40 thorpej /*
567 1.40 thorpej * This used to ignore the return value
568 1.40 thorpej * completely, but we need to check for
569 1.40 thorpej * ephemeral port shortage.
570 1.101 dsl * And attempts to request low ports if not root.
571 1.40 thorpej */
572 1.101 dsl if (error != 0)
573 1.40 thorpej return (error);
574 1.40 thorpej }
575 1.167 ozaki inp->inp_laddr = laddr;
576 1.1 cgd }
577 1.1 cgd inp->inp_faddr = sin->sin_addr;
578 1.1 cgd inp->inp_fport = sin->sin_port;
579 1.139 christos
580 1.139 christos /* Late bind, if needed */
581 1.139 christos if (inp->inp_bindportonsend) {
582 1.139 christos struct sockaddr_in lsin = *((const struct sockaddr_in *)
583 1.139 christos inp->inp_socket->so_proto->pr_domain->dom_sa_any);
584 1.139 christos lsin.sin_addr = inp->inp_laddr;
585 1.139 christos lsin.sin_port = 0;
586 1.139 christos
587 1.139 christos if ((error = in_pcbbind_port(inp, &lsin, l->l_cred)) != 0)
588 1.139 christos return error;
589 1.139 christos }
590 1.139 christos
591 1.33 mycroft in_pcbstate(inp, INP_CONNECTED);
592 1.145 christos #if defined(IPSEC)
593 1.148 christos if (ipsec_enabled && inp->inp_socket->so_type == SOCK_STREAM)
594 1.71 itojun ipsec_pcbconn(inp->inp_sp);
595 1.71 itojun #endif
596 1.1 cgd return (0);
597 1.1 cgd }
598 1.1 cgd
599 1.25 christos void
600 1.98 perry in_pcbdisconnect(void *v)
601 1.1 cgd {
602 1.25 christos struct inpcb *inp = v;
603 1.1 cgd
604 1.88 itojun if (inp->inp_af != AF_INET)
605 1.88 itojun return;
606 1.88 itojun
607 1.32 mycroft inp->inp_faddr = zeroin_addr;
608 1.1 cgd inp->inp_fport = 0;
609 1.33 mycroft in_pcbstate(inp, INP_BOUND);
610 1.145 christos #if defined(IPSEC)
611 1.148 christos if (ipsec_enabled)
612 1.148 christos ipsec_pcbdisconn(inp->inp_sp);
613 1.71 itojun #endif
614 1.93 itojun if (inp->inp_socket->so_state & SS_NOFDREF)
615 1.93 itojun in_pcbdetach(inp);
616 1.1 cgd }
617 1.1 cgd
618 1.25 christos void
619 1.98 perry in_pcbdetach(void *v)
620 1.1 cgd {
621 1.25 christos struct inpcb *inp = v;
622 1.1 cgd struct socket *so = inp->inp_socket;
623 1.24 mycroft int s;
624 1.1 cgd
625 1.88 itojun if (inp->inp_af != AF_INET)
626 1.88 itojun return;
627 1.88 itojun
628 1.145 christos #if defined(IPSEC)
629 1.148 christos if (ipsec_enabled)
630 1.148 christos ipsec4_delete_pcbpolicy(inp);
631 1.150 rmind #endif
632 1.150 rmind so->so_pcb = NULL;
633 1.150 rmind
634 1.175 ozaki s = splsoftnet();
635 1.33 mycroft in_pcbstate(inp, INP_ATTACHED);
636 1.90 provos LIST_REMOVE(&inp->inp_head, inph_lhash);
637 1.146 christos TAILQ_REMOVE(&inp->inp_table->inpt_queue, &inp->inp_head, inph_queue);
638 1.24 mycroft splx(s);
639 1.150 rmind
640 1.150 rmind if (inp->inp_options) {
641 1.150 rmind m_free(inp->inp_options);
642 1.150 rmind }
643 1.150 rmind rtcache_free(&inp->inp_route);
644 1.152 rmind ip_freemoptions(inp->inp_moptions);
645 1.127 spz sofree(so); /* drops the socket's lock */
646 1.150 rmind
647 1.150 rmind pool_put(&inpcb_pool, inp);
648 1.126 matt mutex_enter(softnet_lock); /* reacquire the softnet_lock */
649 1.1 cgd }
650 1.1 cgd
651 1.25 christos void
652 1.157 rtr in_setsockaddr(struct inpcb *inp, struct sockaddr_in *sin)
653 1.1 cgd {
654 1.78 itojun
655 1.88 itojun if (inp->inp_af != AF_INET)
656 1.88 itojun return;
657 1.88 itojun
658 1.119 dyoung sockaddr_in_init(sin, &inp->inp_laddr, inp->inp_lport);
659 1.1 cgd }
660 1.1 cgd
661 1.25 christos void
662 1.157 rtr in_setpeeraddr(struct inpcb *inp, struct sockaddr_in *sin)
663 1.1 cgd {
664 1.78 itojun
665 1.88 itojun if (inp->inp_af != AF_INET)
666 1.88 itojun return;
667 1.88 itojun
668 1.119 dyoung sockaddr_in_init(sin, &inp->inp_faddr, inp->inp_fport);
669 1.1 cgd }
670 1.1 cgd
671 1.1 cgd /*
672 1.1 cgd * Pass some notification to all connections of a protocol
673 1.1 cgd * associated with address dst. The local address and/or port numbers
674 1.1 cgd * may be specified to limit the search. The "usual action" will be
675 1.1 cgd * taken, depending on the ctlinput cmd. The caller must filter any
676 1.1 cgd * cmds that are uninteresting (e.g., no error in the map).
677 1.1 cgd * Call the protocol specific routine (if any) to report
678 1.1 cgd * any errors for each matching socket.
679 1.1 cgd *
680 1.22 mycroft * Must be called at splsoftnet.
681 1.1 cgd */
682 1.37 thorpej int
683 1.98 perry in_pcbnotify(struct inpcbtable *table, struct in_addr faddr, u_int fport_arg,
684 1.98 perry struct in_addr laddr, u_int lport_arg, int errno,
685 1.98 perry void (*notify)(struct inpcb *, int))
686 1.1 cgd {
687 1.33 mycroft struct inpcbhead *head;
688 1.64 augustss struct inpcb *inp, *ninp;
689 1.13 cgd u_int16_t fport = fport_arg, lport = lport_arg;
690 1.37 thorpej int nmatch;
691 1.1 cgd
692 1.33 mycroft if (in_nullhost(faddr) || notify == 0)
693 1.37 thorpej return (0);
694 1.1 cgd
695 1.37 thorpej nmatch = 0;
696 1.33 mycroft head = INPCBHASH_CONNECT(table, faddr, fport, laddr, lport);
697 1.88 itojun for (inp = (struct inpcb *)LIST_FIRST(head); inp != NULL; inp = ninp) {
698 1.88 itojun ninp = (struct inpcb *)LIST_NEXT(inp, inp_hash);
699 1.88 itojun if (inp->inp_af != AF_INET)
700 1.88 itojun continue;
701 1.33 mycroft if (in_hosteq(inp->inp_faddr, faddr) &&
702 1.33 mycroft inp->inp_fport == fport &&
703 1.33 mycroft inp->inp_lport == lport &&
704 1.37 thorpej in_hosteq(inp->inp_laddr, laddr)) {
705 1.33 mycroft (*notify)(inp, errno);
706 1.37 thorpej nmatch++;
707 1.37 thorpej }
708 1.1 cgd }
709 1.37 thorpej return (nmatch);
710 1.18 mycroft }
711 1.18 mycroft
712 1.20 mycroft void
713 1.98 perry in_pcbnotifyall(struct inpcbtable *table, struct in_addr faddr, int errno,
714 1.98 perry void (*notify)(struct inpcb *, int))
715 1.18 mycroft {
716 1.146 christos struct inpcb_hdr *inph, *ninph;
717 1.18 mycroft
718 1.33 mycroft if (in_nullhost(faddr) || notify == 0)
719 1.18 mycroft return;
720 1.18 mycroft
721 1.146 christos TAILQ_FOREACH_SAFE(inph, &table->inpt_queue, inph_queue, ninph) {
722 1.146 christos struct inpcb *inp = (struct inpcb *)inph;
723 1.88 itojun if (inp->inp_af != AF_INET)
724 1.88 itojun continue;
725 1.33 mycroft if (in_hosteq(inp->inp_faddr, faddr))
726 1.33 mycroft (*notify)(inp, errno);
727 1.63 thorpej }
728 1.63 thorpej }
729 1.63 thorpej
730 1.63 thorpej void
731 1.154 seanb in_purgeifmcast(struct ip_moptions *imo, struct ifnet *ifp)
732 1.154 seanb {
733 1.154 seanb int i, gap;
734 1.154 seanb
735 1.176 ozaki /* The owner of imo should be protected by solock */
736 1.164 ozaki KASSERT(ifp != NULL);
737 1.164 ozaki
738 1.154 seanb if (imo == NULL)
739 1.154 seanb return;
740 1.154 seanb
741 1.154 seanb /*
742 1.154 seanb * Unselect the outgoing interface if it is being
743 1.154 seanb * detached.
744 1.154 seanb */
745 1.164 ozaki if (imo->imo_multicast_if_index == ifp->if_index)
746 1.164 ozaki imo->imo_multicast_if_index = 0;
747 1.154 seanb
748 1.154 seanb /*
749 1.154 seanb * Drop multicast group membership if we joined
750 1.154 seanb * through the interface being detached.
751 1.154 seanb */
752 1.154 seanb for (i = 0, gap = 0; i < imo->imo_num_memberships; i++) {
753 1.154 seanb if (imo->imo_membership[i]->inm_ifp == ifp) {
754 1.154 seanb in_delmulti(imo->imo_membership[i]);
755 1.154 seanb gap++;
756 1.154 seanb } else if (gap != 0)
757 1.154 seanb imo->imo_membership[i - gap] = imo->imo_membership[i];
758 1.154 seanb }
759 1.154 seanb imo->imo_num_memberships -= gap;
760 1.154 seanb }
761 1.154 seanb
762 1.154 seanb void
763 1.98 perry in_pcbpurgeif0(struct inpcbtable *table, struct ifnet *ifp)
764 1.63 thorpej {
765 1.146 christos struct inpcb_hdr *inph, *ninph;
766 1.63 thorpej
767 1.146 christos TAILQ_FOREACH_SAFE(inph, &table->inpt_queue, inph_queue, ninph) {
768 1.146 christos struct inpcb *inp = (struct inpcb *)inph;
769 1.176 ozaki bool need_unlock = false;
770 1.176 ozaki
771 1.88 itojun if (inp->inp_af != AF_INET)
772 1.88 itojun continue;
773 1.176 ozaki
774 1.176 ozaki /* The caller holds either one of inps' lock */
775 1.176 ozaki if (!inp_locked(inp)) {
776 1.176 ozaki inp_lock(inp);
777 1.176 ozaki need_unlock = true;
778 1.176 ozaki }
779 1.176 ozaki
780 1.180 ozaki /* IFNET_LOCK must be taken after solock */
781 1.180 ozaki IFNET_LOCK(ifp);
782 1.154 seanb in_purgeifmcast(inp->inp_moptions, ifp);
783 1.180 ozaki IFNET_UNLOCK(ifp);
784 1.176 ozaki
785 1.176 ozaki if (need_unlock)
786 1.176 ozaki inp_unlock(inp);
787 1.69 itojun }
788 1.69 itojun }
789 1.69 itojun
790 1.69 itojun void
791 1.98 perry in_pcbpurgeif(struct inpcbtable *table, struct ifnet *ifp)
792 1.69 itojun {
793 1.121 dyoung struct rtentry *rt;
794 1.146 christos struct inpcb_hdr *inph, *ninph;
795 1.69 itojun
796 1.146 christos TAILQ_FOREACH_SAFE(inph, &table->inpt_queue, inph_queue, ninph) {
797 1.146 christos struct inpcb *inp = (struct inpcb *)inph;
798 1.88 itojun if (inp->inp_af != AF_INET)
799 1.88 itojun continue;
800 1.122 dyoung if ((rt = rtcache_validate(&inp->inp_route)) != NULL &&
801 1.171 ozaki rt->rt_ifp == ifp) {
802 1.171 ozaki rtcache_unref(rt, &inp->inp_route);
803 1.69 itojun in_rtchange(inp, 0);
804 1.171 ozaki } else
805 1.171 ozaki rtcache_unref(rt, &inp->inp_route);
806 1.1 cgd }
807 1.1 cgd }
808 1.1 cgd
809 1.1 cgd /*
810 1.1 cgd * Check for alternatives when higher level complains
811 1.1 cgd * about service problems. For now, invalidate cached
812 1.1 cgd * routing information. If the route was created dynamically
813 1.1 cgd * (by a redirect), time to try a default gateway again.
814 1.1 cgd */
815 1.25 christos void
816 1.98 perry in_losing(struct inpcb *inp)
817 1.1 cgd {
818 1.64 augustss struct rtentry *rt;
819 1.10 mycroft struct rt_addrinfo info;
820 1.1 cgd
821 1.88 itojun if (inp->inp_af != AF_INET)
822 1.88 itojun return;
823 1.88 itojun
824 1.122 dyoung if ((rt = rtcache_validate(&inp->inp_route)) == NULL)
825 1.122 dyoung return;
826 1.122 dyoung
827 1.122 dyoung memset(&info, 0, sizeof(info));
828 1.122 dyoung info.rti_info[RTAX_DST] = rtcache_getdst(&inp->inp_route);
829 1.122 dyoung info.rti_info[RTAX_GATEWAY] = rt->rt_gateway;
830 1.122 dyoung info.rti_info[RTAX_NETMASK] = rt_mask(rt);
831 1.122 dyoung rt_missmsg(RTM_LOSING, &info, rt->rt_flags, 0);
832 1.171 ozaki if (rt->rt_flags & RTF_DYNAMIC) {
833 1.171 ozaki int error;
834 1.171 ozaki struct rtentry *nrt;
835 1.171 ozaki
836 1.171 ozaki error = rtrequest(RTM_DELETE, rt_getkey(rt),
837 1.171 ozaki rt->rt_gateway, rt_mask(rt), rt->rt_flags, &nrt);
838 1.171 ozaki rtcache_unref(rt, &inp->inp_route);
839 1.171 ozaki if (error == 0)
840 1.172 ozaki rt_free(nrt);
841 1.171 ozaki } else
842 1.171 ozaki rtcache_unref(rt, &inp->inp_route);
843 1.122 dyoung /*
844 1.122 dyoung * A new route can be allocated
845 1.122 dyoung * the next time output is attempted.
846 1.122 dyoung */
847 1.122 dyoung rtcache_free(&inp->inp_route);
848 1.1 cgd }
849 1.1 cgd
850 1.1 cgd /*
851 1.111 dyoung * After a routing change, flush old routing. A new route can be
852 1.111 dyoung * allocated the next time output is attempted.
853 1.1 cgd */
854 1.10 mycroft void
855 1.109 christos in_rtchange(struct inpcb *inp, int errno)
856 1.1 cgd {
857 1.32 mycroft
858 1.88 itojun if (inp->inp_af != AF_INET)
859 1.88 itojun return;
860 1.88 itojun
861 1.112 joerg rtcache_free(&inp->inp_route);
862 1.112 joerg
863 1.49 tls /* XXX SHOULD NOTIFY HIGHER-LEVEL PROTOCOLS */
864 1.1 cgd }
865 1.1 cgd
866 1.1 cgd struct inpcb *
867 1.98 perry in_pcblookup_port(struct inpcbtable *table, struct in_addr laddr,
868 1.138 dyoung u_int lport_arg, int lookup_wildcard, vestigial_inpcb_t *vp)
869 1.1 cgd {
870 1.90 provos struct inpcbhead *head;
871 1.88 itojun struct inpcb_hdr *inph;
872 1.142 yamt struct inpcb *match = NULL;
873 1.142 yamt int matchwild = 3;
874 1.142 yamt int wildcard;
875 1.33 mycroft u_int16_t lport = lport_arg;
876 1.1 cgd
877 1.138 dyoung if (vp)
878 1.138 dyoung vp->valid = 0;
879 1.138 dyoung
880 1.90 provos head = INPCBHASH_PORT(table, lport);
881 1.90 provos LIST_FOREACH(inph, head, inph_lhash) {
882 1.142 yamt struct inpcb * const inp = (struct inpcb *)inph;
883 1.142 yamt
884 1.88 itojun if (inp->inp_af != AF_INET)
885 1.88 itojun continue;
886 1.1 cgd if (inp->inp_lport != lport)
887 1.1 cgd continue;
888 1.142 yamt /*
889 1.142 yamt * check if inp's faddr and laddr match with ours.
890 1.142 yamt * our faddr is considered null.
891 1.142 yamt * count the number of wildcard matches. (0 - 2)
892 1.142 yamt *
893 1.142 yamt * null null match
894 1.142 yamt * A null wildcard match
895 1.142 yamt * null B wildcard match
896 1.142 yamt * A B non match
897 1.142 yamt * A A match
898 1.142 yamt */
899 1.1 cgd wildcard = 0;
900 1.33 mycroft if (!in_nullhost(inp->inp_faddr))
901 1.33 mycroft wildcard++;
902 1.32 mycroft if (in_nullhost(inp->inp_laddr)) {
903 1.32 mycroft if (!in_nullhost(laddr))
904 1.1 cgd wildcard++;
905 1.1 cgd } else {
906 1.32 mycroft if (in_nullhost(laddr))
907 1.1 cgd wildcard++;
908 1.32 mycroft else {
909 1.32 mycroft if (!in_hosteq(inp->inp_laddr, laddr))
910 1.32 mycroft continue;
911 1.32 mycroft }
912 1.1 cgd }
913 1.54 lukem if (wildcard && !lookup_wildcard)
914 1.1 cgd continue;
915 1.142 yamt /*
916 1.142 yamt * prefer an address with less wildcards.
917 1.142 yamt */
918 1.1 cgd if (wildcard < matchwild) {
919 1.1 cgd match = inp;
920 1.1 cgd matchwild = wildcard;
921 1.1 cgd if (matchwild == 0)
922 1.1 cgd break;
923 1.1 cgd }
924 1.1 cgd }
925 1.138 dyoung if (match && matchwild == 0)
926 1.138 dyoung return match;
927 1.138 dyoung
928 1.138 dyoung if (vp && table->vestige) {
929 1.138 dyoung void *state = (*table->vestige->init_ports4)(laddr, lport_arg, lookup_wildcard);
930 1.138 dyoung vestigial_inpcb_t better;
931 1.138 dyoung
932 1.138 dyoung while (table->vestige
933 1.138 dyoung && (*table->vestige->next_port4)(state, vp)) {
934 1.138 dyoung
935 1.138 dyoung if (vp->lport != lport)
936 1.138 dyoung continue;
937 1.138 dyoung wildcard = 0;
938 1.138 dyoung if (!in_nullhost(vp->faddr.v4))
939 1.138 dyoung wildcard++;
940 1.138 dyoung if (in_nullhost(vp->laddr.v4)) {
941 1.138 dyoung if (!in_nullhost(laddr))
942 1.138 dyoung wildcard++;
943 1.138 dyoung } else {
944 1.138 dyoung if (in_nullhost(laddr))
945 1.138 dyoung wildcard++;
946 1.138 dyoung else {
947 1.138 dyoung if (!in_hosteq(vp->laddr.v4, laddr))
948 1.138 dyoung continue;
949 1.138 dyoung }
950 1.138 dyoung }
951 1.138 dyoung if (wildcard && !lookup_wildcard)
952 1.138 dyoung continue;
953 1.138 dyoung if (wildcard < matchwild) {
954 1.138 dyoung better = *vp;
955 1.138 dyoung match = (void*)&better;
956 1.138 dyoung
957 1.138 dyoung matchwild = wildcard;
958 1.138 dyoung if (matchwild == 0)
959 1.138 dyoung break;
960 1.138 dyoung }
961 1.138 dyoung }
962 1.138 dyoung
963 1.138 dyoung if (match) {
964 1.138 dyoung if (match != (void*)&better)
965 1.138 dyoung return match;
966 1.138 dyoung else {
967 1.138 dyoung *vp = better;
968 1.138 dyoung return 0;
969 1.138 dyoung }
970 1.138 dyoung }
971 1.138 dyoung }
972 1.138 dyoung
973 1.1 cgd return (match);
974 1.24 mycroft }
975 1.24 mycroft
976 1.24 mycroft #ifdef DIAGNOSTIC
977 1.24 mycroft int in_pcbnotifymiss = 0;
978 1.24 mycroft #endif
979 1.24 mycroft
980 1.24 mycroft struct inpcb *
981 1.98 perry in_pcblookup_connect(struct inpcbtable *table,
982 1.98 perry struct in_addr faddr, u_int fport_arg,
983 1.138 dyoung struct in_addr laddr, u_int lport_arg,
984 1.138 dyoung vestigial_inpcb_t *vp)
985 1.24 mycroft {
986 1.24 mycroft struct inpcbhead *head;
987 1.88 itojun struct inpcb_hdr *inph;
988 1.64 augustss struct inpcb *inp;
989 1.24 mycroft u_int16_t fport = fport_arg, lport = lport_arg;
990 1.24 mycroft
991 1.138 dyoung if (vp)
992 1.138 dyoung vp->valid = 0;
993 1.138 dyoung
994 1.33 mycroft head = INPCBHASH_CONNECT(table, faddr, fport, laddr, lport);
995 1.88 itojun LIST_FOREACH(inph, head, inph_hash) {
996 1.88 itojun inp = (struct inpcb *)inph;
997 1.88 itojun if (inp->inp_af != AF_INET)
998 1.88 itojun continue;
999 1.88 itojun
1000 1.33 mycroft if (in_hosteq(inp->inp_faddr, faddr) &&
1001 1.33 mycroft inp->inp_fport == fport &&
1002 1.33 mycroft inp->inp_lport == lport &&
1003 1.33 mycroft in_hosteq(inp->inp_laddr, laddr))
1004 1.33 mycroft goto out;
1005 1.24 mycroft }
1006 1.138 dyoung if (vp && table->vestige) {
1007 1.138 dyoung if ((*table->vestige->lookup4)(faddr, fport_arg,
1008 1.138 dyoung laddr, lport_arg, vp))
1009 1.138 dyoung return 0;
1010 1.138 dyoung }
1011 1.138 dyoung
1012 1.24 mycroft #ifdef DIAGNOSTIC
1013 1.33 mycroft if (in_pcbnotifymiss) {
1014 1.35 christos printf("in_pcblookup_connect: faddr=%08x fport=%d laddr=%08x lport=%d\n",
1015 1.24 mycroft ntohl(faddr.s_addr), ntohs(fport),
1016 1.24 mycroft ntohl(laddr.s_addr), ntohs(lport));
1017 1.24 mycroft }
1018 1.24 mycroft #endif
1019 1.33 mycroft return (0);
1020 1.33 mycroft
1021 1.33 mycroft out:
1022 1.33 mycroft /* Move this PCB to the head of hash chain. */
1023 1.88 itojun inph = &inp->inp_head;
1024 1.88 itojun if (inph != LIST_FIRST(head)) {
1025 1.88 itojun LIST_REMOVE(inph, inph_hash);
1026 1.88 itojun LIST_INSERT_HEAD(head, inph, inph_hash);
1027 1.33 mycroft }
1028 1.33 mycroft return (inp);
1029 1.33 mycroft }
1030 1.33 mycroft
1031 1.33 mycroft struct inpcb *
1032 1.98 perry in_pcblookup_bind(struct inpcbtable *table,
1033 1.98 perry struct in_addr laddr, u_int lport_arg)
1034 1.33 mycroft {
1035 1.33 mycroft struct inpcbhead *head;
1036 1.88 itojun struct inpcb_hdr *inph;
1037 1.64 augustss struct inpcb *inp;
1038 1.33 mycroft u_int16_t lport = lport_arg;
1039 1.33 mycroft
1040 1.33 mycroft head = INPCBHASH_BIND(table, laddr, lport);
1041 1.88 itojun LIST_FOREACH(inph, head, inph_hash) {
1042 1.88 itojun inp = (struct inpcb *)inph;
1043 1.88 itojun if (inp->inp_af != AF_INET)
1044 1.88 itojun continue;
1045 1.88 itojun
1046 1.33 mycroft if (inp->inp_lport == lport &&
1047 1.33 mycroft in_hosteq(inp->inp_laddr, laddr))
1048 1.33 mycroft goto out;
1049 1.33 mycroft }
1050 1.33 mycroft head = INPCBHASH_BIND(table, zeroin_addr, lport);
1051 1.88 itojun LIST_FOREACH(inph, head, inph_hash) {
1052 1.88 itojun inp = (struct inpcb *)inph;
1053 1.88 itojun if (inp->inp_af != AF_INET)
1054 1.88 itojun continue;
1055 1.88 itojun
1056 1.33 mycroft if (inp->inp_lport == lport &&
1057 1.33 mycroft in_hosteq(inp->inp_laddr, zeroin_addr))
1058 1.33 mycroft goto out;
1059 1.33 mycroft }
1060 1.33 mycroft #ifdef DIAGNOSTIC
1061 1.33 mycroft if (in_pcbnotifymiss) {
1062 1.35 christos printf("in_pcblookup_bind: laddr=%08x lport=%d\n",
1063 1.33 mycroft ntohl(laddr.s_addr), ntohs(lport));
1064 1.33 mycroft }
1065 1.33 mycroft #endif
1066 1.33 mycroft return (0);
1067 1.33 mycroft
1068 1.33 mycroft out:
1069 1.33 mycroft /* Move this PCB to the head of hash chain. */
1070 1.88 itojun inph = &inp->inp_head;
1071 1.88 itojun if (inph != LIST_FIRST(head)) {
1072 1.88 itojun LIST_REMOVE(inph, inph_hash);
1073 1.88 itojun LIST_INSERT_HEAD(head, inph, inph_hash);
1074 1.33 mycroft }
1075 1.24 mycroft return (inp);
1076 1.33 mycroft }
1077 1.33 mycroft
1078 1.33 mycroft void
1079 1.98 perry in_pcbstate(struct inpcb *inp, int state)
1080 1.33 mycroft {
1081 1.33 mycroft
1082 1.88 itojun if (inp->inp_af != AF_INET)
1083 1.88 itojun return;
1084 1.88 itojun
1085 1.33 mycroft if (inp->inp_state > INP_ATTACHED)
1086 1.88 itojun LIST_REMOVE(&inp->inp_head, inph_hash);
1087 1.33 mycroft
1088 1.33 mycroft switch (state) {
1089 1.33 mycroft case INP_BOUND:
1090 1.33 mycroft LIST_INSERT_HEAD(INPCBHASH_BIND(inp->inp_table,
1091 1.88 itojun inp->inp_laddr, inp->inp_lport), &inp->inp_head,
1092 1.88 itojun inph_hash);
1093 1.33 mycroft break;
1094 1.33 mycroft case INP_CONNECTED:
1095 1.33 mycroft LIST_INSERT_HEAD(INPCBHASH_CONNECT(inp->inp_table,
1096 1.33 mycroft inp->inp_faddr, inp->inp_fport,
1097 1.88 itojun inp->inp_laddr, inp->inp_lport), &inp->inp_head,
1098 1.88 itojun inph_hash);
1099 1.33 mycroft break;
1100 1.33 mycroft }
1101 1.33 mycroft
1102 1.33 mycroft inp->inp_state = state;
1103 1.38 thorpej }
1104 1.38 thorpej
1105 1.38 thorpej struct rtentry *
1106 1.98 perry in_pcbrtentry(struct inpcb *inp)
1107 1.38 thorpej {
1108 1.38 thorpej struct route *ro;
1109 1.117 dyoung union {
1110 1.117 dyoung struct sockaddr dst;
1111 1.117 dyoung struct sockaddr_in dst4;
1112 1.117 dyoung } u;
1113 1.88 itojun
1114 1.88 itojun if (inp->inp_af != AF_INET)
1115 1.88 itojun return (NULL);
1116 1.38 thorpej
1117 1.38 thorpej ro = &inp->inp_route;
1118 1.38 thorpej
1119 1.117 dyoung sockaddr_in_init(&u.dst4, &inp->inp_faddr, 0);
1120 1.117 dyoung return rtcache_lookup(ro, &u.dst);
1121 1.59 itojun }
1122 1.171 ozaki
1123 1.171 ozaki void
1124 1.171 ozaki in_pcbrtentry_unref(struct rtentry *rt, struct inpcb *inp)
1125 1.171 ozaki {
1126 1.171 ozaki
1127 1.171 ozaki rtcache_unref(rt, &inp->inp_route);
1128 1.171 ozaki }
1129