ip_input.c revision 1.82.2.2.2.1 1 1.82.2.2.2.1 thorpej /* $NetBSD: ip_input.c,v 1.82.2.2.2.1 1999/06/21 01:27:49 thorpej Exp $ */
2 1.76 thorpej
3 1.76 thorpej /*-
4 1.76 thorpej * Copyright (c) 1998 The NetBSD Foundation, Inc.
5 1.76 thorpej * All rights reserved.
6 1.76 thorpej *
7 1.76 thorpej * This code is derived from software contributed to The NetBSD Foundation
8 1.76 thorpej * by Public Access Networks Corporation ("Panix"). It was developed under
9 1.76 thorpej * contract to Panix by Eric Haszlakiewicz and Thor Lancelot Simon.
10 1.76 thorpej *
11 1.76 thorpej * Redistribution and use in source and binary forms, with or without
12 1.76 thorpej * modification, are permitted provided that the following conditions
13 1.76 thorpej * are met:
14 1.76 thorpej * 1. Redistributions of source code must retain the above copyright
15 1.76 thorpej * notice, this list of conditions and the following disclaimer.
16 1.76 thorpej * 2. Redistributions in binary form must reproduce the above copyright
17 1.76 thorpej * notice, this list of conditions and the following disclaimer in the
18 1.76 thorpej * documentation and/or other materials provided with the distribution.
19 1.76 thorpej * 3. All advertising materials mentioning features or use of this software
20 1.76 thorpej * must display the following acknowledgement:
21 1.76 thorpej * This product includes software developed by the NetBSD
22 1.76 thorpej * Foundation, Inc. and its contributors.
23 1.76 thorpej * 4. Neither the name of The NetBSD Foundation nor the names of its
24 1.76 thorpej * contributors may be used to endorse or promote products derived
25 1.76 thorpej * from this software without specific prior written permission.
26 1.76 thorpej *
27 1.76 thorpej * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
28 1.76 thorpej * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
29 1.76 thorpej * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
30 1.76 thorpej * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
31 1.76 thorpej * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
32 1.76 thorpej * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
33 1.76 thorpej * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
34 1.76 thorpej * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
35 1.76 thorpej * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
36 1.76 thorpej * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
37 1.76 thorpej * POSSIBILITY OF SUCH DAMAGE.
38 1.76 thorpej */
39 1.14 cgd
40 1.1 cgd /*
41 1.13 mycroft * Copyright (c) 1982, 1986, 1988, 1993
42 1.13 mycroft * The Regents of the University of California. All rights reserved.
43 1.1 cgd *
44 1.1 cgd * Redistribution and use in source and binary forms, with or without
45 1.1 cgd * modification, are permitted provided that the following conditions
46 1.1 cgd * are met:
47 1.1 cgd * 1. Redistributions of source code must retain the above copyright
48 1.1 cgd * notice, this list of conditions and the following disclaimer.
49 1.1 cgd * 2. Redistributions in binary form must reproduce the above copyright
50 1.1 cgd * notice, this list of conditions and the following disclaimer in the
51 1.1 cgd * documentation and/or other materials provided with the distribution.
52 1.1 cgd * 3. All advertising materials mentioning features or use of this software
53 1.1 cgd * must display the following acknowledgement:
54 1.1 cgd * This product includes software developed by the University of
55 1.1 cgd * California, Berkeley and its contributors.
56 1.1 cgd * 4. Neither the name of the University nor the names of its contributors
57 1.1 cgd * may be used to endorse or promote products derived from this software
58 1.1 cgd * without specific prior written permission.
59 1.1 cgd *
60 1.1 cgd * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
61 1.1 cgd * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
62 1.1 cgd * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
63 1.1 cgd * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
64 1.1 cgd * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
65 1.1 cgd * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
66 1.1 cgd * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
67 1.1 cgd * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
68 1.1 cgd * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
69 1.1 cgd * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
70 1.1 cgd * SUCH DAMAGE.
71 1.1 cgd *
72 1.14 cgd * @(#)ip_input.c 8.2 (Berkeley) 1/4/94
73 1.1 cgd */
74 1.55 scottr
75 1.62 matt #include "opt_gateway.h"
76 1.69 mrg #include "opt_pfil_hooks.h"
77 1.55 scottr #include "opt_mrouting.h"
78 1.1 cgd
79 1.5 mycroft #include <sys/param.h>
80 1.5 mycroft #include <sys/systm.h>
81 1.5 mycroft #include <sys/malloc.h>
82 1.5 mycroft #include <sys/mbuf.h>
83 1.5 mycroft #include <sys/domain.h>
84 1.5 mycroft #include <sys/protosw.h>
85 1.5 mycroft #include <sys/socket.h>
86 1.44 thorpej #include <sys/socketvar.h>
87 1.5 mycroft #include <sys/errno.h>
88 1.5 mycroft #include <sys/time.h>
89 1.5 mycroft #include <sys/kernel.h>
90 1.28 christos #include <sys/proc.h>
91 1.72 thorpej #include <sys/pool.h>
92 1.28 christos
93 1.28 christos #include <vm/vm.h>
94 1.28 christos #include <sys/sysctl.h>
95 1.1 cgd
96 1.5 mycroft #include <net/if.h>
97 1.44 thorpej #include <net/if_dl.h>
98 1.5 mycroft #include <net/route.h>
99 1.45 mrg #include <net/pfil.h>
100 1.1 cgd
101 1.5 mycroft #include <netinet/in.h>
102 1.5 mycroft #include <netinet/in_systm.h>
103 1.5 mycroft #include <netinet/ip.h>
104 1.5 mycroft #include <netinet/in_pcb.h>
105 1.5 mycroft #include <netinet/in_var.h>
106 1.5 mycroft #include <netinet/ip_var.h>
107 1.5 mycroft #include <netinet/ip_icmp.h>
108 1.44 thorpej
109 1.1 cgd #ifndef IPFORWARDING
110 1.1 cgd #ifdef GATEWAY
111 1.1 cgd #define IPFORWARDING 1 /* forward IP packets not for us */
112 1.1 cgd #else /* GATEWAY */
113 1.1 cgd #define IPFORWARDING 0 /* don't forward IP packets not for us */
114 1.1 cgd #endif /* GATEWAY */
115 1.1 cgd #endif /* IPFORWARDING */
116 1.1 cgd #ifndef IPSENDREDIRECTS
117 1.1 cgd #define IPSENDREDIRECTS 1
118 1.1 cgd #endif
119 1.26 thorpej #ifndef IPFORWSRCRT
120 1.47 cjs #define IPFORWSRCRT 1 /* forward source-routed packets */
121 1.47 cjs #endif
122 1.47 cjs #ifndef IPALLOWSRCRT
123 1.48 mrg #define IPALLOWSRCRT 1 /* allow source-routed packets */
124 1.26 thorpej #endif
125 1.53 kml #ifndef IPMTUDISC
126 1.53 kml #define IPMTUDISC 0
127 1.53 kml #endif
128 1.60 kml #ifndef IPMTUDISCTIMEOUT
129 1.61 kml #define IPMTUDISCTIMEOUT (10 * 60) /* as per RFC 1191 */
130 1.60 kml #endif
131 1.53 kml
132 1.27 thorpej /*
133 1.27 thorpej * Note: DIRECTED_BROADCAST is handled this way so that previous
134 1.27 thorpej * configuration using this option will Just Work.
135 1.27 thorpej */
136 1.27 thorpej #ifndef IPDIRECTEDBCAST
137 1.27 thorpej #ifdef DIRECTED_BROADCAST
138 1.27 thorpej #define IPDIRECTEDBCAST 1
139 1.27 thorpej #else
140 1.27 thorpej #define IPDIRECTEDBCAST 0
141 1.27 thorpej #endif /* DIRECTED_BROADCAST */
142 1.27 thorpej #endif /* IPDIRECTEDBCAST */
143 1.1 cgd int ipforwarding = IPFORWARDING;
144 1.1 cgd int ipsendredirects = IPSENDREDIRECTS;
145 1.13 mycroft int ip_defttl = IPDEFTTL;
146 1.26 thorpej int ip_forwsrcrt = IPFORWSRCRT;
147 1.27 thorpej int ip_directedbcast = IPDIRECTEDBCAST;
148 1.47 cjs int ip_allowsrcrt = IPALLOWSRCRT;
149 1.53 kml int ip_mtudisc = IPMTUDISC;
150 1.60 kml u_int ip_mtudisc_timeout = IPMTUDISCTIMEOUT;
151 1.1 cgd #ifdef DIAGNOSTIC
152 1.1 cgd int ipprintfs = 0;
153 1.1 cgd #endif
154 1.1 cgd
155 1.60 kml struct rttimer_queue *ip_mtudisc_timeout_q = NULL;
156 1.60 kml
157 1.1 cgd extern struct domain inetdomain;
158 1.1 cgd extern struct protosw inetsw[];
159 1.1 cgd u_char ip_protox[IPPROTO_MAX];
160 1.1 cgd int ipqmaxlen = IFQ_MAXLEN;
161 1.22 mycroft struct in_ifaddrhead in_ifaddr;
162 1.57 tls struct in_ifaddrhashhead *in_ifaddrhashtbl;
163 1.13 mycroft struct ifqueue ipintrq;
164 1.63 matt struct ipstat ipstat;
165 1.63 matt u_int16_t ip_id;
166 1.63 matt int ip_defttl;
167 1.75 thorpej
168 1.63 matt struct ipqhead ipq;
169 1.75 thorpej int ipq_locked;
170 1.75 thorpej
171 1.75 thorpej static __inline int ipq_lock_try __P((void));
172 1.75 thorpej static __inline void ipq_unlock __P((void));
173 1.75 thorpej
174 1.75 thorpej static __inline int
175 1.75 thorpej ipq_lock_try()
176 1.75 thorpej {
177 1.75 thorpej int s;
178 1.75 thorpej
179 1.75 thorpej s = splimp();
180 1.75 thorpej if (ipq_locked) {
181 1.75 thorpej splx(s);
182 1.75 thorpej return (0);
183 1.75 thorpej }
184 1.75 thorpej ipq_locked = 1;
185 1.75 thorpej splx(s);
186 1.75 thorpej return (1);
187 1.75 thorpej }
188 1.75 thorpej
189 1.75 thorpej static __inline void
190 1.75 thorpej ipq_unlock()
191 1.75 thorpej {
192 1.75 thorpej int s;
193 1.75 thorpej
194 1.75 thorpej s = splimp();
195 1.75 thorpej ipq_locked = 0;
196 1.75 thorpej splx(s);
197 1.75 thorpej }
198 1.75 thorpej
199 1.75 thorpej #ifdef DIAGNOSTIC
200 1.75 thorpej #define IPQ_LOCK() \
201 1.75 thorpej do { \
202 1.75 thorpej if (ipq_lock_try() == 0) { \
203 1.75 thorpej printf("%s:%d: ipq already locked\n", __FILE__, __LINE__); \
204 1.75 thorpej panic("ipq_lock"); \
205 1.75 thorpej } \
206 1.75 thorpej } while (0)
207 1.75 thorpej #define IPQ_LOCK_CHECK() \
208 1.75 thorpej do { \
209 1.75 thorpej if (ipq_locked == 0) { \
210 1.75 thorpej printf("%s:%d: ipq lock not held\n", __FILE__, __LINE__); \
211 1.75 thorpej panic("ipq lock check"); \
212 1.75 thorpej } \
213 1.75 thorpej } while (0)
214 1.75 thorpej #else
215 1.75 thorpej #define IPQ_LOCK() (void) ipq_lock_try()
216 1.75 thorpej #define IPQ_LOCK_CHECK() /* nothing */
217 1.75 thorpej #endif
218 1.75 thorpej
219 1.75 thorpej #define IPQ_UNLOCK() ipq_unlock()
220 1.1 cgd
221 1.72 thorpej struct pool ipqent_pool;
222 1.72 thorpej
223 1.1 cgd /*
224 1.1 cgd * We need to save the IP options in case a protocol wants to respond
225 1.1 cgd * to an incoming packet over the same route if the packet got here
226 1.1 cgd * using IP source routing. This allows connection establishment and
227 1.1 cgd * maintenance when the remote end is on a network that is not known
228 1.1 cgd * to us.
229 1.1 cgd */
230 1.1 cgd int ip_nhops = 0;
231 1.1 cgd static struct ip_srcrt {
232 1.1 cgd struct in_addr dst; /* final destination */
233 1.1 cgd char nop; /* one NOP to align */
234 1.1 cgd char srcopt[IPOPT_OFFSET + 1]; /* OPTVAL, OLEN and OFFSET */
235 1.1 cgd struct in_addr route[MAX_IPOPTLEN/sizeof(struct in_addr)];
236 1.1 cgd } ip_srcrt;
237 1.1 cgd
238 1.13 mycroft static void save_rte __P((u_char *, struct in_addr));
239 1.35 mycroft
240 1.1 cgd /*
241 1.1 cgd * IP initialization: fill in IP protocol switch table.
242 1.1 cgd * All protocols not implemented in kernel go to raw IP protocol handler.
243 1.1 cgd */
244 1.8 mycroft void
245 1.1 cgd ip_init()
246 1.1 cgd {
247 1.1 cgd register struct protosw *pr;
248 1.1 cgd register int i;
249 1.1 cgd
250 1.72 thorpej pool_init(&ipqent_pool, sizeof(struct ipqent), 0, 0, 0, "ipqepl",
251 1.72 thorpej 0, NULL, NULL, M_IPQ);
252 1.72 thorpej
253 1.1 cgd pr = pffindproto(PF_INET, IPPROTO_RAW, SOCK_RAW);
254 1.1 cgd if (pr == 0)
255 1.1 cgd panic("ip_init");
256 1.1 cgd for (i = 0; i < IPPROTO_MAX; i++)
257 1.1 cgd ip_protox[i] = pr - inetsw;
258 1.1 cgd for (pr = inetdomain.dom_protosw;
259 1.1 cgd pr < inetdomain.dom_protoswNPROTOSW; pr++)
260 1.1 cgd if (pr->pr_domain->dom_family == PF_INET &&
261 1.1 cgd pr->pr_protocol && pr->pr_protocol != IPPROTO_RAW)
262 1.1 cgd ip_protox[pr->pr_protocol] = pr - inetsw;
263 1.25 cgd LIST_INIT(&ipq);
264 1.1 cgd ip_id = time.tv_sec & 0xffff;
265 1.1 cgd ipintrq.ifq_maxlen = ipqmaxlen;
266 1.22 mycroft TAILQ_INIT(&in_ifaddr);
267 1.57 tls in_ifaddrhashtbl =
268 1.57 tls hashinit(IN_IFADDR_HASH_SIZE, M_IFADDR, M_WAITOK, &in_ifaddrhash);
269 1.60 kml if (ip_mtudisc != 0)
270 1.60 kml ip_mtudisc_timeout_q =
271 1.60 kml rt_timer_queue_create(ip_mtudisc_timeout);
272 1.73 thorpej #ifdef GATEWAY
273 1.73 thorpej ipflow_init();
274 1.73 thorpej #endif
275 1.1 cgd }
276 1.1 cgd
277 1.1 cgd struct sockaddr_in ipaddr = { sizeof(ipaddr), AF_INET };
278 1.1 cgd struct route ipforward_rt;
279 1.1 cgd
280 1.1 cgd /*
281 1.1 cgd * Ip input routine. Checksum and byte swap header. If fragmented
282 1.1 cgd * try to reassemble. Process options. Pass to next level.
283 1.1 cgd */
284 1.8 mycroft void
285 1.1 cgd ipintr()
286 1.1 cgd {
287 1.33 mrg register struct ip *ip = NULL;
288 1.1 cgd register struct mbuf *m;
289 1.1 cgd register struct ipq *fp;
290 1.1 cgd register struct in_ifaddr *ia;
291 1.57 tls register struct ifaddr *ifa;
292 1.25 cgd struct ipqent *ipqe;
293 1.35 mycroft int hlen = 0, mff, len, s;
294 1.36 mrg #ifdef PFIL_HOOKS
295 1.33 mrg struct packet_filter_hook *pfh;
296 1.33 mrg struct mbuf *m0;
297 1.43 mrg int rv;
298 1.36 mrg #endif /* PFIL_HOOKS */
299 1.1 cgd
300 1.1 cgd next:
301 1.1 cgd /*
302 1.1 cgd * Get next datagram off input queue and get IP header
303 1.1 cgd * in first mbuf.
304 1.1 cgd */
305 1.1 cgd s = splimp();
306 1.1 cgd IF_DEQUEUE(&ipintrq, m);
307 1.1 cgd splx(s);
308 1.13 mycroft if (m == 0)
309 1.1 cgd return;
310 1.1 cgd #ifdef DIAGNOSTIC
311 1.1 cgd if ((m->m_flags & M_PKTHDR) == 0)
312 1.1 cgd panic("ipintr no HDR");
313 1.1 cgd #endif
314 1.1 cgd /*
315 1.1 cgd * If no IP addresses have been set yet but the interfaces
316 1.1 cgd * are receiving, can't do anything with incoming packets yet.
317 1.1 cgd */
318 1.22 mycroft if (in_ifaddr.tqh_first == 0)
319 1.1 cgd goto bad;
320 1.1 cgd ipstat.ips_total++;
321 1.1 cgd if (m->m_len < sizeof (struct ip) &&
322 1.1 cgd (m = m_pullup(m, sizeof (struct ip))) == 0) {
323 1.1 cgd ipstat.ips_toosmall++;
324 1.1 cgd goto next;
325 1.1 cgd }
326 1.1 cgd ip = mtod(m, struct ip *);
327 1.13 mycroft if (ip->ip_v != IPVERSION) {
328 1.13 mycroft ipstat.ips_badvers++;
329 1.13 mycroft goto bad;
330 1.13 mycroft }
331 1.1 cgd hlen = ip->ip_hl << 2;
332 1.1 cgd if (hlen < sizeof(struct ip)) { /* minimum header length */
333 1.1 cgd ipstat.ips_badhlen++;
334 1.1 cgd goto bad;
335 1.1 cgd }
336 1.1 cgd if (hlen > m->m_len) {
337 1.1 cgd if ((m = m_pullup(m, hlen)) == 0) {
338 1.1 cgd ipstat.ips_badhlen++;
339 1.1 cgd goto next;
340 1.1 cgd }
341 1.1 cgd ip = mtod(m, struct ip *);
342 1.1 cgd }
343 1.82.2.2.2.1 thorpej /*
344 1.82.2.2.2.1 thorpej * we drop packets that have a multicast address as source
345 1.82.2.2.2.1 thorpej * as wanted by rfc 1112
346 1.82.2.2.2.1 thorpej */
347 1.82.2.2.2.1 thorpej if (IN_MULTICAST(ip->ip_src.s_addr)) {
348 1.82.2.2.2.1 thorpej goto bad;
349 1.82.2.2.2.1 thorpej }
350 1.82.2.2.2.1 thorpej
351 1.78 mycroft if (in_cksum(m, hlen) != 0) {
352 1.1 cgd ipstat.ips_badsum++;
353 1.1 cgd goto bad;
354 1.1 cgd }
355 1.1 cgd
356 1.1 cgd /*
357 1.1 cgd * Convert fields to host representation.
358 1.1 cgd */
359 1.1 cgd NTOHS(ip->ip_len);
360 1.1 cgd NTOHS(ip->ip_off);
361 1.35 mycroft len = ip->ip_len;
362 1.81 proff
363 1.81 proff /*
364 1.81 proff * Check for additional length bogosity
365 1.81 proff */
366 1.82.2.2.2.1 thorpej if (len < hlen) {
367 1.81 proff ipstat.ips_badlen++;
368 1.81 proff goto bad;
369 1.81 proff }
370 1.1 cgd
371 1.1 cgd /*
372 1.1 cgd * Check that the amount of data in the buffers
373 1.1 cgd * is as at least much as the IP header would have us expect.
374 1.1 cgd * Trim mbufs if longer than we expect.
375 1.1 cgd * Drop packet if shorter than we expect.
376 1.1 cgd */
377 1.35 mycroft if (m->m_pkthdr.len < len) {
378 1.1 cgd ipstat.ips_tooshort++;
379 1.1 cgd goto bad;
380 1.1 cgd }
381 1.35 mycroft if (m->m_pkthdr.len > len) {
382 1.1 cgd if (m->m_len == m->m_pkthdr.len) {
383 1.35 mycroft m->m_len = len;
384 1.35 mycroft m->m_pkthdr.len = len;
385 1.1 cgd } else
386 1.35 mycroft m_adj(m, len - m->m_pkthdr.len);
387 1.1 cgd }
388 1.1 cgd
389 1.64 thorpej /*
390 1.64 thorpej * Assume that we can create a fast-forward IP flow entry
391 1.64 thorpej * based on this packet.
392 1.64 thorpej */
393 1.64 thorpej m->m_flags |= M_CANFASTFWD;
394 1.64 thorpej
395 1.36 mrg #ifdef PFIL_HOOKS
396 1.33 mrg /*
397 1.64 thorpej * Run through list of hooks for input packets. If there are any
398 1.64 thorpej * filters which require that additional packets in the flow are
399 1.64 thorpej * not fast-forwarded, they must clear the M_CANFASTFWD flag.
400 1.64 thorpej * Note that filters must _never_ set this flag, as another filter
401 1.64 thorpej * in the list may have previously cleared it.
402 1.33 mrg */
403 1.33 mrg m0 = m;
404 1.59 mrg for (pfh = pfil_hook_get(PFIL_IN); pfh; pfh = pfh->pfil_link.tqe_next)
405 1.33 mrg if (pfh->pfil_func) {
406 1.43 mrg rv = pfh->pfil_func(ip, hlen, m->m_pkthdr.rcvif, 0, &m0);
407 1.43 mrg if (rv)
408 1.40 veego goto next;
409 1.68 sommerfe m = m0;
410 1.68 sommerfe if (m == NULL)
411 1.68 sommerfe goto next;
412 1.68 sommerfe ip = mtod(m, struct ip *);
413 1.33 mrg }
414 1.36 mrg #endif /* PFIL_HOOKS */
415 1.33 mrg
416 1.1 cgd /*
417 1.1 cgd * Process options and, if not destined for us,
418 1.1 cgd * ship it on. ip_dooptions returns 1 when an
419 1.1 cgd * error was detected (causing an icmp message
420 1.1 cgd * to be sent and the original packet to be freed).
421 1.1 cgd */
422 1.1 cgd ip_nhops = 0; /* for source routed packets */
423 1.1 cgd if (hlen > sizeof (struct ip) && ip_dooptions(m))
424 1.1 cgd goto next;
425 1.1 cgd
426 1.1 cgd /*
427 1.1 cgd * Check our list of addresses, to see if the packet is for us.
428 1.1 cgd */
429 1.57 tls INADDR_TO_IA(ip->ip_dst, ia);
430 1.82.2.2 perry if (ia != NULL)
431 1.82.2.2 perry goto ours;
432 1.57 tls if (m->m_pkthdr.rcvif->if_flags & IFF_BROADCAST) {
433 1.57 tls for (ifa = m->m_pkthdr.rcvif->if_addrlist.tqh_first;
434 1.57 tls ifa != NULL; ifa = ifa->ifa_list.tqe_next) {
435 1.57 tls if (ifa->ifa_addr->sa_family != AF_INET) continue;
436 1.57 tls ia = ifatoia(ifa);
437 1.35 mycroft if (in_hosteq(ip->ip_dst, ia->ia_broadaddr.sin_addr) ||
438 1.35 mycroft in_hosteq(ip->ip_dst, ia->ia_netbroadcast) ||
439 1.20 mycroft /*
440 1.20 mycroft * Look for all-0's host part (old broadcast addr),
441 1.20 mycroft * either for subnet or net.
442 1.20 mycroft */
443 1.20 mycroft ip->ip_dst.s_addr == ia->ia_subnet ||
444 1.18 mycroft ip->ip_dst.s_addr == ia->ia_net)
445 1.1 cgd goto ours;
446 1.57 tls /*
447 1.57 tls * An interface with IP address zero accepts
448 1.57 tls * all packets that arrive on that interface.
449 1.57 tls */
450 1.57 tls if (in_nullhost(ia->ia_addr.sin_addr))
451 1.57 tls goto ours;
452 1.1 cgd }
453 1.1 cgd }
454 1.18 mycroft if (IN_MULTICAST(ip->ip_dst.s_addr)) {
455 1.4 hpeyerl struct in_multi *inm;
456 1.4 hpeyerl #ifdef MROUTING
457 1.4 hpeyerl extern struct socket *ip_mrouter;
458 1.10 brezak
459 1.10 brezak if (m->m_flags & M_EXT) {
460 1.10 brezak if ((m = m_pullup(m, hlen)) == 0) {
461 1.10 brezak ipstat.ips_toosmall++;
462 1.10 brezak goto next;
463 1.10 brezak }
464 1.10 brezak ip = mtod(m, struct ip *);
465 1.10 brezak }
466 1.4 hpeyerl
467 1.4 hpeyerl if (ip_mrouter) {
468 1.4 hpeyerl /*
469 1.4 hpeyerl * If we are acting as a multicast router, all
470 1.4 hpeyerl * incoming multicast packets are passed to the
471 1.4 hpeyerl * kernel-level multicast forwarding function.
472 1.4 hpeyerl * The packet is returned (relatively) intact; if
473 1.4 hpeyerl * ip_mforward() returns a non-zero value, the packet
474 1.4 hpeyerl * must be discarded, else it may be accepted below.
475 1.4 hpeyerl *
476 1.4 hpeyerl * (The IP ident field is put in the same byte order
477 1.4 hpeyerl * as expected when ip_mforward() is called from
478 1.4 hpeyerl * ip_output().)
479 1.4 hpeyerl */
480 1.13 mycroft if (ip_mforward(m, m->m_pkthdr.rcvif) != 0) {
481 1.13 mycroft ipstat.ips_cantforward++;
482 1.4 hpeyerl m_freem(m);
483 1.4 hpeyerl goto next;
484 1.4 hpeyerl }
485 1.4 hpeyerl
486 1.4 hpeyerl /*
487 1.4 hpeyerl * The process-level routing demon needs to receive
488 1.4 hpeyerl * all multicast IGMP packets, whether or not this
489 1.4 hpeyerl * host belongs to their destination groups.
490 1.4 hpeyerl */
491 1.4 hpeyerl if (ip->ip_p == IPPROTO_IGMP)
492 1.4 hpeyerl goto ours;
493 1.13 mycroft ipstat.ips_forward++;
494 1.4 hpeyerl }
495 1.4 hpeyerl #endif
496 1.4 hpeyerl /*
497 1.4 hpeyerl * See if we belong to the destination multicast group on the
498 1.4 hpeyerl * arrival interface.
499 1.4 hpeyerl */
500 1.4 hpeyerl IN_LOOKUP_MULTI(ip->ip_dst, m->m_pkthdr.rcvif, inm);
501 1.4 hpeyerl if (inm == NULL) {
502 1.13 mycroft ipstat.ips_cantforward++;
503 1.4 hpeyerl m_freem(m);
504 1.4 hpeyerl goto next;
505 1.4 hpeyerl }
506 1.4 hpeyerl goto ours;
507 1.4 hpeyerl }
508 1.19 mycroft if (ip->ip_dst.s_addr == INADDR_BROADCAST ||
509 1.35 mycroft in_nullhost(ip->ip_dst))
510 1.1 cgd goto ours;
511 1.1 cgd
512 1.1 cgd /*
513 1.1 cgd * Not for us; forward if possible and desirable.
514 1.1 cgd */
515 1.1 cgd if (ipforwarding == 0) {
516 1.1 cgd ipstat.ips_cantforward++;
517 1.1 cgd m_freem(m);
518 1.1 cgd } else
519 1.1 cgd ip_forward(m, 0);
520 1.1 cgd goto next;
521 1.1 cgd
522 1.1 cgd ours:
523 1.1 cgd /*
524 1.1 cgd * If offset or IP_MF are set, must reassemble.
525 1.1 cgd * Otherwise, nothing need be done.
526 1.1 cgd * (We could look in the reassembly queue to see
527 1.1 cgd * if the packet was previously fragmented,
528 1.1 cgd * but it's not worth the time; just let them time out.)
529 1.1 cgd */
530 1.37 perry if (ip->ip_off & ~(IP_DF|IP_RF)) {
531 1.1 cgd /*
532 1.1 cgd * Look for queue of fragments
533 1.1 cgd * of this datagram.
534 1.1 cgd */
535 1.75 thorpej IPQ_LOCK();
536 1.25 cgd for (fp = ipq.lh_first; fp != NULL; fp = fp->ipq_q.le_next)
537 1.1 cgd if (ip->ip_id == fp->ipq_id &&
538 1.35 mycroft in_hosteq(ip->ip_src, fp->ipq_src) &&
539 1.35 mycroft in_hosteq(ip->ip_dst, fp->ipq_dst) &&
540 1.1 cgd ip->ip_p == fp->ipq_p)
541 1.1 cgd goto found;
542 1.1 cgd fp = 0;
543 1.1 cgd found:
544 1.1 cgd
545 1.1 cgd /*
546 1.1 cgd * Adjust ip_len to not reflect header,
547 1.25 cgd * set ipqe_mff if more fragments are expected,
548 1.1 cgd * convert offset of this to bytes.
549 1.1 cgd */
550 1.1 cgd ip->ip_len -= hlen;
551 1.25 cgd mff = (ip->ip_off & IP_MF) != 0;
552 1.25 cgd if (mff) {
553 1.16 cgd /*
554 1.16 cgd * Make sure that fragments have a data length
555 1.16 cgd * that's a non-zero multiple of 8 bytes.
556 1.16 cgd */
557 1.17 cgd if (ip->ip_len == 0 || (ip->ip_len & 0x7) != 0) {
558 1.16 cgd ipstat.ips_badfrags++;
559 1.75 thorpej IPQ_UNLOCK();
560 1.16 cgd goto bad;
561 1.16 cgd }
562 1.16 cgd }
563 1.1 cgd ip->ip_off <<= 3;
564 1.1 cgd
565 1.1 cgd /*
566 1.1 cgd * If datagram marked as having more fragments
567 1.1 cgd * or if this is not the first fragment,
568 1.1 cgd * attempt reassembly; if it succeeds, proceed.
569 1.1 cgd */
570 1.25 cgd if (mff || ip->ip_off) {
571 1.1 cgd ipstat.ips_fragments++;
572 1.72 thorpej ipqe = pool_get(&ipqent_pool, PR_NOWAIT);
573 1.25 cgd if (ipqe == NULL) {
574 1.25 cgd ipstat.ips_rcvmemdrop++;
575 1.75 thorpej IPQ_UNLOCK();
576 1.25 cgd goto bad;
577 1.25 cgd }
578 1.25 cgd ipqe->ipqe_mff = mff;
579 1.50 thorpej ipqe->ipqe_m = m;
580 1.25 cgd ipqe->ipqe_ip = ip;
581 1.50 thorpej m = ip_reass(ipqe, fp);
582 1.75 thorpej if (m == 0) {
583 1.75 thorpej IPQ_UNLOCK();
584 1.1 cgd goto next;
585 1.75 thorpej }
586 1.13 mycroft ipstat.ips_reassembled++;
587 1.50 thorpej ip = mtod(m, struct ip *);
588 1.74 thorpej hlen = ip->ip_hl << 2;
589 1.79 mycroft ip->ip_len += hlen;
590 1.1 cgd } else
591 1.1 cgd if (fp)
592 1.1 cgd ip_freef(fp);
593 1.75 thorpej IPQ_UNLOCK();
594 1.79 mycroft }
595 1.1 cgd
596 1.1 cgd /*
597 1.1 cgd * Switch out to protocol's input routine.
598 1.1 cgd */
599 1.82 aidan #if IFA_STATS
600 1.82 aidan ia->ia_ifa.ifa_data.ifad_inbytes += ip->ip_len;
601 1.82 aidan #endif
602 1.1 cgd ipstat.ips_delivered++;
603 1.1 cgd (*inetsw[ip_protox[ip->ip_p]].pr_input)(m, hlen);
604 1.1 cgd goto next;
605 1.1 cgd bad:
606 1.1 cgd m_freem(m);
607 1.1 cgd goto next;
608 1.1 cgd }
609 1.1 cgd
610 1.1 cgd /*
611 1.1 cgd * Take incoming datagram fragment and try to
612 1.1 cgd * reassemble it into whole datagram. If a chain for
613 1.1 cgd * reassembly of this datagram already exists, then it
614 1.1 cgd * is given as fp; otherwise have to make a chain.
615 1.1 cgd */
616 1.50 thorpej struct mbuf *
617 1.25 cgd ip_reass(ipqe, fp)
618 1.25 cgd register struct ipqent *ipqe;
619 1.1 cgd register struct ipq *fp;
620 1.1 cgd {
621 1.50 thorpej register struct mbuf *m = ipqe->ipqe_m;
622 1.25 cgd register struct ipqent *nq, *p, *q;
623 1.25 cgd struct ip *ip;
624 1.1 cgd struct mbuf *t;
625 1.25 cgd int hlen = ipqe->ipqe_ip->ip_hl << 2;
626 1.1 cgd int i, next;
627 1.1 cgd
628 1.75 thorpej IPQ_LOCK_CHECK();
629 1.75 thorpej
630 1.1 cgd /*
631 1.1 cgd * Presence of header sizes in mbufs
632 1.1 cgd * would confuse code below.
633 1.1 cgd */
634 1.1 cgd m->m_data += hlen;
635 1.1 cgd m->m_len -= hlen;
636 1.1 cgd
637 1.1 cgd /*
638 1.1 cgd * If first fragment to arrive, create a reassembly queue.
639 1.1 cgd */
640 1.1 cgd if (fp == 0) {
641 1.50 thorpej MALLOC(fp, struct ipq *, sizeof (struct ipq),
642 1.50 thorpej M_FTABLE, M_NOWAIT);
643 1.50 thorpej if (fp == NULL)
644 1.1 cgd goto dropfrag;
645 1.25 cgd LIST_INSERT_HEAD(&ipq, fp, ipq_q);
646 1.1 cgd fp->ipq_ttl = IPFRAGTTL;
647 1.25 cgd fp->ipq_p = ipqe->ipqe_ip->ip_p;
648 1.25 cgd fp->ipq_id = ipqe->ipqe_ip->ip_id;
649 1.25 cgd LIST_INIT(&fp->ipq_fragq);
650 1.25 cgd fp->ipq_src = ipqe->ipqe_ip->ip_src;
651 1.25 cgd fp->ipq_dst = ipqe->ipqe_ip->ip_dst;
652 1.25 cgd p = NULL;
653 1.1 cgd goto insert;
654 1.1 cgd }
655 1.1 cgd
656 1.1 cgd /*
657 1.1 cgd * Find a segment which begins after this one does.
658 1.1 cgd */
659 1.25 cgd for (p = NULL, q = fp->ipq_fragq.lh_first; q != NULL;
660 1.25 cgd p = q, q = q->ipqe_q.le_next)
661 1.25 cgd if (q->ipqe_ip->ip_off > ipqe->ipqe_ip->ip_off)
662 1.1 cgd break;
663 1.1 cgd
664 1.1 cgd /*
665 1.1 cgd * If there is a preceding segment, it may provide some of
666 1.1 cgd * our data already. If so, drop the data from the incoming
667 1.1 cgd * segment. If it provides all of our data, drop us.
668 1.1 cgd */
669 1.25 cgd if (p != NULL) {
670 1.25 cgd i = p->ipqe_ip->ip_off + p->ipqe_ip->ip_len -
671 1.25 cgd ipqe->ipqe_ip->ip_off;
672 1.1 cgd if (i > 0) {
673 1.25 cgd if (i >= ipqe->ipqe_ip->ip_len)
674 1.1 cgd goto dropfrag;
675 1.50 thorpej m_adj(ipqe->ipqe_m, i);
676 1.25 cgd ipqe->ipqe_ip->ip_off += i;
677 1.25 cgd ipqe->ipqe_ip->ip_len -= i;
678 1.1 cgd }
679 1.1 cgd }
680 1.1 cgd
681 1.1 cgd /*
682 1.1 cgd * While we overlap succeeding segments trim them or,
683 1.1 cgd * if they are completely covered, dequeue them.
684 1.1 cgd */
685 1.25 cgd for (; q != NULL && ipqe->ipqe_ip->ip_off + ipqe->ipqe_ip->ip_len >
686 1.25 cgd q->ipqe_ip->ip_off; q = nq) {
687 1.25 cgd i = (ipqe->ipqe_ip->ip_off + ipqe->ipqe_ip->ip_len) -
688 1.25 cgd q->ipqe_ip->ip_off;
689 1.25 cgd if (i < q->ipqe_ip->ip_len) {
690 1.25 cgd q->ipqe_ip->ip_len -= i;
691 1.25 cgd q->ipqe_ip->ip_off += i;
692 1.50 thorpej m_adj(q->ipqe_m, i);
693 1.1 cgd break;
694 1.1 cgd }
695 1.25 cgd nq = q->ipqe_q.le_next;
696 1.50 thorpej m_freem(q->ipqe_m);
697 1.25 cgd LIST_REMOVE(q, ipqe_q);
698 1.72 thorpej pool_put(&ipqent_pool, q);
699 1.1 cgd }
700 1.1 cgd
701 1.1 cgd insert:
702 1.1 cgd /*
703 1.1 cgd * Stick new segment in its place;
704 1.1 cgd * check for complete reassembly.
705 1.1 cgd */
706 1.25 cgd if (p == NULL) {
707 1.25 cgd LIST_INSERT_HEAD(&fp->ipq_fragq, ipqe, ipqe_q);
708 1.25 cgd } else {
709 1.25 cgd LIST_INSERT_AFTER(p, ipqe, ipqe_q);
710 1.25 cgd }
711 1.1 cgd next = 0;
712 1.25 cgd for (p = NULL, q = fp->ipq_fragq.lh_first; q != NULL;
713 1.25 cgd p = q, q = q->ipqe_q.le_next) {
714 1.25 cgd if (q->ipqe_ip->ip_off != next)
715 1.1 cgd return (0);
716 1.25 cgd next += q->ipqe_ip->ip_len;
717 1.1 cgd }
718 1.25 cgd if (p->ipqe_mff)
719 1.1 cgd return (0);
720 1.1 cgd
721 1.1 cgd /*
722 1.41 thorpej * Reassembly is complete. Check for a bogus message size and
723 1.41 thorpej * concatenate fragments.
724 1.1 cgd */
725 1.25 cgd q = fp->ipq_fragq.lh_first;
726 1.25 cgd ip = q->ipqe_ip;
727 1.41 thorpej if ((next + (ip->ip_hl << 2)) > IP_MAXPACKET) {
728 1.41 thorpej ipstat.ips_toolong++;
729 1.41 thorpej ip_freef(fp);
730 1.41 thorpej return (0);
731 1.41 thorpej }
732 1.50 thorpej m = q->ipqe_m;
733 1.1 cgd t = m->m_next;
734 1.1 cgd m->m_next = 0;
735 1.1 cgd m_cat(m, t);
736 1.25 cgd nq = q->ipqe_q.le_next;
737 1.72 thorpej pool_put(&ipqent_pool, q);
738 1.25 cgd for (q = nq; q != NULL; q = nq) {
739 1.50 thorpej t = q->ipqe_m;
740 1.25 cgd nq = q->ipqe_q.le_next;
741 1.72 thorpej pool_put(&ipqent_pool, q);
742 1.1 cgd m_cat(m, t);
743 1.1 cgd }
744 1.1 cgd
745 1.1 cgd /*
746 1.1 cgd * Create header for new ip packet by
747 1.1 cgd * modifying header of first packet;
748 1.1 cgd * dequeue and discard fragment reassembly header.
749 1.1 cgd * Make header visible.
750 1.1 cgd */
751 1.1 cgd ip->ip_len = next;
752 1.25 cgd ip->ip_src = fp->ipq_src;
753 1.25 cgd ip->ip_dst = fp->ipq_dst;
754 1.25 cgd LIST_REMOVE(fp, ipq_q);
755 1.50 thorpej FREE(fp, M_FTABLE);
756 1.1 cgd m->m_len += (ip->ip_hl << 2);
757 1.1 cgd m->m_data -= (ip->ip_hl << 2);
758 1.1 cgd /* some debugging cruft by sklower, below, will go away soon */
759 1.1 cgd if (m->m_flags & M_PKTHDR) { /* XXX this should be done elsewhere */
760 1.1 cgd register int plen = 0;
761 1.50 thorpej for (t = m; t; t = t->m_next)
762 1.50 thorpej plen += t->m_len;
763 1.50 thorpej m->m_pkthdr.len = plen;
764 1.1 cgd }
765 1.50 thorpej return (m);
766 1.1 cgd
767 1.1 cgd dropfrag:
768 1.1 cgd ipstat.ips_fragdropped++;
769 1.1 cgd m_freem(m);
770 1.72 thorpej pool_put(&ipqent_pool, ipqe);
771 1.1 cgd return (0);
772 1.1 cgd }
773 1.1 cgd
774 1.1 cgd /*
775 1.1 cgd * Free a fragment reassembly header and all
776 1.1 cgd * associated datagrams.
777 1.1 cgd */
778 1.8 mycroft void
779 1.1 cgd ip_freef(fp)
780 1.1 cgd struct ipq *fp;
781 1.1 cgd {
782 1.25 cgd register struct ipqent *q, *p;
783 1.1 cgd
784 1.75 thorpej IPQ_LOCK_CHECK();
785 1.75 thorpej
786 1.25 cgd for (q = fp->ipq_fragq.lh_first; q != NULL; q = p) {
787 1.25 cgd p = q->ipqe_q.le_next;
788 1.50 thorpej m_freem(q->ipqe_m);
789 1.25 cgd LIST_REMOVE(q, ipqe_q);
790 1.72 thorpej pool_put(&ipqent_pool, q);
791 1.1 cgd }
792 1.25 cgd LIST_REMOVE(fp, ipq_q);
793 1.50 thorpej FREE(fp, M_FTABLE);
794 1.1 cgd }
795 1.1 cgd
796 1.1 cgd /*
797 1.1 cgd * IP timer processing;
798 1.1 cgd * if a timer expires on a reassembly
799 1.1 cgd * queue, discard it.
800 1.1 cgd */
801 1.8 mycroft void
802 1.1 cgd ip_slowtimo()
803 1.1 cgd {
804 1.25 cgd register struct ipq *fp, *nfp;
805 1.24 mycroft int s = splsoftnet();
806 1.1 cgd
807 1.75 thorpej IPQ_LOCK();
808 1.25 cgd for (fp = ipq.lh_first; fp != NULL; fp = nfp) {
809 1.25 cgd nfp = fp->ipq_q.le_next;
810 1.25 cgd if (--fp->ipq_ttl == 0) {
811 1.1 cgd ipstat.ips_fragtimeout++;
812 1.25 cgd ip_freef(fp);
813 1.1 cgd }
814 1.1 cgd }
815 1.75 thorpej IPQ_UNLOCK();
816 1.63 matt #ifdef GATEWAY
817 1.63 matt ipflow_slowtimo();
818 1.63 matt #endif
819 1.1 cgd splx(s);
820 1.1 cgd }
821 1.1 cgd
822 1.1 cgd /*
823 1.1 cgd * Drain off all datagram fragments.
824 1.1 cgd */
825 1.8 mycroft void
826 1.1 cgd ip_drain()
827 1.1 cgd {
828 1.1 cgd
829 1.75 thorpej /*
830 1.75 thorpej * We may be called from a device's interrupt context. If
831 1.75 thorpej * the ipq is already busy, just bail out now.
832 1.75 thorpej */
833 1.75 thorpej if (ipq_lock_try() == 0)
834 1.75 thorpej return;
835 1.75 thorpej
836 1.25 cgd while (ipq.lh_first != NULL) {
837 1.1 cgd ipstat.ips_fragdropped++;
838 1.25 cgd ip_freef(ipq.lh_first);
839 1.1 cgd }
840 1.75 thorpej
841 1.75 thorpej IPQ_UNLOCK();
842 1.1 cgd }
843 1.1 cgd
844 1.1 cgd /*
845 1.1 cgd * Do option processing on a datagram,
846 1.1 cgd * possibly discarding it if bad options are encountered,
847 1.1 cgd * or forwarding it if source-routed.
848 1.1 cgd * Returns 1 if packet has been forwarded/freed,
849 1.1 cgd * 0 if the packet should be processed further.
850 1.1 cgd */
851 1.8 mycroft int
852 1.1 cgd ip_dooptions(m)
853 1.1 cgd struct mbuf *m;
854 1.1 cgd {
855 1.1 cgd register struct ip *ip = mtod(m, struct ip *);
856 1.1 cgd register u_char *cp;
857 1.1 cgd register struct ip_timestamp *ipt;
858 1.1 cgd register struct in_ifaddr *ia;
859 1.1 cgd int opt, optlen, cnt, off, code, type = ICMP_PARAMPROB, forward = 0;
860 1.13 mycroft struct in_addr *sin, dst;
861 1.1 cgd n_time ntime;
862 1.1 cgd
863 1.13 mycroft dst = ip->ip_dst;
864 1.1 cgd cp = (u_char *)(ip + 1);
865 1.1 cgd cnt = (ip->ip_hl << 2) - sizeof (struct ip);
866 1.1 cgd for (; cnt > 0; cnt -= optlen, cp += optlen) {
867 1.1 cgd opt = cp[IPOPT_OPTVAL];
868 1.1 cgd if (opt == IPOPT_EOL)
869 1.1 cgd break;
870 1.1 cgd if (opt == IPOPT_NOP)
871 1.1 cgd optlen = 1;
872 1.1 cgd else {
873 1.1 cgd optlen = cp[IPOPT_OLEN];
874 1.1 cgd if (optlen <= 0 || optlen > cnt) {
875 1.1 cgd code = &cp[IPOPT_OLEN] - (u_char *)ip;
876 1.1 cgd goto bad;
877 1.1 cgd }
878 1.1 cgd }
879 1.1 cgd switch (opt) {
880 1.1 cgd
881 1.1 cgd default:
882 1.1 cgd break;
883 1.1 cgd
884 1.1 cgd /*
885 1.1 cgd * Source routing with record.
886 1.1 cgd * Find interface with current destination address.
887 1.1 cgd * If none on this machine then drop if strictly routed,
888 1.1 cgd * or do nothing if loosely routed.
889 1.1 cgd * Record interface address and bring up next address
890 1.1 cgd * component. If strictly routed make sure next
891 1.1 cgd * address is on directly accessible net.
892 1.1 cgd */
893 1.1 cgd case IPOPT_LSRR:
894 1.1 cgd case IPOPT_SSRR:
895 1.47 cjs if (ip_allowsrcrt == 0) {
896 1.47 cjs type = ICMP_UNREACH;
897 1.47 cjs code = ICMP_UNREACH_NET_PROHIB;
898 1.47 cjs goto bad;
899 1.47 cjs }
900 1.1 cgd if ((off = cp[IPOPT_OFFSET]) < IPOPT_MINOFF) {
901 1.1 cgd code = &cp[IPOPT_OFFSET] - (u_char *)ip;
902 1.1 cgd goto bad;
903 1.1 cgd }
904 1.1 cgd ipaddr.sin_addr = ip->ip_dst;
905 1.19 mycroft ia = ifatoia(ifa_ifwithaddr(sintosa(&ipaddr)));
906 1.1 cgd if (ia == 0) {
907 1.1 cgd if (opt == IPOPT_SSRR) {
908 1.1 cgd type = ICMP_UNREACH;
909 1.1 cgd code = ICMP_UNREACH_SRCFAIL;
910 1.1 cgd goto bad;
911 1.1 cgd }
912 1.1 cgd /*
913 1.1 cgd * Loose routing, and not at next destination
914 1.1 cgd * yet; nothing to do except forward.
915 1.1 cgd */
916 1.1 cgd break;
917 1.1 cgd }
918 1.1 cgd off--; /* 0 origin */
919 1.1 cgd if (off > optlen - sizeof(struct in_addr)) {
920 1.1 cgd /*
921 1.1 cgd * End of source route. Should be for us.
922 1.1 cgd */
923 1.1 cgd save_rte(cp, ip->ip_src);
924 1.1 cgd break;
925 1.1 cgd }
926 1.1 cgd /*
927 1.1 cgd * locate outgoing interface
928 1.1 cgd */
929 1.1 cgd bcopy((caddr_t)(cp + off), (caddr_t)&ipaddr.sin_addr,
930 1.1 cgd sizeof(ipaddr.sin_addr));
931 1.1 cgd if (opt == IPOPT_SSRR) {
932 1.1 cgd #define INA struct in_ifaddr *
933 1.1 cgd #define SA struct sockaddr *
934 1.29 mrg ia = (INA)ifa_ifwithladdr((SA)&ipaddr);
935 1.1 cgd } else
936 1.1 cgd ia = ip_rtaddr(ipaddr.sin_addr);
937 1.1 cgd if (ia == 0) {
938 1.1 cgd type = ICMP_UNREACH;
939 1.1 cgd code = ICMP_UNREACH_SRCFAIL;
940 1.1 cgd goto bad;
941 1.1 cgd }
942 1.1 cgd ip->ip_dst = ipaddr.sin_addr;
943 1.20 mycroft bcopy((caddr_t)&ia->ia_addr.sin_addr,
944 1.1 cgd (caddr_t)(cp + off), sizeof(struct in_addr));
945 1.1 cgd cp[IPOPT_OFFSET] += sizeof(struct in_addr);
946 1.13 mycroft /*
947 1.13 mycroft * Let ip_intr's mcast routing check handle mcast pkts
948 1.13 mycroft */
949 1.18 mycroft forward = !IN_MULTICAST(ip->ip_dst.s_addr);
950 1.1 cgd break;
951 1.1 cgd
952 1.1 cgd case IPOPT_RR:
953 1.1 cgd if ((off = cp[IPOPT_OFFSET]) < IPOPT_MINOFF) {
954 1.1 cgd code = &cp[IPOPT_OFFSET] - (u_char *)ip;
955 1.1 cgd goto bad;
956 1.1 cgd }
957 1.1 cgd /*
958 1.1 cgd * If no space remains, ignore.
959 1.1 cgd */
960 1.1 cgd off--; /* 0 origin */
961 1.1 cgd if (off > optlen - sizeof(struct in_addr))
962 1.1 cgd break;
963 1.1 cgd bcopy((caddr_t)(&ip->ip_dst), (caddr_t)&ipaddr.sin_addr,
964 1.1 cgd sizeof(ipaddr.sin_addr));
965 1.1 cgd /*
966 1.1 cgd * locate outgoing interface; if we're the destination,
967 1.1 cgd * use the incoming interface (should be same).
968 1.1 cgd */
969 1.1 cgd if ((ia = (INA)ifa_ifwithaddr((SA)&ipaddr)) == 0 &&
970 1.1 cgd (ia = ip_rtaddr(ipaddr.sin_addr)) == 0) {
971 1.1 cgd type = ICMP_UNREACH;
972 1.1 cgd code = ICMP_UNREACH_HOST;
973 1.1 cgd goto bad;
974 1.1 cgd }
975 1.20 mycroft bcopy((caddr_t)&ia->ia_addr.sin_addr,
976 1.1 cgd (caddr_t)(cp + off), sizeof(struct in_addr));
977 1.1 cgd cp[IPOPT_OFFSET] += sizeof(struct in_addr);
978 1.1 cgd break;
979 1.1 cgd
980 1.1 cgd case IPOPT_TS:
981 1.1 cgd code = cp - (u_char *)ip;
982 1.1 cgd ipt = (struct ip_timestamp *)cp;
983 1.1 cgd if (ipt->ipt_len < 5)
984 1.1 cgd goto bad;
985 1.15 cgd if (ipt->ipt_ptr > ipt->ipt_len - sizeof (int32_t)) {
986 1.1 cgd if (++ipt->ipt_oflw == 0)
987 1.1 cgd goto bad;
988 1.1 cgd break;
989 1.1 cgd }
990 1.1 cgd sin = (struct in_addr *)(cp + ipt->ipt_ptr - 1);
991 1.1 cgd switch (ipt->ipt_flg) {
992 1.1 cgd
993 1.1 cgd case IPOPT_TS_TSONLY:
994 1.1 cgd break;
995 1.1 cgd
996 1.1 cgd case IPOPT_TS_TSANDADDR:
997 1.66 thorpej if (ipt->ipt_ptr - 1 + sizeof(n_time) +
998 1.1 cgd sizeof(struct in_addr) > ipt->ipt_len)
999 1.1 cgd goto bad;
1000 1.13 mycroft ipaddr.sin_addr = dst;
1001 1.13 mycroft ia = (INA)ifaof_ifpforaddr((SA)&ipaddr,
1002 1.13 mycroft m->m_pkthdr.rcvif);
1003 1.13 mycroft if (ia == 0)
1004 1.13 mycroft continue;
1005 1.20 mycroft bcopy((caddr_t)&ia->ia_addr.sin_addr,
1006 1.1 cgd (caddr_t)sin, sizeof(struct in_addr));
1007 1.1 cgd ipt->ipt_ptr += sizeof(struct in_addr);
1008 1.1 cgd break;
1009 1.1 cgd
1010 1.1 cgd case IPOPT_TS_PRESPEC:
1011 1.66 thorpej if (ipt->ipt_ptr - 1 + sizeof(n_time) +
1012 1.1 cgd sizeof(struct in_addr) > ipt->ipt_len)
1013 1.1 cgd goto bad;
1014 1.1 cgd bcopy((caddr_t)sin, (caddr_t)&ipaddr.sin_addr,
1015 1.1 cgd sizeof(struct in_addr));
1016 1.1 cgd if (ifa_ifwithaddr((SA)&ipaddr) == 0)
1017 1.1 cgd continue;
1018 1.1 cgd ipt->ipt_ptr += sizeof(struct in_addr);
1019 1.1 cgd break;
1020 1.1 cgd
1021 1.1 cgd default:
1022 1.1 cgd goto bad;
1023 1.1 cgd }
1024 1.1 cgd ntime = iptime();
1025 1.1 cgd bcopy((caddr_t)&ntime, (caddr_t)cp + ipt->ipt_ptr - 1,
1026 1.1 cgd sizeof(n_time));
1027 1.1 cgd ipt->ipt_ptr += sizeof(n_time);
1028 1.1 cgd }
1029 1.1 cgd }
1030 1.1 cgd if (forward) {
1031 1.26 thorpej if (ip_forwsrcrt == 0) {
1032 1.26 thorpej type = ICMP_UNREACH;
1033 1.26 thorpej code = ICMP_UNREACH_SRCFAIL;
1034 1.26 thorpej goto bad;
1035 1.26 thorpej }
1036 1.1 cgd ip_forward(m, 1);
1037 1.1 cgd return (1);
1038 1.13 mycroft }
1039 1.13 mycroft return (0);
1040 1.1 cgd bad:
1041 1.13 mycroft icmp_error(m, type, code, 0, 0);
1042 1.13 mycroft ipstat.ips_badoptions++;
1043 1.1 cgd return (1);
1044 1.1 cgd }
1045 1.1 cgd
1046 1.1 cgd /*
1047 1.1 cgd * Given address of next destination (final or next hop),
1048 1.1 cgd * return internet address info of interface to be used to get there.
1049 1.1 cgd */
1050 1.1 cgd struct in_ifaddr *
1051 1.1 cgd ip_rtaddr(dst)
1052 1.1 cgd struct in_addr dst;
1053 1.1 cgd {
1054 1.1 cgd register struct sockaddr_in *sin;
1055 1.1 cgd
1056 1.19 mycroft sin = satosin(&ipforward_rt.ro_dst);
1057 1.1 cgd
1058 1.35 mycroft if (ipforward_rt.ro_rt == 0 || !in_hosteq(dst, sin->sin_addr)) {
1059 1.1 cgd if (ipforward_rt.ro_rt) {
1060 1.1 cgd RTFREE(ipforward_rt.ro_rt);
1061 1.1 cgd ipforward_rt.ro_rt = 0;
1062 1.1 cgd }
1063 1.1 cgd sin->sin_family = AF_INET;
1064 1.1 cgd sin->sin_len = sizeof(*sin);
1065 1.1 cgd sin->sin_addr = dst;
1066 1.1 cgd
1067 1.1 cgd rtalloc(&ipforward_rt);
1068 1.1 cgd }
1069 1.1 cgd if (ipforward_rt.ro_rt == 0)
1070 1.1 cgd return ((struct in_ifaddr *)0);
1071 1.19 mycroft return (ifatoia(ipforward_rt.ro_rt->rt_ifa));
1072 1.1 cgd }
1073 1.1 cgd
1074 1.1 cgd /*
1075 1.1 cgd * Save incoming source route for use in replies,
1076 1.1 cgd * to be picked up later by ip_srcroute if the receiver is interested.
1077 1.1 cgd */
1078 1.13 mycroft void
1079 1.1 cgd save_rte(option, dst)
1080 1.1 cgd u_char *option;
1081 1.1 cgd struct in_addr dst;
1082 1.1 cgd {
1083 1.1 cgd unsigned olen;
1084 1.1 cgd
1085 1.1 cgd olen = option[IPOPT_OLEN];
1086 1.1 cgd #ifdef DIAGNOSTIC
1087 1.1 cgd if (ipprintfs)
1088 1.39 christos printf("save_rte: olen %d\n", olen);
1089 1.1 cgd #endif
1090 1.1 cgd if (olen > sizeof(ip_srcrt) - (1 + sizeof(dst)))
1091 1.1 cgd return;
1092 1.1 cgd bcopy((caddr_t)option, (caddr_t)ip_srcrt.srcopt, olen);
1093 1.1 cgd ip_nhops = (olen - IPOPT_OFFSET - 1) / sizeof(struct in_addr);
1094 1.1 cgd ip_srcrt.dst = dst;
1095 1.1 cgd }
1096 1.1 cgd
1097 1.1 cgd /*
1098 1.1 cgd * Retrieve incoming source route for use in replies,
1099 1.1 cgd * in the same form used by setsockopt.
1100 1.1 cgd * The first hop is placed before the options, will be removed later.
1101 1.1 cgd */
1102 1.1 cgd struct mbuf *
1103 1.1 cgd ip_srcroute()
1104 1.1 cgd {
1105 1.1 cgd register struct in_addr *p, *q;
1106 1.1 cgd register struct mbuf *m;
1107 1.1 cgd
1108 1.1 cgd if (ip_nhops == 0)
1109 1.1 cgd return ((struct mbuf *)0);
1110 1.1 cgd m = m_get(M_DONTWAIT, MT_SOOPTS);
1111 1.1 cgd if (m == 0)
1112 1.1 cgd return ((struct mbuf *)0);
1113 1.1 cgd
1114 1.13 mycroft #define OPTSIZ (sizeof(ip_srcrt.nop) + sizeof(ip_srcrt.srcopt))
1115 1.1 cgd
1116 1.1 cgd /* length is (nhops+1)*sizeof(addr) + sizeof(nop + srcrt header) */
1117 1.1 cgd m->m_len = ip_nhops * sizeof(struct in_addr) + sizeof(struct in_addr) +
1118 1.1 cgd OPTSIZ;
1119 1.1 cgd #ifdef DIAGNOSTIC
1120 1.1 cgd if (ipprintfs)
1121 1.39 christos printf("ip_srcroute: nhops %d mlen %d", ip_nhops, m->m_len);
1122 1.1 cgd #endif
1123 1.1 cgd
1124 1.1 cgd /*
1125 1.1 cgd * First save first hop for return route
1126 1.1 cgd */
1127 1.1 cgd p = &ip_srcrt.route[ip_nhops - 1];
1128 1.1 cgd *(mtod(m, struct in_addr *)) = *p--;
1129 1.1 cgd #ifdef DIAGNOSTIC
1130 1.1 cgd if (ipprintfs)
1131 1.39 christos printf(" hops %x", ntohl(mtod(m, struct in_addr *)->s_addr));
1132 1.1 cgd #endif
1133 1.1 cgd
1134 1.1 cgd /*
1135 1.1 cgd * Copy option fields and padding (nop) to mbuf.
1136 1.1 cgd */
1137 1.1 cgd ip_srcrt.nop = IPOPT_NOP;
1138 1.1 cgd ip_srcrt.srcopt[IPOPT_OFFSET] = IPOPT_MINOFF;
1139 1.1 cgd bcopy((caddr_t)&ip_srcrt.nop,
1140 1.1 cgd mtod(m, caddr_t) + sizeof(struct in_addr), OPTSIZ);
1141 1.1 cgd q = (struct in_addr *)(mtod(m, caddr_t) +
1142 1.1 cgd sizeof(struct in_addr) + OPTSIZ);
1143 1.1 cgd #undef OPTSIZ
1144 1.1 cgd /*
1145 1.1 cgd * Record return path as an IP source route,
1146 1.1 cgd * reversing the path (pointers are now aligned).
1147 1.1 cgd */
1148 1.1 cgd while (p >= ip_srcrt.route) {
1149 1.1 cgd #ifdef DIAGNOSTIC
1150 1.1 cgd if (ipprintfs)
1151 1.39 christos printf(" %x", ntohl(q->s_addr));
1152 1.1 cgd #endif
1153 1.1 cgd *q++ = *p--;
1154 1.1 cgd }
1155 1.1 cgd /*
1156 1.1 cgd * Last hop goes to final destination.
1157 1.1 cgd */
1158 1.1 cgd *q = ip_srcrt.dst;
1159 1.1 cgd #ifdef DIAGNOSTIC
1160 1.1 cgd if (ipprintfs)
1161 1.39 christos printf(" %x\n", ntohl(q->s_addr));
1162 1.1 cgd #endif
1163 1.1 cgd return (m);
1164 1.1 cgd }
1165 1.1 cgd
1166 1.1 cgd /*
1167 1.1 cgd * Strip out IP options, at higher
1168 1.1 cgd * level protocol in the kernel.
1169 1.1 cgd * Second argument is buffer to which options
1170 1.1 cgd * will be moved, and return value is their length.
1171 1.1 cgd * XXX should be deleted; last arg currently ignored.
1172 1.1 cgd */
1173 1.8 mycroft void
1174 1.1 cgd ip_stripoptions(m, mopt)
1175 1.1 cgd register struct mbuf *m;
1176 1.1 cgd struct mbuf *mopt;
1177 1.1 cgd {
1178 1.1 cgd register int i;
1179 1.1 cgd struct ip *ip = mtod(m, struct ip *);
1180 1.1 cgd register caddr_t opts;
1181 1.1 cgd int olen;
1182 1.1 cgd
1183 1.79 mycroft olen = (ip->ip_hl << 2) - sizeof (struct ip);
1184 1.1 cgd opts = (caddr_t)(ip + 1);
1185 1.1 cgd i = m->m_len - (sizeof (struct ip) + olen);
1186 1.1 cgd bcopy(opts + olen, opts, (unsigned)i);
1187 1.1 cgd m->m_len -= olen;
1188 1.1 cgd if (m->m_flags & M_PKTHDR)
1189 1.1 cgd m->m_pkthdr.len -= olen;
1190 1.79 mycroft ip->ip_len -= olen;
1191 1.79 mycroft ip->ip_hl = sizeof (struct ip) >> 2;
1192 1.1 cgd }
1193 1.1 cgd
1194 1.23 mycroft int inetctlerrmap[PRC_NCMDS] = {
1195 1.1 cgd 0, 0, 0, 0,
1196 1.1 cgd 0, EMSGSIZE, EHOSTDOWN, EHOSTUNREACH,
1197 1.1 cgd EHOSTUNREACH, EHOSTUNREACH, ECONNREFUSED, ECONNREFUSED,
1198 1.1 cgd EMSGSIZE, EHOSTUNREACH, 0, 0,
1199 1.1 cgd 0, 0, 0, 0,
1200 1.1 cgd ENOPROTOOPT
1201 1.1 cgd };
1202 1.1 cgd
1203 1.1 cgd /*
1204 1.1 cgd * Forward a packet. If some error occurs return the sender
1205 1.1 cgd * an icmp packet. Note we can't always generate a meaningful
1206 1.1 cgd * icmp message because icmp doesn't have a large enough repertoire
1207 1.1 cgd * of codes and types.
1208 1.1 cgd *
1209 1.1 cgd * If not forwarding, just drop the packet. This could be confusing
1210 1.1 cgd * if ipforwarding was zero but some routing protocol was advancing
1211 1.1 cgd * us as a gateway to somewhere. However, we must let the routing
1212 1.1 cgd * protocol deal with that.
1213 1.1 cgd *
1214 1.1 cgd * The srcrt parameter indicates whether the packet is being forwarded
1215 1.1 cgd * via a source route.
1216 1.1 cgd */
1217 1.13 mycroft void
1218 1.1 cgd ip_forward(m, srcrt)
1219 1.1 cgd struct mbuf *m;
1220 1.1 cgd int srcrt;
1221 1.1 cgd {
1222 1.1 cgd register struct ip *ip = mtod(m, struct ip *);
1223 1.1 cgd register struct sockaddr_in *sin;
1224 1.1 cgd register struct rtentry *rt;
1225 1.28 christos int error, type = 0, code = 0;
1226 1.1 cgd struct mbuf *mcopy;
1227 1.13 mycroft n_long dest;
1228 1.13 mycroft struct ifnet *destifp;
1229 1.1 cgd
1230 1.13 mycroft dest = 0;
1231 1.1 cgd #ifdef DIAGNOSTIC
1232 1.1 cgd if (ipprintfs)
1233 1.70 thorpej printf("forward: src %2.2x dst %2.2x ttl %x\n",
1234 1.70 thorpej ntohl(ip->ip_src.s_addr),
1235 1.70 thorpej ntohl(ip->ip_dst.s_addr), ip->ip_ttl);
1236 1.1 cgd #endif
1237 1.1 cgd if (m->m_flags & M_BCAST || in_canforward(ip->ip_dst) == 0) {
1238 1.1 cgd ipstat.ips_cantforward++;
1239 1.1 cgd m_freem(m);
1240 1.1 cgd return;
1241 1.1 cgd }
1242 1.1 cgd if (ip->ip_ttl <= IPTTLDEC) {
1243 1.13 mycroft icmp_error(m, ICMP_TIMXCEED, ICMP_TIMXCEED_INTRANS, dest, 0);
1244 1.1 cgd return;
1245 1.1 cgd }
1246 1.1 cgd ip->ip_ttl -= IPTTLDEC;
1247 1.1 cgd
1248 1.19 mycroft sin = satosin(&ipforward_rt.ro_dst);
1249 1.1 cgd if ((rt = ipforward_rt.ro_rt) == 0 ||
1250 1.35 mycroft !in_hosteq(ip->ip_dst, sin->sin_addr)) {
1251 1.1 cgd if (ipforward_rt.ro_rt) {
1252 1.1 cgd RTFREE(ipforward_rt.ro_rt);
1253 1.1 cgd ipforward_rt.ro_rt = 0;
1254 1.1 cgd }
1255 1.1 cgd sin->sin_family = AF_INET;
1256 1.35 mycroft sin->sin_len = sizeof(struct sockaddr_in);
1257 1.1 cgd sin->sin_addr = ip->ip_dst;
1258 1.1 cgd
1259 1.1 cgd rtalloc(&ipforward_rt);
1260 1.1 cgd if (ipforward_rt.ro_rt == 0) {
1261 1.13 mycroft icmp_error(m, ICMP_UNREACH, ICMP_UNREACH_HOST, dest, 0);
1262 1.1 cgd return;
1263 1.1 cgd }
1264 1.1 cgd rt = ipforward_rt.ro_rt;
1265 1.1 cgd }
1266 1.1 cgd
1267 1.1 cgd /*
1268 1.34 mycroft * Save at most 68 bytes of the packet in case
1269 1.1 cgd * we need to generate an ICMP message to the src.
1270 1.1 cgd */
1271 1.34 mycroft mcopy = m_copy(m, 0, imin((int)ip->ip_len, 68));
1272 1.1 cgd
1273 1.1 cgd /*
1274 1.1 cgd * If forwarding packet using same interface that it came in on,
1275 1.1 cgd * perhaps should send a redirect to sender to shortcut a hop.
1276 1.1 cgd * Only send redirect if source is sending directly to us,
1277 1.1 cgd * and if packet was not source routed (or has any options).
1278 1.1 cgd * Also, don't send redirect if forwarding using a default route
1279 1.1 cgd * or a route modified by a redirect.
1280 1.1 cgd */
1281 1.1 cgd if (rt->rt_ifp == m->m_pkthdr.rcvif &&
1282 1.1 cgd (rt->rt_flags & (RTF_DYNAMIC|RTF_MODIFIED)) == 0 &&
1283 1.35 mycroft !in_nullhost(satosin(rt_key(rt))->sin_addr) &&
1284 1.1 cgd ipsendredirects && !srcrt) {
1285 1.19 mycroft if (rt->rt_ifa &&
1286 1.19 mycroft (ip->ip_src.s_addr & ifatoia(rt->rt_ifa)->ia_subnetmask) ==
1287 1.19 mycroft ifatoia(rt->rt_ifa)->ia_subnet) {
1288 1.77 thorpej if (rt->rt_flags & RTF_GATEWAY)
1289 1.77 thorpej dest = satosin(rt->rt_gateway)->sin_addr.s_addr;
1290 1.77 thorpej else
1291 1.77 thorpej dest = ip->ip_dst.s_addr;
1292 1.77 thorpej /*
1293 1.77 thorpej * Router requirements says to only send host
1294 1.77 thorpej * redirects.
1295 1.77 thorpej */
1296 1.77 thorpej type = ICMP_REDIRECT;
1297 1.77 thorpej code = ICMP_REDIRECT_HOST;
1298 1.1 cgd #ifdef DIAGNOSTIC
1299 1.77 thorpej if (ipprintfs)
1300 1.77 thorpej printf("redirect (%d) to %x\n", code,
1301 1.77 thorpej (u_int32_t)dest);
1302 1.1 cgd #endif
1303 1.1 cgd }
1304 1.1 cgd }
1305 1.1 cgd
1306 1.27 thorpej error = ip_output(m, (struct mbuf *)0, &ipforward_rt,
1307 1.27 thorpej (IP_FORWARDING | (ip_directedbcast ? IP_ALLOWBROADCAST : 0)), 0);
1308 1.1 cgd if (error)
1309 1.1 cgd ipstat.ips_cantforward++;
1310 1.1 cgd else {
1311 1.1 cgd ipstat.ips_forward++;
1312 1.1 cgd if (type)
1313 1.1 cgd ipstat.ips_redirectsent++;
1314 1.1 cgd else {
1315 1.63 matt if (mcopy) {
1316 1.63 matt #ifdef GATEWAY
1317 1.64 thorpej if (mcopy->m_flags & M_CANFASTFWD)
1318 1.64 thorpej ipflow_create(&ipforward_rt, mcopy);
1319 1.63 matt #endif
1320 1.1 cgd m_freem(mcopy);
1321 1.63 matt }
1322 1.1 cgd return;
1323 1.1 cgd }
1324 1.1 cgd }
1325 1.1 cgd if (mcopy == NULL)
1326 1.1 cgd return;
1327 1.13 mycroft destifp = NULL;
1328 1.13 mycroft
1329 1.1 cgd switch (error) {
1330 1.1 cgd
1331 1.1 cgd case 0: /* forwarded, but need redirect */
1332 1.1 cgd /* type, code set above */
1333 1.1 cgd break;
1334 1.1 cgd
1335 1.1 cgd case ENETUNREACH: /* shouldn't happen, checked above */
1336 1.1 cgd case EHOSTUNREACH:
1337 1.1 cgd case ENETDOWN:
1338 1.1 cgd case EHOSTDOWN:
1339 1.1 cgd default:
1340 1.1 cgd type = ICMP_UNREACH;
1341 1.1 cgd code = ICMP_UNREACH_HOST;
1342 1.1 cgd break;
1343 1.1 cgd
1344 1.1 cgd case EMSGSIZE:
1345 1.1 cgd type = ICMP_UNREACH;
1346 1.1 cgd code = ICMP_UNREACH_NEEDFRAG;
1347 1.13 mycroft if (ipforward_rt.ro_rt)
1348 1.13 mycroft destifp = ipforward_rt.ro_rt->rt_ifp;
1349 1.1 cgd ipstat.ips_cantfrag++;
1350 1.1 cgd break;
1351 1.1 cgd
1352 1.1 cgd case ENOBUFS:
1353 1.1 cgd type = ICMP_SOURCEQUENCH;
1354 1.1 cgd code = 0;
1355 1.1 cgd break;
1356 1.1 cgd }
1357 1.13 mycroft icmp_error(mcopy, type, code, dest, destifp);
1358 1.44 thorpej }
1359 1.44 thorpej
1360 1.44 thorpej void
1361 1.44 thorpej ip_savecontrol(inp, mp, ip, m)
1362 1.44 thorpej register struct inpcb *inp;
1363 1.44 thorpej register struct mbuf **mp;
1364 1.44 thorpej register struct ip *ip;
1365 1.44 thorpej register struct mbuf *m;
1366 1.44 thorpej {
1367 1.44 thorpej
1368 1.44 thorpej if (inp->inp_socket->so_options & SO_TIMESTAMP) {
1369 1.44 thorpej struct timeval tv;
1370 1.44 thorpej
1371 1.44 thorpej microtime(&tv);
1372 1.44 thorpej *mp = sbcreatecontrol((caddr_t) &tv, sizeof(tv),
1373 1.44 thorpej SCM_TIMESTAMP, SOL_SOCKET);
1374 1.44 thorpej if (*mp)
1375 1.44 thorpej mp = &(*mp)->m_next;
1376 1.44 thorpej }
1377 1.44 thorpej if (inp->inp_flags & INP_RECVDSTADDR) {
1378 1.44 thorpej *mp = sbcreatecontrol((caddr_t) &ip->ip_dst,
1379 1.44 thorpej sizeof(struct in_addr), IP_RECVDSTADDR, IPPROTO_IP);
1380 1.44 thorpej if (*mp)
1381 1.44 thorpej mp = &(*mp)->m_next;
1382 1.44 thorpej }
1383 1.44 thorpej #ifdef notyet
1384 1.44 thorpej /*
1385 1.44 thorpej * XXX
1386 1.44 thorpej * Moving these out of udp_input() made them even more broken
1387 1.44 thorpej * than they already were.
1388 1.44 thorpej * - fenner (at) parc.xerox.com
1389 1.44 thorpej */
1390 1.44 thorpej /* options were tossed already */
1391 1.44 thorpej if (inp->inp_flags & INP_RECVOPTS) {
1392 1.44 thorpej *mp = sbcreatecontrol((caddr_t) opts_deleted_above,
1393 1.44 thorpej sizeof(struct in_addr), IP_RECVOPTS, IPPROTO_IP);
1394 1.44 thorpej if (*mp)
1395 1.44 thorpej mp = &(*mp)->m_next;
1396 1.44 thorpej }
1397 1.44 thorpej /* ip_srcroute doesn't do what we want here, need to fix */
1398 1.44 thorpej if (inp->inp_flags & INP_RECVRETOPTS) {
1399 1.44 thorpej *mp = sbcreatecontrol((caddr_t) ip_srcroute(),
1400 1.44 thorpej sizeof(struct in_addr), IP_RECVRETOPTS, IPPROTO_IP);
1401 1.44 thorpej if (*mp)
1402 1.44 thorpej mp = &(*mp)->m_next;
1403 1.44 thorpej }
1404 1.44 thorpej #endif
1405 1.44 thorpej if (inp->inp_flags & INP_RECVIF) {
1406 1.44 thorpej struct sockaddr_dl sdl;
1407 1.44 thorpej
1408 1.44 thorpej sdl.sdl_len = offsetof(struct sockaddr_dl, sdl_data[0]);
1409 1.44 thorpej sdl.sdl_family = AF_LINK;
1410 1.44 thorpej sdl.sdl_index = m->m_pkthdr.rcvif ?
1411 1.44 thorpej m->m_pkthdr.rcvif->if_index : 0;
1412 1.44 thorpej sdl.sdl_nlen = sdl.sdl_alen = sdl.sdl_slen = 0;
1413 1.44 thorpej *mp = sbcreatecontrol((caddr_t) &sdl, sdl.sdl_len,
1414 1.44 thorpej IP_RECVIF, IPPROTO_IP);
1415 1.44 thorpej if (*mp)
1416 1.44 thorpej mp = &(*mp)->m_next;
1417 1.44 thorpej }
1418 1.13 mycroft }
1419 1.13 mycroft
1420 1.13 mycroft int
1421 1.13 mycroft ip_sysctl(name, namelen, oldp, oldlenp, newp, newlen)
1422 1.13 mycroft int *name;
1423 1.13 mycroft u_int namelen;
1424 1.13 mycroft void *oldp;
1425 1.13 mycroft size_t *oldlenp;
1426 1.13 mycroft void *newp;
1427 1.13 mycroft size_t newlen;
1428 1.13 mycroft {
1429 1.52 thorpej extern int subnetsarelocal;
1430 1.52 thorpej
1431 1.54 lukem int error, old;
1432 1.54 lukem
1433 1.13 mycroft /* All sysctl names at this level are terminal. */
1434 1.13 mycroft if (namelen != 1)
1435 1.13 mycroft return (ENOTDIR);
1436 1.13 mycroft
1437 1.13 mycroft switch (name[0]) {
1438 1.13 mycroft case IPCTL_FORWARDING:
1439 1.13 mycroft return (sysctl_int(oldp, oldlenp, newp, newlen, &ipforwarding));
1440 1.13 mycroft case IPCTL_SENDREDIRECTS:
1441 1.13 mycroft return (sysctl_int(oldp, oldlenp, newp, newlen,
1442 1.13 mycroft &ipsendredirects));
1443 1.13 mycroft case IPCTL_DEFTTL:
1444 1.13 mycroft return (sysctl_int(oldp, oldlenp, newp, newlen, &ip_defttl));
1445 1.13 mycroft #ifdef notyet
1446 1.13 mycroft case IPCTL_DEFMTU:
1447 1.13 mycroft return (sysctl_int(oldp, oldlenp, newp, newlen, &ip_mtu));
1448 1.13 mycroft #endif
1449 1.26 thorpej case IPCTL_FORWSRCRT:
1450 1.47 cjs /* Don't allow this to change in a secure environment. */
1451 1.26 thorpej if (securelevel > 0)
1452 1.46 cjs return (sysctl_rdint(oldp, oldlenp, newp,
1453 1.46 cjs ip_forwsrcrt));
1454 1.46 cjs else
1455 1.46 cjs return (sysctl_int(oldp, oldlenp, newp, newlen,
1456 1.46 cjs &ip_forwsrcrt));
1457 1.27 thorpej case IPCTL_DIRECTEDBCAST:
1458 1.27 thorpej return (sysctl_int(oldp, oldlenp, newp, newlen,
1459 1.27 thorpej &ip_directedbcast));
1460 1.47 cjs case IPCTL_ALLOWSRCRT:
1461 1.47 cjs return (sysctl_int(oldp, oldlenp, newp, newlen,
1462 1.47 cjs &ip_allowsrcrt));
1463 1.52 thorpej case IPCTL_SUBNETSARELOCAL:
1464 1.52 thorpej return (sysctl_int(oldp, oldlenp, newp, newlen,
1465 1.52 thorpej &subnetsarelocal));
1466 1.53 kml case IPCTL_MTUDISC:
1467 1.60 kml error = sysctl_int(oldp, oldlenp, newp, newlen,
1468 1.60 kml &ip_mtudisc);
1469 1.60 kml if (ip_mtudisc != 0 && ip_mtudisc_timeout_q == NULL) {
1470 1.60 kml ip_mtudisc_timeout_q =
1471 1.60 kml rt_timer_queue_create(ip_mtudisc_timeout);
1472 1.60 kml } else if (ip_mtudisc == 0 && ip_mtudisc_timeout_q != NULL) {
1473 1.60 kml rt_timer_queue_destroy(ip_mtudisc_timeout_q, TRUE);
1474 1.60 kml ip_mtudisc_timeout_q = NULL;
1475 1.60 kml }
1476 1.60 kml return error;
1477 1.54 lukem case IPCTL_ANONPORTMIN:
1478 1.54 lukem old = anonportmin;
1479 1.54 lukem error = sysctl_int(oldp, oldlenp, newp, newlen, &anonportmin);
1480 1.54 lukem if (anonportmin >= anonportmax || anonportmin > 65535
1481 1.54 lukem #ifndef IPNOPRIVPORTS
1482 1.54 lukem || anonportmin < IPPORT_RESERVED
1483 1.54 lukem #endif
1484 1.54 lukem ) {
1485 1.54 lukem anonportmin = old;
1486 1.54 lukem return (EINVAL);
1487 1.54 lukem }
1488 1.54 lukem return (error);
1489 1.54 lukem case IPCTL_ANONPORTMAX:
1490 1.54 lukem old = anonportmax;
1491 1.54 lukem error = sysctl_int(oldp, oldlenp, newp, newlen, &anonportmax);
1492 1.54 lukem if (anonportmin >= anonportmax || anonportmax > 65535
1493 1.54 lukem #ifndef IPNOPRIVPORTS
1494 1.54 lukem || anonportmax < IPPORT_RESERVED
1495 1.54 lukem #endif
1496 1.54 lukem ) {
1497 1.54 lukem anonportmax = old;
1498 1.54 lukem return (EINVAL);
1499 1.54 lukem }
1500 1.60 kml return (error);
1501 1.60 kml case IPCTL_MTUDISCTIMEOUT:
1502 1.60 kml error = sysctl_int(oldp, oldlenp, newp, newlen,
1503 1.60 kml &ip_mtudisc_timeout);
1504 1.60 kml if (ip_mtudisc_timeout_q != NULL)
1505 1.60 kml rt_timer_queue_change(ip_mtudisc_timeout_q,
1506 1.60 kml ip_mtudisc_timeout);
1507 1.54 lukem return (error);
1508 1.65 matt #ifdef GATEWAY
1509 1.65 matt case IPCTL_MAXFLOWS:
1510 1.67 thorpej {
1511 1.67 thorpej int s;
1512 1.67 thorpej
1513 1.65 matt error = sysctl_int(oldp, oldlenp, newp, newlen,
1514 1.65 matt &ip_maxflows);
1515 1.67 thorpej s = splsoftnet();
1516 1.65 matt ipflow_reap(0);
1517 1.67 thorpej splx(s);
1518 1.65 matt return (error);
1519 1.67 thorpej }
1520 1.65 matt #endif
1521 1.13 mycroft default:
1522 1.13 mycroft return (EOPNOTSUPP);
1523 1.13 mycroft }
1524 1.13 mycroft /* NOTREACHED */
1525 1.1 cgd }
1526