ip_icmp.c revision 1.37 1 1.37 itojun /* $NetBSD: ip_icmp.c,v 1.37 1999/07/01 08:12:50 itojun Exp $ */
2 1.37 itojun
3 1.37 itojun /*
4 1.37 itojun * Copyright (C) 1995, 1996, 1997, and 1998 WIDE Project.
5 1.37 itojun * All rights reserved.
6 1.37 itojun *
7 1.37 itojun * Redistribution and use in source and binary forms, with or without
8 1.37 itojun * modification, are permitted provided that the following conditions
9 1.37 itojun * are met:
10 1.37 itojun * 1. Redistributions of source code must retain the above copyright
11 1.37 itojun * notice, this list of conditions and the following disclaimer.
12 1.37 itojun * 2. Redistributions in binary form must reproduce the above copyright
13 1.37 itojun * notice, this list of conditions and the following disclaimer in the
14 1.37 itojun * documentation and/or other materials provided with the distribution.
15 1.37 itojun * 3. Neither the name of the project nor the names of its contributors
16 1.37 itojun * may be used to endorse or promote products derived from this software
17 1.37 itojun * without specific prior written permission.
18 1.37 itojun *
19 1.37 itojun * THIS SOFTWARE IS PROVIDED BY THE PROJECT AND CONTRIBUTORS ``AS IS'' AND
20 1.37 itojun * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
21 1.37 itojun * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
22 1.37 itojun * ARE DISCLAIMED. IN NO EVENT SHALL THE PROJECT OR CONTRIBUTORS BE LIABLE
23 1.37 itojun * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
24 1.37 itojun * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
25 1.37 itojun * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
26 1.37 itojun * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
27 1.37 itojun * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
28 1.37 itojun * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
29 1.37 itojun * SUCH DAMAGE.
30 1.37 itojun */
31 1.10 cgd
32 1.31 thorpej /*-
33 1.31 thorpej * Copyright (c) 1998 The NetBSD Foundation, Inc.
34 1.31 thorpej * All rights reserved.
35 1.31 thorpej *
36 1.31 thorpej * This code is derived from software contributed to The NetBSD Foundation
37 1.31 thorpej * by Public Access Networks Corporation ("Panix"). It was developed under
38 1.31 thorpej * contract to Panix by Eric Haszlakiewicz and Thor Lancelot Simon.
39 1.31 thorpej *
40 1.31 thorpej * Redistribution and use in source and binary forms, with or without
41 1.31 thorpej * modification, are permitted provided that the following conditions
42 1.31 thorpej * are met:
43 1.31 thorpej * 1. Redistributions of source code must retain the above copyright
44 1.31 thorpej * notice, this list of conditions and the following disclaimer.
45 1.31 thorpej * 2. Redistributions in binary form must reproduce the above copyright
46 1.31 thorpej * notice, this list of conditions and the following disclaimer in the
47 1.31 thorpej * documentation and/or other materials provided with the distribution.
48 1.31 thorpej * 3. All advertising materials mentioning features or use of this software
49 1.31 thorpej * must display the following acknowledgement:
50 1.31 thorpej * This product includes software developed by the NetBSD
51 1.31 thorpej * Foundation, Inc. and its contributors.
52 1.31 thorpej * 4. Neither the name of The NetBSD Foundation nor the names of its
53 1.31 thorpej * contributors may be used to endorse or promote products derived
54 1.31 thorpej * from this software without specific prior written permission.
55 1.31 thorpej *
56 1.31 thorpej * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
57 1.31 thorpej * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
58 1.31 thorpej * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
59 1.31 thorpej * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
60 1.31 thorpej * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
61 1.31 thorpej * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
62 1.31 thorpej * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
63 1.31 thorpej * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
64 1.31 thorpej * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
65 1.31 thorpej * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
66 1.31 thorpej * POSSIBILITY OF SUCH DAMAGE.
67 1.31 thorpej */
68 1.31 thorpej
69 1.1 cgd /*
70 1.9 mycroft * Copyright (c) 1982, 1986, 1988, 1993
71 1.9 mycroft * The Regents of the University of California. All rights reserved.
72 1.1 cgd *
73 1.1 cgd * Redistribution and use in source and binary forms, with or without
74 1.1 cgd * modification, are permitted provided that the following conditions
75 1.1 cgd * are met:
76 1.1 cgd * 1. Redistributions of source code must retain the above copyright
77 1.1 cgd * notice, this list of conditions and the following disclaimer.
78 1.1 cgd * 2. Redistributions in binary form must reproduce the above copyright
79 1.1 cgd * notice, this list of conditions and the following disclaimer in the
80 1.1 cgd * documentation and/or other materials provided with the distribution.
81 1.1 cgd * 3. All advertising materials mentioning features or use of this software
82 1.1 cgd * must display the following acknowledgement:
83 1.1 cgd * This product includes software developed by the University of
84 1.1 cgd * California, Berkeley and its contributors.
85 1.1 cgd * 4. Neither the name of the University nor the names of its contributors
86 1.1 cgd * may be used to endorse or promote products derived from this software
87 1.1 cgd * without specific prior written permission.
88 1.1 cgd *
89 1.1 cgd * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
90 1.1 cgd * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
91 1.1 cgd * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
92 1.1 cgd * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
93 1.1 cgd * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
94 1.1 cgd * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
95 1.1 cgd * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
96 1.1 cgd * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
97 1.1 cgd * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
98 1.1 cgd * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
99 1.1 cgd * SUCH DAMAGE.
100 1.1 cgd *
101 1.10 cgd * @(#)ip_icmp.c 8.2 (Berkeley) 1/4/94
102 1.1 cgd */
103 1.1 cgd
104 1.4 mycroft #include <sys/param.h>
105 1.4 mycroft #include <sys/systm.h>
106 1.4 mycroft #include <sys/malloc.h>
107 1.4 mycroft #include <sys/mbuf.h>
108 1.4 mycroft #include <sys/protosw.h>
109 1.4 mycroft #include <sys/socket.h>
110 1.4 mycroft #include <sys/time.h>
111 1.4 mycroft #include <sys/kernel.h>
112 1.19 christos #include <sys/proc.h>
113 1.19 christos
114 1.19 christos #include <vm/vm.h>
115 1.19 christos #include <sys/sysctl.h>
116 1.1 cgd
117 1.9 mycroft #include <net/if.h>
118 1.4 mycroft #include <net/route.h>
119 1.1 cgd
120 1.4 mycroft #include <netinet/in.h>
121 1.4 mycroft #include <netinet/in_systm.h>
122 1.4 mycroft #include <netinet/in_var.h>
123 1.4 mycroft #include <netinet/ip.h>
124 1.4 mycroft #include <netinet/ip_icmp.h>
125 1.19 christos #include <netinet/ip_var.h>
126 1.4 mycroft #include <netinet/icmp_var.h>
127 1.1 cgd
128 1.37 itojun #ifdef IPSEC
129 1.37 itojun #include <netinet6/ipsec.h>
130 1.37 itojun #include <netkey/key.h>
131 1.37 itojun #include <netkey/key_debug.h>
132 1.37 itojun #endif
133 1.37 itojun
134 1.19 christos #include <machine/stdarg.h>
135 1.19 christos
136 1.1 cgd /*
137 1.1 cgd * ICMP routines: error generation, receive packet processing, and
138 1.1 cgd * routines to turnaround packets back to the originator, and
139 1.1 cgd * host table maintenance routines.
140 1.1 cgd */
141 1.9 mycroft
142 1.9 mycroft int icmpmaskrepl = 0;
143 1.1 cgd #ifdef ICMPPRINTFS
144 1.1 cgd int icmpprintfs = 0;
145 1.1 cgd #endif
146 1.1 cgd
147 1.37 itojun #if 0
148 1.37 itojun static int ip_next_mtu __P((int, int));
149 1.37 itojun #else
150 1.37 itojun /*static*/ int ip_next_mtu __P((int, int));
151 1.37 itojun #endif
152 1.37 itojun
153 1.1 cgd extern struct protosw inetsw[];
154 1.1 cgd
155 1.24 kml static void icmp_mtudisc __P((struct icmp *));
156 1.29 kml static void icmp_mtudisc_timeout __P((struct rtentry *, struct rttimer *));
157 1.24 kml
158 1.1 cgd /*
159 1.1 cgd * Generate an error packet of type error
160 1.1 cgd * in response to bad packet ip.
161 1.1 cgd */
162 1.6 mycroft void
163 1.9 mycroft icmp_error(n, type, code, dest, destifp)
164 1.1 cgd struct mbuf *n;
165 1.1 cgd int type, code;
166 1.9 mycroft n_long dest;
167 1.9 mycroft struct ifnet *destifp;
168 1.1 cgd {
169 1.1 cgd register struct ip *oip = mtod(n, struct ip *), *nip;
170 1.1 cgd register unsigned oiplen = oip->ip_hl << 2;
171 1.1 cgd register struct icmp *icp;
172 1.1 cgd register struct mbuf *m;
173 1.1 cgd unsigned icmplen;
174 1.1 cgd
175 1.1 cgd #ifdef ICMPPRINTFS
176 1.1 cgd if (icmpprintfs)
177 1.22 christos printf("icmp_error(%x, %d, %d)\n", oip, type, code);
178 1.1 cgd #endif
179 1.1 cgd if (type != ICMP_REDIRECT)
180 1.1 cgd icmpstat.icps_error++;
181 1.1 cgd /*
182 1.1 cgd * Don't send error if not the first fragment of message.
183 1.1 cgd * Don't error if the old packet protocol was ICMP
184 1.1 cgd * error message, only known informational types.
185 1.1 cgd */
186 1.1 cgd if (oip->ip_off &~ (IP_MF|IP_DF))
187 1.1 cgd goto freeit;
188 1.1 cgd if (oip->ip_p == IPPROTO_ICMP && type != ICMP_REDIRECT &&
189 1.1 cgd n->m_len >= oiplen + ICMP_MINLEN &&
190 1.1 cgd !ICMP_INFOTYPE(((struct icmp *)((caddr_t)oip + oiplen))->icmp_type)) {
191 1.1 cgd icmpstat.icps_oldicmp++;
192 1.1 cgd goto freeit;
193 1.1 cgd }
194 1.3 hpeyerl /* Don't send error in response to a multicast or broadcast packet */
195 1.9 mycroft if (n->m_flags & (M_BCAST|M_MCAST))
196 1.3 hpeyerl goto freeit;
197 1.1 cgd /*
198 1.1 cgd * First, formulate icmp message
199 1.1 cgd */
200 1.1 cgd m = m_gethdr(M_DONTWAIT, MT_HEADER);
201 1.1 cgd if (m == NULL)
202 1.1 cgd goto freeit;
203 1.32 thorpej icmplen = oiplen + min(8, oip->ip_len - oiplen);
204 1.1 cgd m->m_len = icmplen + ICMP_MINLEN;
205 1.1 cgd MH_ALIGN(m, m->m_len);
206 1.1 cgd icp = mtod(m, struct icmp *);
207 1.1 cgd if ((u_int)type > ICMP_MAXTYPE)
208 1.1 cgd panic("icmp_error");
209 1.1 cgd icmpstat.icps_outhist[type]++;
210 1.1 cgd icp->icmp_type = type;
211 1.1 cgd if (type == ICMP_REDIRECT)
212 1.9 mycroft icp->icmp_gwaddr.s_addr = dest;
213 1.9 mycroft else {
214 1.1 cgd icp->icmp_void = 0;
215 1.9 mycroft /*
216 1.9 mycroft * The following assignments assume an overlay with the
217 1.9 mycroft * zeroed icmp_void field.
218 1.9 mycroft */
219 1.9 mycroft if (type == ICMP_PARAMPROB) {
220 1.9 mycroft icp->icmp_pptr = code;
221 1.9 mycroft code = 0;
222 1.9 mycroft } else if (type == ICMP_UNREACH &&
223 1.12 cgd code == ICMP_UNREACH_NEEDFRAG && destifp)
224 1.9 mycroft icp->icmp_nextmtu = htons(destifp->if_mtu);
225 1.1 cgd }
226 1.9 mycroft
227 1.32 thorpej HTONS(oip->ip_off);
228 1.32 thorpej HTONS(oip->ip_len);
229 1.1 cgd icp->icmp_code = code;
230 1.1 cgd bcopy((caddr_t)oip, (caddr_t)&icp->icmp_ip, icmplen);
231 1.1 cgd nip = &icp->icmp_ip;
232 1.1 cgd
233 1.1 cgd /*
234 1.1 cgd * Now, copy old ip header (without options)
235 1.1 cgd * in front of icmp message.
236 1.1 cgd */
237 1.1 cgd if (m->m_data - sizeof(struct ip) < m->m_pktdat)
238 1.1 cgd panic("icmp len");
239 1.1 cgd m->m_data -= sizeof(struct ip);
240 1.1 cgd m->m_len += sizeof(struct ip);
241 1.1 cgd m->m_pkthdr.len = m->m_len;
242 1.1 cgd m->m_pkthdr.rcvif = n->m_pkthdr.rcvif;
243 1.1 cgd nip = mtod(m, struct ip *);
244 1.9 mycroft bcopy((caddr_t)oip, (caddr_t)nip, sizeof(struct ip));
245 1.1 cgd nip->ip_len = m->m_len;
246 1.1 cgd nip->ip_hl = sizeof(struct ip) >> 2;
247 1.1 cgd nip->ip_p = IPPROTO_ICMP;
248 1.9 mycroft nip->ip_tos = 0;
249 1.1 cgd icmp_reflect(m);
250 1.1 cgd
251 1.1 cgd freeit:
252 1.1 cgd m_freem(n);
253 1.1 cgd }
254 1.1 cgd
255 1.1 cgd static struct sockaddr_in icmpsrc = { sizeof (struct sockaddr_in), AF_INET };
256 1.1 cgd static struct sockaddr_in icmpdst = { sizeof (struct sockaddr_in), AF_INET };
257 1.1 cgd static struct sockaddr_in icmpgw = { sizeof (struct sockaddr_in), AF_INET };
258 1.1 cgd struct sockaddr_in icmpmask = { 8, 0 };
259 1.1 cgd
260 1.1 cgd /*
261 1.1 cgd * Process a received ICMP message.
262 1.1 cgd */
263 1.6 mycroft void
264 1.19 christos #if __STDC__
265 1.19 christos icmp_input(struct mbuf *m, ...)
266 1.19 christos #else
267 1.19 christos icmp_input(m, va_alist)
268 1.19 christos struct mbuf *m;
269 1.19 christos va_dcl
270 1.19 christos #endif
271 1.1 cgd {
272 1.37 itojun int proto;
273 1.1 cgd register struct icmp *icp;
274 1.1 cgd register struct ip *ip = mtod(m, struct ip *);
275 1.34 mycroft int icmplen;
276 1.1 cgd register int i;
277 1.1 cgd struct in_ifaddr *ia;
278 1.19 christos void *(*ctlfunc) __P((int, struct sockaddr *, void *));
279 1.9 mycroft int code;
280 1.1 cgd extern u_char ip_protox[];
281 1.19 christos int hlen;
282 1.19 christos va_list ap;
283 1.19 christos
284 1.19 christos va_start(ap, m);
285 1.19 christos hlen = va_arg(ap, int);
286 1.37 itojun proto = va_arg(ap, int);
287 1.19 christos va_end(ap);
288 1.1 cgd
289 1.1 cgd /*
290 1.1 cgd * Locate icmp structure in mbuf, and check
291 1.1 cgd * that not corrupted and of at least minimum length.
292 1.1 cgd */
293 1.34 mycroft icmplen = ip->ip_len - hlen;
294 1.1 cgd #ifdef ICMPPRINTFS
295 1.1 cgd if (icmpprintfs)
296 1.22 christos printf("icmp_input from %x to %x, len %d\n",
297 1.20 mycroft ntohl(ip->ip_src.s_addr), ntohl(ip->ip_dst.s_addr),
298 1.20 mycroft icmplen);
299 1.1 cgd #endif
300 1.1 cgd if (icmplen < ICMP_MINLEN) {
301 1.1 cgd icmpstat.icps_tooshort++;
302 1.1 cgd goto freeit;
303 1.1 cgd }
304 1.9 mycroft i = hlen + min(icmplen, ICMP_ADVLENMIN);
305 1.20 mycroft if (m->m_len < i && (m = m_pullup(m, i)) == 0) {
306 1.1 cgd icmpstat.icps_tooshort++;
307 1.1 cgd return;
308 1.1 cgd }
309 1.5 mycroft ip = mtod(m, struct ip *);
310 1.1 cgd m->m_len -= hlen;
311 1.1 cgd m->m_data += hlen;
312 1.1 cgd icp = mtod(m, struct icmp *);
313 1.1 cgd if (in_cksum(m, icmplen)) {
314 1.1 cgd icmpstat.icps_checksum++;
315 1.1 cgd goto freeit;
316 1.1 cgd }
317 1.1 cgd m->m_len += hlen;
318 1.1 cgd m->m_data -= hlen;
319 1.1 cgd
320 1.1 cgd #ifdef ICMPPRINTFS
321 1.1 cgd /*
322 1.1 cgd * Message type specific processing.
323 1.1 cgd */
324 1.1 cgd if (icmpprintfs)
325 1.22 christos printf("icmp_input, type %d code %d\n", icp->icmp_type,
326 1.1 cgd icp->icmp_code);
327 1.1 cgd #endif
328 1.37 itojun #ifdef IPSEC
329 1.37 itojun /* drop it if it does not match the policy */
330 1.37 itojun if (ipsec4_in_reject(m, NULL)) {
331 1.37 itojun ipsecstat.in_polvio++;
332 1.37 itojun goto freeit;
333 1.37 itojun }
334 1.37 itojun #endif
335 1.1 cgd if (icp->icmp_type > ICMP_MAXTYPE)
336 1.1 cgd goto raw;
337 1.1 cgd icmpstat.icps_inhist[icp->icmp_type]++;
338 1.1 cgd code = icp->icmp_code;
339 1.1 cgd switch (icp->icmp_type) {
340 1.1 cgd
341 1.1 cgd case ICMP_UNREACH:
342 1.9 mycroft switch (code) {
343 1.9 mycroft case ICMP_UNREACH_NET:
344 1.9 mycroft case ICMP_UNREACH_HOST:
345 1.9 mycroft case ICMP_UNREACH_PROTOCOL:
346 1.9 mycroft case ICMP_UNREACH_PORT:
347 1.9 mycroft case ICMP_UNREACH_SRCFAIL:
348 1.9 mycroft code += PRC_UNREACH_NET;
349 1.9 mycroft break;
350 1.9 mycroft
351 1.9 mycroft case ICMP_UNREACH_NEEDFRAG:
352 1.9 mycroft code = PRC_MSGSIZE;
353 1.9 mycroft break;
354 1.9 mycroft
355 1.9 mycroft case ICMP_UNREACH_NET_UNKNOWN:
356 1.9 mycroft case ICMP_UNREACH_NET_PROHIB:
357 1.9 mycroft case ICMP_UNREACH_TOSNET:
358 1.9 mycroft code = PRC_UNREACH_NET;
359 1.9 mycroft break;
360 1.9 mycroft
361 1.9 mycroft case ICMP_UNREACH_HOST_UNKNOWN:
362 1.9 mycroft case ICMP_UNREACH_ISOLATED:
363 1.9 mycroft case ICMP_UNREACH_HOST_PROHIB:
364 1.9 mycroft case ICMP_UNREACH_TOSHOST:
365 1.9 mycroft code = PRC_UNREACH_HOST;
366 1.9 mycroft break;
367 1.9 mycroft
368 1.9 mycroft default:
369 1.9 mycroft goto badcode;
370 1.9 mycroft }
371 1.1 cgd goto deliver;
372 1.1 cgd
373 1.1 cgd case ICMP_TIMXCEED:
374 1.1 cgd if (code > 1)
375 1.1 cgd goto badcode;
376 1.1 cgd code += PRC_TIMXCEED_INTRANS;
377 1.1 cgd goto deliver;
378 1.1 cgd
379 1.1 cgd case ICMP_PARAMPROB:
380 1.9 mycroft if (code > 1)
381 1.1 cgd goto badcode;
382 1.1 cgd code = PRC_PARAMPROB;
383 1.1 cgd goto deliver;
384 1.1 cgd
385 1.1 cgd case ICMP_SOURCEQUENCH:
386 1.1 cgd if (code)
387 1.1 cgd goto badcode;
388 1.1 cgd code = PRC_QUENCH;
389 1.20 mycroft goto deliver;
390 1.20 mycroft
391 1.1 cgd deliver:
392 1.1 cgd /*
393 1.1 cgd * Problem with datagram; advise higher level routines.
394 1.1 cgd */
395 1.1 cgd if (icmplen < ICMP_ADVLENMIN || icmplen < ICMP_ADVLEN(icp) ||
396 1.1 cgd icp->icmp_ip.ip_hl < (sizeof(struct ip) >> 2)) {
397 1.1 cgd icmpstat.icps_badlen++;
398 1.1 cgd goto freeit;
399 1.1 cgd }
400 1.14 mycroft if (IN_MULTICAST(icp->icmp_ip.ip_dst.s_addr))
401 1.13 mycroft goto badcode;
402 1.1 cgd NTOHS(icp->icmp_ip.ip_len);
403 1.1 cgd #ifdef ICMPPRINTFS
404 1.1 cgd if (icmpprintfs)
405 1.22 christos printf("deliver to protocol %d\n", icp->icmp_ip.ip_p);
406 1.1 cgd #endif
407 1.1 cgd icmpsrc.sin_addr = icp->icmp_ip.ip_dst;
408 1.25 kml if (code == PRC_MSGSIZE && ip_mtudisc)
409 1.24 kml icmp_mtudisc(icp);
410 1.37 itojun /*
411 1.37 itojun * XXX if the packet contains [IPv4 AH TCP], we can't make a
412 1.37 itojun * notification to TCP layer.
413 1.37 itojun */
414 1.19 christos ctlfunc = inetsw[ip_protox[icp->icmp_ip.ip_p]].pr_ctlinput;
415 1.19 christos if (ctlfunc)
416 1.16 mycroft (*ctlfunc)(code, sintosa(&icmpsrc), &icp->icmp_ip);
417 1.1 cgd break;
418 1.1 cgd
419 1.1 cgd badcode:
420 1.1 cgd icmpstat.icps_badcode++;
421 1.1 cgd break;
422 1.1 cgd
423 1.1 cgd case ICMP_ECHO:
424 1.1 cgd icp->icmp_type = ICMP_ECHOREPLY;
425 1.1 cgd goto reflect;
426 1.1 cgd
427 1.1 cgd case ICMP_TSTAMP:
428 1.1 cgd if (icmplen < ICMP_TSLEN) {
429 1.1 cgd icmpstat.icps_badlen++;
430 1.1 cgd break;
431 1.1 cgd }
432 1.1 cgd icp->icmp_type = ICMP_TSTAMPREPLY;
433 1.1 cgd icp->icmp_rtime = iptime();
434 1.1 cgd icp->icmp_ttime = icp->icmp_rtime; /* bogus, do later! */
435 1.1 cgd goto reflect;
436 1.9 mycroft
437 1.9 mycroft case ICMP_MASKREQ:
438 1.9 mycroft if (icmpmaskrepl == 0)
439 1.9 mycroft break;
440 1.9 mycroft /*
441 1.9 mycroft * We are not able to respond with all ones broadcast
442 1.9 mycroft * unless we receive it over a point-to-point interface.
443 1.9 mycroft */
444 1.23 thorpej if (icmplen < ICMP_MASKLEN) {
445 1.23 thorpej icmpstat.icps_badlen++;
446 1.9 mycroft break;
447 1.23 thorpej }
448 1.15 mycroft if (ip->ip_dst.s_addr == INADDR_BROADCAST ||
449 1.20 mycroft in_nullhost(ip->ip_dst))
450 1.9 mycroft icmpdst.sin_addr = ip->ip_src;
451 1.15 mycroft else
452 1.9 mycroft icmpdst.sin_addr = ip->ip_dst;
453 1.16 mycroft ia = ifatoia(ifaof_ifpforaddr(sintosa(&icmpdst),
454 1.16 mycroft m->m_pkthdr.rcvif));
455 1.9 mycroft if (ia == 0)
456 1.1 cgd break;
457 1.1 cgd icp->icmp_type = ICMP_MASKREPLY;
458 1.1 cgd icp->icmp_mask = ia->ia_sockmask.sin_addr.s_addr;
459 1.20 mycroft if (in_nullhost(ip->ip_src)) {
460 1.1 cgd if (ia->ia_ifp->if_flags & IFF_BROADCAST)
461 1.17 mycroft ip->ip_src = ia->ia_broadaddr.sin_addr;
462 1.1 cgd else if (ia->ia_ifp->if_flags & IFF_POINTOPOINT)
463 1.17 mycroft ip->ip_src = ia->ia_dstaddr.sin_addr;
464 1.1 cgd }
465 1.1 cgd reflect:
466 1.1 cgd icmpstat.icps_reflect++;
467 1.1 cgd icmpstat.icps_outhist[icp->icmp_type]++;
468 1.1 cgd icmp_reflect(m);
469 1.1 cgd return;
470 1.1 cgd
471 1.1 cgd case ICMP_REDIRECT:
472 1.9 mycroft if (code > 3)
473 1.9 mycroft goto badcode;
474 1.9 mycroft if (icmplen < ICMP_ADVLENMIN || icmplen < ICMP_ADVLEN(icp) ||
475 1.9 mycroft icp->icmp_ip.ip_hl < (sizeof(struct ip) >> 2)) {
476 1.1 cgd icmpstat.icps_badlen++;
477 1.1 cgd break;
478 1.1 cgd }
479 1.1 cgd /*
480 1.1 cgd * Short circuit routing redirects to force
481 1.1 cgd * immediate change in the kernel's routing
482 1.1 cgd * tables. The message is also handed to anyone
483 1.1 cgd * listening on a raw socket (e.g. the routing
484 1.1 cgd * daemon for use in updating its tables).
485 1.1 cgd */
486 1.1 cgd icmpgw.sin_addr = ip->ip_src;
487 1.1 cgd icmpdst.sin_addr = icp->icmp_gwaddr;
488 1.1 cgd #ifdef ICMPPRINTFS
489 1.1 cgd if (icmpprintfs)
490 1.22 christos printf("redirect dst %x to %x\n", icp->icmp_ip.ip_dst,
491 1.20 mycroft icp->icmp_gwaddr);
492 1.1 cgd #endif
493 1.9 mycroft icmpsrc.sin_addr = icp->icmp_ip.ip_dst;
494 1.16 mycroft rtredirect(sintosa(&icmpsrc), sintosa(&icmpdst),
495 1.12 cgd (struct sockaddr *)0, RTF_GATEWAY | RTF_HOST,
496 1.16 mycroft sintosa(&icmpgw), (struct rtentry **)0);
497 1.16 mycroft pfctlinput(PRC_REDIRECT_HOST, sintosa(&icmpsrc));
498 1.37 itojun #ifdef IPSEC
499 1.37 itojun key_sa_routechange((struct sockaddr *)&icmpsrc);
500 1.37 itojun #endif
501 1.1 cgd break;
502 1.1 cgd
503 1.1 cgd /*
504 1.1 cgd * No kernel processing for the following;
505 1.1 cgd * just fall through to send to raw listener.
506 1.1 cgd */
507 1.1 cgd case ICMP_ECHOREPLY:
508 1.9 mycroft case ICMP_ROUTERADVERT:
509 1.9 mycroft case ICMP_ROUTERSOLICIT:
510 1.1 cgd case ICMP_TSTAMPREPLY:
511 1.1 cgd case ICMP_IREQREPLY:
512 1.1 cgd case ICMP_MASKREPLY:
513 1.1 cgd default:
514 1.1 cgd break;
515 1.1 cgd }
516 1.1 cgd
517 1.1 cgd raw:
518 1.37 itojun rip_input(m, hlen, proto);
519 1.1 cgd return;
520 1.1 cgd
521 1.1 cgd freeit:
522 1.1 cgd m_freem(m);
523 1.37 itojun return;
524 1.1 cgd }
525 1.1 cgd
526 1.1 cgd /*
527 1.1 cgd * Reflect the ip packet back to the source
528 1.1 cgd */
529 1.6 mycroft void
530 1.1 cgd icmp_reflect(m)
531 1.1 cgd struct mbuf *m;
532 1.1 cgd {
533 1.1 cgd register struct ip *ip = mtod(m, struct ip *);
534 1.1 cgd register struct in_ifaddr *ia;
535 1.27 tls register struct ifaddr *ifa;
536 1.1 cgd struct in_addr t;
537 1.19 christos struct mbuf *opts = 0;
538 1.1 cgd int optlen = (ip->ip_hl << 2) - sizeof(struct ip);
539 1.1 cgd
540 1.9 mycroft if (!in_canforward(ip->ip_src) &&
541 1.14 mycroft ((ip->ip_src.s_addr & IN_CLASSA_NET) !=
542 1.14 mycroft htonl(IN_LOOPBACKNET << IN_CLASSA_NSHIFT))) {
543 1.9 mycroft m_freem(m); /* Bad return address */
544 1.12 cgd goto done; /* ip_output() will check for broadcast */
545 1.9 mycroft }
546 1.1 cgd t = ip->ip_dst;
547 1.1 cgd ip->ip_dst = ip->ip_src;
548 1.1 cgd /*
549 1.1 cgd * If the incoming packet was addressed directly to us,
550 1.1 cgd * use dst as the src for the reply. Otherwise (broadcast
551 1.1 cgd * or anonymous), use the address which corresponds
552 1.1 cgd * to the incoming interface.
553 1.1 cgd */
554 1.27 tls INADDR_TO_IA(t, ia);
555 1.27 tls if (ia == NULL && (m->m_pkthdr.rcvif->if_flags & IFF_BROADCAST)) {
556 1.27 tls for (ifa = m->m_pkthdr.rcvif->if_addrlist.tqh_first;
557 1.27 tls ifa != NULL; ifa = ifa->ifa_list.tqe_next) {
558 1.27 tls if (ifa->ifa_addr->sa_family != AF_INET)
559 1.27 tls continue;
560 1.27 tls ia = ifatoia(ifa);
561 1.27 tls if (in_hosteq(t, ia->ia_broadaddr.sin_addr))
562 1.27 tls break;
563 1.27 tls }
564 1.1 cgd }
565 1.27 tls
566 1.9 mycroft icmpdst.sin_addr = t;
567 1.1 cgd if (ia == (struct in_ifaddr *)0)
568 1.16 mycroft ia = ifatoia(ifaof_ifpforaddr(sintosa(&icmpdst),
569 1.16 mycroft m->m_pkthdr.rcvif));
570 1.9 mycroft /*
571 1.9 mycroft * The following happens if the packet was not addressed to us,
572 1.27 tls * and was received on an interface with no IP address:
573 1.27 tls * We find the first AF_INET address on the first non-loopback
574 1.27 tls * interface.
575 1.9 mycroft */
576 1.1 cgd if (ia == (struct in_ifaddr *)0)
577 1.27 tls for (ia = in_ifaddr.tqh_first; ia != NULL;
578 1.27 tls ia = ia->ia_list.tqe_next) {
579 1.27 tls if (ia->ia_ifp->if_flags & IFF_LOOPBACK)
580 1.27 tls continue;
581 1.27 tls break;
582 1.27 tls }
583 1.36 mycroft /*
584 1.36 mycroft * If we still didn't find an address, punt. We could have an
585 1.36 mycroft * interface up (and receiving packets) with no address.
586 1.36 mycroft */
587 1.36 mycroft if (ia == (struct in_ifaddr *)0) {
588 1.36 mycroft m_freem(m);
589 1.36 mycroft goto done;
590 1.36 mycroft }
591 1.36 mycroft
592 1.17 mycroft t = ia->ia_addr.sin_addr;
593 1.1 cgd ip->ip_src = t;
594 1.1 cgd ip->ip_ttl = MAXTTL;
595 1.1 cgd
596 1.1 cgd if (optlen > 0) {
597 1.1 cgd register u_char *cp;
598 1.1 cgd int opt, cnt;
599 1.1 cgd u_int len;
600 1.1 cgd
601 1.1 cgd /*
602 1.1 cgd * Retrieve any source routing from the incoming packet;
603 1.1 cgd * add on any record-route or timestamp options.
604 1.1 cgd */
605 1.1 cgd cp = (u_char *) (ip + 1);
606 1.1 cgd if ((opts = ip_srcroute()) == 0 &&
607 1.1 cgd (opts = m_gethdr(M_DONTWAIT, MT_HEADER))) {
608 1.1 cgd opts->m_len = sizeof(struct in_addr);
609 1.20 mycroft *mtod(opts, struct in_addr *) = zeroin_addr;
610 1.1 cgd }
611 1.1 cgd if (opts) {
612 1.1 cgd #ifdef ICMPPRINTFS
613 1.1 cgd if (icmpprintfs)
614 1.22 christos printf("icmp_reflect optlen %d rt %d => ",
615 1.1 cgd optlen, opts->m_len);
616 1.1 cgd #endif
617 1.1 cgd for (cnt = optlen; cnt > 0; cnt -= len, cp += len) {
618 1.1 cgd opt = cp[IPOPT_OPTVAL];
619 1.1 cgd if (opt == IPOPT_EOL)
620 1.1 cgd break;
621 1.1 cgd if (opt == IPOPT_NOP)
622 1.1 cgd len = 1;
623 1.1 cgd else {
624 1.1 cgd len = cp[IPOPT_OLEN];
625 1.1 cgd if (len <= 0 || len > cnt)
626 1.1 cgd break;
627 1.1 cgd }
628 1.1 cgd /*
629 1.9 mycroft * Should check for overflow, but it "can't happen"
630 1.1 cgd */
631 1.9 mycroft if (opt == IPOPT_RR || opt == IPOPT_TS ||
632 1.9 mycroft opt == IPOPT_SECURITY) {
633 1.1 cgd bcopy((caddr_t)cp,
634 1.1 cgd mtod(opts, caddr_t) + opts->m_len, len);
635 1.1 cgd opts->m_len += len;
636 1.1 cgd }
637 1.1 cgd }
638 1.9 mycroft /* Terminate & pad, if necessary */
639 1.19 christos if ((cnt = opts->m_len % 4) != 0) {
640 1.9 mycroft for (; cnt < 4; cnt++) {
641 1.9 mycroft *(mtod(opts, caddr_t) + opts->m_len) =
642 1.9 mycroft IPOPT_EOL;
643 1.9 mycroft opts->m_len++;
644 1.9 mycroft }
645 1.1 cgd }
646 1.1 cgd #ifdef ICMPPRINTFS
647 1.1 cgd if (icmpprintfs)
648 1.22 christos printf("%d\n", opts->m_len);
649 1.1 cgd #endif
650 1.1 cgd }
651 1.1 cgd /*
652 1.1 cgd * Now strip out original options by copying rest of first
653 1.1 cgd * mbuf's data back, and adjust the IP length.
654 1.1 cgd */
655 1.1 cgd ip->ip_len -= optlen;
656 1.1 cgd ip->ip_hl = sizeof(struct ip) >> 2;
657 1.1 cgd m->m_len -= optlen;
658 1.1 cgd if (m->m_flags & M_PKTHDR)
659 1.1 cgd m->m_pkthdr.len -= optlen;
660 1.1 cgd optlen += sizeof(struct ip);
661 1.1 cgd bcopy((caddr_t)ip + optlen, (caddr_t)(ip + 1),
662 1.1 cgd (unsigned)(m->m_len - sizeof(struct ip)));
663 1.1 cgd }
664 1.3 hpeyerl m->m_flags &= ~(M_BCAST|M_MCAST);
665 1.1 cgd icmp_send(m, opts);
666 1.9 mycroft done:
667 1.1 cgd if (opts)
668 1.1 cgd (void)m_free(opts);
669 1.1 cgd }
670 1.1 cgd
671 1.1 cgd /*
672 1.1 cgd * Send an icmp packet back to the ip level,
673 1.1 cgd * after supplying a checksum.
674 1.1 cgd */
675 1.6 mycroft void
676 1.1 cgd icmp_send(m, opts)
677 1.1 cgd register struct mbuf *m;
678 1.1 cgd struct mbuf *opts;
679 1.1 cgd {
680 1.1 cgd register struct ip *ip = mtod(m, struct ip *);
681 1.1 cgd register int hlen;
682 1.1 cgd register struct icmp *icp;
683 1.1 cgd
684 1.1 cgd hlen = ip->ip_hl << 2;
685 1.1 cgd m->m_data += hlen;
686 1.1 cgd m->m_len -= hlen;
687 1.1 cgd icp = mtod(m, struct icmp *);
688 1.1 cgd icp->icmp_cksum = 0;
689 1.1 cgd icp->icmp_cksum = in_cksum(m, ip->ip_len - hlen);
690 1.1 cgd m->m_data -= hlen;
691 1.1 cgd m->m_len += hlen;
692 1.1 cgd #ifdef ICMPPRINTFS
693 1.1 cgd if (icmpprintfs)
694 1.22 christos printf("icmp_send dst %x src %x\n", ip->ip_dst, ip->ip_src);
695 1.1 cgd #endif
696 1.37 itojun #ifdef IPSEC
697 1.37 itojun m->m_pkthdr.rcvif = NULL;
698 1.37 itojun #endif /*IPSEC*/
699 1.7 mycroft (void) ip_output(m, opts, NULL, 0, NULL);
700 1.1 cgd }
701 1.1 cgd
702 1.1 cgd n_time
703 1.1 cgd iptime()
704 1.1 cgd {
705 1.1 cgd struct timeval atv;
706 1.1 cgd u_long t;
707 1.1 cgd
708 1.1 cgd microtime(&atv);
709 1.1 cgd t = (atv.tv_sec % (24*60*60)) * 1000 + atv.tv_usec / 1000;
710 1.1 cgd return (htonl(t));
711 1.9 mycroft }
712 1.9 mycroft
713 1.9 mycroft int
714 1.9 mycroft icmp_sysctl(name, namelen, oldp, oldlenp, newp, newlen)
715 1.9 mycroft int *name;
716 1.9 mycroft u_int namelen;
717 1.9 mycroft void *oldp;
718 1.9 mycroft size_t *oldlenp;
719 1.9 mycroft void *newp;
720 1.9 mycroft size_t newlen;
721 1.9 mycroft {
722 1.9 mycroft
723 1.9 mycroft /* All sysctl names at this level are terminal. */
724 1.9 mycroft if (namelen != 1)
725 1.9 mycroft return (ENOTDIR);
726 1.9 mycroft
727 1.9 mycroft switch (name[0]) {
728 1.9 mycroft case ICMPCTL_MASKREPL:
729 1.9 mycroft return (sysctl_int(oldp, oldlenp, newp, newlen, &icmpmaskrepl));
730 1.9 mycroft default:
731 1.9 mycroft return (ENOPROTOOPT);
732 1.9 mycroft }
733 1.9 mycroft /* NOTREACHED */
734 1.24 kml }
735 1.24 kml
736 1.24 kml static void
737 1.24 kml icmp_mtudisc(icp)
738 1.24 kml struct icmp *icp;
739 1.24 kml {
740 1.24 kml struct rtentry *rt;
741 1.24 kml struct sockaddr *dst = sintosa(&icmpsrc);
742 1.26 kml u_long mtu = ntohs(icp->icmp_nextmtu); /* Why a long? IPv6 */
743 1.29 kml int error;
744 1.24 kml
745 1.24 kml /* Table of common MTUs: */
746 1.24 kml
747 1.24 kml static u_long mtu_table[] = {65535, 65280, 32000, 17914, 9180, 8166,
748 1.24 kml 4352, 2002, 1492, 1006, 508, 296, 68, 0};
749 1.24 kml
750 1.24 kml rt = rtalloc1(dst, 1);
751 1.24 kml if (rt == 0)
752 1.24 kml return;
753 1.24 kml
754 1.24 kml /* If we didn't get a host route, allocate one */
755 1.24 kml
756 1.24 kml if ((rt->rt_flags & RTF_HOST) == 0) {
757 1.24 kml struct rtentry *nrt;
758 1.24 kml
759 1.24 kml error = rtrequest((int) RTM_ADD, dst,
760 1.24 kml (struct sockaddr *) rt->rt_gateway,
761 1.24 kml (struct sockaddr *) 0,
762 1.24 kml RTF_GATEWAY | RTF_HOST | RTF_DYNAMIC, &nrt);
763 1.24 kml if (error) {
764 1.24 kml rtfree(rt);
765 1.24 kml rtfree(nrt);
766 1.24 kml return;
767 1.24 kml }
768 1.24 kml nrt->rt_rmx = rt->rt_rmx;
769 1.24 kml rtfree(rt);
770 1.24 kml rt = nrt;
771 1.24 kml }
772 1.29 kml error = rt_timer_add(rt, icmp_mtudisc_timeout, ip_mtudisc_timeout_q);
773 1.29 kml if (error) {
774 1.29 kml rtfree(rt);
775 1.29 kml return;
776 1.29 kml }
777 1.24 kml
778 1.24 kml if (mtu == 0) {
779 1.24 kml int i = 0;
780 1.24 kml
781 1.26 kml mtu = icp->icmp_ip.ip_len; /* NTOHS happened in deliver: */
782 1.24 kml /* Some 4.2BSD-based routers incorrectly adjust the ip_len */
783 1.24 kml if (mtu > rt->rt_rmx.rmx_mtu && rt->rt_rmx.rmx_mtu != 0)
784 1.24 kml mtu -= (icp->icmp_ip.ip_hl << 2);
785 1.24 kml
786 1.26 kml /* If we still can't guess a value, try the route */
787 1.26 kml
788 1.26 kml if (mtu == 0) {
789 1.24 kml mtu = rt->rt_rmx.rmx_mtu;
790 1.24 kml
791 1.26 kml /* If no route mtu, default to the interface mtu */
792 1.26 kml
793 1.26 kml if (mtu == 0)
794 1.26 kml mtu = rt->rt_ifp->if_mtu;
795 1.26 kml }
796 1.26 kml
797 1.24 kml for (i = 0; i < sizeof(mtu_table) / sizeof(mtu_table[0]); i++)
798 1.26 kml if (mtu > mtu_table[i]) {
799 1.26 kml mtu = mtu_table[i];
800 1.24 kml break;
801 1.26 kml }
802 1.24 kml }
803 1.24 kml
804 1.29 kml /*
805 1.29 kml * XXX: RTV_MTU is overloaded, since the admin can set it
806 1.29 kml * to turn off PMTU for a route, and the kernel can
807 1.29 kml * set it to indicate a serious problem with PMTU
808 1.29 kml * on a route. We should be using a separate flag
809 1.29 kml * for the kernel to indicate this.
810 1.29 kml */
811 1.29 kml
812 1.24 kml if ((rt->rt_rmx.rmx_locks & RTV_MTU) == 0) {
813 1.26 kml if (mtu < 296 || mtu > rt->rt_ifp->if_mtu)
814 1.24 kml rt->rt_rmx.rmx_locks |= RTV_MTU;
815 1.24 kml else if (rt->rt_rmx.rmx_mtu > mtu ||
816 1.24 kml rt->rt_rmx.rmx_mtu == 0)
817 1.24 kml rt->rt_rmx.rmx_mtu = mtu;
818 1.24 kml }
819 1.26 kml
820 1.24 kml if (rt)
821 1.24 kml rtfree(rt);
822 1.37 itojun }
823 1.37 itojun
824 1.37 itojun /*
825 1.37 itojun * Return the next larger or smaller MTU plateau (table from RFC 1191)
826 1.37 itojun * given current value MTU. If DIR is less than zero, a larger plateau
827 1.37 itojun * is returned; otherwise, a smaller value is returned.
828 1.37 itojun */
829 1.37 itojun int
830 1.37 itojun ip_next_mtu(mtu, dir) /* XXX */
831 1.37 itojun int mtu;
832 1.37 itojun int dir;
833 1.37 itojun {
834 1.37 itojun static int mtutab[] = {
835 1.37 itojun 65535, 32000, 17914, 8166, 4352, 2002, 1492, 1006, 508, 296,
836 1.37 itojun 68, 0
837 1.37 itojun };
838 1.37 itojun int i;
839 1.37 itojun
840 1.37 itojun for (i = 0; i < (sizeof mtutab) / (sizeof mtutab[0]); i++) {
841 1.37 itojun if (mtu >= mtutab[i])
842 1.37 itojun break;
843 1.37 itojun }
844 1.37 itojun
845 1.37 itojun if (dir < 0) {
846 1.37 itojun if (i == 0) {
847 1.37 itojun return 0;
848 1.37 itojun } else {
849 1.37 itojun return mtutab[i - 1];
850 1.37 itojun }
851 1.37 itojun } else {
852 1.37 itojun if (mtutab[i] == 0) {
853 1.37 itojun return 0;
854 1.37 itojun } else if(mtu > mtutab[i]) {
855 1.37 itojun return mtutab[i];
856 1.37 itojun } else {
857 1.37 itojun return mtutab[i + 1];
858 1.37 itojun }
859 1.37 itojun }
860 1.29 kml }
861 1.29 kml
862 1.29 kml
863 1.29 kml static void
864 1.29 kml icmp_mtudisc_timeout(rt, r)
865 1.29 kml struct rtentry *rt;
866 1.29 kml struct rttimer *r;
867 1.29 kml {
868 1.29 kml if (rt == NULL)
869 1.29 kml panic("icmp_mtudisc_timeout: bad route to timeout");
870 1.29 kml if ((rt->rt_flags & (RTF_DYNAMIC | RTF_HOST)) ==
871 1.29 kml (RTF_DYNAMIC | RTF_HOST)) {
872 1.29 kml rtrequest((int) RTM_DELETE, (struct sockaddr *)rt_key(rt),
873 1.29 kml rt->rt_gateway, rt_mask(rt), rt->rt_flags, 0);
874 1.29 kml } else {
875 1.29 kml if ((rt->rt_rmx.rmx_locks & RTV_MTU) == 0) {
876 1.29 kml rt->rt_rmx.rmx_mtu = 0;
877 1.29 kml }
878 1.29 kml }
879 1.1 cgd }
880