ip_input.c revision 1.25 1 1.25 cgd /* $NetBSD: ip_input.c,v 1.25 1995/11/21 01:07:34 cgd Exp $ */
2 1.14 cgd
3 1.1 cgd /*
4 1.13 mycroft * Copyright (c) 1982, 1986, 1988, 1993
5 1.13 mycroft * The Regents of the University of California. All rights reserved.
6 1.1 cgd *
7 1.1 cgd * Redistribution and use in source and binary forms, with or without
8 1.1 cgd * modification, are permitted provided that the following conditions
9 1.1 cgd * are met:
10 1.1 cgd * 1. Redistributions of source code must retain the above copyright
11 1.1 cgd * notice, this list of conditions and the following disclaimer.
12 1.1 cgd * 2. Redistributions in binary form must reproduce the above copyright
13 1.1 cgd * notice, this list of conditions and the following disclaimer in the
14 1.1 cgd * documentation and/or other materials provided with the distribution.
15 1.1 cgd * 3. All advertising materials mentioning features or use of this software
16 1.1 cgd * must display the following acknowledgement:
17 1.1 cgd * This product includes software developed by the University of
18 1.1 cgd * California, Berkeley and its contributors.
19 1.1 cgd * 4. Neither the name of the University nor the names of its contributors
20 1.1 cgd * may be used to endorse or promote products derived from this software
21 1.1 cgd * without specific prior written permission.
22 1.1 cgd *
23 1.1 cgd * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
24 1.1 cgd * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
25 1.1 cgd * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
26 1.1 cgd * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
27 1.1 cgd * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
28 1.1 cgd * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
29 1.1 cgd * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
30 1.1 cgd * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
31 1.1 cgd * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
32 1.1 cgd * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
33 1.1 cgd * SUCH DAMAGE.
34 1.1 cgd *
35 1.14 cgd * @(#)ip_input.c 8.2 (Berkeley) 1/4/94
36 1.1 cgd */
37 1.1 cgd
38 1.5 mycroft #include <sys/param.h>
39 1.5 mycroft #include <sys/systm.h>
40 1.5 mycroft #include <sys/malloc.h>
41 1.5 mycroft #include <sys/mbuf.h>
42 1.5 mycroft #include <sys/domain.h>
43 1.5 mycroft #include <sys/protosw.h>
44 1.5 mycroft #include <sys/socket.h>
45 1.5 mycroft #include <sys/errno.h>
46 1.5 mycroft #include <sys/time.h>
47 1.5 mycroft #include <sys/kernel.h>
48 1.1 cgd
49 1.5 mycroft #include <net/if.h>
50 1.5 mycroft #include <net/route.h>
51 1.1 cgd
52 1.5 mycroft #include <netinet/in.h>
53 1.5 mycroft #include <netinet/in_systm.h>
54 1.5 mycroft #include <netinet/ip.h>
55 1.5 mycroft #include <netinet/in_pcb.h>
56 1.5 mycroft #include <netinet/in_var.h>
57 1.5 mycroft #include <netinet/ip_var.h>
58 1.5 mycroft #include <netinet/ip_icmp.h>
59 1.1 cgd
60 1.1 cgd #ifndef IPFORWARDING
61 1.1 cgd #ifdef GATEWAY
62 1.1 cgd #define IPFORWARDING 1 /* forward IP packets not for us */
63 1.1 cgd #else /* GATEWAY */
64 1.1 cgd #define IPFORWARDING 0 /* don't forward IP packets not for us */
65 1.1 cgd #endif /* GATEWAY */
66 1.1 cgd #endif /* IPFORWARDING */
67 1.1 cgd #ifndef IPSENDREDIRECTS
68 1.1 cgd #define IPSENDREDIRECTS 1
69 1.1 cgd #endif
70 1.1 cgd int ipforwarding = IPFORWARDING;
71 1.1 cgd int ipsendredirects = IPSENDREDIRECTS;
72 1.13 mycroft int ip_defttl = IPDEFTTL;
73 1.1 cgd #ifdef DIAGNOSTIC
74 1.1 cgd int ipprintfs = 0;
75 1.1 cgd #endif
76 1.1 cgd
77 1.1 cgd extern struct domain inetdomain;
78 1.1 cgd extern struct protosw inetsw[];
79 1.1 cgd u_char ip_protox[IPPROTO_MAX];
80 1.1 cgd int ipqmaxlen = IFQ_MAXLEN;
81 1.22 mycroft struct in_ifaddrhead in_ifaddr;
82 1.13 mycroft struct ifqueue ipintrq;
83 1.1 cgd
84 1.1 cgd /*
85 1.1 cgd * We need to save the IP options in case a protocol wants to respond
86 1.1 cgd * to an incoming packet over the same route if the packet got here
87 1.1 cgd * using IP source routing. This allows connection establishment and
88 1.1 cgd * maintenance when the remote end is on a network that is not known
89 1.1 cgd * to us.
90 1.1 cgd */
91 1.1 cgd int ip_nhops = 0;
92 1.1 cgd static struct ip_srcrt {
93 1.1 cgd struct in_addr dst; /* final destination */
94 1.1 cgd char nop; /* one NOP to align */
95 1.1 cgd char srcopt[IPOPT_OFFSET + 1]; /* OPTVAL, OLEN and OFFSET */
96 1.1 cgd struct in_addr route[MAX_IPOPTLEN/sizeof(struct in_addr)];
97 1.1 cgd } ip_srcrt;
98 1.1 cgd
99 1.13 mycroft static void save_rte __P((u_char *, struct in_addr));
100 1.1 cgd /*
101 1.1 cgd * IP initialization: fill in IP protocol switch table.
102 1.1 cgd * All protocols not implemented in kernel go to raw IP protocol handler.
103 1.1 cgd */
104 1.8 mycroft void
105 1.1 cgd ip_init()
106 1.1 cgd {
107 1.1 cgd register struct protosw *pr;
108 1.1 cgd register int i;
109 1.1 cgd
110 1.1 cgd pr = pffindproto(PF_INET, IPPROTO_RAW, SOCK_RAW);
111 1.1 cgd if (pr == 0)
112 1.1 cgd panic("ip_init");
113 1.1 cgd for (i = 0; i < IPPROTO_MAX; i++)
114 1.1 cgd ip_protox[i] = pr - inetsw;
115 1.1 cgd for (pr = inetdomain.dom_protosw;
116 1.1 cgd pr < inetdomain.dom_protoswNPROTOSW; pr++)
117 1.1 cgd if (pr->pr_domain->dom_family == PF_INET &&
118 1.1 cgd pr->pr_protocol && pr->pr_protocol != IPPROTO_RAW)
119 1.1 cgd ip_protox[pr->pr_protocol] = pr - inetsw;
120 1.25 cgd LIST_INIT(&ipq);
121 1.1 cgd ip_id = time.tv_sec & 0xffff;
122 1.1 cgd ipintrq.ifq_maxlen = ipqmaxlen;
123 1.22 mycroft TAILQ_INIT(&in_ifaddr);
124 1.1 cgd }
125 1.1 cgd
126 1.1 cgd struct sockaddr_in ipaddr = { sizeof(ipaddr), AF_INET };
127 1.1 cgd struct route ipforward_rt;
128 1.1 cgd
129 1.1 cgd /*
130 1.1 cgd * Ip input routine. Checksum and byte swap header. If fragmented
131 1.1 cgd * try to reassemble. Process options. Pass to next level.
132 1.1 cgd */
133 1.8 mycroft void
134 1.1 cgd ipintr()
135 1.1 cgd {
136 1.1 cgd register struct ip *ip;
137 1.1 cgd register struct mbuf *m;
138 1.1 cgd register struct ipq *fp;
139 1.1 cgd register struct in_ifaddr *ia;
140 1.25 cgd struct ipqent *ipqe;
141 1.25 cgd int hlen, mff, s;
142 1.1 cgd
143 1.1 cgd next:
144 1.1 cgd /*
145 1.1 cgd * Get next datagram off input queue and get IP header
146 1.1 cgd * in first mbuf.
147 1.1 cgd */
148 1.1 cgd s = splimp();
149 1.1 cgd IF_DEQUEUE(&ipintrq, m);
150 1.1 cgd splx(s);
151 1.13 mycroft if (m == 0)
152 1.1 cgd return;
153 1.1 cgd #ifdef DIAGNOSTIC
154 1.1 cgd if ((m->m_flags & M_PKTHDR) == 0)
155 1.1 cgd panic("ipintr no HDR");
156 1.1 cgd #endif
157 1.1 cgd /*
158 1.1 cgd * If no IP addresses have been set yet but the interfaces
159 1.1 cgd * are receiving, can't do anything with incoming packets yet.
160 1.1 cgd */
161 1.22 mycroft if (in_ifaddr.tqh_first == 0)
162 1.1 cgd goto bad;
163 1.1 cgd ipstat.ips_total++;
164 1.1 cgd if (m->m_len < sizeof (struct ip) &&
165 1.1 cgd (m = m_pullup(m, sizeof (struct ip))) == 0) {
166 1.1 cgd ipstat.ips_toosmall++;
167 1.1 cgd goto next;
168 1.1 cgd }
169 1.1 cgd ip = mtod(m, struct ip *);
170 1.13 mycroft if (ip->ip_v != IPVERSION) {
171 1.13 mycroft ipstat.ips_badvers++;
172 1.13 mycroft goto bad;
173 1.13 mycroft }
174 1.1 cgd hlen = ip->ip_hl << 2;
175 1.1 cgd if (hlen < sizeof(struct ip)) { /* minimum header length */
176 1.1 cgd ipstat.ips_badhlen++;
177 1.1 cgd goto bad;
178 1.1 cgd }
179 1.1 cgd if (hlen > m->m_len) {
180 1.1 cgd if ((m = m_pullup(m, hlen)) == 0) {
181 1.1 cgd ipstat.ips_badhlen++;
182 1.1 cgd goto next;
183 1.1 cgd }
184 1.1 cgd ip = mtod(m, struct ip *);
185 1.1 cgd }
186 1.1 cgd if (ip->ip_sum = in_cksum(m, hlen)) {
187 1.1 cgd ipstat.ips_badsum++;
188 1.1 cgd goto bad;
189 1.1 cgd }
190 1.1 cgd
191 1.1 cgd /*
192 1.1 cgd * Convert fields to host representation.
193 1.1 cgd */
194 1.1 cgd NTOHS(ip->ip_len);
195 1.1 cgd if (ip->ip_len < hlen) {
196 1.1 cgd ipstat.ips_badlen++;
197 1.1 cgd goto bad;
198 1.1 cgd }
199 1.1 cgd NTOHS(ip->ip_id);
200 1.1 cgd NTOHS(ip->ip_off);
201 1.1 cgd
202 1.1 cgd /*
203 1.1 cgd * Check that the amount of data in the buffers
204 1.1 cgd * is as at least much as the IP header would have us expect.
205 1.1 cgd * Trim mbufs if longer than we expect.
206 1.1 cgd * Drop packet if shorter than we expect.
207 1.1 cgd */
208 1.1 cgd if (m->m_pkthdr.len < ip->ip_len) {
209 1.1 cgd ipstat.ips_tooshort++;
210 1.1 cgd goto bad;
211 1.1 cgd }
212 1.1 cgd if (m->m_pkthdr.len > ip->ip_len) {
213 1.1 cgd if (m->m_len == m->m_pkthdr.len) {
214 1.1 cgd m->m_len = ip->ip_len;
215 1.1 cgd m->m_pkthdr.len = ip->ip_len;
216 1.1 cgd } else
217 1.1 cgd m_adj(m, ip->ip_len - m->m_pkthdr.len);
218 1.1 cgd }
219 1.1 cgd
220 1.1 cgd /*
221 1.1 cgd * Process options and, if not destined for us,
222 1.1 cgd * ship it on. ip_dooptions returns 1 when an
223 1.1 cgd * error was detected (causing an icmp message
224 1.1 cgd * to be sent and the original packet to be freed).
225 1.1 cgd */
226 1.1 cgd ip_nhops = 0; /* for source routed packets */
227 1.1 cgd if (hlen > sizeof (struct ip) && ip_dooptions(m))
228 1.1 cgd goto next;
229 1.1 cgd
230 1.1 cgd /*
231 1.1 cgd * Check our list of addresses, to see if the packet is for us.
232 1.1 cgd */
233 1.22 mycroft for (ia = in_ifaddr.tqh_first; ia; ia = ia->ia_list.tqe_next) {
234 1.20 mycroft if (ip->ip_dst.s_addr == ia->ia_addr.sin_addr.s_addr)
235 1.1 cgd goto ours;
236 1.1 cgd if (
237 1.1 cgd #ifdef DIRECTED_BROADCAST
238 1.1 cgd ia->ia_ifp == m->m_pkthdr.rcvif &&
239 1.1 cgd #endif
240 1.1 cgd (ia->ia_ifp->if_flags & IFF_BROADCAST)) {
241 1.20 mycroft if (ip->ip_dst.s_addr == ia->ia_broadaddr.sin_addr.s_addr ||
242 1.20 mycroft ip->ip_dst.s_addr == ia->ia_netbroadcast.s_addr ||
243 1.20 mycroft /*
244 1.20 mycroft * Look for all-0's host part (old broadcast addr),
245 1.20 mycroft * either for subnet or net.
246 1.20 mycroft */
247 1.20 mycroft ip->ip_dst.s_addr == ia->ia_subnet ||
248 1.18 mycroft ip->ip_dst.s_addr == ia->ia_net)
249 1.1 cgd goto ours;
250 1.1 cgd }
251 1.1 cgd }
252 1.18 mycroft if (IN_MULTICAST(ip->ip_dst.s_addr)) {
253 1.4 hpeyerl struct in_multi *inm;
254 1.4 hpeyerl #ifdef MROUTING
255 1.4 hpeyerl extern struct socket *ip_mrouter;
256 1.10 brezak
257 1.10 brezak if (m->m_flags & M_EXT) {
258 1.10 brezak if ((m = m_pullup(m, hlen)) == 0) {
259 1.10 brezak ipstat.ips_toosmall++;
260 1.10 brezak goto next;
261 1.10 brezak }
262 1.10 brezak ip = mtod(m, struct ip *);
263 1.10 brezak }
264 1.4 hpeyerl
265 1.4 hpeyerl if (ip_mrouter) {
266 1.4 hpeyerl /*
267 1.4 hpeyerl * If we are acting as a multicast router, all
268 1.4 hpeyerl * incoming multicast packets are passed to the
269 1.4 hpeyerl * kernel-level multicast forwarding function.
270 1.4 hpeyerl * The packet is returned (relatively) intact; if
271 1.4 hpeyerl * ip_mforward() returns a non-zero value, the packet
272 1.4 hpeyerl * must be discarded, else it may be accepted below.
273 1.4 hpeyerl *
274 1.4 hpeyerl * (The IP ident field is put in the same byte order
275 1.4 hpeyerl * as expected when ip_mforward() is called from
276 1.4 hpeyerl * ip_output().)
277 1.4 hpeyerl */
278 1.4 hpeyerl ip->ip_id = htons(ip->ip_id);
279 1.13 mycroft if (ip_mforward(m, m->m_pkthdr.rcvif) != 0) {
280 1.13 mycroft ipstat.ips_cantforward++;
281 1.4 hpeyerl m_freem(m);
282 1.4 hpeyerl goto next;
283 1.4 hpeyerl }
284 1.4 hpeyerl ip->ip_id = ntohs(ip->ip_id);
285 1.4 hpeyerl
286 1.4 hpeyerl /*
287 1.4 hpeyerl * The process-level routing demon needs to receive
288 1.4 hpeyerl * all multicast IGMP packets, whether or not this
289 1.4 hpeyerl * host belongs to their destination groups.
290 1.4 hpeyerl */
291 1.4 hpeyerl if (ip->ip_p == IPPROTO_IGMP)
292 1.4 hpeyerl goto ours;
293 1.13 mycroft ipstat.ips_forward++;
294 1.4 hpeyerl }
295 1.4 hpeyerl #endif
296 1.4 hpeyerl /*
297 1.4 hpeyerl * See if we belong to the destination multicast group on the
298 1.4 hpeyerl * arrival interface.
299 1.4 hpeyerl */
300 1.4 hpeyerl IN_LOOKUP_MULTI(ip->ip_dst, m->m_pkthdr.rcvif, inm);
301 1.4 hpeyerl if (inm == NULL) {
302 1.13 mycroft ipstat.ips_cantforward++;
303 1.4 hpeyerl m_freem(m);
304 1.4 hpeyerl goto next;
305 1.4 hpeyerl }
306 1.4 hpeyerl goto ours;
307 1.4 hpeyerl }
308 1.19 mycroft if (ip->ip_dst.s_addr == INADDR_BROADCAST ||
309 1.19 mycroft ip->ip_dst.s_addr == INADDR_ANY)
310 1.1 cgd goto ours;
311 1.1 cgd
312 1.1 cgd /*
313 1.1 cgd * Not for us; forward if possible and desirable.
314 1.1 cgd */
315 1.1 cgd if (ipforwarding == 0) {
316 1.1 cgd ipstat.ips_cantforward++;
317 1.1 cgd m_freem(m);
318 1.1 cgd } else
319 1.1 cgd ip_forward(m, 0);
320 1.1 cgd goto next;
321 1.1 cgd
322 1.1 cgd ours:
323 1.1 cgd /*
324 1.1 cgd * If offset or IP_MF are set, must reassemble.
325 1.1 cgd * Otherwise, nothing need be done.
326 1.1 cgd * (We could look in the reassembly queue to see
327 1.1 cgd * if the packet was previously fragmented,
328 1.1 cgd * but it's not worth the time; just let them time out.)
329 1.1 cgd */
330 1.1 cgd if (ip->ip_off &~ IP_DF) {
331 1.1 cgd if (m->m_flags & M_EXT) { /* XXX */
332 1.1 cgd if ((m = m_pullup(m, sizeof (struct ip))) == 0) {
333 1.1 cgd ipstat.ips_toosmall++;
334 1.1 cgd goto next;
335 1.1 cgd }
336 1.1 cgd ip = mtod(m, struct ip *);
337 1.1 cgd }
338 1.1 cgd /*
339 1.1 cgd * Look for queue of fragments
340 1.1 cgd * of this datagram.
341 1.1 cgd */
342 1.25 cgd for (fp = ipq.lh_first; fp != NULL; fp = fp->ipq_q.le_next)
343 1.1 cgd if (ip->ip_id == fp->ipq_id &&
344 1.1 cgd ip->ip_src.s_addr == fp->ipq_src.s_addr &&
345 1.1 cgd ip->ip_dst.s_addr == fp->ipq_dst.s_addr &&
346 1.1 cgd ip->ip_p == fp->ipq_p)
347 1.1 cgd goto found;
348 1.1 cgd fp = 0;
349 1.1 cgd found:
350 1.1 cgd
351 1.1 cgd /*
352 1.1 cgd * Adjust ip_len to not reflect header,
353 1.25 cgd * set ipqe_mff if more fragments are expected,
354 1.1 cgd * convert offset of this to bytes.
355 1.1 cgd */
356 1.1 cgd ip->ip_len -= hlen;
357 1.25 cgd mff = (ip->ip_off & IP_MF) != 0;
358 1.25 cgd if (mff) {
359 1.16 cgd /*
360 1.16 cgd * Make sure that fragments have a data length
361 1.16 cgd * that's a non-zero multiple of 8 bytes.
362 1.16 cgd */
363 1.17 cgd if (ip->ip_len == 0 || (ip->ip_len & 0x7) != 0) {
364 1.16 cgd ipstat.ips_badfrags++;
365 1.16 cgd goto bad;
366 1.16 cgd }
367 1.16 cgd }
368 1.1 cgd ip->ip_off <<= 3;
369 1.1 cgd
370 1.1 cgd /*
371 1.1 cgd * If datagram marked as having more fragments
372 1.1 cgd * or if this is not the first fragment,
373 1.1 cgd * attempt reassembly; if it succeeds, proceed.
374 1.1 cgd */
375 1.25 cgd if (mff || ip->ip_off) {
376 1.1 cgd ipstat.ips_fragments++;
377 1.25 cgd MALLOC(ipqe, struct ipqent *, sizeof (struct ipqent),
378 1.25 cgd M_IPQ, M_NOWAIT);
379 1.25 cgd if (ipqe == NULL) {
380 1.25 cgd ipstat.ips_rcvmemdrop++;
381 1.25 cgd goto bad;
382 1.25 cgd }
383 1.25 cgd ipqe->ipqe_mff = mff;
384 1.25 cgd ipqe->ipqe_ip = ip;
385 1.25 cgd ip = ip_reass(ipqe, fp);
386 1.1 cgd if (ip == 0)
387 1.1 cgd goto next;
388 1.13 mycroft ipstat.ips_reassembled++;
389 1.1 cgd m = dtom(ip);
390 1.1 cgd } else
391 1.1 cgd if (fp)
392 1.1 cgd ip_freef(fp);
393 1.1 cgd } else
394 1.1 cgd ip->ip_len -= hlen;
395 1.1 cgd
396 1.1 cgd /*
397 1.1 cgd * Switch out to protocol's input routine.
398 1.1 cgd */
399 1.1 cgd ipstat.ips_delivered++;
400 1.1 cgd (*inetsw[ip_protox[ip->ip_p]].pr_input)(m, hlen);
401 1.1 cgd goto next;
402 1.1 cgd bad:
403 1.1 cgd m_freem(m);
404 1.1 cgd goto next;
405 1.1 cgd }
406 1.1 cgd
407 1.1 cgd /*
408 1.1 cgd * Take incoming datagram fragment and try to
409 1.1 cgd * reassemble it into whole datagram. If a chain for
410 1.1 cgd * reassembly of this datagram already exists, then it
411 1.1 cgd * is given as fp; otherwise have to make a chain.
412 1.1 cgd */
413 1.1 cgd struct ip *
414 1.25 cgd ip_reass(ipqe, fp)
415 1.25 cgd register struct ipqent *ipqe;
416 1.1 cgd register struct ipq *fp;
417 1.1 cgd {
418 1.25 cgd register struct mbuf *m = dtom(ipqe->ipqe_ip);
419 1.25 cgd register struct ipqent *nq, *p, *q;
420 1.25 cgd struct ip *ip;
421 1.1 cgd struct mbuf *t;
422 1.25 cgd int hlen = ipqe->ipqe_ip->ip_hl << 2;
423 1.1 cgd int i, next;
424 1.1 cgd
425 1.1 cgd /*
426 1.1 cgd * Presence of header sizes in mbufs
427 1.1 cgd * would confuse code below.
428 1.1 cgd */
429 1.1 cgd m->m_data += hlen;
430 1.1 cgd m->m_len -= hlen;
431 1.1 cgd
432 1.1 cgd /*
433 1.1 cgd * If first fragment to arrive, create a reassembly queue.
434 1.1 cgd */
435 1.1 cgd if (fp == 0) {
436 1.1 cgd if ((t = m_get(M_DONTWAIT, MT_FTABLE)) == NULL)
437 1.1 cgd goto dropfrag;
438 1.1 cgd fp = mtod(t, struct ipq *);
439 1.25 cgd LIST_INSERT_HEAD(&ipq, fp, ipq_q);
440 1.1 cgd fp->ipq_ttl = IPFRAGTTL;
441 1.25 cgd fp->ipq_p = ipqe->ipqe_ip->ip_p;
442 1.25 cgd fp->ipq_id = ipqe->ipqe_ip->ip_id;
443 1.25 cgd LIST_INIT(&fp->ipq_fragq);
444 1.25 cgd fp->ipq_src = ipqe->ipqe_ip->ip_src;
445 1.25 cgd fp->ipq_dst = ipqe->ipqe_ip->ip_dst;
446 1.25 cgd p = NULL;
447 1.1 cgd goto insert;
448 1.1 cgd }
449 1.1 cgd
450 1.1 cgd /*
451 1.1 cgd * Find a segment which begins after this one does.
452 1.1 cgd */
453 1.25 cgd for (p = NULL, q = fp->ipq_fragq.lh_first; q != NULL;
454 1.25 cgd p = q, q = q->ipqe_q.le_next)
455 1.25 cgd if (q->ipqe_ip->ip_off > ipqe->ipqe_ip->ip_off)
456 1.1 cgd break;
457 1.1 cgd
458 1.1 cgd /*
459 1.1 cgd * If there is a preceding segment, it may provide some of
460 1.1 cgd * our data already. If so, drop the data from the incoming
461 1.1 cgd * segment. If it provides all of our data, drop us.
462 1.1 cgd */
463 1.25 cgd if (p != NULL) {
464 1.25 cgd i = p->ipqe_ip->ip_off + p->ipqe_ip->ip_len -
465 1.25 cgd ipqe->ipqe_ip->ip_off;
466 1.1 cgd if (i > 0) {
467 1.25 cgd if (i >= ipqe->ipqe_ip->ip_len)
468 1.1 cgd goto dropfrag;
469 1.25 cgd m_adj(dtom(ipqe->ipqe_ip), i);
470 1.25 cgd ipqe->ipqe_ip->ip_off += i;
471 1.25 cgd ipqe->ipqe_ip->ip_len -= i;
472 1.1 cgd }
473 1.1 cgd }
474 1.1 cgd
475 1.1 cgd /*
476 1.1 cgd * While we overlap succeeding segments trim them or,
477 1.1 cgd * if they are completely covered, dequeue them.
478 1.1 cgd */
479 1.25 cgd for (; q != NULL && ipqe->ipqe_ip->ip_off + ipqe->ipqe_ip->ip_len >
480 1.25 cgd q->ipqe_ip->ip_off; q = nq) {
481 1.25 cgd i = (ipqe->ipqe_ip->ip_off + ipqe->ipqe_ip->ip_len) -
482 1.25 cgd q->ipqe_ip->ip_off;
483 1.25 cgd if (i < q->ipqe_ip->ip_len) {
484 1.25 cgd q->ipqe_ip->ip_len -= i;
485 1.25 cgd q->ipqe_ip->ip_off += i;
486 1.25 cgd m_adj(dtom(q->ipqe_ip), i);
487 1.1 cgd break;
488 1.1 cgd }
489 1.25 cgd nq = q->ipqe_q.le_next;
490 1.25 cgd m_freem(dtom(q->ipqe_ip));
491 1.25 cgd LIST_REMOVE(q, ipqe_q);
492 1.25 cgd FREE(q, M_IPQ);
493 1.1 cgd }
494 1.1 cgd
495 1.1 cgd insert:
496 1.1 cgd /*
497 1.1 cgd * Stick new segment in its place;
498 1.1 cgd * check for complete reassembly.
499 1.1 cgd */
500 1.25 cgd if (p == NULL) {
501 1.25 cgd LIST_INSERT_HEAD(&fp->ipq_fragq, ipqe, ipqe_q);
502 1.25 cgd } else {
503 1.25 cgd LIST_INSERT_AFTER(p, ipqe, ipqe_q);
504 1.25 cgd }
505 1.1 cgd next = 0;
506 1.25 cgd for (p = NULL, q = fp->ipq_fragq.lh_first; q != NULL;
507 1.25 cgd p = q, q = q->ipqe_q.le_next) {
508 1.25 cgd if (q->ipqe_ip->ip_off != next)
509 1.1 cgd return (0);
510 1.25 cgd next += q->ipqe_ip->ip_len;
511 1.1 cgd }
512 1.25 cgd if (p->ipqe_mff)
513 1.1 cgd return (0);
514 1.1 cgd
515 1.1 cgd /*
516 1.1 cgd * Reassembly is complete; concatenate fragments.
517 1.1 cgd */
518 1.25 cgd q = fp->ipq_fragq.lh_first;
519 1.25 cgd ip = q->ipqe_ip;
520 1.25 cgd m = dtom(q->ipqe_ip);
521 1.1 cgd t = m->m_next;
522 1.1 cgd m->m_next = 0;
523 1.1 cgd m_cat(m, t);
524 1.25 cgd nq = q->ipqe_q.le_next;
525 1.25 cgd FREE(q, M_IPQ);
526 1.25 cgd for (q = nq; q != NULL; q = nq) {
527 1.25 cgd t = dtom(q->ipqe_ip);
528 1.25 cgd nq = q->ipqe_q.le_next;
529 1.25 cgd FREE(q, M_IPQ);
530 1.1 cgd m_cat(m, t);
531 1.1 cgd }
532 1.1 cgd
533 1.1 cgd /*
534 1.1 cgd * Create header for new ip packet by
535 1.1 cgd * modifying header of first packet;
536 1.1 cgd * dequeue and discard fragment reassembly header.
537 1.1 cgd * Make header visible.
538 1.1 cgd */
539 1.1 cgd ip->ip_len = next;
540 1.25 cgd ip->ip_src = fp->ipq_src;
541 1.25 cgd ip->ip_dst = fp->ipq_dst;
542 1.25 cgd LIST_REMOVE(fp, ipq_q);
543 1.1 cgd (void) m_free(dtom(fp));
544 1.1 cgd m->m_len += (ip->ip_hl << 2);
545 1.1 cgd m->m_data -= (ip->ip_hl << 2);
546 1.1 cgd /* some debugging cruft by sklower, below, will go away soon */
547 1.1 cgd if (m->m_flags & M_PKTHDR) { /* XXX this should be done elsewhere */
548 1.1 cgd register int plen = 0;
549 1.1 cgd for (t = m; m; m = m->m_next)
550 1.1 cgd plen += m->m_len;
551 1.1 cgd t->m_pkthdr.len = plen;
552 1.1 cgd }
553 1.25 cgd return (ip);
554 1.1 cgd
555 1.1 cgd dropfrag:
556 1.1 cgd ipstat.ips_fragdropped++;
557 1.1 cgd m_freem(m);
558 1.25 cgd FREE(ipqe, M_IPQ);
559 1.1 cgd return (0);
560 1.1 cgd }
561 1.1 cgd
562 1.1 cgd /*
563 1.1 cgd * Free a fragment reassembly header and all
564 1.1 cgd * associated datagrams.
565 1.1 cgd */
566 1.8 mycroft void
567 1.1 cgd ip_freef(fp)
568 1.1 cgd struct ipq *fp;
569 1.1 cgd {
570 1.25 cgd register struct ipqent *q, *p;
571 1.1 cgd
572 1.25 cgd for (q = fp->ipq_fragq.lh_first; q != NULL; q = p) {
573 1.25 cgd p = q->ipqe_q.le_next;
574 1.25 cgd m_freem(dtom(q->ipqe_ip));
575 1.25 cgd LIST_REMOVE(q, ipqe_q);
576 1.25 cgd FREE(q, M_IPQ);
577 1.1 cgd }
578 1.25 cgd LIST_REMOVE(fp, ipq_q);
579 1.1 cgd (void) m_free(dtom(fp));
580 1.1 cgd }
581 1.1 cgd
582 1.1 cgd /*
583 1.1 cgd * IP timer processing;
584 1.1 cgd * if a timer expires on a reassembly
585 1.1 cgd * queue, discard it.
586 1.1 cgd */
587 1.8 mycroft void
588 1.1 cgd ip_slowtimo()
589 1.1 cgd {
590 1.25 cgd register struct ipq *fp, *nfp;
591 1.24 mycroft int s = splsoftnet();
592 1.1 cgd
593 1.25 cgd for (fp = ipq.lh_first; fp != NULL; fp = nfp) {
594 1.25 cgd nfp = fp->ipq_q.le_next;
595 1.25 cgd if (--fp->ipq_ttl == 0) {
596 1.1 cgd ipstat.ips_fragtimeout++;
597 1.25 cgd ip_freef(fp);
598 1.1 cgd }
599 1.1 cgd }
600 1.1 cgd splx(s);
601 1.1 cgd }
602 1.1 cgd
603 1.1 cgd /*
604 1.1 cgd * Drain off all datagram fragments.
605 1.1 cgd */
606 1.8 mycroft void
607 1.1 cgd ip_drain()
608 1.1 cgd {
609 1.1 cgd
610 1.25 cgd while (ipq.lh_first != NULL) {
611 1.1 cgd ipstat.ips_fragdropped++;
612 1.25 cgd ip_freef(ipq.lh_first);
613 1.1 cgd }
614 1.1 cgd }
615 1.1 cgd
616 1.1 cgd /*
617 1.1 cgd * Do option processing on a datagram,
618 1.1 cgd * possibly discarding it if bad options are encountered,
619 1.1 cgd * or forwarding it if source-routed.
620 1.1 cgd * Returns 1 if packet has been forwarded/freed,
621 1.1 cgd * 0 if the packet should be processed further.
622 1.1 cgd */
623 1.8 mycroft int
624 1.1 cgd ip_dooptions(m)
625 1.1 cgd struct mbuf *m;
626 1.1 cgd {
627 1.1 cgd register struct ip *ip = mtod(m, struct ip *);
628 1.1 cgd register u_char *cp;
629 1.1 cgd register struct ip_timestamp *ipt;
630 1.1 cgd register struct in_ifaddr *ia;
631 1.1 cgd int opt, optlen, cnt, off, code, type = ICMP_PARAMPROB, forward = 0;
632 1.13 mycroft struct in_addr *sin, dst;
633 1.1 cgd n_time ntime;
634 1.1 cgd
635 1.13 mycroft dst = ip->ip_dst;
636 1.1 cgd cp = (u_char *)(ip + 1);
637 1.1 cgd cnt = (ip->ip_hl << 2) - sizeof (struct ip);
638 1.1 cgd for (; cnt > 0; cnt -= optlen, cp += optlen) {
639 1.1 cgd opt = cp[IPOPT_OPTVAL];
640 1.1 cgd if (opt == IPOPT_EOL)
641 1.1 cgd break;
642 1.1 cgd if (opt == IPOPT_NOP)
643 1.1 cgd optlen = 1;
644 1.1 cgd else {
645 1.1 cgd optlen = cp[IPOPT_OLEN];
646 1.1 cgd if (optlen <= 0 || optlen > cnt) {
647 1.1 cgd code = &cp[IPOPT_OLEN] - (u_char *)ip;
648 1.1 cgd goto bad;
649 1.1 cgd }
650 1.1 cgd }
651 1.1 cgd switch (opt) {
652 1.1 cgd
653 1.1 cgd default:
654 1.1 cgd break;
655 1.1 cgd
656 1.1 cgd /*
657 1.1 cgd * Source routing with record.
658 1.1 cgd * Find interface with current destination address.
659 1.1 cgd * If none on this machine then drop if strictly routed,
660 1.1 cgd * or do nothing if loosely routed.
661 1.1 cgd * Record interface address and bring up next address
662 1.1 cgd * component. If strictly routed make sure next
663 1.1 cgd * address is on directly accessible net.
664 1.1 cgd */
665 1.1 cgd case IPOPT_LSRR:
666 1.1 cgd case IPOPT_SSRR:
667 1.1 cgd if ((off = cp[IPOPT_OFFSET]) < IPOPT_MINOFF) {
668 1.1 cgd code = &cp[IPOPT_OFFSET] - (u_char *)ip;
669 1.1 cgd goto bad;
670 1.1 cgd }
671 1.1 cgd ipaddr.sin_addr = ip->ip_dst;
672 1.19 mycroft ia = ifatoia(ifa_ifwithaddr(sintosa(&ipaddr)));
673 1.1 cgd if (ia == 0) {
674 1.1 cgd if (opt == IPOPT_SSRR) {
675 1.1 cgd type = ICMP_UNREACH;
676 1.1 cgd code = ICMP_UNREACH_SRCFAIL;
677 1.1 cgd goto bad;
678 1.1 cgd }
679 1.1 cgd /*
680 1.1 cgd * Loose routing, and not at next destination
681 1.1 cgd * yet; nothing to do except forward.
682 1.1 cgd */
683 1.1 cgd break;
684 1.1 cgd }
685 1.1 cgd off--; /* 0 origin */
686 1.1 cgd if (off > optlen - sizeof(struct in_addr)) {
687 1.1 cgd /*
688 1.1 cgd * End of source route. Should be for us.
689 1.1 cgd */
690 1.1 cgd save_rte(cp, ip->ip_src);
691 1.1 cgd break;
692 1.1 cgd }
693 1.1 cgd /*
694 1.1 cgd * locate outgoing interface
695 1.1 cgd */
696 1.1 cgd bcopy((caddr_t)(cp + off), (caddr_t)&ipaddr.sin_addr,
697 1.1 cgd sizeof(ipaddr.sin_addr));
698 1.1 cgd if (opt == IPOPT_SSRR) {
699 1.1 cgd #define INA struct in_ifaddr *
700 1.1 cgd #define SA struct sockaddr *
701 1.1 cgd if ((ia = (INA)ifa_ifwithdstaddr((SA)&ipaddr)) == 0)
702 1.13 mycroft ia = (INA)ifa_ifwithnet((SA)&ipaddr);
703 1.1 cgd } else
704 1.1 cgd ia = ip_rtaddr(ipaddr.sin_addr);
705 1.1 cgd if (ia == 0) {
706 1.1 cgd type = ICMP_UNREACH;
707 1.1 cgd code = ICMP_UNREACH_SRCFAIL;
708 1.1 cgd goto bad;
709 1.1 cgd }
710 1.1 cgd ip->ip_dst = ipaddr.sin_addr;
711 1.20 mycroft bcopy((caddr_t)&ia->ia_addr.sin_addr,
712 1.1 cgd (caddr_t)(cp + off), sizeof(struct in_addr));
713 1.1 cgd cp[IPOPT_OFFSET] += sizeof(struct in_addr);
714 1.13 mycroft /*
715 1.13 mycroft * Let ip_intr's mcast routing check handle mcast pkts
716 1.13 mycroft */
717 1.18 mycroft forward = !IN_MULTICAST(ip->ip_dst.s_addr);
718 1.1 cgd break;
719 1.1 cgd
720 1.1 cgd case IPOPT_RR:
721 1.1 cgd if ((off = cp[IPOPT_OFFSET]) < IPOPT_MINOFF) {
722 1.1 cgd code = &cp[IPOPT_OFFSET] - (u_char *)ip;
723 1.1 cgd goto bad;
724 1.1 cgd }
725 1.1 cgd /*
726 1.1 cgd * If no space remains, ignore.
727 1.1 cgd */
728 1.1 cgd off--; /* 0 origin */
729 1.1 cgd if (off > optlen - sizeof(struct in_addr))
730 1.1 cgd break;
731 1.1 cgd bcopy((caddr_t)(&ip->ip_dst), (caddr_t)&ipaddr.sin_addr,
732 1.1 cgd sizeof(ipaddr.sin_addr));
733 1.1 cgd /*
734 1.1 cgd * locate outgoing interface; if we're the destination,
735 1.1 cgd * use the incoming interface (should be same).
736 1.1 cgd */
737 1.1 cgd if ((ia = (INA)ifa_ifwithaddr((SA)&ipaddr)) == 0 &&
738 1.1 cgd (ia = ip_rtaddr(ipaddr.sin_addr)) == 0) {
739 1.1 cgd type = ICMP_UNREACH;
740 1.1 cgd code = ICMP_UNREACH_HOST;
741 1.1 cgd goto bad;
742 1.1 cgd }
743 1.20 mycroft bcopy((caddr_t)&ia->ia_addr.sin_addr,
744 1.1 cgd (caddr_t)(cp + off), sizeof(struct in_addr));
745 1.1 cgd cp[IPOPT_OFFSET] += sizeof(struct in_addr);
746 1.1 cgd break;
747 1.1 cgd
748 1.1 cgd case IPOPT_TS:
749 1.1 cgd code = cp - (u_char *)ip;
750 1.1 cgd ipt = (struct ip_timestamp *)cp;
751 1.1 cgd if (ipt->ipt_len < 5)
752 1.1 cgd goto bad;
753 1.15 cgd if (ipt->ipt_ptr > ipt->ipt_len - sizeof (int32_t)) {
754 1.1 cgd if (++ipt->ipt_oflw == 0)
755 1.1 cgd goto bad;
756 1.1 cgd break;
757 1.1 cgd }
758 1.1 cgd sin = (struct in_addr *)(cp + ipt->ipt_ptr - 1);
759 1.1 cgd switch (ipt->ipt_flg) {
760 1.1 cgd
761 1.1 cgd case IPOPT_TS_TSONLY:
762 1.1 cgd break;
763 1.1 cgd
764 1.1 cgd case IPOPT_TS_TSANDADDR:
765 1.1 cgd if (ipt->ipt_ptr + sizeof(n_time) +
766 1.1 cgd sizeof(struct in_addr) > ipt->ipt_len)
767 1.1 cgd goto bad;
768 1.13 mycroft ipaddr.sin_addr = dst;
769 1.13 mycroft ia = (INA)ifaof_ifpforaddr((SA)&ipaddr,
770 1.13 mycroft m->m_pkthdr.rcvif);
771 1.13 mycroft if (ia == 0)
772 1.13 mycroft continue;
773 1.20 mycroft bcopy((caddr_t)&ia->ia_addr.sin_addr,
774 1.1 cgd (caddr_t)sin, sizeof(struct in_addr));
775 1.1 cgd ipt->ipt_ptr += sizeof(struct in_addr);
776 1.1 cgd break;
777 1.1 cgd
778 1.1 cgd case IPOPT_TS_PRESPEC:
779 1.1 cgd if (ipt->ipt_ptr + sizeof(n_time) +
780 1.1 cgd sizeof(struct in_addr) > ipt->ipt_len)
781 1.1 cgd goto bad;
782 1.1 cgd bcopy((caddr_t)sin, (caddr_t)&ipaddr.sin_addr,
783 1.1 cgd sizeof(struct in_addr));
784 1.1 cgd if (ifa_ifwithaddr((SA)&ipaddr) == 0)
785 1.1 cgd continue;
786 1.1 cgd ipt->ipt_ptr += sizeof(struct in_addr);
787 1.1 cgd break;
788 1.1 cgd
789 1.1 cgd default:
790 1.1 cgd goto bad;
791 1.1 cgd }
792 1.1 cgd ntime = iptime();
793 1.1 cgd bcopy((caddr_t)&ntime, (caddr_t)cp + ipt->ipt_ptr - 1,
794 1.1 cgd sizeof(n_time));
795 1.1 cgd ipt->ipt_ptr += sizeof(n_time);
796 1.1 cgd }
797 1.1 cgd }
798 1.1 cgd if (forward) {
799 1.1 cgd ip_forward(m, 1);
800 1.1 cgd return (1);
801 1.13 mycroft }
802 1.13 mycroft return (0);
803 1.1 cgd bad:
804 1.13 mycroft ip->ip_len -= ip->ip_hl << 2; /* XXX icmp_error adds in hdr length */
805 1.13 mycroft icmp_error(m, type, code, 0, 0);
806 1.13 mycroft ipstat.ips_badoptions++;
807 1.1 cgd return (1);
808 1.1 cgd }
809 1.1 cgd
810 1.1 cgd /*
811 1.1 cgd * Given address of next destination (final or next hop),
812 1.1 cgd * return internet address info of interface to be used to get there.
813 1.1 cgd */
814 1.1 cgd struct in_ifaddr *
815 1.1 cgd ip_rtaddr(dst)
816 1.1 cgd struct in_addr dst;
817 1.1 cgd {
818 1.1 cgd register struct sockaddr_in *sin;
819 1.1 cgd
820 1.19 mycroft sin = satosin(&ipforward_rt.ro_dst);
821 1.1 cgd
822 1.1 cgd if (ipforward_rt.ro_rt == 0 || dst.s_addr != sin->sin_addr.s_addr) {
823 1.1 cgd if (ipforward_rt.ro_rt) {
824 1.1 cgd RTFREE(ipforward_rt.ro_rt);
825 1.1 cgd ipforward_rt.ro_rt = 0;
826 1.1 cgd }
827 1.1 cgd sin->sin_family = AF_INET;
828 1.1 cgd sin->sin_len = sizeof(*sin);
829 1.1 cgd sin->sin_addr = dst;
830 1.1 cgd
831 1.1 cgd rtalloc(&ipforward_rt);
832 1.1 cgd }
833 1.1 cgd if (ipforward_rt.ro_rt == 0)
834 1.1 cgd return ((struct in_ifaddr *)0);
835 1.19 mycroft return (ifatoia(ipforward_rt.ro_rt->rt_ifa));
836 1.1 cgd }
837 1.1 cgd
838 1.1 cgd /*
839 1.1 cgd * Save incoming source route for use in replies,
840 1.1 cgd * to be picked up later by ip_srcroute if the receiver is interested.
841 1.1 cgd */
842 1.13 mycroft void
843 1.1 cgd save_rte(option, dst)
844 1.1 cgd u_char *option;
845 1.1 cgd struct in_addr dst;
846 1.1 cgd {
847 1.1 cgd unsigned olen;
848 1.1 cgd
849 1.1 cgd olen = option[IPOPT_OLEN];
850 1.1 cgd #ifdef DIAGNOSTIC
851 1.1 cgd if (ipprintfs)
852 1.1 cgd printf("save_rte: olen %d\n", olen);
853 1.1 cgd #endif
854 1.1 cgd if (olen > sizeof(ip_srcrt) - (1 + sizeof(dst)))
855 1.1 cgd return;
856 1.1 cgd bcopy((caddr_t)option, (caddr_t)ip_srcrt.srcopt, olen);
857 1.1 cgd ip_nhops = (olen - IPOPT_OFFSET - 1) / sizeof(struct in_addr);
858 1.1 cgd ip_srcrt.dst = dst;
859 1.1 cgd }
860 1.1 cgd
861 1.1 cgd /*
862 1.1 cgd * Retrieve incoming source route for use in replies,
863 1.1 cgd * in the same form used by setsockopt.
864 1.1 cgd * The first hop is placed before the options, will be removed later.
865 1.1 cgd */
866 1.1 cgd struct mbuf *
867 1.1 cgd ip_srcroute()
868 1.1 cgd {
869 1.1 cgd register struct in_addr *p, *q;
870 1.1 cgd register struct mbuf *m;
871 1.1 cgd
872 1.1 cgd if (ip_nhops == 0)
873 1.1 cgd return ((struct mbuf *)0);
874 1.1 cgd m = m_get(M_DONTWAIT, MT_SOOPTS);
875 1.1 cgd if (m == 0)
876 1.1 cgd return ((struct mbuf *)0);
877 1.1 cgd
878 1.13 mycroft #define OPTSIZ (sizeof(ip_srcrt.nop) + sizeof(ip_srcrt.srcopt))
879 1.1 cgd
880 1.1 cgd /* length is (nhops+1)*sizeof(addr) + sizeof(nop + srcrt header) */
881 1.1 cgd m->m_len = ip_nhops * sizeof(struct in_addr) + sizeof(struct in_addr) +
882 1.1 cgd OPTSIZ;
883 1.1 cgd #ifdef DIAGNOSTIC
884 1.1 cgd if (ipprintfs)
885 1.1 cgd printf("ip_srcroute: nhops %d mlen %d", ip_nhops, m->m_len);
886 1.1 cgd #endif
887 1.1 cgd
888 1.1 cgd /*
889 1.1 cgd * First save first hop for return route
890 1.1 cgd */
891 1.1 cgd p = &ip_srcrt.route[ip_nhops - 1];
892 1.1 cgd *(mtod(m, struct in_addr *)) = *p--;
893 1.1 cgd #ifdef DIAGNOSTIC
894 1.1 cgd if (ipprintfs)
895 1.1 cgd printf(" hops %lx", ntohl(mtod(m, struct in_addr *)->s_addr));
896 1.1 cgd #endif
897 1.1 cgd
898 1.1 cgd /*
899 1.1 cgd * Copy option fields and padding (nop) to mbuf.
900 1.1 cgd */
901 1.1 cgd ip_srcrt.nop = IPOPT_NOP;
902 1.1 cgd ip_srcrt.srcopt[IPOPT_OFFSET] = IPOPT_MINOFF;
903 1.1 cgd bcopy((caddr_t)&ip_srcrt.nop,
904 1.1 cgd mtod(m, caddr_t) + sizeof(struct in_addr), OPTSIZ);
905 1.1 cgd q = (struct in_addr *)(mtod(m, caddr_t) +
906 1.1 cgd sizeof(struct in_addr) + OPTSIZ);
907 1.1 cgd #undef OPTSIZ
908 1.1 cgd /*
909 1.1 cgd * Record return path as an IP source route,
910 1.1 cgd * reversing the path (pointers are now aligned).
911 1.1 cgd */
912 1.1 cgd while (p >= ip_srcrt.route) {
913 1.1 cgd #ifdef DIAGNOSTIC
914 1.1 cgd if (ipprintfs)
915 1.1 cgd printf(" %lx", ntohl(q->s_addr));
916 1.1 cgd #endif
917 1.1 cgd *q++ = *p--;
918 1.1 cgd }
919 1.1 cgd /*
920 1.1 cgd * Last hop goes to final destination.
921 1.1 cgd */
922 1.1 cgd *q = ip_srcrt.dst;
923 1.1 cgd #ifdef DIAGNOSTIC
924 1.1 cgd if (ipprintfs)
925 1.1 cgd printf(" %lx\n", ntohl(q->s_addr));
926 1.1 cgd #endif
927 1.1 cgd return (m);
928 1.1 cgd }
929 1.1 cgd
930 1.1 cgd /*
931 1.1 cgd * Strip out IP options, at higher
932 1.1 cgd * level protocol in the kernel.
933 1.1 cgd * Second argument is buffer to which options
934 1.1 cgd * will be moved, and return value is their length.
935 1.1 cgd * XXX should be deleted; last arg currently ignored.
936 1.1 cgd */
937 1.8 mycroft void
938 1.1 cgd ip_stripoptions(m, mopt)
939 1.1 cgd register struct mbuf *m;
940 1.1 cgd struct mbuf *mopt;
941 1.1 cgd {
942 1.1 cgd register int i;
943 1.1 cgd struct ip *ip = mtod(m, struct ip *);
944 1.1 cgd register caddr_t opts;
945 1.1 cgd int olen;
946 1.1 cgd
947 1.1 cgd olen = (ip->ip_hl<<2) - sizeof (struct ip);
948 1.1 cgd opts = (caddr_t)(ip + 1);
949 1.1 cgd i = m->m_len - (sizeof (struct ip) + olen);
950 1.1 cgd bcopy(opts + olen, opts, (unsigned)i);
951 1.1 cgd m->m_len -= olen;
952 1.1 cgd if (m->m_flags & M_PKTHDR)
953 1.1 cgd m->m_pkthdr.len -= olen;
954 1.1 cgd ip->ip_hl = sizeof(struct ip) >> 2;
955 1.1 cgd }
956 1.1 cgd
957 1.23 mycroft int inetctlerrmap[PRC_NCMDS] = {
958 1.1 cgd 0, 0, 0, 0,
959 1.1 cgd 0, EMSGSIZE, EHOSTDOWN, EHOSTUNREACH,
960 1.1 cgd EHOSTUNREACH, EHOSTUNREACH, ECONNREFUSED, ECONNREFUSED,
961 1.1 cgd EMSGSIZE, EHOSTUNREACH, 0, 0,
962 1.1 cgd 0, 0, 0, 0,
963 1.1 cgd ENOPROTOOPT
964 1.1 cgd };
965 1.1 cgd
966 1.1 cgd /*
967 1.1 cgd * Forward a packet. If some error occurs return the sender
968 1.1 cgd * an icmp packet. Note we can't always generate a meaningful
969 1.1 cgd * icmp message because icmp doesn't have a large enough repertoire
970 1.1 cgd * of codes and types.
971 1.1 cgd *
972 1.1 cgd * If not forwarding, just drop the packet. This could be confusing
973 1.1 cgd * if ipforwarding was zero but some routing protocol was advancing
974 1.1 cgd * us as a gateway to somewhere. However, we must let the routing
975 1.1 cgd * protocol deal with that.
976 1.1 cgd *
977 1.1 cgd * The srcrt parameter indicates whether the packet is being forwarded
978 1.1 cgd * via a source route.
979 1.1 cgd */
980 1.13 mycroft void
981 1.1 cgd ip_forward(m, srcrt)
982 1.1 cgd struct mbuf *m;
983 1.1 cgd int srcrt;
984 1.1 cgd {
985 1.1 cgd register struct ip *ip = mtod(m, struct ip *);
986 1.1 cgd register struct sockaddr_in *sin;
987 1.1 cgd register struct rtentry *rt;
988 1.1 cgd int error, type = 0, code;
989 1.1 cgd struct mbuf *mcopy;
990 1.13 mycroft n_long dest;
991 1.13 mycroft struct ifnet *destifp;
992 1.1 cgd
993 1.13 mycroft dest = 0;
994 1.1 cgd #ifdef DIAGNOSTIC
995 1.1 cgd if (ipprintfs)
996 1.1 cgd printf("forward: src %x dst %x ttl %x\n", ip->ip_src,
997 1.1 cgd ip->ip_dst, ip->ip_ttl);
998 1.1 cgd #endif
999 1.1 cgd if (m->m_flags & M_BCAST || in_canforward(ip->ip_dst) == 0) {
1000 1.1 cgd ipstat.ips_cantforward++;
1001 1.1 cgd m_freem(m);
1002 1.1 cgd return;
1003 1.1 cgd }
1004 1.1 cgd HTONS(ip->ip_id);
1005 1.1 cgd if (ip->ip_ttl <= IPTTLDEC) {
1006 1.13 mycroft icmp_error(m, ICMP_TIMXCEED, ICMP_TIMXCEED_INTRANS, dest, 0);
1007 1.1 cgd return;
1008 1.1 cgd }
1009 1.1 cgd ip->ip_ttl -= IPTTLDEC;
1010 1.1 cgd
1011 1.19 mycroft sin = satosin(&ipforward_rt.ro_dst);
1012 1.1 cgd if ((rt = ipforward_rt.ro_rt) == 0 ||
1013 1.1 cgd ip->ip_dst.s_addr != sin->sin_addr.s_addr) {
1014 1.1 cgd if (ipforward_rt.ro_rt) {
1015 1.1 cgd RTFREE(ipforward_rt.ro_rt);
1016 1.1 cgd ipforward_rt.ro_rt = 0;
1017 1.1 cgd }
1018 1.1 cgd sin->sin_family = AF_INET;
1019 1.1 cgd sin->sin_len = sizeof(*sin);
1020 1.1 cgd sin->sin_addr = ip->ip_dst;
1021 1.1 cgd
1022 1.1 cgd rtalloc(&ipforward_rt);
1023 1.1 cgd if (ipforward_rt.ro_rt == 0) {
1024 1.13 mycroft icmp_error(m, ICMP_UNREACH, ICMP_UNREACH_HOST, dest, 0);
1025 1.1 cgd return;
1026 1.1 cgd }
1027 1.1 cgd rt = ipforward_rt.ro_rt;
1028 1.1 cgd }
1029 1.1 cgd
1030 1.1 cgd /*
1031 1.1 cgd * Save at most 64 bytes of the packet in case
1032 1.1 cgd * we need to generate an ICMP message to the src.
1033 1.1 cgd */
1034 1.1 cgd mcopy = m_copy(m, 0, imin((int)ip->ip_len, 64));
1035 1.1 cgd
1036 1.1 cgd /*
1037 1.1 cgd * If forwarding packet using same interface that it came in on,
1038 1.1 cgd * perhaps should send a redirect to sender to shortcut a hop.
1039 1.1 cgd * Only send redirect if source is sending directly to us,
1040 1.1 cgd * and if packet was not source routed (or has any options).
1041 1.1 cgd * Also, don't send redirect if forwarding using a default route
1042 1.1 cgd * or a route modified by a redirect.
1043 1.1 cgd */
1044 1.1 cgd if (rt->rt_ifp == m->m_pkthdr.rcvif &&
1045 1.1 cgd (rt->rt_flags & (RTF_DYNAMIC|RTF_MODIFIED)) == 0 &&
1046 1.1 cgd satosin(rt_key(rt))->sin_addr.s_addr != 0 &&
1047 1.1 cgd ipsendredirects && !srcrt) {
1048 1.19 mycroft if (rt->rt_ifa &&
1049 1.19 mycroft (ip->ip_src.s_addr & ifatoia(rt->rt_ifa)->ia_subnetmask) ==
1050 1.19 mycroft ifatoia(rt->rt_ifa)->ia_subnet) {
1051 1.1 cgd if (rt->rt_flags & RTF_GATEWAY)
1052 1.13 mycroft dest = satosin(rt->rt_gateway)->sin_addr.s_addr;
1053 1.1 cgd else
1054 1.13 mycroft dest = ip->ip_dst.s_addr;
1055 1.13 mycroft /* Router requirements says to only send host redirects */
1056 1.1 cgd type = ICMP_REDIRECT;
1057 1.13 mycroft code = ICMP_REDIRECT_HOST;
1058 1.1 cgd #ifdef DIAGNOSTIC
1059 1.1 cgd if (ipprintfs)
1060 1.15 cgd printf("redirect (%d) to %lx\n", code, (u_int32_t)dest);
1061 1.1 cgd #endif
1062 1.1 cgd }
1063 1.1 cgd }
1064 1.1 cgd
1065 1.13 mycroft error = ip_output(m, (struct mbuf *)0, &ipforward_rt, IP_FORWARDING
1066 1.9 mycroft #ifdef DIRECTED_BROADCAST
1067 1.13 mycroft | IP_ALLOWBROADCAST
1068 1.9 mycroft #endif
1069 1.13 mycroft , 0);
1070 1.1 cgd if (error)
1071 1.1 cgd ipstat.ips_cantforward++;
1072 1.1 cgd else {
1073 1.1 cgd ipstat.ips_forward++;
1074 1.1 cgd if (type)
1075 1.1 cgd ipstat.ips_redirectsent++;
1076 1.1 cgd else {
1077 1.1 cgd if (mcopy)
1078 1.1 cgd m_freem(mcopy);
1079 1.1 cgd return;
1080 1.1 cgd }
1081 1.1 cgd }
1082 1.1 cgd if (mcopy == NULL)
1083 1.1 cgd return;
1084 1.13 mycroft destifp = NULL;
1085 1.13 mycroft
1086 1.1 cgd switch (error) {
1087 1.1 cgd
1088 1.1 cgd case 0: /* forwarded, but need redirect */
1089 1.1 cgd /* type, code set above */
1090 1.1 cgd break;
1091 1.1 cgd
1092 1.1 cgd case ENETUNREACH: /* shouldn't happen, checked above */
1093 1.1 cgd case EHOSTUNREACH:
1094 1.1 cgd case ENETDOWN:
1095 1.1 cgd case EHOSTDOWN:
1096 1.1 cgd default:
1097 1.1 cgd type = ICMP_UNREACH;
1098 1.1 cgd code = ICMP_UNREACH_HOST;
1099 1.1 cgd break;
1100 1.1 cgd
1101 1.1 cgd case EMSGSIZE:
1102 1.1 cgd type = ICMP_UNREACH;
1103 1.1 cgd code = ICMP_UNREACH_NEEDFRAG;
1104 1.13 mycroft if (ipforward_rt.ro_rt)
1105 1.13 mycroft destifp = ipforward_rt.ro_rt->rt_ifp;
1106 1.1 cgd ipstat.ips_cantfrag++;
1107 1.1 cgd break;
1108 1.1 cgd
1109 1.1 cgd case ENOBUFS:
1110 1.1 cgd type = ICMP_SOURCEQUENCH;
1111 1.1 cgd code = 0;
1112 1.1 cgd break;
1113 1.1 cgd }
1114 1.13 mycroft icmp_error(mcopy, type, code, dest, destifp);
1115 1.13 mycroft }
1116 1.13 mycroft
1117 1.13 mycroft int
1118 1.13 mycroft ip_sysctl(name, namelen, oldp, oldlenp, newp, newlen)
1119 1.13 mycroft int *name;
1120 1.13 mycroft u_int namelen;
1121 1.13 mycroft void *oldp;
1122 1.13 mycroft size_t *oldlenp;
1123 1.13 mycroft void *newp;
1124 1.13 mycroft size_t newlen;
1125 1.13 mycroft {
1126 1.13 mycroft /* All sysctl names at this level are terminal. */
1127 1.13 mycroft if (namelen != 1)
1128 1.13 mycroft return (ENOTDIR);
1129 1.13 mycroft
1130 1.13 mycroft switch (name[0]) {
1131 1.13 mycroft case IPCTL_FORWARDING:
1132 1.13 mycroft return (sysctl_int(oldp, oldlenp, newp, newlen, &ipforwarding));
1133 1.13 mycroft case IPCTL_SENDREDIRECTS:
1134 1.13 mycroft return (sysctl_int(oldp, oldlenp, newp, newlen,
1135 1.13 mycroft &ipsendredirects));
1136 1.13 mycroft case IPCTL_DEFTTL:
1137 1.13 mycroft return (sysctl_int(oldp, oldlenp, newp, newlen, &ip_defttl));
1138 1.13 mycroft #ifdef notyet
1139 1.13 mycroft case IPCTL_DEFMTU:
1140 1.13 mycroft return (sysctl_int(oldp, oldlenp, newp, newlen, &ip_mtu));
1141 1.13 mycroft #endif
1142 1.13 mycroft default:
1143 1.13 mycroft return (EOPNOTSUPP);
1144 1.13 mycroft }
1145 1.13 mycroft /* NOTREACHED */
1146 1.1 cgd }
1147