ip_input.c revision 1.10 1 1.1 cgd /*
2 1.1 cgd * Copyright (c) 1982, 1986, 1988 Regents of the University of California.
3 1.1 cgd * All rights reserved.
4 1.1 cgd *
5 1.1 cgd * Redistribution and use in source and binary forms, with or without
6 1.1 cgd * modification, are permitted provided that the following conditions
7 1.1 cgd * are met:
8 1.1 cgd * 1. Redistributions of source code must retain the above copyright
9 1.1 cgd * notice, this list of conditions and the following disclaimer.
10 1.1 cgd * 2. Redistributions in binary form must reproduce the above copyright
11 1.1 cgd * notice, this list of conditions and the following disclaimer in the
12 1.1 cgd * documentation and/or other materials provided with the distribution.
13 1.1 cgd * 3. All advertising materials mentioning features or use of this software
14 1.1 cgd * must display the following acknowledgement:
15 1.1 cgd * This product includes software developed by the University of
16 1.1 cgd * California, Berkeley and its contributors.
17 1.1 cgd * 4. Neither the name of the University nor the names of its contributors
18 1.1 cgd * may be used to endorse or promote products derived from this software
19 1.1 cgd * without specific prior written permission.
20 1.1 cgd *
21 1.1 cgd * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
22 1.1 cgd * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
23 1.1 cgd * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
24 1.1 cgd * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
25 1.1 cgd * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
26 1.1 cgd * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
27 1.1 cgd * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
28 1.1 cgd * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
29 1.1 cgd * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
30 1.1 cgd * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
31 1.1 cgd * SUCH DAMAGE.
32 1.1 cgd *
33 1.3 cgd * from: @(#)ip_input.c 7.19 (Berkeley) 5/25/91
34 1.10 brezak * $Id: ip_input.c,v 1.10 1994/01/29 11:58:01 brezak Exp $
35 1.1 cgd */
36 1.1 cgd
37 1.5 mycroft #include <sys/param.h>
38 1.5 mycroft #include <sys/systm.h>
39 1.5 mycroft #include <sys/malloc.h>
40 1.5 mycroft #include <sys/mbuf.h>
41 1.5 mycroft #include <sys/domain.h>
42 1.5 mycroft #include <sys/protosw.h>
43 1.5 mycroft #include <sys/socket.h>
44 1.5 mycroft #include <sys/errno.h>
45 1.5 mycroft #include <sys/time.h>
46 1.5 mycroft #include <sys/kernel.h>
47 1.1 cgd
48 1.5 mycroft #include <net/if.h>
49 1.5 mycroft #include <net/route.h>
50 1.1 cgd
51 1.5 mycroft #include <netinet/in.h>
52 1.5 mycroft #include <netinet/in_systm.h>
53 1.5 mycroft #include <netinet/ip.h>
54 1.5 mycroft #include <netinet/in_pcb.h>
55 1.5 mycroft #include <netinet/in_var.h>
56 1.5 mycroft #include <netinet/ip_var.h>
57 1.5 mycroft #include <netinet/ip_icmp.h>
58 1.8 mycroft #include <netinet/ip_mroute.h>
59 1.1 cgd
60 1.1 cgd #ifndef IPFORWARDING
61 1.1 cgd #ifdef GATEWAY
62 1.1 cgd #define IPFORWARDING 1 /* forward IP packets not for us */
63 1.1 cgd #else /* GATEWAY */
64 1.1 cgd #define IPFORWARDING 0 /* don't forward IP packets not for us */
65 1.1 cgd #endif /* GATEWAY */
66 1.1 cgd #endif /* IPFORWARDING */
67 1.1 cgd #ifndef IPSENDREDIRECTS
68 1.1 cgd #define IPSENDREDIRECTS 1
69 1.1 cgd #endif
70 1.1 cgd int ipforwarding = IPFORWARDING;
71 1.1 cgd int ipsendredirects = IPSENDREDIRECTS;
72 1.1 cgd #ifdef DIAGNOSTIC
73 1.1 cgd int ipprintfs = 0;
74 1.1 cgd #endif
75 1.1 cgd
76 1.1 cgd extern struct domain inetdomain;
77 1.1 cgd extern struct protosw inetsw[];
78 1.1 cgd u_char ip_protox[IPPROTO_MAX];
79 1.1 cgd int ipqmaxlen = IFQ_MAXLEN;
80 1.1 cgd struct in_ifaddr *in_ifaddr; /* first inet address */
81 1.1 cgd
82 1.1 cgd /*
83 1.1 cgd * We need to save the IP options in case a protocol wants to respond
84 1.1 cgd * to an incoming packet over the same route if the packet got here
85 1.1 cgd * using IP source routing. This allows connection establishment and
86 1.1 cgd * maintenance when the remote end is on a network that is not known
87 1.1 cgd * to us.
88 1.1 cgd */
89 1.1 cgd int ip_nhops = 0;
90 1.1 cgd static struct ip_srcrt {
91 1.1 cgd struct in_addr dst; /* final destination */
92 1.1 cgd char nop; /* one NOP to align */
93 1.1 cgd char srcopt[IPOPT_OFFSET + 1]; /* OPTVAL, OLEN and OFFSET */
94 1.1 cgd struct in_addr route[MAX_IPOPTLEN/sizeof(struct in_addr)];
95 1.1 cgd } ip_srcrt;
96 1.1 cgd
97 1.1 cgd #ifdef GATEWAY
98 1.1 cgd extern int if_index;
99 1.1 cgd u_long *ip_ifmatrix;
100 1.1 cgd #endif
101 1.1 cgd
102 1.8 mycroft static void ip_forward __P((struct mbuf *, int));
103 1.8 mycroft static void save_rte __P((u_char *, struct in_addr));
104 1.8 mycroft
105 1.1 cgd /*
106 1.1 cgd * IP initialization: fill in IP protocol switch table.
107 1.1 cgd * All protocols not implemented in kernel go to raw IP protocol handler.
108 1.1 cgd */
109 1.8 mycroft void
110 1.1 cgd ip_init()
111 1.1 cgd {
112 1.1 cgd register struct protosw *pr;
113 1.1 cgd register int i;
114 1.1 cgd
115 1.1 cgd pr = pffindproto(PF_INET, IPPROTO_RAW, SOCK_RAW);
116 1.1 cgd if (pr == 0)
117 1.1 cgd panic("ip_init");
118 1.1 cgd for (i = 0; i < IPPROTO_MAX; i++)
119 1.1 cgd ip_protox[i] = pr - inetsw;
120 1.1 cgd for (pr = inetdomain.dom_protosw;
121 1.1 cgd pr < inetdomain.dom_protoswNPROTOSW; pr++)
122 1.1 cgd if (pr->pr_domain->dom_family == PF_INET &&
123 1.1 cgd pr->pr_protocol && pr->pr_protocol != IPPROTO_RAW)
124 1.1 cgd ip_protox[pr->pr_protocol] = pr - inetsw;
125 1.1 cgd ipq.next = ipq.prev = &ipq;
126 1.1 cgd ip_id = time.tv_sec & 0xffff;
127 1.1 cgd ipintrq.ifq_maxlen = ipqmaxlen;
128 1.1 cgd #ifdef GATEWAY
129 1.1 cgd i = (if_index + 1) * (if_index + 1) * sizeof (u_long);
130 1.1 cgd if ((ip_ifmatrix = (u_long *) malloc(i, M_RTABLE, M_WAITOK)) == 0)
131 1.1 cgd panic("no memory for ip_ifmatrix");
132 1.1 cgd #endif
133 1.1 cgd }
134 1.1 cgd
135 1.1 cgd struct ip *ip_reass();
136 1.1 cgd struct sockaddr_in ipaddr = { sizeof(ipaddr), AF_INET };
137 1.1 cgd struct route ipforward_rt;
138 1.1 cgd
139 1.1 cgd /*
140 1.1 cgd * Ip input routine. Checksum and byte swap header. If fragmented
141 1.1 cgd * try to reassemble. Process options. Pass to next level.
142 1.1 cgd */
143 1.8 mycroft void
144 1.1 cgd ipintr()
145 1.1 cgd {
146 1.1 cgd register struct ip *ip;
147 1.1 cgd register struct mbuf *m;
148 1.1 cgd register struct ipq *fp;
149 1.1 cgd register struct in_ifaddr *ia;
150 1.1 cgd int hlen, s;
151 1.2 cgd #ifdef PARANOID
152 1.2 cgd static int busy = 0;
153 1.1 cgd
154 1.2 cgd if (busy)
155 1.2 cgd panic("ipintr: called recursively\n");
156 1.2 cgd ++busy;
157 1.2 cgd #endif
158 1.1 cgd next:
159 1.1 cgd /*
160 1.1 cgd * Get next datagram off input queue and get IP header
161 1.1 cgd * in first mbuf.
162 1.1 cgd */
163 1.1 cgd s = splimp();
164 1.1 cgd IF_DEQUEUE(&ipintrq, m);
165 1.1 cgd splx(s);
166 1.2 cgd if (m == 0) {
167 1.2 cgd #ifdef PARANOID
168 1.2 cgd --busy;
169 1.2 cgd #endif
170 1.1 cgd return;
171 1.2 cgd }
172 1.1 cgd #ifdef DIAGNOSTIC
173 1.1 cgd if ((m->m_flags & M_PKTHDR) == 0)
174 1.1 cgd panic("ipintr no HDR");
175 1.1 cgd #endif
176 1.1 cgd /*
177 1.1 cgd * If no IP addresses have been set yet but the interfaces
178 1.1 cgd * are receiving, can't do anything with incoming packets yet.
179 1.1 cgd */
180 1.1 cgd if (in_ifaddr == NULL)
181 1.1 cgd goto bad;
182 1.1 cgd ipstat.ips_total++;
183 1.1 cgd if (m->m_len < sizeof (struct ip) &&
184 1.1 cgd (m = m_pullup(m, sizeof (struct ip))) == 0) {
185 1.1 cgd ipstat.ips_toosmall++;
186 1.1 cgd goto next;
187 1.1 cgd }
188 1.1 cgd ip = mtod(m, struct ip *);
189 1.1 cgd hlen = ip->ip_hl << 2;
190 1.1 cgd if (hlen < sizeof(struct ip)) { /* minimum header length */
191 1.1 cgd ipstat.ips_badhlen++;
192 1.1 cgd goto bad;
193 1.1 cgd }
194 1.1 cgd if (hlen > m->m_len) {
195 1.1 cgd if ((m = m_pullup(m, hlen)) == 0) {
196 1.1 cgd ipstat.ips_badhlen++;
197 1.1 cgd goto next;
198 1.1 cgd }
199 1.1 cgd ip = mtod(m, struct ip *);
200 1.1 cgd }
201 1.1 cgd if (ip->ip_sum = in_cksum(m, hlen)) {
202 1.1 cgd ipstat.ips_badsum++;
203 1.1 cgd goto bad;
204 1.1 cgd }
205 1.1 cgd
206 1.1 cgd /*
207 1.1 cgd * Convert fields to host representation.
208 1.1 cgd */
209 1.1 cgd NTOHS(ip->ip_len);
210 1.1 cgd if (ip->ip_len < hlen) {
211 1.1 cgd ipstat.ips_badlen++;
212 1.1 cgd goto bad;
213 1.1 cgd }
214 1.1 cgd NTOHS(ip->ip_id);
215 1.1 cgd NTOHS(ip->ip_off);
216 1.1 cgd
217 1.1 cgd /*
218 1.1 cgd * Check that the amount of data in the buffers
219 1.1 cgd * is as at least much as the IP header would have us expect.
220 1.1 cgd * Trim mbufs if longer than we expect.
221 1.1 cgd * Drop packet if shorter than we expect.
222 1.1 cgd */
223 1.1 cgd if (m->m_pkthdr.len < ip->ip_len) {
224 1.1 cgd ipstat.ips_tooshort++;
225 1.1 cgd goto bad;
226 1.1 cgd }
227 1.1 cgd if (m->m_pkthdr.len > ip->ip_len) {
228 1.1 cgd if (m->m_len == m->m_pkthdr.len) {
229 1.1 cgd m->m_len = ip->ip_len;
230 1.1 cgd m->m_pkthdr.len = ip->ip_len;
231 1.1 cgd } else
232 1.1 cgd m_adj(m, ip->ip_len - m->m_pkthdr.len);
233 1.1 cgd }
234 1.1 cgd
235 1.1 cgd /*
236 1.1 cgd * Process options and, if not destined for us,
237 1.1 cgd * ship it on. ip_dooptions returns 1 when an
238 1.1 cgd * error was detected (causing an icmp message
239 1.1 cgd * to be sent and the original packet to be freed).
240 1.1 cgd */
241 1.1 cgd ip_nhops = 0; /* for source routed packets */
242 1.1 cgd if (hlen > sizeof (struct ip) && ip_dooptions(m))
243 1.1 cgd goto next;
244 1.1 cgd
245 1.1 cgd /*
246 1.1 cgd * Check our list of addresses, to see if the packet is for us.
247 1.1 cgd */
248 1.1 cgd for (ia = in_ifaddr; ia; ia = ia->ia_next) {
249 1.1 cgd #define satosin(sa) ((struct sockaddr_in *)(sa))
250 1.1 cgd
251 1.1 cgd if (IA_SIN(ia)->sin_addr.s_addr == ip->ip_dst.s_addr)
252 1.1 cgd goto ours;
253 1.1 cgd if (
254 1.1 cgd #ifdef DIRECTED_BROADCAST
255 1.1 cgd ia->ia_ifp == m->m_pkthdr.rcvif &&
256 1.1 cgd #endif
257 1.1 cgd (ia->ia_ifp->if_flags & IFF_BROADCAST)) {
258 1.1 cgd u_long t;
259 1.1 cgd
260 1.1 cgd if (satosin(&ia->ia_broadaddr)->sin_addr.s_addr ==
261 1.1 cgd ip->ip_dst.s_addr)
262 1.1 cgd goto ours;
263 1.1 cgd if (ip->ip_dst.s_addr == ia->ia_netbroadcast.s_addr)
264 1.1 cgd goto ours;
265 1.1 cgd /*
266 1.1 cgd * Look for all-0's host part (old broadcast addr),
267 1.1 cgd * either for subnet or net.
268 1.1 cgd */
269 1.1 cgd t = ntohl(ip->ip_dst.s_addr);
270 1.1 cgd if (t == ia->ia_subnet)
271 1.1 cgd goto ours;
272 1.1 cgd if (t == ia->ia_net)
273 1.1 cgd goto ours;
274 1.1 cgd }
275 1.1 cgd }
276 1.4 hpeyerl #ifdef MULTICAST
277 1.4 hpeyerl if (IN_MULTICAST(ntohl(ip->ip_dst.s_addr))) {
278 1.4 hpeyerl struct in_multi *inm;
279 1.4 hpeyerl #ifdef MROUTING
280 1.4 hpeyerl extern struct socket *ip_mrouter;
281 1.10 brezak
282 1.10 brezak if (m->m_flags & M_EXT) {
283 1.10 brezak if ((m = m_pullup(m, hlen)) == 0) {
284 1.10 brezak ipstat.ips_toosmall++;
285 1.10 brezak goto next;
286 1.10 brezak }
287 1.10 brezak ip = mtod(m, struct ip *);
288 1.10 brezak }
289 1.4 hpeyerl
290 1.4 hpeyerl if (ip_mrouter) {
291 1.4 hpeyerl /*
292 1.4 hpeyerl * If we are acting as a multicast router, all
293 1.4 hpeyerl * incoming multicast packets are passed to the
294 1.4 hpeyerl * kernel-level multicast forwarding function.
295 1.4 hpeyerl * The packet is returned (relatively) intact; if
296 1.4 hpeyerl * ip_mforward() returns a non-zero value, the packet
297 1.4 hpeyerl * must be discarded, else it may be accepted below.
298 1.4 hpeyerl *
299 1.4 hpeyerl * (The IP ident field is put in the same byte order
300 1.4 hpeyerl * as expected when ip_mforward() is called from
301 1.4 hpeyerl * ip_output().)
302 1.4 hpeyerl */
303 1.4 hpeyerl ip->ip_id = htons(ip->ip_id);
304 1.4 hpeyerl if (ip_mforward(ip, m->m_pkthdr.rcvif, m) != 0) {
305 1.4 hpeyerl m_freem(m);
306 1.4 hpeyerl goto next;
307 1.4 hpeyerl }
308 1.4 hpeyerl ip->ip_id = ntohs(ip->ip_id);
309 1.4 hpeyerl
310 1.4 hpeyerl /*
311 1.4 hpeyerl * The process-level routing demon needs to receive
312 1.4 hpeyerl * all multicast IGMP packets, whether or not this
313 1.4 hpeyerl * host belongs to their destination groups.
314 1.4 hpeyerl */
315 1.4 hpeyerl if (ip->ip_p == IPPROTO_IGMP)
316 1.4 hpeyerl goto ours;
317 1.4 hpeyerl }
318 1.4 hpeyerl #endif
319 1.4 hpeyerl /*
320 1.4 hpeyerl * See if we belong to the destination multicast group on the
321 1.4 hpeyerl * arrival interface.
322 1.4 hpeyerl */
323 1.4 hpeyerl IN_LOOKUP_MULTI(ip->ip_dst, m->m_pkthdr.rcvif, inm);
324 1.4 hpeyerl if (inm == NULL) {
325 1.4 hpeyerl m_freem(m);
326 1.4 hpeyerl goto next;
327 1.4 hpeyerl }
328 1.4 hpeyerl goto ours;
329 1.4 hpeyerl }
330 1.4 hpeyerl #endif
331 1.1 cgd if (ip->ip_dst.s_addr == (u_long)INADDR_BROADCAST)
332 1.1 cgd goto ours;
333 1.1 cgd if (ip->ip_dst.s_addr == INADDR_ANY)
334 1.1 cgd goto ours;
335 1.1 cgd
336 1.1 cgd /*
337 1.1 cgd * Not for us; forward if possible and desirable.
338 1.1 cgd */
339 1.1 cgd if (ipforwarding == 0) {
340 1.1 cgd ipstat.ips_cantforward++;
341 1.1 cgd m_freem(m);
342 1.1 cgd } else
343 1.1 cgd ip_forward(m, 0);
344 1.1 cgd goto next;
345 1.1 cgd
346 1.1 cgd ours:
347 1.1 cgd /*
348 1.1 cgd * If offset or IP_MF are set, must reassemble.
349 1.1 cgd * Otherwise, nothing need be done.
350 1.1 cgd * (We could look in the reassembly queue to see
351 1.1 cgd * if the packet was previously fragmented,
352 1.1 cgd * but it's not worth the time; just let them time out.)
353 1.1 cgd */
354 1.1 cgd if (ip->ip_off &~ IP_DF) {
355 1.1 cgd if (m->m_flags & M_EXT) { /* XXX */
356 1.1 cgd if ((m = m_pullup(m, sizeof (struct ip))) == 0) {
357 1.1 cgd ipstat.ips_toosmall++;
358 1.1 cgd goto next;
359 1.1 cgd }
360 1.1 cgd ip = mtod(m, struct ip *);
361 1.1 cgd }
362 1.1 cgd /*
363 1.1 cgd * Look for queue of fragments
364 1.1 cgd * of this datagram.
365 1.1 cgd */
366 1.1 cgd for (fp = ipq.next; fp != &ipq; fp = fp->next)
367 1.1 cgd if (ip->ip_id == fp->ipq_id &&
368 1.1 cgd ip->ip_src.s_addr == fp->ipq_src.s_addr &&
369 1.1 cgd ip->ip_dst.s_addr == fp->ipq_dst.s_addr &&
370 1.1 cgd ip->ip_p == fp->ipq_p)
371 1.1 cgd goto found;
372 1.1 cgd fp = 0;
373 1.1 cgd found:
374 1.1 cgd
375 1.1 cgd /*
376 1.1 cgd * Adjust ip_len to not reflect header,
377 1.1 cgd * set ip_mff if more fragments are expected,
378 1.1 cgd * convert offset of this to bytes.
379 1.1 cgd */
380 1.1 cgd ip->ip_len -= hlen;
381 1.1 cgd ((struct ipasfrag *)ip)->ipf_mff = 0;
382 1.1 cgd if (ip->ip_off & IP_MF)
383 1.1 cgd ((struct ipasfrag *)ip)->ipf_mff = 1;
384 1.1 cgd ip->ip_off <<= 3;
385 1.1 cgd
386 1.1 cgd /*
387 1.1 cgd * If datagram marked as having more fragments
388 1.1 cgd * or if this is not the first fragment,
389 1.1 cgd * attempt reassembly; if it succeeds, proceed.
390 1.1 cgd */
391 1.1 cgd if (((struct ipasfrag *)ip)->ipf_mff || ip->ip_off) {
392 1.1 cgd ipstat.ips_fragments++;
393 1.1 cgd ip = ip_reass((struct ipasfrag *)ip, fp);
394 1.1 cgd if (ip == 0)
395 1.1 cgd goto next;
396 1.1 cgd else
397 1.1 cgd ipstat.ips_reassembled++;
398 1.1 cgd m = dtom(ip);
399 1.1 cgd } else
400 1.1 cgd if (fp)
401 1.1 cgd ip_freef(fp);
402 1.1 cgd } else
403 1.1 cgd ip->ip_len -= hlen;
404 1.1 cgd
405 1.1 cgd /*
406 1.1 cgd * Switch out to protocol's input routine.
407 1.1 cgd */
408 1.1 cgd ipstat.ips_delivered++;
409 1.1 cgd (*inetsw[ip_protox[ip->ip_p]].pr_input)(m, hlen);
410 1.1 cgd goto next;
411 1.1 cgd bad:
412 1.1 cgd m_freem(m);
413 1.1 cgd goto next;
414 1.1 cgd }
415 1.1 cgd
416 1.1 cgd /*
417 1.1 cgd * Take incoming datagram fragment and try to
418 1.1 cgd * reassemble it into whole datagram. If a chain for
419 1.1 cgd * reassembly of this datagram already exists, then it
420 1.1 cgd * is given as fp; otherwise have to make a chain.
421 1.1 cgd */
422 1.1 cgd struct ip *
423 1.1 cgd ip_reass(ip, fp)
424 1.1 cgd register struct ipasfrag *ip;
425 1.1 cgd register struct ipq *fp;
426 1.1 cgd {
427 1.1 cgd register struct mbuf *m = dtom(ip);
428 1.1 cgd register struct ipasfrag *q;
429 1.1 cgd struct mbuf *t;
430 1.1 cgd int hlen = ip->ip_hl << 2;
431 1.1 cgd int i, next;
432 1.1 cgd
433 1.1 cgd /*
434 1.1 cgd * Presence of header sizes in mbufs
435 1.1 cgd * would confuse code below.
436 1.1 cgd */
437 1.1 cgd m->m_data += hlen;
438 1.1 cgd m->m_len -= hlen;
439 1.1 cgd
440 1.1 cgd /*
441 1.1 cgd * If first fragment to arrive, create a reassembly queue.
442 1.1 cgd */
443 1.1 cgd if (fp == 0) {
444 1.1 cgd if ((t = m_get(M_DONTWAIT, MT_FTABLE)) == NULL)
445 1.1 cgd goto dropfrag;
446 1.1 cgd fp = mtod(t, struct ipq *);
447 1.1 cgd insque(fp, &ipq);
448 1.1 cgd fp->ipq_ttl = IPFRAGTTL;
449 1.1 cgd fp->ipq_p = ip->ip_p;
450 1.1 cgd fp->ipq_id = ip->ip_id;
451 1.1 cgd fp->ipq_next = fp->ipq_prev = (struct ipasfrag *)fp;
452 1.1 cgd fp->ipq_src = ((struct ip *)ip)->ip_src;
453 1.1 cgd fp->ipq_dst = ((struct ip *)ip)->ip_dst;
454 1.1 cgd q = (struct ipasfrag *)fp;
455 1.1 cgd goto insert;
456 1.1 cgd }
457 1.1 cgd
458 1.1 cgd /*
459 1.1 cgd * Find a segment which begins after this one does.
460 1.1 cgd */
461 1.1 cgd for (q = fp->ipq_next; q != (struct ipasfrag *)fp; q = q->ipf_next)
462 1.1 cgd if (q->ip_off > ip->ip_off)
463 1.1 cgd break;
464 1.1 cgd
465 1.1 cgd /*
466 1.1 cgd * If there is a preceding segment, it may provide some of
467 1.1 cgd * our data already. If so, drop the data from the incoming
468 1.1 cgd * segment. If it provides all of our data, drop us.
469 1.1 cgd */
470 1.1 cgd if (q->ipf_prev != (struct ipasfrag *)fp) {
471 1.1 cgd i = q->ipf_prev->ip_off + q->ipf_prev->ip_len - ip->ip_off;
472 1.1 cgd if (i > 0) {
473 1.1 cgd if (i >= ip->ip_len)
474 1.1 cgd goto dropfrag;
475 1.1 cgd m_adj(dtom(ip), i);
476 1.1 cgd ip->ip_off += i;
477 1.1 cgd ip->ip_len -= i;
478 1.1 cgd }
479 1.1 cgd }
480 1.1 cgd
481 1.1 cgd /*
482 1.1 cgd * While we overlap succeeding segments trim them or,
483 1.1 cgd * if they are completely covered, dequeue them.
484 1.1 cgd */
485 1.1 cgd while (q != (struct ipasfrag *)fp && ip->ip_off + ip->ip_len > q->ip_off) {
486 1.1 cgd i = (ip->ip_off + ip->ip_len) - q->ip_off;
487 1.1 cgd if (i < q->ip_len) {
488 1.1 cgd q->ip_len -= i;
489 1.1 cgd q->ip_off += i;
490 1.1 cgd m_adj(dtom(q), i);
491 1.1 cgd break;
492 1.1 cgd }
493 1.1 cgd q = q->ipf_next;
494 1.1 cgd m_freem(dtom(q->ipf_prev));
495 1.1 cgd ip_deq(q->ipf_prev);
496 1.1 cgd }
497 1.1 cgd
498 1.1 cgd insert:
499 1.1 cgd /*
500 1.1 cgd * Stick new segment in its place;
501 1.1 cgd * check for complete reassembly.
502 1.1 cgd */
503 1.1 cgd ip_enq(ip, q->ipf_prev);
504 1.1 cgd next = 0;
505 1.1 cgd for (q = fp->ipq_next; q != (struct ipasfrag *)fp; q = q->ipf_next) {
506 1.1 cgd if (q->ip_off != next)
507 1.1 cgd return (0);
508 1.1 cgd next += q->ip_len;
509 1.1 cgd }
510 1.1 cgd if (q->ipf_prev->ipf_mff)
511 1.1 cgd return (0);
512 1.1 cgd
513 1.1 cgd /*
514 1.1 cgd * Reassembly is complete; concatenate fragments.
515 1.1 cgd */
516 1.1 cgd q = fp->ipq_next;
517 1.1 cgd m = dtom(q);
518 1.1 cgd t = m->m_next;
519 1.1 cgd m->m_next = 0;
520 1.1 cgd m_cat(m, t);
521 1.1 cgd q = q->ipf_next;
522 1.1 cgd while (q != (struct ipasfrag *)fp) {
523 1.1 cgd t = dtom(q);
524 1.1 cgd q = q->ipf_next;
525 1.1 cgd m_cat(m, t);
526 1.1 cgd }
527 1.1 cgd
528 1.1 cgd /*
529 1.1 cgd * Create header for new ip packet by
530 1.1 cgd * modifying header of first packet;
531 1.1 cgd * dequeue and discard fragment reassembly header.
532 1.1 cgd * Make header visible.
533 1.1 cgd */
534 1.1 cgd ip = fp->ipq_next;
535 1.1 cgd ip->ip_len = next;
536 1.1 cgd ((struct ip *)ip)->ip_src = fp->ipq_src;
537 1.1 cgd ((struct ip *)ip)->ip_dst = fp->ipq_dst;
538 1.1 cgd remque(fp);
539 1.1 cgd (void) m_free(dtom(fp));
540 1.1 cgd m = dtom(ip);
541 1.1 cgd m->m_len += (ip->ip_hl << 2);
542 1.1 cgd m->m_data -= (ip->ip_hl << 2);
543 1.1 cgd /* some debugging cruft by sklower, below, will go away soon */
544 1.1 cgd if (m->m_flags & M_PKTHDR) { /* XXX this should be done elsewhere */
545 1.1 cgd register int plen = 0;
546 1.1 cgd for (t = m; m; m = m->m_next)
547 1.1 cgd plen += m->m_len;
548 1.1 cgd t->m_pkthdr.len = plen;
549 1.1 cgd }
550 1.1 cgd return ((struct ip *)ip);
551 1.1 cgd
552 1.1 cgd dropfrag:
553 1.1 cgd ipstat.ips_fragdropped++;
554 1.1 cgd m_freem(m);
555 1.1 cgd return (0);
556 1.1 cgd }
557 1.1 cgd
558 1.1 cgd /*
559 1.1 cgd * Free a fragment reassembly header and all
560 1.1 cgd * associated datagrams.
561 1.1 cgd */
562 1.8 mycroft void
563 1.1 cgd ip_freef(fp)
564 1.1 cgd struct ipq *fp;
565 1.1 cgd {
566 1.1 cgd register struct ipasfrag *q, *p;
567 1.1 cgd
568 1.1 cgd for (q = fp->ipq_next; q != (struct ipasfrag *)fp; q = p) {
569 1.1 cgd p = q->ipf_next;
570 1.1 cgd ip_deq(q);
571 1.1 cgd m_freem(dtom(q));
572 1.1 cgd }
573 1.1 cgd remque(fp);
574 1.1 cgd (void) m_free(dtom(fp));
575 1.1 cgd }
576 1.1 cgd
577 1.1 cgd /*
578 1.1 cgd * Put an ip fragment on a reassembly chain.
579 1.1 cgd * Like insque, but pointers in middle of structure.
580 1.1 cgd */
581 1.8 mycroft void
582 1.1 cgd ip_enq(p, prev)
583 1.1 cgd register struct ipasfrag *p, *prev;
584 1.1 cgd {
585 1.1 cgd
586 1.1 cgd p->ipf_prev = prev;
587 1.1 cgd p->ipf_next = prev->ipf_next;
588 1.1 cgd prev->ipf_next->ipf_prev = p;
589 1.1 cgd prev->ipf_next = p;
590 1.1 cgd }
591 1.1 cgd
592 1.1 cgd /*
593 1.1 cgd * To ip_enq as remque is to insque.
594 1.1 cgd */
595 1.8 mycroft void
596 1.1 cgd ip_deq(p)
597 1.1 cgd register struct ipasfrag *p;
598 1.1 cgd {
599 1.1 cgd
600 1.1 cgd p->ipf_prev->ipf_next = p->ipf_next;
601 1.1 cgd p->ipf_next->ipf_prev = p->ipf_prev;
602 1.1 cgd }
603 1.1 cgd
604 1.1 cgd /*
605 1.1 cgd * IP timer processing;
606 1.1 cgd * if a timer expires on a reassembly
607 1.1 cgd * queue, discard it.
608 1.1 cgd */
609 1.8 mycroft void
610 1.1 cgd ip_slowtimo()
611 1.1 cgd {
612 1.1 cgd register struct ipq *fp;
613 1.1 cgd int s = splnet();
614 1.1 cgd
615 1.1 cgd fp = ipq.next;
616 1.1 cgd if (fp == 0) {
617 1.1 cgd splx(s);
618 1.1 cgd return;
619 1.1 cgd }
620 1.1 cgd while (fp != &ipq) {
621 1.1 cgd --fp->ipq_ttl;
622 1.1 cgd fp = fp->next;
623 1.1 cgd if (fp->prev->ipq_ttl == 0) {
624 1.1 cgd ipstat.ips_fragtimeout++;
625 1.1 cgd ip_freef(fp->prev);
626 1.1 cgd }
627 1.1 cgd }
628 1.1 cgd splx(s);
629 1.1 cgd }
630 1.1 cgd
631 1.1 cgd /*
632 1.1 cgd * Drain off all datagram fragments.
633 1.1 cgd */
634 1.8 mycroft void
635 1.1 cgd ip_drain()
636 1.1 cgd {
637 1.1 cgd
638 1.1 cgd while (ipq.next != &ipq) {
639 1.1 cgd ipstat.ips_fragdropped++;
640 1.1 cgd ip_freef(ipq.next);
641 1.1 cgd }
642 1.1 cgd }
643 1.1 cgd
644 1.1 cgd extern struct in_ifaddr *ifptoia();
645 1.1 cgd struct in_ifaddr *ip_rtaddr();
646 1.1 cgd
647 1.1 cgd /*
648 1.1 cgd * Do option processing on a datagram,
649 1.1 cgd * possibly discarding it if bad options are encountered,
650 1.1 cgd * or forwarding it if source-routed.
651 1.1 cgd * Returns 1 if packet has been forwarded/freed,
652 1.1 cgd * 0 if the packet should be processed further.
653 1.1 cgd */
654 1.8 mycroft int
655 1.1 cgd ip_dooptions(m)
656 1.1 cgd struct mbuf *m;
657 1.1 cgd {
658 1.1 cgd register struct ip *ip = mtod(m, struct ip *);
659 1.1 cgd register u_char *cp;
660 1.1 cgd register struct ip_timestamp *ipt;
661 1.1 cgd register struct in_ifaddr *ia;
662 1.1 cgd int opt, optlen, cnt, off, code, type = ICMP_PARAMPROB, forward = 0;
663 1.1 cgd struct in_addr *sin;
664 1.1 cgd n_time ntime;
665 1.1 cgd
666 1.1 cgd cp = (u_char *)(ip + 1);
667 1.1 cgd cnt = (ip->ip_hl << 2) - sizeof (struct ip);
668 1.1 cgd for (; cnt > 0; cnt -= optlen, cp += optlen) {
669 1.1 cgd opt = cp[IPOPT_OPTVAL];
670 1.1 cgd if (opt == IPOPT_EOL)
671 1.1 cgd break;
672 1.1 cgd if (opt == IPOPT_NOP)
673 1.1 cgd optlen = 1;
674 1.1 cgd else {
675 1.1 cgd optlen = cp[IPOPT_OLEN];
676 1.1 cgd if (optlen <= 0 || optlen > cnt) {
677 1.1 cgd code = &cp[IPOPT_OLEN] - (u_char *)ip;
678 1.1 cgd goto bad;
679 1.1 cgd }
680 1.1 cgd }
681 1.1 cgd switch (opt) {
682 1.1 cgd
683 1.1 cgd default:
684 1.1 cgd break;
685 1.1 cgd
686 1.1 cgd /*
687 1.1 cgd * Source routing with record.
688 1.1 cgd * Find interface with current destination address.
689 1.1 cgd * If none on this machine then drop if strictly routed,
690 1.1 cgd * or do nothing if loosely routed.
691 1.1 cgd * Record interface address and bring up next address
692 1.1 cgd * component. If strictly routed make sure next
693 1.1 cgd * address is on directly accessible net.
694 1.1 cgd */
695 1.1 cgd case IPOPT_LSRR:
696 1.1 cgd case IPOPT_SSRR:
697 1.1 cgd if ((off = cp[IPOPT_OFFSET]) < IPOPT_MINOFF) {
698 1.1 cgd code = &cp[IPOPT_OFFSET] - (u_char *)ip;
699 1.1 cgd goto bad;
700 1.1 cgd }
701 1.1 cgd ipaddr.sin_addr = ip->ip_dst;
702 1.1 cgd ia = (struct in_ifaddr *)
703 1.1 cgd ifa_ifwithaddr((struct sockaddr *)&ipaddr);
704 1.1 cgd if (ia == 0) {
705 1.1 cgd if (opt == IPOPT_SSRR) {
706 1.1 cgd type = ICMP_UNREACH;
707 1.1 cgd code = ICMP_UNREACH_SRCFAIL;
708 1.1 cgd goto bad;
709 1.1 cgd }
710 1.1 cgd /*
711 1.1 cgd * Loose routing, and not at next destination
712 1.1 cgd * yet; nothing to do except forward.
713 1.1 cgd */
714 1.1 cgd break;
715 1.1 cgd }
716 1.1 cgd off--; /* 0 origin */
717 1.1 cgd if (off > optlen - sizeof(struct in_addr)) {
718 1.1 cgd /*
719 1.1 cgd * End of source route. Should be for us.
720 1.1 cgd */
721 1.1 cgd save_rte(cp, ip->ip_src);
722 1.1 cgd break;
723 1.1 cgd }
724 1.1 cgd /*
725 1.1 cgd * locate outgoing interface
726 1.1 cgd */
727 1.1 cgd bcopy((caddr_t)(cp + off), (caddr_t)&ipaddr.sin_addr,
728 1.1 cgd sizeof(ipaddr.sin_addr));
729 1.1 cgd if (opt == IPOPT_SSRR) {
730 1.1 cgd #define INA struct in_ifaddr *
731 1.1 cgd #define SA struct sockaddr *
732 1.1 cgd if ((ia = (INA)ifa_ifwithdstaddr((SA)&ipaddr)) == 0)
733 1.1 cgd ia = in_iaonnetof(in_netof(ipaddr.sin_addr));
734 1.1 cgd } else
735 1.1 cgd ia = ip_rtaddr(ipaddr.sin_addr);
736 1.1 cgd if (ia == 0) {
737 1.1 cgd type = ICMP_UNREACH;
738 1.1 cgd code = ICMP_UNREACH_SRCFAIL;
739 1.1 cgd goto bad;
740 1.1 cgd }
741 1.1 cgd ip->ip_dst = ipaddr.sin_addr;
742 1.1 cgd bcopy((caddr_t)&(IA_SIN(ia)->sin_addr),
743 1.1 cgd (caddr_t)(cp + off), sizeof(struct in_addr));
744 1.1 cgd cp[IPOPT_OFFSET] += sizeof(struct in_addr);
745 1.1 cgd forward = 1;
746 1.1 cgd break;
747 1.1 cgd
748 1.1 cgd case IPOPT_RR:
749 1.1 cgd if ((off = cp[IPOPT_OFFSET]) < IPOPT_MINOFF) {
750 1.1 cgd code = &cp[IPOPT_OFFSET] - (u_char *)ip;
751 1.1 cgd goto bad;
752 1.1 cgd }
753 1.1 cgd /*
754 1.1 cgd * If no space remains, ignore.
755 1.1 cgd */
756 1.1 cgd off--; /* 0 origin */
757 1.1 cgd if (off > optlen - sizeof(struct in_addr))
758 1.1 cgd break;
759 1.1 cgd bcopy((caddr_t)(&ip->ip_dst), (caddr_t)&ipaddr.sin_addr,
760 1.1 cgd sizeof(ipaddr.sin_addr));
761 1.1 cgd /*
762 1.1 cgd * locate outgoing interface; if we're the destination,
763 1.1 cgd * use the incoming interface (should be same).
764 1.1 cgd */
765 1.1 cgd if ((ia = (INA)ifa_ifwithaddr((SA)&ipaddr)) == 0 &&
766 1.1 cgd (ia = ip_rtaddr(ipaddr.sin_addr)) == 0) {
767 1.1 cgd type = ICMP_UNREACH;
768 1.1 cgd code = ICMP_UNREACH_HOST;
769 1.1 cgd goto bad;
770 1.1 cgd }
771 1.1 cgd bcopy((caddr_t)&(IA_SIN(ia)->sin_addr),
772 1.1 cgd (caddr_t)(cp + off), sizeof(struct in_addr));
773 1.1 cgd cp[IPOPT_OFFSET] += sizeof(struct in_addr);
774 1.1 cgd break;
775 1.1 cgd
776 1.1 cgd case IPOPT_TS:
777 1.1 cgd code = cp - (u_char *)ip;
778 1.1 cgd ipt = (struct ip_timestamp *)cp;
779 1.1 cgd if (ipt->ipt_len < 5)
780 1.1 cgd goto bad;
781 1.1 cgd if (ipt->ipt_ptr > ipt->ipt_len - sizeof (long)) {
782 1.1 cgd if (++ipt->ipt_oflw == 0)
783 1.1 cgd goto bad;
784 1.1 cgd break;
785 1.1 cgd }
786 1.1 cgd sin = (struct in_addr *)(cp + ipt->ipt_ptr - 1);
787 1.1 cgd switch (ipt->ipt_flg) {
788 1.1 cgd
789 1.1 cgd case IPOPT_TS_TSONLY:
790 1.1 cgd break;
791 1.1 cgd
792 1.1 cgd case IPOPT_TS_TSANDADDR:
793 1.1 cgd if (ipt->ipt_ptr + sizeof(n_time) +
794 1.1 cgd sizeof(struct in_addr) > ipt->ipt_len)
795 1.1 cgd goto bad;
796 1.1 cgd ia = ifptoia(m->m_pkthdr.rcvif);
797 1.1 cgd bcopy((caddr_t)&IA_SIN(ia)->sin_addr,
798 1.1 cgd (caddr_t)sin, sizeof(struct in_addr));
799 1.1 cgd ipt->ipt_ptr += sizeof(struct in_addr);
800 1.1 cgd break;
801 1.1 cgd
802 1.1 cgd case IPOPT_TS_PRESPEC:
803 1.1 cgd if (ipt->ipt_ptr + sizeof(n_time) +
804 1.1 cgd sizeof(struct in_addr) > ipt->ipt_len)
805 1.1 cgd goto bad;
806 1.1 cgd bcopy((caddr_t)sin, (caddr_t)&ipaddr.sin_addr,
807 1.1 cgd sizeof(struct in_addr));
808 1.1 cgd if (ifa_ifwithaddr((SA)&ipaddr) == 0)
809 1.1 cgd continue;
810 1.1 cgd ipt->ipt_ptr += sizeof(struct in_addr);
811 1.1 cgd break;
812 1.1 cgd
813 1.1 cgd default:
814 1.1 cgd goto bad;
815 1.1 cgd }
816 1.1 cgd ntime = iptime();
817 1.1 cgd bcopy((caddr_t)&ntime, (caddr_t)cp + ipt->ipt_ptr - 1,
818 1.1 cgd sizeof(n_time));
819 1.1 cgd ipt->ipt_ptr += sizeof(n_time);
820 1.1 cgd }
821 1.1 cgd }
822 1.1 cgd if (forward) {
823 1.1 cgd ip_forward(m, 1);
824 1.1 cgd return (1);
825 1.1 cgd } else
826 1.1 cgd return (0);
827 1.1 cgd bad:
828 1.7 mycroft {
829 1.7 mycroft register struct in_addr foo = {};
830 1.7 mycroft icmp_error(m, type, code, foo);
831 1.7 mycroft }
832 1.1 cgd return (1);
833 1.1 cgd }
834 1.1 cgd
835 1.1 cgd /*
836 1.1 cgd * Given address of next destination (final or next hop),
837 1.1 cgd * return internet address info of interface to be used to get there.
838 1.1 cgd */
839 1.1 cgd struct in_ifaddr *
840 1.1 cgd ip_rtaddr(dst)
841 1.1 cgd struct in_addr dst;
842 1.1 cgd {
843 1.1 cgd register struct sockaddr_in *sin;
844 1.1 cgd
845 1.1 cgd sin = (struct sockaddr_in *) &ipforward_rt.ro_dst;
846 1.1 cgd
847 1.1 cgd if (ipforward_rt.ro_rt == 0 || dst.s_addr != sin->sin_addr.s_addr) {
848 1.1 cgd if (ipforward_rt.ro_rt) {
849 1.1 cgd RTFREE(ipforward_rt.ro_rt);
850 1.1 cgd ipforward_rt.ro_rt = 0;
851 1.1 cgd }
852 1.1 cgd sin->sin_family = AF_INET;
853 1.1 cgd sin->sin_len = sizeof(*sin);
854 1.1 cgd sin->sin_addr = dst;
855 1.1 cgd
856 1.1 cgd rtalloc(&ipforward_rt);
857 1.1 cgd }
858 1.1 cgd if (ipforward_rt.ro_rt == 0)
859 1.1 cgd return ((struct in_ifaddr *)0);
860 1.1 cgd return ((struct in_ifaddr *) ipforward_rt.ro_rt->rt_ifa);
861 1.1 cgd }
862 1.1 cgd
863 1.1 cgd /*
864 1.1 cgd * Save incoming source route for use in replies,
865 1.1 cgd * to be picked up later by ip_srcroute if the receiver is interested.
866 1.1 cgd */
867 1.8 mycroft static void
868 1.1 cgd save_rte(option, dst)
869 1.1 cgd u_char *option;
870 1.1 cgd struct in_addr dst;
871 1.1 cgd {
872 1.1 cgd unsigned olen;
873 1.1 cgd
874 1.1 cgd olen = option[IPOPT_OLEN];
875 1.1 cgd #ifdef DIAGNOSTIC
876 1.1 cgd if (ipprintfs)
877 1.1 cgd printf("save_rte: olen %d\n", olen);
878 1.1 cgd #endif
879 1.1 cgd if (olen > sizeof(ip_srcrt) - (1 + sizeof(dst)))
880 1.1 cgd return;
881 1.1 cgd bcopy((caddr_t)option, (caddr_t)ip_srcrt.srcopt, olen);
882 1.1 cgd ip_nhops = (olen - IPOPT_OFFSET - 1) / sizeof(struct in_addr);
883 1.1 cgd ip_srcrt.dst = dst;
884 1.1 cgd }
885 1.1 cgd
886 1.1 cgd /*
887 1.1 cgd * Retrieve incoming source route for use in replies,
888 1.1 cgd * in the same form used by setsockopt.
889 1.1 cgd * The first hop is placed before the options, will be removed later.
890 1.1 cgd */
891 1.1 cgd struct mbuf *
892 1.1 cgd ip_srcroute()
893 1.1 cgd {
894 1.1 cgd register struct in_addr *p, *q;
895 1.1 cgd register struct mbuf *m;
896 1.1 cgd
897 1.1 cgd if (ip_nhops == 0)
898 1.1 cgd return ((struct mbuf *)0);
899 1.1 cgd m = m_get(M_DONTWAIT, MT_SOOPTS);
900 1.1 cgd if (m == 0)
901 1.1 cgd return ((struct mbuf *)0);
902 1.1 cgd
903 1.6 mycroft #define OPTSIZ (sizeof(ip_srcrt.nop) + sizeof(ip_srcrt.srcopt))
904 1.1 cgd
905 1.1 cgd /* length is (nhops+1)*sizeof(addr) + sizeof(nop + srcrt header) */
906 1.1 cgd m->m_len = ip_nhops * sizeof(struct in_addr) + sizeof(struct in_addr) +
907 1.1 cgd OPTSIZ;
908 1.1 cgd #ifdef DIAGNOSTIC
909 1.1 cgd if (ipprintfs)
910 1.1 cgd printf("ip_srcroute: nhops %d mlen %d", ip_nhops, m->m_len);
911 1.1 cgd #endif
912 1.1 cgd
913 1.1 cgd /*
914 1.1 cgd * First save first hop for return route
915 1.1 cgd */
916 1.1 cgd p = &ip_srcrt.route[ip_nhops - 1];
917 1.1 cgd *(mtod(m, struct in_addr *)) = *p--;
918 1.1 cgd #ifdef DIAGNOSTIC
919 1.1 cgd if (ipprintfs)
920 1.1 cgd printf(" hops %lx", ntohl(mtod(m, struct in_addr *)->s_addr));
921 1.1 cgd #endif
922 1.1 cgd
923 1.1 cgd /*
924 1.1 cgd * Copy option fields and padding (nop) to mbuf.
925 1.1 cgd */
926 1.1 cgd ip_srcrt.nop = IPOPT_NOP;
927 1.1 cgd ip_srcrt.srcopt[IPOPT_OFFSET] = IPOPT_MINOFF;
928 1.1 cgd bcopy((caddr_t)&ip_srcrt.nop,
929 1.1 cgd mtod(m, caddr_t) + sizeof(struct in_addr), OPTSIZ);
930 1.1 cgd q = (struct in_addr *)(mtod(m, caddr_t) +
931 1.1 cgd sizeof(struct in_addr) + OPTSIZ);
932 1.1 cgd #undef OPTSIZ
933 1.1 cgd /*
934 1.1 cgd * Record return path as an IP source route,
935 1.1 cgd * reversing the path (pointers are now aligned).
936 1.1 cgd */
937 1.1 cgd while (p >= ip_srcrt.route) {
938 1.1 cgd #ifdef DIAGNOSTIC
939 1.1 cgd if (ipprintfs)
940 1.1 cgd printf(" %lx", ntohl(q->s_addr));
941 1.1 cgd #endif
942 1.1 cgd *q++ = *p--;
943 1.1 cgd }
944 1.1 cgd /*
945 1.1 cgd * Last hop goes to final destination.
946 1.1 cgd */
947 1.1 cgd *q = ip_srcrt.dst;
948 1.1 cgd #ifdef DIAGNOSTIC
949 1.1 cgd if (ipprintfs)
950 1.1 cgd printf(" %lx\n", ntohl(q->s_addr));
951 1.1 cgd #endif
952 1.1 cgd return (m);
953 1.1 cgd }
954 1.1 cgd
955 1.1 cgd /*
956 1.1 cgd * Strip out IP options, at higher
957 1.1 cgd * level protocol in the kernel.
958 1.1 cgd * Second argument is buffer to which options
959 1.1 cgd * will be moved, and return value is their length.
960 1.1 cgd * XXX should be deleted; last arg currently ignored.
961 1.1 cgd */
962 1.8 mycroft void
963 1.1 cgd ip_stripoptions(m, mopt)
964 1.1 cgd register struct mbuf *m;
965 1.1 cgd struct mbuf *mopt;
966 1.1 cgd {
967 1.1 cgd register int i;
968 1.1 cgd struct ip *ip = mtod(m, struct ip *);
969 1.1 cgd register caddr_t opts;
970 1.1 cgd int olen;
971 1.1 cgd
972 1.1 cgd olen = (ip->ip_hl<<2) - sizeof (struct ip);
973 1.1 cgd opts = (caddr_t)(ip + 1);
974 1.1 cgd i = m->m_len - (sizeof (struct ip) + olen);
975 1.1 cgd bcopy(opts + olen, opts, (unsigned)i);
976 1.1 cgd m->m_len -= olen;
977 1.1 cgd if (m->m_flags & M_PKTHDR)
978 1.1 cgd m->m_pkthdr.len -= olen;
979 1.1 cgd ip->ip_hl = sizeof(struct ip) >> 2;
980 1.1 cgd }
981 1.1 cgd
982 1.1 cgd u_char inetctlerrmap[PRC_NCMDS] = {
983 1.1 cgd 0, 0, 0, 0,
984 1.1 cgd 0, EMSGSIZE, EHOSTDOWN, EHOSTUNREACH,
985 1.1 cgd EHOSTUNREACH, EHOSTUNREACH, ECONNREFUSED, ECONNREFUSED,
986 1.1 cgd EMSGSIZE, EHOSTUNREACH, 0, 0,
987 1.1 cgd 0, 0, 0, 0,
988 1.1 cgd ENOPROTOOPT
989 1.1 cgd };
990 1.1 cgd
991 1.1 cgd /*
992 1.1 cgd * Forward a packet. If some error occurs return the sender
993 1.1 cgd * an icmp packet. Note we can't always generate a meaningful
994 1.1 cgd * icmp message because icmp doesn't have a large enough repertoire
995 1.1 cgd * of codes and types.
996 1.1 cgd *
997 1.1 cgd * If not forwarding, just drop the packet. This could be confusing
998 1.1 cgd * if ipforwarding was zero but some routing protocol was advancing
999 1.1 cgd * us as a gateway to somewhere. However, we must let the routing
1000 1.1 cgd * protocol deal with that.
1001 1.1 cgd *
1002 1.1 cgd * The srcrt parameter indicates whether the packet is being forwarded
1003 1.1 cgd * via a source route.
1004 1.1 cgd */
1005 1.8 mycroft static void
1006 1.1 cgd ip_forward(m, srcrt)
1007 1.1 cgd struct mbuf *m;
1008 1.1 cgd int srcrt;
1009 1.1 cgd {
1010 1.1 cgd register struct ip *ip = mtod(m, struct ip *);
1011 1.1 cgd register struct sockaddr_in *sin;
1012 1.1 cgd register struct rtentry *rt;
1013 1.1 cgd int error, type = 0, code;
1014 1.1 cgd struct mbuf *mcopy;
1015 1.1 cgd struct in_addr dest;
1016 1.1 cgd
1017 1.1 cgd dest.s_addr = 0;
1018 1.1 cgd #ifdef DIAGNOSTIC
1019 1.1 cgd if (ipprintfs)
1020 1.1 cgd printf("forward: src %x dst %x ttl %x\n", ip->ip_src,
1021 1.1 cgd ip->ip_dst, ip->ip_ttl);
1022 1.1 cgd #endif
1023 1.1 cgd if (m->m_flags & M_BCAST || in_canforward(ip->ip_dst) == 0) {
1024 1.1 cgd ipstat.ips_cantforward++;
1025 1.1 cgd m_freem(m);
1026 1.1 cgd return;
1027 1.1 cgd }
1028 1.1 cgd HTONS(ip->ip_id);
1029 1.1 cgd if (ip->ip_ttl <= IPTTLDEC) {
1030 1.1 cgd icmp_error(m, ICMP_TIMXCEED, ICMP_TIMXCEED_INTRANS, dest);
1031 1.1 cgd return;
1032 1.1 cgd }
1033 1.1 cgd ip->ip_ttl -= IPTTLDEC;
1034 1.1 cgd
1035 1.1 cgd sin = (struct sockaddr_in *)&ipforward_rt.ro_dst;
1036 1.1 cgd if ((rt = ipforward_rt.ro_rt) == 0 ||
1037 1.1 cgd ip->ip_dst.s_addr != sin->sin_addr.s_addr) {
1038 1.1 cgd if (ipforward_rt.ro_rt) {
1039 1.1 cgd RTFREE(ipforward_rt.ro_rt);
1040 1.1 cgd ipforward_rt.ro_rt = 0;
1041 1.1 cgd }
1042 1.1 cgd sin->sin_family = AF_INET;
1043 1.1 cgd sin->sin_len = sizeof(*sin);
1044 1.1 cgd sin->sin_addr = ip->ip_dst;
1045 1.1 cgd
1046 1.1 cgd rtalloc(&ipforward_rt);
1047 1.1 cgd if (ipforward_rt.ro_rt == 0) {
1048 1.1 cgd icmp_error(m, ICMP_UNREACH, ICMP_UNREACH_HOST, dest);
1049 1.1 cgd return;
1050 1.1 cgd }
1051 1.1 cgd rt = ipforward_rt.ro_rt;
1052 1.1 cgd }
1053 1.1 cgd
1054 1.1 cgd /*
1055 1.1 cgd * Save at most 64 bytes of the packet in case
1056 1.1 cgd * we need to generate an ICMP message to the src.
1057 1.1 cgd */
1058 1.1 cgd mcopy = m_copy(m, 0, imin((int)ip->ip_len, 64));
1059 1.1 cgd
1060 1.1 cgd #ifdef GATEWAY
1061 1.1 cgd ip_ifmatrix[rt->rt_ifp->if_index +
1062 1.1 cgd if_index * m->m_pkthdr.rcvif->if_index]++;
1063 1.1 cgd #endif
1064 1.1 cgd /*
1065 1.1 cgd * If forwarding packet using same interface that it came in on,
1066 1.1 cgd * perhaps should send a redirect to sender to shortcut a hop.
1067 1.1 cgd * Only send redirect if source is sending directly to us,
1068 1.1 cgd * and if packet was not source routed (or has any options).
1069 1.1 cgd * Also, don't send redirect if forwarding using a default route
1070 1.1 cgd * or a route modified by a redirect.
1071 1.1 cgd */
1072 1.1 cgd #define satosin(sa) ((struct sockaddr_in *)(sa))
1073 1.1 cgd if (rt->rt_ifp == m->m_pkthdr.rcvif &&
1074 1.1 cgd (rt->rt_flags & (RTF_DYNAMIC|RTF_MODIFIED)) == 0 &&
1075 1.1 cgd satosin(rt_key(rt))->sin_addr.s_addr != 0 &&
1076 1.1 cgd ipsendredirects && !srcrt) {
1077 1.1 cgd struct in_ifaddr *ia;
1078 1.1 cgd u_long src = ntohl(ip->ip_src.s_addr);
1079 1.1 cgd u_long dst = ntohl(ip->ip_dst.s_addr);
1080 1.1 cgd
1081 1.1 cgd if ((ia = ifptoia(m->m_pkthdr.rcvif)) &&
1082 1.1 cgd (src & ia->ia_subnetmask) == ia->ia_subnet) {
1083 1.1 cgd if (rt->rt_flags & RTF_GATEWAY)
1084 1.1 cgd dest = satosin(rt->rt_gateway)->sin_addr;
1085 1.1 cgd else
1086 1.1 cgd dest = ip->ip_dst;
1087 1.1 cgd /*
1088 1.1 cgd * If the destination is reached by a route to host,
1089 1.1 cgd * is on a subnet of a local net, or is directly
1090 1.1 cgd * on the attached net (!), use host redirect.
1091 1.1 cgd * (We may be the correct first hop for other subnets.)
1092 1.1 cgd */
1093 1.1 cgd #define RTA(rt) ((struct in_ifaddr *)(rt->rt_ifa))
1094 1.1 cgd type = ICMP_REDIRECT;
1095 1.1 cgd if ((rt->rt_flags & RTF_HOST) ||
1096 1.1 cgd (rt->rt_flags & RTF_GATEWAY) == 0)
1097 1.1 cgd code = ICMP_REDIRECT_HOST;
1098 1.1 cgd else if (RTA(rt)->ia_subnetmask != RTA(rt)->ia_netmask &&
1099 1.1 cgd (dst & RTA(rt)->ia_netmask) == RTA(rt)->ia_net)
1100 1.1 cgd code = ICMP_REDIRECT_HOST;
1101 1.1 cgd else
1102 1.1 cgd code = ICMP_REDIRECT_NET;
1103 1.1 cgd #ifdef DIAGNOSTIC
1104 1.1 cgd if (ipprintfs)
1105 1.1 cgd printf("redirect (%d) to %x\n", code, dest.s_addr);
1106 1.1 cgd #endif
1107 1.1 cgd }
1108 1.1 cgd }
1109 1.1 cgd
1110 1.9 mycroft error = ip_output(m, NULL, &ipforward_rt, IP_FORWARDING
1111 1.9 mycroft #ifdef DIRECTED_BROADCAST
1112 1.9 mycroft | IP_ALLOWBROADCAST
1113 1.9 mycroft #endif
1114 1.9 mycroft , NULL);
1115 1.1 cgd if (error)
1116 1.1 cgd ipstat.ips_cantforward++;
1117 1.1 cgd else {
1118 1.1 cgd ipstat.ips_forward++;
1119 1.1 cgd if (type)
1120 1.1 cgd ipstat.ips_redirectsent++;
1121 1.1 cgd else {
1122 1.1 cgd if (mcopy)
1123 1.1 cgd m_freem(mcopy);
1124 1.1 cgd return;
1125 1.1 cgd }
1126 1.1 cgd }
1127 1.1 cgd if (mcopy == NULL)
1128 1.1 cgd return;
1129 1.1 cgd switch (error) {
1130 1.1 cgd
1131 1.1 cgd case 0: /* forwarded, but need redirect */
1132 1.1 cgd /* type, code set above */
1133 1.1 cgd break;
1134 1.1 cgd
1135 1.1 cgd case ENETUNREACH: /* shouldn't happen, checked above */
1136 1.1 cgd case EHOSTUNREACH:
1137 1.1 cgd case ENETDOWN:
1138 1.1 cgd case EHOSTDOWN:
1139 1.1 cgd default:
1140 1.1 cgd type = ICMP_UNREACH;
1141 1.1 cgd code = ICMP_UNREACH_HOST;
1142 1.1 cgd break;
1143 1.1 cgd
1144 1.1 cgd case EMSGSIZE:
1145 1.1 cgd type = ICMP_UNREACH;
1146 1.1 cgd code = ICMP_UNREACH_NEEDFRAG;
1147 1.1 cgd ipstat.ips_cantfrag++;
1148 1.1 cgd break;
1149 1.1 cgd
1150 1.1 cgd case ENOBUFS:
1151 1.1 cgd type = ICMP_SOURCEQUENCH;
1152 1.1 cgd code = 0;
1153 1.1 cgd break;
1154 1.1 cgd }
1155 1.1 cgd icmp_error(mcopy, type, code, dest);
1156 1.1 cgd }
1157