Home | History | Annotate | Line # | Download | only in netinet
ip_input.c revision 1.60
      1  1.60       kml /*	$NetBSD: ip_input.c,v 1.60 1998/04/29 03:44:11 kml Exp $	*/
      2  1.58       tls 
      3  1.58       tls /*-
      4  1.58       tls  * Copyright (c) 1998 The NetBSD Foundation, Inc.
      5  1.58       tls  * All rights reserved.
      6  1.58       tls  *
      7  1.58       tls  * This code is derived from software contributed to The NetBSD Foundation
      8  1.58       tls  * by Public Access Networks Corporation ("Panix").  It was developed under
      9  1.58       tls  * contract to Panix by Eric Haszlakiewicz and Thor Lancelot Simon.
     10  1.58       tls  *
     11  1.58       tls  * Redistribution and use in source and binary forms, with or without
     12  1.58       tls  * modification, are permitted provided that the following conditions
     13  1.58       tls  * are met:
     14  1.58       tls  * 1. Redistributions of source code must retain the above copyright
     15  1.58       tls  *    notice, this list of conditions and the following disclaimer.
     16  1.58       tls  * 2. Redistributions in binary form must reproduce the above copyright
     17  1.58       tls  *    notice, this list of conditions and the following disclaimer in the
     18  1.58       tls  *    documentation and/or other materials provided with the distribution.
     19  1.58       tls  * 3. All advertising materials mentioning features or use of this software
     20  1.58       tls  *    must display the following acknowledgement:
     21  1.58       tls  *	This product includes software developed by the NetBSD
     22  1.58       tls  *	Foundation, Inc. and its contributors.
     23  1.58       tls  * 4. Neither the name of The NetBSD Foundation nor the names of its
     24  1.58       tls  *    contributors may be used to endorse or promote products derived
     25  1.58       tls  *    from this software without specific prior written permission.
     26  1.58       tls  *
     27  1.58       tls  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     28  1.58       tls  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     29  1.58       tls  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     30  1.58       tls  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     31  1.58       tls  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     32  1.58       tls  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     33  1.58       tls  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     34  1.58       tls  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     35  1.58       tls  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     36  1.58       tls  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     37  1.58       tls  * POSSIBILITY OF SUCH DAMAGE.
     38  1.58       tls  */
     39  1.14       cgd 
     40   1.1       cgd /*
     41  1.13   mycroft  * Copyright (c) 1982, 1986, 1988, 1993
     42  1.13   mycroft  *	The Regents of the University of California.  All rights reserved.
     43   1.1       cgd  *
     44   1.1       cgd  * Redistribution and use in source and binary forms, with or without
     45   1.1       cgd  * modification, are permitted provided that the following conditions
     46   1.1       cgd  * are met:
     47   1.1       cgd  * 1. Redistributions of source code must retain the above copyright
     48   1.1       cgd  *    notice, this list of conditions and the following disclaimer.
     49   1.1       cgd  * 2. Redistributions in binary form must reproduce the above copyright
     50   1.1       cgd  *    notice, this list of conditions and the following disclaimer in the
     51   1.1       cgd  *    documentation and/or other materials provided with the distribution.
     52   1.1       cgd  * 3. All advertising materials mentioning features or use of this software
     53   1.1       cgd  *    must display the following acknowledgement:
     54   1.1       cgd  *	This product includes software developed by the University of
     55   1.1       cgd  *	California, Berkeley and its contributors.
     56   1.1       cgd  * 4. Neither the name of the University nor the names of its contributors
     57   1.1       cgd  *    may be used to endorse or promote products derived from this software
     58   1.1       cgd  *    without specific prior written permission.
     59   1.1       cgd  *
     60   1.1       cgd  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
     61   1.1       cgd  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     62   1.1       cgd  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     63   1.1       cgd  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
     64   1.1       cgd  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     65   1.1       cgd  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     66   1.1       cgd  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     67   1.1       cgd  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     68   1.1       cgd  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     69   1.1       cgd  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     70   1.1       cgd  * SUCH DAMAGE.
     71   1.1       cgd  *
     72  1.14       cgd  *	@(#)ip_input.c	8.2 (Berkeley) 1/4/94
     73   1.1       cgd  */
     74  1.55    scottr 
     75  1.55    scottr #include "opt_mrouting.h"
     76   1.1       cgd 
     77   1.5   mycroft #include <sys/param.h>
     78   1.5   mycroft #include <sys/systm.h>
     79   1.5   mycroft #include <sys/malloc.h>
     80   1.5   mycroft #include <sys/mbuf.h>
     81   1.5   mycroft #include <sys/domain.h>
     82   1.5   mycroft #include <sys/protosw.h>
     83   1.5   mycroft #include <sys/socket.h>
     84  1.44   thorpej #include <sys/socketvar.h>
     85   1.5   mycroft #include <sys/errno.h>
     86   1.5   mycroft #include <sys/time.h>
     87   1.5   mycroft #include <sys/kernel.h>
     88  1.28  christos #include <sys/proc.h>
     89  1.28  christos 
     90  1.28  christos #include <vm/vm.h>
     91  1.28  christos #include <sys/sysctl.h>
     92   1.1       cgd 
     93   1.5   mycroft #include <net/if.h>
     94  1.44   thorpej #include <net/if_dl.h>
     95   1.5   mycroft #include <net/route.h>
     96  1.45       mrg #include <net/pfil.h>
     97   1.1       cgd 
     98   1.5   mycroft #include <netinet/in.h>
     99   1.5   mycroft #include <netinet/in_systm.h>
    100   1.5   mycroft #include <netinet/ip.h>
    101   1.5   mycroft #include <netinet/in_pcb.h>
    102   1.5   mycroft #include <netinet/in_var.h>
    103   1.5   mycroft #include <netinet/ip_var.h>
    104   1.5   mycroft #include <netinet/ip_icmp.h>
    105  1.44   thorpej 
    106   1.1       cgd #ifndef	IPFORWARDING
    107   1.1       cgd #ifdef GATEWAY
    108   1.1       cgd #define	IPFORWARDING	1	/* forward IP packets not for us */
    109   1.1       cgd #else /* GATEWAY */
    110   1.1       cgd #define	IPFORWARDING	0	/* don't forward IP packets not for us */
    111   1.1       cgd #endif /* GATEWAY */
    112   1.1       cgd #endif /* IPFORWARDING */
    113   1.1       cgd #ifndef	IPSENDREDIRECTS
    114   1.1       cgd #define	IPSENDREDIRECTS	1
    115   1.1       cgd #endif
    116  1.26   thorpej #ifndef IPFORWSRCRT
    117  1.47       cjs #define	IPFORWSRCRT	1	/* forward source-routed packets */
    118  1.47       cjs #endif
    119  1.47       cjs #ifndef IPALLOWSRCRT
    120  1.48       mrg #define	IPALLOWSRCRT	1	/* allow source-routed packets */
    121  1.26   thorpej #endif
    122  1.53       kml #ifndef IPMTUDISC
    123  1.53       kml #define IPMTUDISC	0
    124  1.53       kml #endif
    125  1.60       kml #ifndef IPMTUDISCTIMEOUT
    126  1.60       kml #define IPMTUDISCTIMEOUT (1 * 60)	/* experimental short timeout value! */
    127  1.60       kml #endif
    128  1.53       kml 
    129  1.27   thorpej /*
    130  1.27   thorpej  * Note: DIRECTED_BROADCAST is handled this way so that previous
    131  1.27   thorpej  * configuration using this option will Just Work.
    132  1.27   thorpej  */
    133  1.27   thorpej #ifndef IPDIRECTEDBCAST
    134  1.27   thorpej #ifdef DIRECTED_BROADCAST
    135  1.27   thorpej #define IPDIRECTEDBCAST	1
    136  1.27   thorpej #else
    137  1.27   thorpej #define	IPDIRECTEDBCAST	0
    138  1.27   thorpej #endif /* DIRECTED_BROADCAST */
    139  1.27   thorpej #endif /* IPDIRECTEDBCAST */
    140   1.1       cgd int	ipforwarding = IPFORWARDING;
    141   1.1       cgd int	ipsendredirects = IPSENDREDIRECTS;
    142  1.13   mycroft int	ip_defttl = IPDEFTTL;
    143  1.26   thorpej int	ip_forwsrcrt = IPFORWSRCRT;
    144  1.27   thorpej int	ip_directedbcast = IPDIRECTEDBCAST;
    145  1.47       cjs int	ip_allowsrcrt = IPALLOWSRCRT;
    146  1.53       kml int	ip_mtudisc = IPMTUDISC;
    147  1.60       kml u_int	ip_mtudisc_timeout = IPMTUDISCTIMEOUT;
    148   1.1       cgd #ifdef DIAGNOSTIC
    149   1.1       cgd int	ipprintfs = 0;
    150   1.1       cgd #endif
    151   1.1       cgd 
    152  1.60       kml struct rttimer_queue *ip_mtudisc_timeout_q = NULL;
    153  1.60       kml 
    154   1.1       cgd extern	struct domain inetdomain;
    155   1.1       cgd extern	struct protosw inetsw[];
    156   1.1       cgd u_char	ip_protox[IPPROTO_MAX];
    157   1.1       cgd int	ipqmaxlen = IFQ_MAXLEN;
    158  1.22   mycroft struct	in_ifaddrhead in_ifaddr;
    159  1.57       tls struct	in_ifaddrhashhead *in_ifaddrhashtbl;
    160  1.13   mycroft struct	ifqueue ipintrq;
    161   1.1       cgd 
    162   1.1       cgd /*
    163   1.1       cgd  * We need to save the IP options in case a protocol wants to respond
    164   1.1       cgd  * to an incoming packet over the same route if the packet got here
    165   1.1       cgd  * using IP source routing.  This allows connection establishment and
    166   1.1       cgd  * maintenance when the remote end is on a network that is not known
    167   1.1       cgd  * to us.
    168   1.1       cgd  */
    169   1.1       cgd int	ip_nhops = 0;
    170   1.1       cgd static	struct ip_srcrt {
    171   1.1       cgd 	struct	in_addr dst;			/* final destination */
    172   1.1       cgd 	char	nop;				/* one NOP to align */
    173   1.1       cgd 	char	srcopt[IPOPT_OFFSET + 1];	/* OPTVAL, OLEN and OFFSET */
    174   1.1       cgd 	struct	in_addr route[MAX_IPOPTLEN/sizeof(struct in_addr)];
    175   1.1       cgd } ip_srcrt;
    176   1.1       cgd 
    177  1.13   mycroft static void save_rte __P((u_char *, struct in_addr));
    178  1.35   mycroft 
    179   1.1       cgd /*
    180   1.1       cgd  * IP initialization: fill in IP protocol switch table.
    181   1.1       cgd  * All protocols not implemented in kernel go to raw IP protocol handler.
    182   1.1       cgd  */
    183   1.8   mycroft void
    184   1.1       cgd ip_init()
    185   1.1       cgd {
    186   1.1       cgd 	register struct protosw *pr;
    187   1.1       cgd 	register int i;
    188   1.1       cgd 
    189   1.1       cgd 	pr = pffindproto(PF_INET, IPPROTO_RAW, SOCK_RAW);
    190   1.1       cgd 	if (pr == 0)
    191   1.1       cgd 		panic("ip_init");
    192   1.1       cgd 	for (i = 0; i < IPPROTO_MAX; i++)
    193   1.1       cgd 		ip_protox[i] = pr - inetsw;
    194   1.1       cgd 	for (pr = inetdomain.dom_protosw;
    195   1.1       cgd 	    pr < inetdomain.dom_protoswNPROTOSW; pr++)
    196   1.1       cgd 		if (pr->pr_domain->dom_family == PF_INET &&
    197   1.1       cgd 		    pr->pr_protocol && pr->pr_protocol != IPPROTO_RAW)
    198   1.1       cgd 			ip_protox[pr->pr_protocol] = pr - inetsw;
    199  1.25       cgd 	LIST_INIT(&ipq);
    200   1.1       cgd 	ip_id = time.tv_sec & 0xffff;
    201   1.1       cgd 	ipintrq.ifq_maxlen = ipqmaxlen;
    202  1.22   mycroft 	TAILQ_INIT(&in_ifaddr);
    203  1.57       tls 	in_ifaddrhashtbl =
    204  1.57       tls 	    hashinit(IN_IFADDR_HASH_SIZE, M_IFADDR, M_WAITOK, &in_ifaddrhash);
    205  1.60       kml 	if (ip_mtudisc != 0)
    206  1.60       kml 		ip_mtudisc_timeout_q =
    207  1.60       kml 		    rt_timer_queue_create(ip_mtudisc_timeout);
    208   1.1       cgd }
    209   1.1       cgd 
    210   1.1       cgd struct	sockaddr_in ipaddr = { sizeof(ipaddr), AF_INET };
    211   1.1       cgd struct	route ipforward_rt;
    212   1.1       cgd 
    213   1.1       cgd /*
    214   1.1       cgd  * Ip input routine.  Checksum and byte swap header.  If fragmented
    215   1.1       cgd  * try to reassemble.  Process options.  Pass to next level.
    216   1.1       cgd  */
    217   1.8   mycroft void
    218   1.1       cgd ipintr()
    219   1.1       cgd {
    220  1.33       mrg 	register struct ip *ip = NULL;
    221   1.1       cgd 	register struct mbuf *m;
    222   1.1       cgd 	register struct ipq *fp;
    223   1.1       cgd 	register struct in_ifaddr *ia;
    224  1.57       tls 	register struct ifaddr *ifa;
    225  1.25       cgd 	struct ipqent *ipqe;
    226  1.35   mycroft 	int hlen = 0, mff, len, s;
    227  1.36       mrg #ifdef PFIL_HOOKS
    228  1.33       mrg 	struct packet_filter_hook *pfh;
    229  1.33       mrg 	struct mbuf *m0;
    230  1.43       mrg 	int rv;
    231  1.36       mrg #endif /* PFIL_HOOKS */
    232   1.1       cgd 
    233   1.1       cgd next:
    234   1.1       cgd 	/*
    235   1.1       cgd 	 * Get next datagram off input queue and get IP header
    236   1.1       cgd 	 * in first mbuf.
    237   1.1       cgd 	 */
    238   1.1       cgd 	s = splimp();
    239   1.1       cgd 	IF_DEQUEUE(&ipintrq, m);
    240   1.1       cgd 	splx(s);
    241  1.13   mycroft 	if (m == 0)
    242   1.1       cgd 		return;
    243   1.1       cgd #ifdef	DIAGNOSTIC
    244   1.1       cgd 	if ((m->m_flags & M_PKTHDR) == 0)
    245   1.1       cgd 		panic("ipintr no HDR");
    246   1.1       cgd #endif
    247   1.1       cgd 	/*
    248   1.1       cgd 	 * If no IP addresses have been set yet but the interfaces
    249   1.1       cgd 	 * are receiving, can't do anything with incoming packets yet.
    250   1.1       cgd 	 */
    251  1.22   mycroft 	if (in_ifaddr.tqh_first == 0)
    252   1.1       cgd 		goto bad;
    253   1.1       cgd 	ipstat.ips_total++;
    254   1.1       cgd 	if (m->m_len < sizeof (struct ip) &&
    255   1.1       cgd 	    (m = m_pullup(m, sizeof (struct ip))) == 0) {
    256   1.1       cgd 		ipstat.ips_toosmall++;
    257   1.1       cgd 		goto next;
    258   1.1       cgd 	}
    259   1.1       cgd 	ip = mtod(m, struct ip *);
    260  1.13   mycroft 	if (ip->ip_v != IPVERSION) {
    261  1.13   mycroft 		ipstat.ips_badvers++;
    262  1.13   mycroft 		goto bad;
    263  1.13   mycroft 	}
    264   1.1       cgd 	hlen = ip->ip_hl << 2;
    265   1.1       cgd 	if (hlen < sizeof(struct ip)) {	/* minimum header length */
    266   1.1       cgd 		ipstat.ips_badhlen++;
    267   1.1       cgd 		goto bad;
    268   1.1       cgd 	}
    269   1.1       cgd 	if (hlen > m->m_len) {
    270   1.1       cgd 		if ((m = m_pullup(m, hlen)) == 0) {
    271   1.1       cgd 			ipstat.ips_badhlen++;
    272   1.1       cgd 			goto next;
    273   1.1       cgd 		}
    274   1.1       cgd 		ip = mtod(m, struct ip *);
    275   1.1       cgd 	}
    276  1.28  christos 	if ((ip->ip_sum = in_cksum(m, hlen)) != 0) {
    277   1.1       cgd 		ipstat.ips_badsum++;
    278   1.1       cgd 		goto bad;
    279   1.1       cgd 	}
    280   1.1       cgd 
    281   1.1       cgd 	/*
    282   1.1       cgd 	 * Convert fields to host representation.
    283   1.1       cgd 	 */
    284   1.1       cgd 	NTOHS(ip->ip_len);
    285   1.1       cgd 	NTOHS(ip->ip_id);
    286   1.1       cgd 	NTOHS(ip->ip_off);
    287  1.35   mycroft 	len = ip->ip_len;
    288   1.1       cgd 
    289   1.1       cgd 	/*
    290   1.1       cgd 	 * Check that the amount of data in the buffers
    291   1.1       cgd 	 * is as at least much as the IP header would have us expect.
    292   1.1       cgd 	 * Trim mbufs if longer than we expect.
    293   1.1       cgd 	 * Drop packet if shorter than we expect.
    294   1.1       cgd 	 */
    295  1.35   mycroft 	if (m->m_pkthdr.len < len) {
    296   1.1       cgd 		ipstat.ips_tooshort++;
    297   1.1       cgd 		goto bad;
    298   1.1       cgd 	}
    299  1.35   mycroft 	if (m->m_pkthdr.len > len) {
    300   1.1       cgd 		if (m->m_len == m->m_pkthdr.len) {
    301  1.35   mycroft 			m->m_len = len;
    302  1.35   mycroft 			m->m_pkthdr.len = len;
    303   1.1       cgd 		} else
    304  1.35   mycroft 			m_adj(m, len - m->m_pkthdr.len);
    305   1.1       cgd 	}
    306   1.1       cgd 
    307  1.36       mrg #ifdef PFIL_HOOKS
    308  1.33       mrg 	/*
    309  1.33       mrg 	 * Run through list of hooks for input packets.
    310  1.33       mrg 	 */
    311  1.33       mrg 	m0 = m;
    312  1.59       mrg 	for (pfh = pfil_hook_get(PFIL_IN); pfh; pfh = pfh->pfil_link.tqe_next)
    313  1.33       mrg 		if (pfh->pfil_func) {
    314  1.43       mrg 			rv = pfh->pfil_func(ip, hlen, m->m_pkthdr.rcvif, 0, &m0);
    315  1.43       mrg 			if (rv)
    316  1.40     veego 				goto next;
    317  1.49  christos 			ip = mtod(m = m0, struct ip *);
    318  1.33       mrg 		}
    319  1.36       mrg #endif /* PFIL_HOOKS */
    320  1.33       mrg 
    321   1.1       cgd 	/*
    322   1.1       cgd 	 * Process options and, if not destined for us,
    323   1.1       cgd 	 * ship it on.  ip_dooptions returns 1 when an
    324   1.1       cgd 	 * error was detected (causing an icmp message
    325   1.1       cgd 	 * to be sent and the original packet to be freed).
    326   1.1       cgd 	 */
    327   1.1       cgd 	ip_nhops = 0;		/* for source routed packets */
    328   1.1       cgd 	if (hlen > sizeof (struct ip) && ip_dooptions(m))
    329   1.1       cgd 		goto next;
    330   1.1       cgd 
    331   1.1       cgd 	/*
    332   1.1       cgd 	 * Check our list of addresses, to see if the packet is for us.
    333   1.1       cgd 	 */
    334  1.57       tls 	INADDR_TO_IA(ip->ip_dst, ia);
    335  1.57       tls 	if (ia != NULL) goto ours;
    336  1.57       tls 	if (m->m_pkthdr.rcvif->if_flags & IFF_BROADCAST) {
    337  1.57       tls 		for (ifa = m->m_pkthdr.rcvif->if_addrlist.tqh_first;
    338  1.57       tls 		    ifa != NULL; ifa = ifa->ifa_list.tqe_next) {
    339  1.57       tls 			if (ifa->ifa_addr->sa_family != AF_INET) continue;
    340  1.57       tls 			ia = ifatoia(ifa);
    341  1.35   mycroft 			if (in_hosteq(ip->ip_dst, ia->ia_broadaddr.sin_addr) ||
    342  1.35   mycroft 			    in_hosteq(ip->ip_dst, ia->ia_netbroadcast) ||
    343  1.20   mycroft 			    /*
    344  1.20   mycroft 			     * Look for all-0's host part (old broadcast addr),
    345  1.20   mycroft 			     * either for subnet or net.
    346  1.20   mycroft 			     */
    347  1.20   mycroft 			    ip->ip_dst.s_addr == ia->ia_subnet ||
    348  1.18   mycroft 			    ip->ip_dst.s_addr == ia->ia_net)
    349   1.1       cgd 				goto ours;
    350  1.57       tls 			/*
    351  1.57       tls 			 * An interface with IP address zero accepts
    352  1.57       tls 			 * all packets that arrive on that interface.
    353  1.57       tls 			 */
    354  1.57       tls 			if (in_nullhost(ia->ia_addr.sin_addr))
    355  1.57       tls 				goto ours;
    356   1.1       cgd 		}
    357   1.1       cgd 	}
    358  1.18   mycroft 	if (IN_MULTICAST(ip->ip_dst.s_addr)) {
    359   1.4   hpeyerl 		struct in_multi *inm;
    360   1.4   hpeyerl #ifdef MROUTING
    361   1.4   hpeyerl 		extern struct socket *ip_mrouter;
    362  1.10    brezak 
    363  1.10    brezak 		if (m->m_flags & M_EXT) {
    364  1.10    brezak 			if ((m = m_pullup(m, hlen)) == 0) {
    365  1.10    brezak 				ipstat.ips_toosmall++;
    366  1.10    brezak 				goto next;
    367  1.10    brezak 			}
    368  1.10    brezak 			ip = mtod(m, struct ip *);
    369  1.10    brezak 		}
    370   1.4   hpeyerl 
    371   1.4   hpeyerl 		if (ip_mrouter) {
    372   1.4   hpeyerl 			/*
    373   1.4   hpeyerl 			 * If we are acting as a multicast router, all
    374   1.4   hpeyerl 			 * incoming multicast packets are passed to the
    375   1.4   hpeyerl 			 * kernel-level multicast forwarding function.
    376   1.4   hpeyerl 			 * The packet is returned (relatively) intact; if
    377   1.4   hpeyerl 			 * ip_mforward() returns a non-zero value, the packet
    378   1.4   hpeyerl 			 * must be discarded, else it may be accepted below.
    379   1.4   hpeyerl 			 *
    380   1.4   hpeyerl 			 * (The IP ident field is put in the same byte order
    381   1.4   hpeyerl 			 * as expected when ip_mforward() is called from
    382   1.4   hpeyerl 			 * ip_output().)
    383   1.4   hpeyerl 			 */
    384   1.4   hpeyerl 			ip->ip_id = htons(ip->ip_id);
    385  1.13   mycroft 			if (ip_mforward(m, m->m_pkthdr.rcvif) != 0) {
    386  1.13   mycroft 				ipstat.ips_cantforward++;
    387   1.4   hpeyerl 				m_freem(m);
    388   1.4   hpeyerl 				goto next;
    389   1.4   hpeyerl 			}
    390   1.4   hpeyerl 			ip->ip_id = ntohs(ip->ip_id);
    391   1.4   hpeyerl 
    392   1.4   hpeyerl 			/*
    393   1.4   hpeyerl 			 * The process-level routing demon needs to receive
    394   1.4   hpeyerl 			 * all multicast IGMP packets, whether or not this
    395   1.4   hpeyerl 			 * host belongs to their destination groups.
    396   1.4   hpeyerl 			 */
    397   1.4   hpeyerl 			if (ip->ip_p == IPPROTO_IGMP)
    398   1.4   hpeyerl 				goto ours;
    399  1.13   mycroft 			ipstat.ips_forward++;
    400   1.4   hpeyerl 		}
    401   1.4   hpeyerl #endif
    402   1.4   hpeyerl 		/*
    403   1.4   hpeyerl 		 * See if we belong to the destination multicast group on the
    404   1.4   hpeyerl 		 * arrival interface.
    405   1.4   hpeyerl 		 */
    406   1.4   hpeyerl 		IN_LOOKUP_MULTI(ip->ip_dst, m->m_pkthdr.rcvif, inm);
    407   1.4   hpeyerl 		if (inm == NULL) {
    408  1.13   mycroft 			ipstat.ips_cantforward++;
    409   1.4   hpeyerl 			m_freem(m);
    410   1.4   hpeyerl 			goto next;
    411   1.4   hpeyerl 		}
    412   1.4   hpeyerl 		goto ours;
    413   1.4   hpeyerl 	}
    414  1.19   mycroft 	if (ip->ip_dst.s_addr == INADDR_BROADCAST ||
    415  1.35   mycroft 	    in_nullhost(ip->ip_dst))
    416   1.1       cgd 		goto ours;
    417   1.1       cgd 
    418   1.1       cgd 	/*
    419   1.1       cgd 	 * Not for us; forward if possible and desirable.
    420   1.1       cgd 	 */
    421   1.1       cgd 	if (ipforwarding == 0) {
    422   1.1       cgd 		ipstat.ips_cantforward++;
    423   1.1       cgd 		m_freem(m);
    424   1.1       cgd 	} else
    425   1.1       cgd 		ip_forward(m, 0);
    426   1.1       cgd 	goto next;
    427   1.1       cgd 
    428   1.1       cgd ours:
    429   1.1       cgd 	/*
    430   1.1       cgd 	 * If offset or IP_MF are set, must reassemble.
    431   1.1       cgd 	 * Otherwise, nothing need be done.
    432   1.1       cgd 	 * (We could look in the reassembly queue to see
    433   1.1       cgd 	 * if the packet was previously fragmented,
    434   1.1       cgd 	 * but it's not worth the time; just let them time out.)
    435   1.1       cgd 	 */
    436  1.37     perry 	if (ip->ip_off & ~(IP_DF|IP_RF)) {
    437   1.1       cgd 		/*
    438   1.1       cgd 		 * Look for queue of fragments
    439   1.1       cgd 		 * of this datagram.
    440   1.1       cgd 		 */
    441  1.25       cgd 		for (fp = ipq.lh_first; fp != NULL; fp = fp->ipq_q.le_next)
    442   1.1       cgd 			if (ip->ip_id == fp->ipq_id &&
    443  1.35   mycroft 			    in_hosteq(ip->ip_src, fp->ipq_src) &&
    444  1.35   mycroft 			    in_hosteq(ip->ip_dst, fp->ipq_dst) &&
    445   1.1       cgd 			    ip->ip_p == fp->ipq_p)
    446   1.1       cgd 				goto found;
    447   1.1       cgd 		fp = 0;
    448   1.1       cgd found:
    449   1.1       cgd 
    450   1.1       cgd 		/*
    451   1.1       cgd 		 * Adjust ip_len to not reflect header,
    452  1.25       cgd 		 * set ipqe_mff if more fragments are expected,
    453   1.1       cgd 		 * convert offset of this to bytes.
    454   1.1       cgd 		 */
    455   1.1       cgd 		ip->ip_len -= hlen;
    456  1.25       cgd 		mff = (ip->ip_off & IP_MF) != 0;
    457  1.25       cgd 		if (mff) {
    458  1.16       cgd 		        /*
    459  1.16       cgd 		         * Make sure that fragments have a data length
    460  1.16       cgd 			 * that's a non-zero multiple of 8 bytes.
    461  1.16       cgd 		         */
    462  1.17       cgd 			if (ip->ip_len == 0 || (ip->ip_len & 0x7) != 0) {
    463  1.16       cgd 				ipstat.ips_badfrags++;
    464  1.16       cgd 				goto bad;
    465  1.16       cgd 			}
    466  1.16       cgd 		}
    467   1.1       cgd 		ip->ip_off <<= 3;
    468   1.1       cgd 
    469   1.1       cgd 		/*
    470   1.1       cgd 		 * If datagram marked as having more fragments
    471   1.1       cgd 		 * or if this is not the first fragment,
    472   1.1       cgd 		 * attempt reassembly; if it succeeds, proceed.
    473   1.1       cgd 		 */
    474  1.25       cgd 		if (mff || ip->ip_off) {
    475   1.1       cgd 			ipstat.ips_fragments++;
    476  1.25       cgd 			MALLOC(ipqe, struct ipqent *, sizeof (struct ipqent),
    477  1.25       cgd 			    M_IPQ, M_NOWAIT);
    478  1.25       cgd 			if (ipqe == NULL) {
    479  1.25       cgd 				ipstat.ips_rcvmemdrop++;
    480  1.25       cgd 				goto bad;
    481  1.25       cgd 			}
    482  1.25       cgd 			ipqe->ipqe_mff = mff;
    483  1.50   thorpej 			ipqe->ipqe_m = m;
    484  1.25       cgd 			ipqe->ipqe_ip = ip;
    485  1.50   thorpej 			m = ip_reass(ipqe, fp);
    486  1.50   thorpej 			if (m == 0)
    487   1.1       cgd 				goto next;
    488  1.13   mycroft 			ipstat.ips_reassembled++;
    489  1.50   thorpej 			ip = mtod(m, struct ip *);
    490   1.1       cgd 		} else
    491   1.1       cgd 			if (fp)
    492   1.1       cgd 				ip_freef(fp);
    493   1.1       cgd 	} else
    494   1.1       cgd 		ip->ip_len -= hlen;
    495   1.1       cgd 
    496   1.1       cgd 	/*
    497   1.1       cgd 	 * Switch out to protocol's input routine.
    498   1.1       cgd 	 */
    499   1.1       cgd 	ipstat.ips_delivered++;
    500   1.1       cgd 	(*inetsw[ip_protox[ip->ip_p]].pr_input)(m, hlen);
    501   1.1       cgd 	goto next;
    502   1.1       cgd bad:
    503   1.1       cgd 	m_freem(m);
    504   1.1       cgd 	goto next;
    505   1.1       cgd }
    506   1.1       cgd 
    507   1.1       cgd /*
    508   1.1       cgd  * Take incoming datagram fragment and try to
    509   1.1       cgd  * reassemble it into whole datagram.  If a chain for
    510   1.1       cgd  * reassembly of this datagram already exists, then it
    511   1.1       cgd  * is given as fp; otherwise have to make a chain.
    512   1.1       cgd  */
    513  1.50   thorpej struct mbuf *
    514  1.25       cgd ip_reass(ipqe, fp)
    515  1.25       cgd 	register struct ipqent *ipqe;
    516   1.1       cgd 	register struct ipq *fp;
    517   1.1       cgd {
    518  1.50   thorpej 	register struct mbuf *m = ipqe->ipqe_m;
    519  1.25       cgd 	register struct ipqent *nq, *p, *q;
    520  1.25       cgd 	struct ip *ip;
    521   1.1       cgd 	struct mbuf *t;
    522  1.25       cgd 	int hlen = ipqe->ipqe_ip->ip_hl << 2;
    523   1.1       cgd 	int i, next;
    524   1.1       cgd 
    525   1.1       cgd 	/*
    526   1.1       cgd 	 * Presence of header sizes in mbufs
    527   1.1       cgd 	 * would confuse code below.
    528   1.1       cgd 	 */
    529   1.1       cgd 	m->m_data += hlen;
    530   1.1       cgd 	m->m_len -= hlen;
    531   1.1       cgd 
    532   1.1       cgd 	/*
    533   1.1       cgd 	 * If first fragment to arrive, create a reassembly queue.
    534   1.1       cgd 	 */
    535   1.1       cgd 	if (fp == 0) {
    536  1.50   thorpej 		MALLOC(fp, struct ipq *, sizeof (struct ipq),
    537  1.50   thorpej 		    M_FTABLE, M_NOWAIT);
    538  1.50   thorpej 		if (fp == NULL)
    539   1.1       cgd 			goto dropfrag;
    540  1.25       cgd 		LIST_INSERT_HEAD(&ipq, fp, ipq_q);
    541   1.1       cgd 		fp->ipq_ttl = IPFRAGTTL;
    542  1.25       cgd 		fp->ipq_p = ipqe->ipqe_ip->ip_p;
    543  1.25       cgd 		fp->ipq_id = ipqe->ipqe_ip->ip_id;
    544  1.25       cgd 		LIST_INIT(&fp->ipq_fragq);
    545  1.25       cgd 		fp->ipq_src = ipqe->ipqe_ip->ip_src;
    546  1.25       cgd 		fp->ipq_dst = ipqe->ipqe_ip->ip_dst;
    547  1.25       cgd 		p = NULL;
    548   1.1       cgd 		goto insert;
    549   1.1       cgd 	}
    550   1.1       cgd 
    551   1.1       cgd 	/*
    552   1.1       cgd 	 * Find a segment which begins after this one does.
    553   1.1       cgd 	 */
    554  1.25       cgd 	for (p = NULL, q = fp->ipq_fragq.lh_first; q != NULL;
    555  1.25       cgd 	    p = q, q = q->ipqe_q.le_next)
    556  1.25       cgd 		if (q->ipqe_ip->ip_off > ipqe->ipqe_ip->ip_off)
    557   1.1       cgd 			break;
    558   1.1       cgd 
    559   1.1       cgd 	/*
    560   1.1       cgd 	 * If there is a preceding segment, it may provide some of
    561   1.1       cgd 	 * our data already.  If so, drop the data from the incoming
    562   1.1       cgd 	 * segment.  If it provides all of our data, drop us.
    563   1.1       cgd 	 */
    564  1.25       cgd 	if (p != NULL) {
    565  1.25       cgd 		i = p->ipqe_ip->ip_off + p->ipqe_ip->ip_len -
    566  1.25       cgd 		    ipqe->ipqe_ip->ip_off;
    567   1.1       cgd 		if (i > 0) {
    568  1.25       cgd 			if (i >= ipqe->ipqe_ip->ip_len)
    569   1.1       cgd 				goto dropfrag;
    570  1.50   thorpej 			m_adj(ipqe->ipqe_m, i);
    571  1.25       cgd 			ipqe->ipqe_ip->ip_off += i;
    572  1.25       cgd 			ipqe->ipqe_ip->ip_len -= i;
    573   1.1       cgd 		}
    574   1.1       cgd 	}
    575   1.1       cgd 
    576   1.1       cgd 	/*
    577   1.1       cgd 	 * While we overlap succeeding segments trim them or,
    578   1.1       cgd 	 * if they are completely covered, dequeue them.
    579   1.1       cgd 	 */
    580  1.25       cgd 	for (; q != NULL && ipqe->ipqe_ip->ip_off + ipqe->ipqe_ip->ip_len >
    581  1.25       cgd 	    q->ipqe_ip->ip_off; q = nq) {
    582  1.25       cgd 		i = (ipqe->ipqe_ip->ip_off + ipqe->ipqe_ip->ip_len) -
    583  1.25       cgd 		    q->ipqe_ip->ip_off;
    584  1.25       cgd 		if (i < q->ipqe_ip->ip_len) {
    585  1.25       cgd 			q->ipqe_ip->ip_len -= i;
    586  1.25       cgd 			q->ipqe_ip->ip_off += i;
    587  1.50   thorpej 			m_adj(q->ipqe_m, i);
    588   1.1       cgd 			break;
    589   1.1       cgd 		}
    590  1.25       cgd 		nq = q->ipqe_q.le_next;
    591  1.50   thorpej 		m_freem(q->ipqe_m);
    592  1.25       cgd 		LIST_REMOVE(q, ipqe_q);
    593  1.25       cgd 		FREE(q, M_IPQ);
    594   1.1       cgd 	}
    595   1.1       cgd 
    596   1.1       cgd insert:
    597   1.1       cgd 	/*
    598   1.1       cgd 	 * Stick new segment in its place;
    599   1.1       cgd 	 * check for complete reassembly.
    600   1.1       cgd 	 */
    601  1.25       cgd 	if (p == NULL) {
    602  1.25       cgd 		LIST_INSERT_HEAD(&fp->ipq_fragq, ipqe, ipqe_q);
    603  1.25       cgd 	} else {
    604  1.25       cgd 		LIST_INSERT_AFTER(p, ipqe, ipqe_q);
    605  1.25       cgd 	}
    606   1.1       cgd 	next = 0;
    607  1.25       cgd 	for (p = NULL, q = fp->ipq_fragq.lh_first; q != NULL;
    608  1.25       cgd 	    p = q, q = q->ipqe_q.le_next) {
    609  1.25       cgd 		if (q->ipqe_ip->ip_off != next)
    610   1.1       cgd 			return (0);
    611  1.25       cgd 		next += q->ipqe_ip->ip_len;
    612   1.1       cgd 	}
    613  1.25       cgd 	if (p->ipqe_mff)
    614   1.1       cgd 		return (0);
    615   1.1       cgd 
    616   1.1       cgd 	/*
    617  1.41   thorpej 	 * Reassembly is complete.  Check for a bogus message size and
    618  1.41   thorpej 	 * concatenate fragments.
    619   1.1       cgd 	 */
    620  1.25       cgd 	q = fp->ipq_fragq.lh_first;
    621  1.25       cgd 	ip = q->ipqe_ip;
    622  1.41   thorpej 	if ((next + (ip->ip_hl << 2)) > IP_MAXPACKET) {
    623  1.41   thorpej 		ipstat.ips_toolong++;
    624  1.41   thorpej 		ip_freef(fp);
    625  1.41   thorpej 		return (0);
    626  1.41   thorpej 	}
    627  1.50   thorpej 	m = q->ipqe_m;
    628   1.1       cgd 	t = m->m_next;
    629   1.1       cgd 	m->m_next = 0;
    630   1.1       cgd 	m_cat(m, t);
    631  1.25       cgd 	nq = q->ipqe_q.le_next;
    632  1.25       cgd 	FREE(q, M_IPQ);
    633  1.25       cgd 	for (q = nq; q != NULL; q = nq) {
    634  1.50   thorpej 		t = q->ipqe_m;
    635  1.25       cgd 		nq = q->ipqe_q.le_next;
    636  1.25       cgd 		FREE(q, M_IPQ);
    637   1.1       cgd 		m_cat(m, t);
    638   1.1       cgd 	}
    639   1.1       cgd 
    640   1.1       cgd 	/*
    641   1.1       cgd 	 * Create header for new ip packet by
    642   1.1       cgd 	 * modifying header of first packet;
    643   1.1       cgd 	 * dequeue and discard fragment reassembly header.
    644   1.1       cgd 	 * Make header visible.
    645   1.1       cgd 	 */
    646   1.1       cgd 	ip->ip_len = next;
    647  1.25       cgd 	ip->ip_src = fp->ipq_src;
    648  1.25       cgd 	ip->ip_dst = fp->ipq_dst;
    649  1.25       cgd 	LIST_REMOVE(fp, ipq_q);
    650  1.50   thorpej 	FREE(fp, M_FTABLE);
    651   1.1       cgd 	m->m_len += (ip->ip_hl << 2);
    652   1.1       cgd 	m->m_data -= (ip->ip_hl << 2);
    653   1.1       cgd 	/* some debugging cruft by sklower, below, will go away soon */
    654   1.1       cgd 	if (m->m_flags & M_PKTHDR) { /* XXX this should be done elsewhere */
    655   1.1       cgd 		register int plen = 0;
    656  1.50   thorpej 		for (t = m; t; t = t->m_next)
    657  1.50   thorpej 			plen += t->m_len;
    658  1.50   thorpej 		m->m_pkthdr.len = plen;
    659   1.1       cgd 	}
    660  1.50   thorpej 	return (m);
    661   1.1       cgd 
    662   1.1       cgd dropfrag:
    663   1.1       cgd 	ipstat.ips_fragdropped++;
    664   1.1       cgd 	m_freem(m);
    665  1.25       cgd 	FREE(ipqe, M_IPQ);
    666   1.1       cgd 	return (0);
    667   1.1       cgd }
    668   1.1       cgd 
    669   1.1       cgd /*
    670   1.1       cgd  * Free a fragment reassembly header and all
    671   1.1       cgd  * associated datagrams.
    672   1.1       cgd  */
    673   1.8   mycroft void
    674   1.1       cgd ip_freef(fp)
    675   1.1       cgd 	struct ipq *fp;
    676   1.1       cgd {
    677  1.25       cgd 	register struct ipqent *q, *p;
    678   1.1       cgd 
    679  1.25       cgd 	for (q = fp->ipq_fragq.lh_first; q != NULL; q = p) {
    680  1.25       cgd 		p = q->ipqe_q.le_next;
    681  1.50   thorpej 		m_freem(q->ipqe_m);
    682  1.25       cgd 		LIST_REMOVE(q, ipqe_q);
    683  1.25       cgd 		FREE(q, M_IPQ);
    684   1.1       cgd 	}
    685  1.25       cgd 	LIST_REMOVE(fp, ipq_q);
    686  1.50   thorpej 	FREE(fp, M_FTABLE);
    687   1.1       cgd }
    688   1.1       cgd 
    689   1.1       cgd /*
    690   1.1       cgd  * IP timer processing;
    691   1.1       cgd  * if a timer expires on a reassembly
    692   1.1       cgd  * queue, discard it.
    693   1.1       cgd  */
    694   1.8   mycroft void
    695   1.1       cgd ip_slowtimo()
    696   1.1       cgd {
    697  1.25       cgd 	register struct ipq *fp, *nfp;
    698  1.24   mycroft 	int s = splsoftnet();
    699   1.1       cgd 
    700  1.25       cgd 	for (fp = ipq.lh_first; fp != NULL; fp = nfp) {
    701  1.25       cgd 		nfp = fp->ipq_q.le_next;
    702  1.25       cgd 		if (--fp->ipq_ttl == 0) {
    703   1.1       cgd 			ipstat.ips_fragtimeout++;
    704  1.25       cgd 			ip_freef(fp);
    705   1.1       cgd 		}
    706   1.1       cgd 	}
    707   1.1       cgd 	splx(s);
    708   1.1       cgd }
    709   1.1       cgd 
    710   1.1       cgd /*
    711   1.1       cgd  * Drain off all datagram fragments.
    712   1.1       cgd  */
    713   1.8   mycroft void
    714   1.1       cgd ip_drain()
    715   1.1       cgd {
    716   1.1       cgd 
    717  1.25       cgd 	while (ipq.lh_first != NULL) {
    718   1.1       cgd 		ipstat.ips_fragdropped++;
    719  1.25       cgd 		ip_freef(ipq.lh_first);
    720   1.1       cgd 	}
    721   1.1       cgd }
    722   1.1       cgd 
    723   1.1       cgd /*
    724   1.1       cgd  * Do option processing on a datagram,
    725   1.1       cgd  * possibly discarding it if bad options are encountered,
    726   1.1       cgd  * or forwarding it if source-routed.
    727   1.1       cgd  * Returns 1 if packet has been forwarded/freed,
    728   1.1       cgd  * 0 if the packet should be processed further.
    729   1.1       cgd  */
    730   1.8   mycroft int
    731   1.1       cgd ip_dooptions(m)
    732   1.1       cgd 	struct mbuf *m;
    733   1.1       cgd {
    734   1.1       cgd 	register struct ip *ip = mtod(m, struct ip *);
    735   1.1       cgd 	register u_char *cp;
    736   1.1       cgd 	register struct ip_timestamp *ipt;
    737   1.1       cgd 	register struct in_ifaddr *ia;
    738   1.1       cgd 	int opt, optlen, cnt, off, code, type = ICMP_PARAMPROB, forward = 0;
    739  1.13   mycroft 	struct in_addr *sin, dst;
    740   1.1       cgd 	n_time ntime;
    741   1.1       cgd 
    742  1.13   mycroft 	dst = ip->ip_dst;
    743   1.1       cgd 	cp = (u_char *)(ip + 1);
    744   1.1       cgd 	cnt = (ip->ip_hl << 2) - sizeof (struct ip);
    745   1.1       cgd 	for (; cnt > 0; cnt -= optlen, cp += optlen) {
    746   1.1       cgd 		opt = cp[IPOPT_OPTVAL];
    747   1.1       cgd 		if (opt == IPOPT_EOL)
    748   1.1       cgd 			break;
    749   1.1       cgd 		if (opt == IPOPT_NOP)
    750   1.1       cgd 			optlen = 1;
    751   1.1       cgd 		else {
    752   1.1       cgd 			optlen = cp[IPOPT_OLEN];
    753   1.1       cgd 			if (optlen <= 0 || optlen > cnt) {
    754   1.1       cgd 				code = &cp[IPOPT_OLEN] - (u_char *)ip;
    755   1.1       cgd 				goto bad;
    756   1.1       cgd 			}
    757   1.1       cgd 		}
    758   1.1       cgd 		switch (opt) {
    759   1.1       cgd 
    760   1.1       cgd 		default:
    761   1.1       cgd 			break;
    762   1.1       cgd 
    763   1.1       cgd 		/*
    764   1.1       cgd 		 * Source routing with record.
    765   1.1       cgd 		 * Find interface with current destination address.
    766   1.1       cgd 		 * If none on this machine then drop if strictly routed,
    767   1.1       cgd 		 * or do nothing if loosely routed.
    768   1.1       cgd 		 * Record interface address and bring up next address
    769   1.1       cgd 		 * component.  If strictly routed make sure next
    770   1.1       cgd 		 * address is on directly accessible net.
    771   1.1       cgd 		 */
    772   1.1       cgd 		case IPOPT_LSRR:
    773   1.1       cgd 		case IPOPT_SSRR:
    774  1.47       cjs 			if (ip_allowsrcrt == 0) {
    775  1.47       cjs 				type = ICMP_UNREACH;
    776  1.47       cjs 				code = ICMP_UNREACH_NET_PROHIB;
    777  1.47       cjs 				goto bad;
    778  1.47       cjs 			}
    779   1.1       cgd 			if ((off = cp[IPOPT_OFFSET]) < IPOPT_MINOFF) {
    780   1.1       cgd 				code = &cp[IPOPT_OFFSET] - (u_char *)ip;
    781   1.1       cgd 				goto bad;
    782   1.1       cgd 			}
    783   1.1       cgd 			ipaddr.sin_addr = ip->ip_dst;
    784  1.19   mycroft 			ia = ifatoia(ifa_ifwithaddr(sintosa(&ipaddr)));
    785   1.1       cgd 			if (ia == 0) {
    786   1.1       cgd 				if (opt == IPOPT_SSRR) {
    787   1.1       cgd 					type = ICMP_UNREACH;
    788   1.1       cgd 					code = ICMP_UNREACH_SRCFAIL;
    789   1.1       cgd 					goto bad;
    790   1.1       cgd 				}
    791   1.1       cgd 				/*
    792   1.1       cgd 				 * Loose routing, and not at next destination
    793   1.1       cgd 				 * yet; nothing to do except forward.
    794   1.1       cgd 				 */
    795   1.1       cgd 				break;
    796   1.1       cgd 			}
    797   1.1       cgd 			off--;			/* 0 origin */
    798   1.1       cgd 			if (off > optlen - sizeof(struct in_addr)) {
    799   1.1       cgd 				/*
    800   1.1       cgd 				 * End of source route.  Should be for us.
    801   1.1       cgd 				 */
    802   1.1       cgd 				save_rte(cp, ip->ip_src);
    803   1.1       cgd 				break;
    804   1.1       cgd 			}
    805   1.1       cgd 			/*
    806   1.1       cgd 			 * locate outgoing interface
    807   1.1       cgd 			 */
    808   1.1       cgd 			bcopy((caddr_t)(cp + off), (caddr_t)&ipaddr.sin_addr,
    809   1.1       cgd 			    sizeof(ipaddr.sin_addr));
    810   1.1       cgd 			if (opt == IPOPT_SSRR) {
    811   1.1       cgd #define	INA	struct in_ifaddr *
    812   1.1       cgd #define	SA	struct sockaddr *
    813  1.29       mrg 			    ia = (INA)ifa_ifwithladdr((SA)&ipaddr);
    814   1.1       cgd 			} else
    815   1.1       cgd 				ia = ip_rtaddr(ipaddr.sin_addr);
    816   1.1       cgd 			if (ia == 0) {
    817   1.1       cgd 				type = ICMP_UNREACH;
    818   1.1       cgd 				code = ICMP_UNREACH_SRCFAIL;
    819   1.1       cgd 				goto bad;
    820   1.1       cgd 			}
    821   1.1       cgd 			ip->ip_dst = ipaddr.sin_addr;
    822  1.20   mycroft 			bcopy((caddr_t)&ia->ia_addr.sin_addr,
    823   1.1       cgd 			    (caddr_t)(cp + off), sizeof(struct in_addr));
    824   1.1       cgd 			cp[IPOPT_OFFSET] += sizeof(struct in_addr);
    825  1.13   mycroft 			/*
    826  1.13   mycroft 			 * Let ip_intr's mcast routing check handle mcast pkts
    827  1.13   mycroft 			 */
    828  1.18   mycroft 			forward = !IN_MULTICAST(ip->ip_dst.s_addr);
    829   1.1       cgd 			break;
    830   1.1       cgd 
    831   1.1       cgd 		case IPOPT_RR:
    832   1.1       cgd 			if ((off = cp[IPOPT_OFFSET]) < IPOPT_MINOFF) {
    833   1.1       cgd 				code = &cp[IPOPT_OFFSET] - (u_char *)ip;
    834   1.1       cgd 				goto bad;
    835   1.1       cgd 			}
    836   1.1       cgd 			/*
    837   1.1       cgd 			 * If no space remains, ignore.
    838   1.1       cgd 			 */
    839   1.1       cgd 			off--;			/* 0 origin */
    840   1.1       cgd 			if (off > optlen - sizeof(struct in_addr))
    841   1.1       cgd 				break;
    842   1.1       cgd 			bcopy((caddr_t)(&ip->ip_dst), (caddr_t)&ipaddr.sin_addr,
    843   1.1       cgd 			    sizeof(ipaddr.sin_addr));
    844   1.1       cgd 			/*
    845   1.1       cgd 			 * locate outgoing interface; if we're the destination,
    846   1.1       cgd 			 * use the incoming interface (should be same).
    847   1.1       cgd 			 */
    848   1.1       cgd 			if ((ia = (INA)ifa_ifwithaddr((SA)&ipaddr)) == 0 &&
    849   1.1       cgd 			    (ia = ip_rtaddr(ipaddr.sin_addr)) == 0) {
    850   1.1       cgd 				type = ICMP_UNREACH;
    851   1.1       cgd 				code = ICMP_UNREACH_HOST;
    852   1.1       cgd 				goto bad;
    853   1.1       cgd 			}
    854  1.20   mycroft 			bcopy((caddr_t)&ia->ia_addr.sin_addr,
    855   1.1       cgd 			    (caddr_t)(cp + off), sizeof(struct in_addr));
    856   1.1       cgd 			cp[IPOPT_OFFSET] += sizeof(struct in_addr);
    857   1.1       cgd 			break;
    858   1.1       cgd 
    859   1.1       cgd 		case IPOPT_TS:
    860   1.1       cgd 			code = cp - (u_char *)ip;
    861   1.1       cgd 			ipt = (struct ip_timestamp *)cp;
    862   1.1       cgd 			if (ipt->ipt_len < 5)
    863   1.1       cgd 				goto bad;
    864  1.15       cgd 			if (ipt->ipt_ptr > ipt->ipt_len - sizeof (int32_t)) {
    865   1.1       cgd 				if (++ipt->ipt_oflw == 0)
    866   1.1       cgd 					goto bad;
    867   1.1       cgd 				break;
    868   1.1       cgd 			}
    869   1.1       cgd 			sin = (struct in_addr *)(cp + ipt->ipt_ptr - 1);
    870   1.1       cgd 			switch (ipt->ipt_flg) {
    871   1.1       cgd 
    872   1.1       cgd 			case IPOPT_TS_TSONLY:
    873   1.1       cgd 				break;
    874   1.1       cgd 
    875   1.1       cgd 			case IPOPT_TS_TSANDADDR:
    876   1.1       cgd 				if (ipt->ipt_ptr + sizeof(n_time) +
    877   1.1       cgd 				    sizeof(struct in_addr) > ipt->ipt_len)
    878   1.1       cgd 					goto bad;
    879  1.13   mycroft 				ipaddr.sin_addr = dst;
    880  1.13   mycroft 				ia = (INA)ifaof_ifpforaddr((SA)&ipaddr,
    881  1.13   mycroft 							    m->m_pkthdr.rcvif);
    882  1.13   mycroft 				if (ia == 0)
    883  1.13   mycroft 					continue;
    884  1.20   mycroft 				bcopy((caddr_t)&ia->ia_addr.sin_addr,
    885   1.1       cgd 				    (caddr_t)sin, sizeof(struct in_addr));
    886   1.1       cgd 				ipt->ipt_ptr += sizeof(struct in_addr);
    887   1.1       cgd 				break;
    888   1.1       cgd 
    889   1.1       cgd 			case IPOPT_TS_PRESPEC:
    890   1.1       cgd 				if (ipt->ipt_ptr + sizeof(n_time) +
    891   1.1       cgd 				    sizeof(struct in_addr) > ipt->ipt_len)
    892   1.1       cgd 					goto bad;
    893   1.1       cgd 				bcopy((caddr_t)sin, (caddr_t)&ipaddr.sin_addr,
    894   1.1       cgd 				    sizeof(struct in_addr));
    895   1.1       cgd 				if (ifa_ifwithaddr((SA)&ipaddr) == 0)
    896   1.1       cgd 					continue;
    897   1.1       cgd 				ipt->ipt_ptr += sizeof(struct in_addr);
    898   1.1       cgd 				break;
    899   1.1       cgd 
    900   1.1       cgd 			default:
    901   1.1       cgd 				goto bad;
    902   1.1       cgd 			}
    903   1.1       cgd 			ntime = iptime();
    904   1.1       cgd 			bcopy((caddr_t)&ntime, (caddr_t)cp + ipt->ipt_ptr - 1,
    905   1.1       cgd 			    sizeof(n_time));
    906   1.1       cgd 			ipt->ipt_ptr += sizeof(n_time);
    907   1.1       cgd 		}
    908   1.1       cgd 	}
    909   1.1       cgd 	if (forward) {
    910  1.26   thorpej 		if (ip_forwsrcrt == 0) {
    911  1.26   thorpej 			type = ICMP_UNREACH;
    912  1.26   thorpej 			code = ICMP_UNREACH_SRCFAIL;
    913  1.26   thorpej 			goto bad;
    914  1.26   thorpej 		}
    915   1.1       cgd 		ip_forward(m, 1);
    916   1.1       cgd 		return (1);
    917  1.13   mycroft 	}
    918  1.13   mycroft 	return (0);
    919   1.1       cgd bad:
    920  1.13   mycroft 	ip->ip_len -= ip->ip_hl << 2;   /* XXX icmp_error adds in hdr length */
    921  1.13   mycroft 	icmp_error(m, type, code, 0, 0);
    922  1.13   mycroft 	ipstat.ips_badoptions++;
    923   1.1       cgd 	return (1);
    924   1.1       cgd }
    925   1.1       cgd 
    926   1.1       cgd /*
    927   1.1       cgd  * Given address of next destination (final or next hop),
    928   1.1       cgd  * return internet address info of interface to be used to get there.
    929   1.1       cgd  */
    930   1.1       cgd struct in_ifaddr *
    931   1.1       cgd ip_rtaddr(dst)
    932   1.1       cgd 	 struct in_addr dst;
    933   1.1       cgd {
    934   1.1       cgd 	register struct sockaddr_in *sin;
    935   1.1       cgd 
    936  1.19   mycroft 	sin = satosin(&ipforward_rt.ro_dst);
    937   1.1       cgd 
    938  1.35   mycroft 	if (ipforward_rt.ro_rt == 0 || !in_hosteq(dst, sin->sin_addr)) {
    939   1.1       cgd 		if (ipforward_rt.ro_rt) {
    940   1.1       cgd 			RTFREE(ipforward_rt.ro_rt);
    941   1.1       cgd 			ipforward_rt.ro_rt = 0;
    942   1.1       cgd 		}
    943   1.1       cgd 		sin->sin_family = AF_INET;
    944   1.1       cgd 		sin->sin_len = sizeof(*sin);
    945   1.1       cgd 		sin->sin_addr = dst;
    946   1.1       cgd 
    947   1.1       cgd 		rtalloc(&ipforward_rt);
    948   1.1       cgd 	}
    949   1.1       cgd 	if (ipforward_rt.ro_rt == 0)
    950   1.1       cgd 		return ((struct in_ifaddr *)0);
    951  1.19   mycroft 	return (ifatoia(ipforward_rt.ro_rt->rt_ifa));
    952   1.1       cgd }
    953   1.1       cgd 
    954   1.1       cgd /*
    955   1.1       cgd  * Save incoming source route for use in replies,
    956   1.1       cgd  * to be picked up later by ip_srcroute if the receiver is interested.
    957   1.1       cgd  */
    958  1.13   mycroft void
    959   1.1       cgd save_rte(option, dst)
    960   1.1       cgd 	u_char *option;
    961   1.1       cgd 	struct in_addr dst;
    962   1.1       cgd {
    963   1.1       cgd 	unsigned olen;
    964   1.1       cgd 
    965   1.1       cgd 	olen = option[IPOPT_OLEN];
    966   1.1       cgd #ifdef DIAGNOSTIC
    967   1.1       cgd 	if (ipprintfs)
    968  1.39  christos 		printf("save_rte: olen %d\n", olen);
    969   1.1       cgd #endif
    970   1.1       cgd 	if (olen > sizeof(ip_srcrt) - (1 + sizeof(dst)))
    971   1.1       cgd 		return;
    972   1.1       cgd 	bcopy((caddr_t)option, (caddr_t)ip_srcrt.srcopt, olen);
    973   1.1       cgd 	ip_nhops = (olen - IPOPT_OFFSET - 1) / sizeof(struct in_addr);
    974   1.1       cgd 	ip_srcrt.dst = dst;
    975   1.1       cgd }
    976   1.1       cgd 
    977   1.1       cgd /*
    978   1.1       cgd  * Retrieve incoming source route for use in replies,
    979   1.1       cgd  * in the same form used by setsockopt.
    980   1.1       cgd  * The first hop is placed before the options, will be removed later.
    981   1.1       cgd  */
    982   1.1       cgd struct mbuf *
    983   1.1       cgd ip_srcroute()
    984   1.1       cgd {
    985   1.1       cgd 	register struct in_addr *p, *q;
    986   1.1       cgd 	register struct mbuf *m;
    987   1.1       cgd 
    988   1.1       cgd 	if (ip_nhops == 0)
    989   1.1       cgd 		return ((struct mbuf *)0);
    990   1.1       cgd 	m = m_get(M_DONTWAIT, MT_SOOPTS);
    991   1.1       cgd 	if (m == 0)
    992   1.1       cgd 		return ((struct mbuf *)0);
    993   1.1       cgd 
    994  1.13   mycroft #define OPTSIZ	(sizeof(ip_srcrt.nop) + sizeof(ip_srcrt.srcopt))
    995   1.1       cgd 
    996   1.1       cgd 	/* length is (nhops+1)*sizeof(addr) + sizeof(nop + srcrt header) */
    997   1.1       cgd 	m->m_len = ip_nhops * sizeof(struct in_addr) + sizeof(struct in_addr) +
    998   1.1       cgd 	    OPTSIZ;
    999   1.1       cgd #ifdef DIAGNOSTIC
   1000   1.1       cgd 	if (ipprintfs)
   1001  1.39  christos 		printf("ip_srcroute: nhops %d mlen %d", ip_nhops, m->m_len);
   1002   1.1       cgd #endif
   1003   1.1       cgd 
   1004   1.1       cgd 	/*
   1005   1.1       cgd 	 * First save first hop for return route
   1006   1.1       cgd 	 */
   1007   1.1       cgd 	p = &ip_srcrt.route[ip_nhops - 1];
   1008   1.1       cgd 	*(mtod(m, struct in_addr *)) = *p--;
   1009   1.1       cgd #ifdef DIAGNOSTIC
   1010   1.1       cgd 	if (ipprintfs)
   1011  1.39  christos 		printf(" hops %x", ntohl(mtod(m, struct in_addr *)->s_addr));
   1012   1.1       cgd #endif
   1013   1.1       cgd 
   1014   1.1       cgd 	/*
   1015   1.1       cgd 	 * Copy option fields and padding (nop) to mbuf.
   1016   1.1       cgd 	 */
   1017   1.1       cgd 	ip_srcrt.nop = IPOPT_NOP;
   1018   1.1       cgd 	ip_srcrt.srcopt[IPOPT_OFFSET] = IPOPT_MINOFF;
   1019   1.1       cgd 	bcopy((caddr_t)&ip_srcrt.nop,
   1020   1.1       cgd 	    mtod(m, caddr_t) + sizeof(struct in_addr), OPTSIZ);
   1021   1.1       cgd 	q = (struct in_addr *)(mtod(m, caddr_t) +
   1022   1.1       cgd 	    sizeof(struct in_addr) + OPTSIZ);
   1023   1.1       cgd #undef OPTSIZ
   1024   1.1       cgd 	/*
   1025   1.1       cgd 	 * Record return path as an IP source route,
   1026   1.1       cgd 	 * reversing the path (pointers are now aligned).
   1027   1.1       cgd 	 */
   1028   1.1       cgd 	while (p >= ip_srcrt.route) {
   1029   1.1       cgd #ifdef DIAGNOSTIC
   1030   1.1       cgd 		if (ipprintfs)
   1031  1.39  christos 			printf(" %x", ntohl(q->s_addr));
   1032   1.1       cgd #endif
   1033   1.1       cgd 		*q++ = *p--;
   1034   1.1       cgd 	}
   1035   1.1       cgd 	/*
   1036   1.1       cgd 	 * Last hop goes to final destination.
   1037   1.1       cgd 	 */
   1038   1.1       cgd 	*q = ip_srcrt.dst;
   1039   1.1       cgd #ifdef DIAGNOSTIC
   1040   1.1       cgd 	if (ipprintfs)
   1041  1.39  christos 		printf(" %x\n", ntohl(q->s_addr));
   1042   1.1       cgd #endif
   1043   1.1       cgd 	return (m);
   1044   1.1       cgd }
   1045   1.1       cgd 
   1046   1.1       cgd /*
   1047   1.1       cgd  * Strip out IP options, at higher
   1048   1.1       cgd  * level protocol in the kernel.
   1049   1.1       cgd  * Second argument is buffer to which options
   1050   1.1       cgd  * will be moved, and return value is their length.
   1051   1.1       cgd  * XXX should be deleted; last arg currently ignored.
   1052   1.1       cgd  */
   1053   1.8   mycroft void
   1054   1.1       cgd ip_stripoptions(m, mopt)
   1055   1.1       cgd 	register struct mbuf *m;
   1056   1.1       cgd 	struct mbuf *mopt;
   1057   1.1       cgd {
   1058   1.1       cgd 	register int i;
   1059   1.1       cgd 	struct ip *ip = mtod(m, struct ip *);
   1060   1.1       cgd 	register caddr_t opts;
   1061   1.1       cgd 	int olen;
   1062   1.1       cgd 
   1063   1.1       cgd 	olen = (ip->ip_hl<<2) - sizeof (struct ip);
   1064   1.1       cgd 	opts = (caddr_t)(ip + 1);
   1065   1.1       cgd 	i = m->m_len - (sizeof (struct ip) + olen);
   1066   1.1       cgd 	bcopy(opts  + olen, opts, (unsigned)i);
   1067   1.1       cgd 	m->m_len -= olen;
   1068   1.1       cgd 	if (m->m_flags & M_PKTHDR)
   1069   1.1       cgd 		m->m_pkthdr.len -= olen;
   1070   1.1       cgd 	ip->ip_hl = sizeof(struct ip) >> 2;
   1071   1.1       cgd }
   1072   1.1       cgd 
   1073  1.23   mycroft int inetctlerrmap[PRC_NCMDS] = {
   1074   1.1       cgd 	0,		0,		0,		0,
   1075   1.1       cgd 	0,		EMSGSIZE,	EHOSTDOWN,	EHOSTUNREACH,
   1076   1.1       cgd 	EHOSTUNREACH,	EHOSTUNREACH,	ECONNREFUSED,	ECONNREFUSED,
   1077   1.1       cgd 	EMSGSIZE,	EHOSTUNREACH,	0,		0,
   1078   1.1       cgd 	0,		0,		0,		0,
   1079   1.1       cgd 	ENOPROTOOPT
   1080   1.1       cgd };
   1081   1.1       cgd 
   1082   1.1       cgd /*
   1083   1.1       cgd  * Forward a packet.  If some error occurs return the sender
   1084   1.1       cgd  * an icmp packet.  Note we can't always generate a meaningful
   1085   1.1       cgd  * icmp message because icmp doesn't have a large enough repertoire
   1086   1.1       cgd  * of codes and types.
   1087   1.1       cgd  *
   1088   1.1       cgd  * If not forwarding, just drop the packet.  This could be confusing
   1089   1.1       cgd  * if ipforwarding was zero but some routing protocol was advancing
   1090   1.1       cgd  * us as a gateway to somewhere.  However, we must let the routing
   1091   1.1       cgd  * protocol deal with that.
   1092   1.1       cgd  *
   1093   1.1       cgd  * The srcrt parameter indicates whether the packet is being forwarded
   1094   1.1       cgd  * via a source route.
   1095   1.1       cgd  */
   1096  1.13   mycroft void
   1097   1.1       cgd ip_forward(m, srcrt)
   1098   1.1       cgd 	struct mbuf *m;
   1099   1.1       cgd 	int srcrt;
   1100   1.1       cgd {
   1101   1.1       cgd 	register struct ip *ip = mtod(m, struct ip *);
   1102   1.1       cgd 	register struct sockaddr_in *sin;
   1103   1.1       cgd 	register struct rtentry *rt;
   1104  1.28  christos 	int error, type = 0, code = 0;
   1105   1.1       cgd 	struct mbuf *mcopy;
   1106  1.13   mycroft 	n_long dest;
   1107  1.13   mycroft 	struct ifnet *destifp;
   1108   1.1       cgd 
   1109  1.13   mycroft 	dest = 0;
   1110   1.1       cgd #ifdef DIAGNOSTIC
   1111   1.1       cgd 	if (ipprintfs)
   1112  1.39  christos 		printf("forward: src %x dst %x ttl %x\n",
   1113  1.35   mycroft 		    ip->ip_src.s_addr, ip->ip_dst.s_addr, ip->ip_ttl);
   1114   1.1       cgd #endif
   1115   1.1       cgd 	if (m->m_flags & M_BCAST || in_canforward(ip->ip_dst) == 0) {
   1116   1.1       cgd 		ipstat.ips_cantforward++;
   1117   1.1       cgd 		m_freem(m);
   1118   1.1       cgd 		return;
   1119   1.1       cgd 	}
   1120   1.1       cgd 	HTONS(ip->ip_id);
   1121   1.1       cgd 	if (ip->ip_ttl <= IPTTLDEC) {
   1122  1.13   mycroft 		icmp_error(m, ICMP_TIMXCEED, ICMP_TIMXCEED_INTRANS, dest, 0);
   1123   1.1       cgd 		return;
   1124   1.1       cgd 	}
   1125   1.1       cgd 	ip->ip_ttl -= IPTTLDEC;
   1126   1.1       cgd 
   1127  1.19   mycroft 	sin = satosin(&ipforward_rt.ro_dst);
   1128   1.1       cgd 	if ((rt = ipforward_rt.ro_rt) == 0 ||
   1129  1.35   mycroft 	    !in_hosteq(ip->ip_dst, sin->sin_addr)) {
   1130   1.1       cgd 		if (ipforward_rt.ro_rt) {
   1131   1.1       cgd 			RTFREE(ipforward_rt.ro_rt);
   1132   1.1       cgd 			ipforward_rt.ro_rt = 0;
   1133   1.1       cgd 		}
   1134   1.1       cgd 		sin->sin_family = AF_INET;
   1135  1.35   mycroft 		sin->sin_len = sizeof(struct sockaddr_in);
   1136   1.1       cgd 		sin->sin_addr = ip->ip_dst;
   1137   1.1       cgd 
   1138   1.1       cgd 		rtalloc(&ipforward_rt);
   1139   1.1       cgd 		if (ipforward_rt.ro_rt == 0) {
   1140  1.13   mycroft 			icmp_error(m, ICMP_UNREACH, ICMP_UNREACH_HOST, dest, 0);
   1141   1.1       cgd 			return;
   1142   1.1       cgd 		}
   1143   1.1       cgd 		rt = ipforward_rt.ro_rt;
   1144   1.1       cgd 	}
   1145   1.1       cgd 
   1146   1.1       cgd 	/*
   1147  1.34   mycroft 	 * Save at most 68 bytes of the packet in case
   1148   1.1       cgd 	 * we need to generate an ICMP message to the src.
   1149   1.1       cgd 	 */
   1150  1.34   mycroft 	mcopy = m_copy(m, 0, imin((int)ip->ip_len, 68));
   1151   1.1       cgd 
   1152   1.1       cgd 	/*
   1153   1.1       cgd 	 * If forwarding packet using same interface that it came in on,
   1154   1.1       cgd 	 * perhaps should send a redirect to sender to shortcut a hop.
   1155   1.1       cgd 	 * Only send redirect if source is sending directly to us,
   1156   1.1       cgd 	 * and if packet was not source routed (or has any options).
   1157   1.1       cgd 	 * Also, don't send redirect if forwarding using a default route
   1158   1.1       cgd 	 * or a route modified by a redirect.
   1159   1.1       cgd 	 */
   1160   1.1       cgd 	if (rt->rt_ifp == m->m_pkthdr.rcvif &&
   1161   1.1       cgd 	    (rt->rt_flags & (RTF_DYNAMIC|RTF_MODIFIED)) == 0 &&
   1162  1.35   mycroft 	    !in_nullhost(satosin(rt_key(rt))->sin_addr) &&
   1163   1.1       cgd 	    ipsendredirects && !srcrt) {
   1164  1.19   mycroft 		if (rt->rt_ifa &&
   1165  1.19   mycroft 		    (ip->ip_src.s_addr & ifatoia(rt->rt_ifa)->ia_subnetmask) ==
   1166  1.19   mycroft 		    ifatoia(rt->rt_ifa)->ia_subnet) {
   1167   1.1       cgd 		    if (rt->rt_flags & RTF_GATEWAY)
   1168  1.13   mycroft 			dest = satosin(rt->rt_gateway)->sin_addr.s_addr;
   1169   1.1       cgd 		    else
   1170  1.13   mycroft 			dest = ip->ip_dst.s_addr;
   1171  1.13   mycroft 		    /* Router requirements says to only send host redirects */
   1172   1.1       cgd 		    type = ICMP_REDIRECT;
   1173  1.13   mycroft 		    code = ICMP_REDIRECT_HOST;
   1174   1.1       cgd #ifdef DIAGNOSTIC
   1175   1.1       cgd 		    if (ipprintfs)
   1176  1.39  christos 		    	printf("redirect (%d) to %x\n", code, (u_int32_t)dest);
   1177   1.1       cgd #endif
   1178   1.1       cgd 		}
   1179   1.1       cgd 	}
   1180   1.1       cgd 
   1181  1.27   thorpej 	error = ip_output(m, (struct mbuf *)0, &ipforward_rt,
   1182  1.27   thorpej 	    (IP_FORWARDING | (ip_directedbcast ? IP_ALLOWBROADCAST : 0)), 0);
   1183   1.1       cgd 	if (error)
   1184   1.1       cgd 		ipstat.ips_cantforward++;
   1185   1.1       cgd 	else {
   1186   1.1       cgd 		ipstat.ips_forward++;
   1187   1.1       cgd 		if (type)
   1188   1.1       cgd 			ipstat.ips_redirectsent++;
   1189   1.1       cgd 		else {
   1190   1.1       cgd 			if (mcopy)
   1191   1.1       cgd 				m_freem(mcopy);
   1192   1.1       cgd 			return;
   1193   1.1       cgd 		}
   1194   1.1       cgd 	}
   1195   1.1       cgd 	if (mcopy == NULL)
   1196   1.1       cgd 		return;
   1197  1.13   mycroft 	destifp = NULL;
   1198  1.13   mycroft 
   1199   1.1       cgd 	switch (error) {
   1200   1.1       cgd 
   1201   1.1       cgd 	case 0:				/* forwarded, but need redirect */
   1202   1.1       cgd 		/* type, code set above */
   1203   1.1       cgd 		break;
   1204   1.1       cgd 
   1205   1.1       cgd 	case ENETUNREACH:		/* shouldn't happen, checked above */
   1206   1.1       cgd 	case EHOSTUNREACH:
   1207   1.1       cgd 	case ENETDOWN:
   1208   1.1       cgd 	case EHOSTDOWN:
   1209   1.1       cgd 	default:
   1210   1.1       cgd 		type = ICMP_UNREACH;
   1211   1.1       cgd 		code = ICMP_UNREACH_HOST;
   1212   1.1       cgd 		break;
   1213   1.1       cgd 
   1214   1.1       cgd 	case EMSGSIZE:
   1215   1.1       cgd 		type = ICMP_UNREACH;
   1216   1.1       cgd 		code = ICMP_UNREACH_NEEDFRAG;
   1217  1.13   mycroft 		if (ipforward_rt.ro_rt)
   1218  1.13   mycroft 			destifp = ipforward_rt.ro_rt->rt_ifp;
   1219   1.1       cgd 		ipstat.ips_cantfrag++;
   1220   1.1       cgd 		break;
   1221   1.1       cgd 
   1222   1.1       cgd 	case ENOBUFS:
   1223   1.1       cgd 		type = ICMP_SOURCEQUENCH;
   1224   1.1       cgd 		code = 0;
   1225   1.1       cgd 		break;
   1226   1.1       cgd 	}
   1227  1.13   mycroft 	icmp_error(mcopy, type, code, dest, destifp);
   1228  1.44   thorpej }
   1229  1.44   thorpej 
   1230  1.44   thorpej void
   1231  1.44   thorpej ip_savecontrol(inp, mp, ip, m)
   1232  1.44   thorpej 	register struct inpcb *inp;
   1233  1.44   thorpej 	register struct mbuf **mp;
   1234  1.44   thorpej 	register struct ip *ip;
   1235  1.44   thorpej 	register struct mbuf *m;
   1236  1.44   thorpej {
   1237  1.44   thorpej 
   1238  1.44   thorpej 	if (inp->inp_socket->so_options & SO_TIMESTAMP) {
   1239  1.44   thorpej 		struct timeval tv;
   1240  1.44   thorpej 
   1241  1.44   thorpej 		microtime(&tv);
   1242  1.44   thorpej 		*mp = sbcreatecontrol((caddr_t) &tv, sizeof(tv),
   1243  1.44   thorpej 		    SCM_TIMESTAMP, SOL_SOCKET);
   1244  1.44   thorpej 		if (*mp)
   1245  1.44   thorpej 			mp = &(*mp)->m_next;
   1246  1.44   thorpej 	}
   1247  1.44   thorpej 	if (inp->inp_flags & INP_RECVDSTADDR) {
   1248  1.44   thorpej 		*mp = sbcreatecontrol((caddr_t) &ip->ip_dst,
   1249  1.44   thorpej 		    sizeof(struct in_addr), IP_RECVDSTADDR, IPPROTO_IP);
   1250  1.44   thorpej 		if (*mp)
   1251  1.44   thorpej 			mp = &(*mp)->m_next;
   1252  1.44   thorpej 	}
   1253  1.44   thorpej #ifdef notyet
   1254  1.44   thorpej 	/*
   1255  1.44   thorpej 	 * XXX
   1256  1.44   thorpej 	 * Moving these out of udp_input() made them even more broken
   1257  1.44   thorpej 	 * than they already were.
   1258  1.44   thorpej 	 *	- fenner (at) parc.xerox.com
   1259  1.44   thorpej 	 */
   1260  1.44   thorpej 	/* options were tossed already */
   1261  1.44   thorpej 	if (inp->inp_flags & INP_RECVOPTS) {
   1262  1.44   thorpej 		*mp = sbcreatecontrol((caddr_t) opts_deleted_above,
   1263  1.44   thorpej 		    sizeof(struct in_addr), IP_RECVOPTS, IPPROTO_IP);
   1264  1.44   thorpej 		if (*mp)
   1265  1.44   thorpej 			mp = &(*mp)->m_next;
   1266  1.44   thorpej 	}
   1267  1.44   thorpej 	/* ip_srcroute doesn't do what we want here, need to fix */
   1268  1.44   thorpej 	if (inp->inp_flags & INP_RECVRETOPTS) {
   1269  1.44   thorpej 		*mp = sbcreatecontrol((caddr_t) ip_srcroute(),
   1270  1.44   thorpej 		    sizeof(struct in_addr), IP_RECVRETOPTS, IPPROTO_IP);
   1271  1.44   thorpej 		if (*mp)
   1272  1.44   thorpej 			mp = &(*mp)->m_next;
   1273  1.44   thorpej 	}
   1274  1.44   thorpej #endif
   1275  1.44   thorpej 	if (inp->inp_flags & INP_RECVIF) {
   1276  1.44   thorpej 		struct sockaddr_dl sdl;
   1277  1.44   thorpej 
   1278  1.44   thorpej 		sdl.sdl_len = offsetof(struct sockaddr_dl, sdl_data[0]);
   1279  1.44   thorpej 		sdl.sdl_family = AF_LINK;
   1280  1.44   thorpej 		sdl.sdl_index = m->m_pkthdr.rcvif ?
   1281  1.44   thorpej 		    m->m_pkthdr.rcvif->if_index : 0;
   1282  1.44   thorpej 		sdl.sdl_nlen = sdl.sdl_alen = sdl.sdl_slen = 0;
   1283  1.44   thorpej 		*mp = sbcreatecontrol((caddr_t) &sdl, sdl.sdl_len,
   1284  1.44   thorpej 		    IP_RECVIF, IPPROTO_IP);
   1285  1.44   thorpej 		if (*mp)
   1286  1.44   thorpej 			mp = &(*mp)->m_next;
   1287  1.44   thorpej 	}
   1288  1.13   mycroft }
   1289  1.13   mycroft 
   1290  1.13   mycroft int
   1291  1.13   mycroft ip_sysctl(name, namelen, oldp, oldlenp, newp, newlen)
   1292  1.13   mycroft 	int *name;
   1293  1.13   mycroft 	u_int namelen;
   1294  1.13   mycroft 	void *oldp;
   1295  1.13   mycroft 	size_t *oldlenp;
   1296  1.13   mycroft 	void *newp;
   1297  1.13   mycroft 	size_t newlen;
   1298  1.13   mycroft {
   1299  1.52   thorpej 	extern int subnetsarelocal;
   1300  1.52   thorpej 
   1301  1.54     lukem 	int error, old;
   1302  1.54     lukem 
   1303  1.13   mycroft 	/* All sysctl names at this level are terminal. */
   1304  1.13   mycroft 	if (namelen != 1)
   1305  1.13   mycroft 		return (ENOTDIR);
   1306  1.13   mycroft 
   1307  1.13   mycroft 	switch (name[0]) {
   1308  1.13   mycroft 	case IPCTL_FORWARDING:
   1309  1.13   mycroft 		return (sysctl_int(oldp, oldlenp, newp, newlen, &ipforwarding));
   1310  1.13   mycroft 	case IPCTL_SENDREDIRECTS:
   1311  1.13   mycroft 		return (sysctl_int(oldp, oldlenp, newp, newlen,
   1312  1.13   mycroft 			&ipsendredirects));
   1313  1.13   mycroft 	case IPCTL_DEFTTL:
   1314  1.13   mycroft 		return (sysctl_int(oldp, oldlenp, newp, newlen, &ip_defttl));
   1315  1.13   mycroft #ifdef notyet
   1316  1.13   mycroft 	case IPCTL_DEFMTU:
   1317  1.13   mycroft 		return (sysctl_int(oldp, oldlenp, newp, newlen, &ip_mtu));
   1318  1.13   mycroft #endif
   1319  1.26   thorpej 	case IPCTL_FORWSRCRT:
   1320  1.47       cjs 		/* Don't allow this to change in a secure environment.  */
   1321  1.26   thorpej 		if (securelevel > 0)
   1322  1.46       cjs 			return (sysctl_rdint(oldp, oldlenp, newp,
   1323  1.46       cjs 			    ip_forwsrcrt));
   1324  1.46       cjs 		else
   1325  1.46       cjs 			return (sysctl_int(oldp, oldlenp, newp, newlen,
   1326  1.46       cjs 			    &ip_forwsrcrt));
   1327  1.27   thorpej 	case IPCTL_DIRECTEDBCAST:
   1328  1.27   thorpej 		return (sysctl_int(oldp, oldlenp, newp, newlen,
   1329  1.27   thorpej 		    &ip_directedbcast));
   1330  1.47       cjs 	case IPCTL_ALLOWSRCRT:
   1331  1.47       cjs 		return (sysctl_int(oldp, oldlenp, newp, newlen,
   1332  1.47       cjs 		    &ip_allowsrcrt));
   1333  1.52   thorpej 	case IPCTL_SUBNETSARELOCAL:
   1334  1.52   thorpej 		return (sysctl_int(oldp, oldlenp, newp, newlen,
   1335  1.52   thorpej 		    &subnetsarelocal));
   1336  1.53       kml 	case IPCTL_MTUDISC:
   1337  1.60       kml 		error = sysctl_int(oldp, oldlenp, newp, newlen,
   1338  1.60       kml 		    &ip_mtudisc);
   1339  1.60       kml 		if (ip_mtudisc != 0 && ip_mtudisc_timeout_q == NULL) {
   1340  1.60       kml 			ip_mtudisc_timeout_q =
   1341  1.60       kml 			    rt_timer_queue_create(ip_mtudisc_timeout);
   1342  1.60       kml 		} else if (ip_mtudisc == 0 && ip_mtudisc_timeout_q != NULL) {
   1343  1.60       kml 			rt_timer_queue_destroy(ip_mtudisc_timeout_q, TRUE);
   1344  1.60       kml 			ip_mtudisc_timeout_q = NULL;
   1345  1.60       kml 		}
   1346  1.60       kml 		return error;
   1347  1.54     lukem 	case IPCTL_ANONPORTMIN:
   1348  1.54     lukem 		old = anonportmin;
   1349  1.54     lukem 		error = sysctl_int(oldp, oldlenp, newp, newlen, &anonportmin);
   1350  1.54     lukem 		if (anonportmin >= anonportmax || anonportmin > 65535
   1351  1.54     lukem #ifndef IPNOPRIVPORTS
   1352  1.54     lukem 		    || anonportmin < IPPORT_RESERVED
   1353  1.54     lukem #endif
   1354  1.54     lukem 		    ) {
   1355  1.54     lukem 			anonportmin = old;
   1356  1.54     lukem 			return (EINVAL);
   1357  1.54     lukem 		}
   1358  1.54     lukem 		return (error);
   1359  1.54     lukem 	case IPCTL_ANONPORTMAX:
   1360  1.54     lukem 		old = anonportmax;
   1361  1.54     lukem 		error = sysctl_int(oldp, oldlenp, newp, newlen, &anonportmax);
   1362  1.54     lukem 		if (anonportmin >= anonportmax || anonportmax > 65535
   1363  1.54     lukem #ifndef IPNOPRIVPORTS
   1364  1.54     lukem 		    || anonportmax < IPPORT_RESERVED
   1365  1.54     lukem #endif
   1366  1.54     lukem 		    ) {
   1367  1.54     lukem 			anonportmax = old;
   1368  1.54     lukem 			return (EINVAL);
   1369  1.54     lukem 		}
   1370  1.60       kml 		return (error);
   1371  1.60       kml 	case IPCTL_MTUDISCTIMEOUT:
   1372  1.60       kml 		error = sysctl_int(oldp, oldlenp, newp, newlen,
   1373  1.60       kml 		   &ip_mtudisc_timeout);
   1374  1.60       kml 		if (ip_mtudisc_timeout_q != NULL)
   1375  1.60       kml 			rt_timer_queue_change(ip_mtudisc_timeout_q,
   1376  1.60       kml 					      ip_mtudisc_timeout);
   1377  1.54     lukem 		return (error);
   1378  1.13   mycroft 	default:
   1379  1.13   mycroft 		return (EOPNOTSUPP);
   1380  1.13   mycroft 	}
   1381  1.13   mycroft 	/* NOTREACHED */
   1382   1.1       cgd }
   1383