Home | History | Annotate | Line # | Download | only in net
route.c revision 1.81
      1  1.81     joerg /*	$NetBSD: route.c,v 1.81 2006/12/07 19:37:08 joerg Exp $	*/
      2  1.18       kml 
      3  1.18       kml /*-
      4  1.18       kml  * Copyright (c) 1998 The NetBSD Foundation, Inc.
      5  1.18       kml  * All rights reserved.
      6  1.18       kml  *
      7  1.18       kml  * This code is derived from software contributed to The NetBSD Foundation
      8  1.18       kml  * by Kevin M. Lahey of the Numerical Aerospace Simulation Facility,
      9  1.18       kml  * NASA Ames Research Center.
     10  1.18       kml  *
     11  1.18       kml  * Redistribution and use in source and binary forms, with or without
     12  1.18       kml  * modification, are permitted provided that the following conditions
     13  1.18       kml  * are met:
     14  1.18       kml  * 1. Redistributions of source code must retain the above copyright
     15  1.18       kml  *    notice, this list of conditions and the following disclaimer.
     16  1.18       kml  * 2. Redistributions in binary form must reproduce the above copyright
     17  1.18       kml  *    notice, this list of conditions and the following disclaimer in the
     18  1.18       kml  *    documentation and/or other materials provided with the distribution.
     19  1.18       kml  * 3. All advertising materials mentioning features or use of this software
     20  1.18       kml  *    must display the following acknowledgement:
     21  1.18       kml  *	This product includes software developed by the NetBSD
     22  1.18       kml  *	Foundation, Inc. and its contributors.
     23  1.18       kml  * 4. Neither the name of The NetBSD Foundation nor the names of its
     24  1.18       kml  *    contributors may be used to endorse or promote products derived
     25  1.18       kml  *    from this software without specific prior written permission.
     26  1.18       kml  *
     27  1.18       kml  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     28  1.18       kml  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     29  1.18       kml  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     30  1.18       kml  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     31  1.18       kml  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     32  1.18       kml  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     33  1.18       kml  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     34  1.18       kml  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     35  1.18       kml  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     36  1.18       kml  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     37  1.18       kml  * POSSIBILITY OF SUCH DAMAGE.
     38  1.18       kml  */
     39  1.11       cgd 
     40   1.1       cgd /*
     41  1.25    itojun  * Copyright (C) 1995, 1996, 1997, and 1998 WIDE Project.
     42  1.25    itojun  * All rights reserved.
     43  1.65     perry  *
     44  1.25    itojun  * Redistribution and use in source and binary forms, with or without
     45  1.25    itojun  * modification, are permitted provided that the following conditions
     46  1.25    itojun  * are met:
     47  1.25    itojun  * 1. Redistributions of source code must retain the above copyright
     48  1.25    itojun  *    notice, this list of conditions and the following disclaimer.
     49  1.25    itojun  * 2. Redistributions in binary form must reproduce the above copyright
     50  1.25    itojun  *    notice, this list of conditions and the following disclaimer in the
     51  1.25    itojun  *    documentation and/or other materials provided with the distribution.
     52  1.25    itojun  * 3. Neither the name of the project nor the names of its contributors
     53  1.25    itojun  *    may be used to endorse or promote products derived from this software
     54  1.25    itojun  *    without specific prior written permission.
     55  1.65     perry  *
     56  1.25    itojun  * THIS SOFTWARE IS PROVIDED BY THE PROJECT AND CONTRIBUTORS ``AS IS'' AND
     57  1.25    itojun  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     58  1.25    itojun  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     59  1.25    itojun  * ARE DISCLAIMED.  IN NO EVENT SHALL THE PROJECT OR CONTRIBUTORS BE LIABLE
     60  1.25    itojun  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     61  1.25    itojun  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     62  1.25    itojun  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     63  1.25    itojun  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     64  1.25    itojun  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     65  1.25    itojun  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     66  1.25    itojun  * SUCH DAMAGE.
     67  1.25    itojun  */
     68  1.25    itojun 
     69  1.25    itojun /*
     70  1.10   mycroft  * Copyright (c) 1980, 1986, 1991, 1993
     71  1.10   mycroft  *	The Regents of the University of California.  All rights reserved.
     72   1.1       cgd  *
     73   1.1       cgd  * Redistribution and use in source and binary forms, with or without
     74   1.1       cgd  * modification, are permitted provided that the following conditions
     75   1.1       cgd  * are met:
     76   1.1       cgd  * 1. Redistributions of source code must retain the above copyright
     77   1.1       cgd  *    notice, this list of conditions and the following disclaimer.
     78   1.1       cgd  * 2. Redistributions in binary form must reproduce the above copyright
     79   1.1       cgd  *    notice, this list of conditions and the following disclaimer in the
     80   1.1       cgd  *    documentation and/or other materials provided with the distribution.
     81  1.58       agc  * 3. Neither the name of the University nor the names of its contributors
     82   1.1       cgd  *    may be used to endorse or promote products derived from this software
     83   1.1       cgd  *    without specific prior written permission.
     84   1.1       cgd  *
     85   1.1       cgd  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
     86   1.1       cgd  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     87   1.1       cgd  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     88   1.1       cgd  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
     89   1.1       cgd  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     90   1.1       cgd  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     91   1.1       cgd  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     92   1.1       cgd  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     93   1.1       cgd  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     94   1.1       cgd  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     95   1.1       cgd  * SUCH DAMAGE.
     96   1.1       cgd  *
     97  1.17  christos  *	@(#)route.c	8.3 (Berkeley) 1/9/95
     98   1.1       cgd  */
     99  1.50     lukem 
    100  1.50     lukem #include <sys/cdefs.h>
    101  1.81     joerg __KERNEL_RCSID(0, "$NetBSD: route.c,v 1.81 2006/12/07 19:37:08 joerg Exp $");
    102   1.2       cgd 
    103   1.5   mycroft #include <sys/param.h>
    104   1.5   mycroft #include <sys/systm.h>
    105  1.35   thorpej #include <sys/callout.h>
    106   1.5   mycroft #include <sys/proc.h>
    107   1.5   mycroft #include <sys/mbuf.h>
    108   1.5   mycroft #include <sys/socket.h>
    109   1.5   mycroft #include <sys/socketvar.h>
    110   1.5   mycroft #include <sys/domain.h>
    111   1.5   mycroft #include <sys/protosw.h>
    112  1.18       kml #include <sys/kernel.h>
    113   1.5   mycroft #include <sys/ioctl.h>
    114  1.22   thorpej #include <sys/pool.h>
    115   1.1       cgd 
    116   1.5   mycroft #include <net/if.h>
    117   1.5   mycroft #include <net/route.h>
    118   1.5   mycroft #include <net/raw_cb.h>
    119   1.1       cgd 
    120   1.5   mycroft #include <netinet/in.h>
    121   1.5   mycroft #include <netinet/in_var.h>
    122   1.1       cgd 
    123   1.5   mycroft 
    124  1.52      matt struct	route_cb route_cb;
    125  1.52      matt struct	rtstat	rtstat;
    126  1.52      matt struct	radix_node_head *rt_tables[AF_MAX+1];
    127   1.1       cgd 
    128   1.1       cgd int	rttrash;		/* routes not in table but not freed */
    129   1.1       cgd struct	sockaddr wildcard;	/* zero valued cookie for wildcard searches */
    130   1.1       cgd 
    131  1.61    simonb POOL_INIT(rtentry_pool, sizeof(struct rtentry), 0, 0, 0, "rtentpl", NULL);
    132  1.61    simonb POOL_INIT(rttimer_pool, sizeof(struct rttimer), 0, 0, 0, "rttmrpl", NULL);
    133  1.22   thorpej 
    134  1.35   thorpej struct callout rt_timer_ch; /* callout for rt_timer_timer() */
    135  1.35   thorpej 
    136  1.60      matt static int rtdeletemsg(struct rtentry *);
    137  1.60      matt static int rtflushclone1(struct radix_node *, void *);
    138  1.60      matt static void rtflushclone(struct radix_node_head *, struct rtentry *);
    139  1.40    itojun 
    140  1.81     joerg struct ifaddr *
    141  1.81     joerg rt_get_ifa(struct rtentry *rt)
    142  1.81     joerg {
    143  1.81     joerg 	struct ifaddr *ifa;
    144  1.81     joerg 
    145  1.81     joerg 	if ((ifa = rt->rt_ifa) == NULL)
    146  1.81     joerg 		return ifa;
    147  1.81     joerg 	else if (ifa->ifa_getifa == NULL)
    148  1.81     joerg 		return ifa;
    149  1.81     joerg #if 0
    150  1.81     joerg 	else if (ifa->ifa_seqno != NULL && *ifa->ifa_seqno == rt->rt_ifa_seqno)
    151  1.81     joerg 		return ifa;
    152  1.81     joerg #endif
    153  1.81     joerg 	else {
    154  1.81     joerg 		ifa = (*ifa->ifa_getifa)(ifa, rt_key(rt));
    155  1.81     joerg 		rt_replace_ifa(rt, ifa);
    156  1.81     joerg 		return ifa;
    157  1.81     joerg 	}
    158  1.81     joerg }
    159  1.81     joerg 
    160  1.80     joerg static void
    161  1.80     joerg rt_set_ifa1(struct rtentry *rt, struct ifaddr *ifa)
    162  1.80     joerg {
    163  1.80     joerg 	rt->rt_ifa = ifa;
    164  1.80     joerg 	if (ifa->ifa_seqno != NULL)
    165  1.80     joerg 		rt->rt_ifa_seqno = *ifa->ifa_seqno;
    166  1.80     joerg }
    167  1.80     joerg 
    168  1.80     joerg void
    169  1.80     joerg rt_replace_ifa(struct rtentry *rt, struct ifaddr *ifa)
    170  1.80     joerg {
    171  1.80     joerg 	IFAREF(ifa);
    172  1.80     joerg 	IFAFREE(rt->rt_ifa);
    173  1.80     joerg 	rt_set_ifa1(rt, ifa);
    174  1.80     joerg }
    175  1.80     joerg 
    176  1.80     joerg static void
    177  1.80     joerg rt_set_ifa(struct rtentry *rt, struct ifaddr *ifa)
    178  1.80     joerg {
    179  1.80     joerg 	IFAREF(ifa);
    180  1.80     joerg 	rt_set_ifa1(rt, ifa);
    181  1.80     joerg }
    182  1.80     joerg 
    183  1.10   mycroft void
    184  1.60      matt rtable_init(void **table)
    185  1.10   mycroft {
    186  1.10   mycroft 	struct domain *dom;
    187  1.64      matt 	DOMAIN_FOREACH(dom)
    188  1.10   mycroft 		if (dom->dom_rtattach)
    189  1.10   mycroft 			dom->dom_rtattach(&table[dom->dom_family],
    190  1.10   mycroft 			    dom->dom_rtoffset);
    191  1.10   mycroft }
    192   1.1       cgd 
    193   1.9   mycroft void
    194  1.60      matt route_init(void)
    195   1.1       cgd {
    196  1.22   thorpej 
    197  1.10   mycroft 	rn_init();	/* initialize all zeroes, all ones, mask table */
    198  1.10   mycroft 	rtable_init((void **)rt_tables);
    199   1.1       cgd }
    200   1.1       cgd 
    201   1.1       cgd /*
    202   1.1       cgd  * Packet routing routines.
    203   1.1       cgd  */
    204   1.9   mycroft void
    205  1.60      matt rtalloc(struct route *ro)
    206   1.1       cgd {
    207  1.75    dyoung 	if (ro->ro_rt != NULL) {
    208  1.75    dyoung 		if (ro->ro_rt->rt_ifp != NULL &&
    209  1.75    dyoung 		    (ro->ro_rt->rt_flags & RTF_UP) != 0)
    210  1.75    dyoung 			return;
    211  1.75    dyoung 		RTFREE(ro->ro_rt);
    212  1.75    dyoung 	}
    213   1.1       cgd 	ro->ro_rt = rtalloc1(&ro->ro_dst, 1);
    214   1.1       cgd }
    215  1.25    itojun 
    216   1.1       cgd struct rtentry *
    217  1.60      matt rtalloc1(const struct sockaddr *dst, int report)
    218   1.1       cgd {
    219  1.36  augustss 	struct radix_node_head *rnh = rt_tables[dst->sa_family];
    220  1.36  augustss 	struct rtentry *rt;
    221  1.36  augustss 	struct radix_node *rn;
    222  1.68  christos 	struct rtentry *newrt = NULL;
    223  1.10   mycroft 	struct rt_addrinfo info;
    224  1.13   mycroft 	int  s = splsoftnet(), err = 0, msgtype = RTM_MISS;
    225   1.1       cgd 
    226  1.66  christos 	if (rnh && (rn = rnh->rnh_matchaddr(dst, rnh)) &&
    227   1.1       cgd 	    ((rn->rn_flags & RNF_ROOT) == 0)) {
    228   1.1       cgd 		newrt = rt = (struct rtentry *)rn;
    229   1.1       cgd 		if (report && (rt->rt_flags & RTF_CLONING)) {
    230  1.68  christos 			err = rtrequest(RTM_RESOLVE, dst, NULL, NULL, 0,
    231  1.68  christos 			    &newrt);
    232   1.8       cgd 			if (err) {
    233   1.8       cgd 				newrt = rt;
    234   1.8       cgd 				rt->rt_refcnt++;
    235   1.8       cgd 				goto miss;
    236   1.8       cgd 			}
    237  1.69  christos 			KASSERT(newrt != NULL);
    238   1.8       cgd 			if ((rt = newrt) && (rt->rt_flags & RTF_XRESOLVE)) {
    239   1.8       cgd 				msgtype = RTM_RESOLVE;
    240   1.8       cgd 				goto miss;
    241   1.8       cgd 			}
    242  1.39    itojun 			/* Inform listeners of the new route */
    243  1.44   thorpej 			memset(&info, 0, sizeof(info));
    244  1.39    itojun 			info.rti_info[RTAX_DST] = rt_key(rt);
    245  1.39    itojun 			info.rti_info[RTAX_NETMASK] = rt_mask(rt);
    246  1.39    itojun 			info.rti_info[RTAX_GATEWAY] = rt->rt_gateway;
    247  1.39    itojun 			if (rt->rt_ifp != NULL) {
    248  1.65     perry 				info.rti_info[RTAX_IFP] =
    249  1.49      matt 				    TAILQ_FIRST(&rt->rt_ifp->if_addrlist)->ifa_addr;
    250  1.39    itojun 				info.rti_info[RTAX_IFA] = rt->rt_ifa->ifa_addr;
    251  1.39    itojun 			}
    252  1.39    itojun 			rt_missmsg(RTM_ADD, &info, rt->rt_flags, 0);
    253   1.1       cgd 		} else
    254   1.1       cgd 			rt->rt_refcnt++;
    255   1.1       cgd 	} else {
    256   1.1       cgd 		rtstat.rts_unreach++;
    257  1.10   mycroft 	miss:	if (report) {
    258  1.44   thorpej 			memset((caddr_t)&info, 0, sizeof(info));
    259  1.10   mycroft 			info.rti_info[RTAX_DST] = dst;
    260  1.10   mycroft 			rt_missmsg(msgtype, &info, 0, err);
    261  1.10   mycroft 		}
    262   1.1       cgd 	}
    263   1.1       cgd 	splx(s);
    264   1.1       cgd 	return (newrt);
    265   1.1       cgd }
    266   1.1       cgd 
    267   1.9   mycroft void
    268  1.60      matt rtfree(struct rtentry *rt)
    269   1.1       cgd {
    270  1.36  augustss 	struct ifaddr *ifa;
    271  1.10   mycroft 
    272  1.68  christos 	if (rt == NULL)
    273   1.1       cgd 		panic("rtfree");
    274   1.1       cgd 	rt->rt_refcnt--;
    275   1.1       cgd 	if (rt->rt_refcnt <= 0 && (rt->rt_flags & RTF_UP) == 0) {
    276   1.1       cgd 		if (rt->rt_nodes->rn_flags & (RNF_ACTIVE | RNF_ROOT))
    277   1.1       cgd 			panic ("rtfree 2");
    278  1.10   mycroft 		rttrash--;
    279  1.10   mycroft 		if (rt->rt_refcnt < 0) {
    280  1.16  christos 			printf("rtfree: %p not freed (neg refs)\n", rt);
    281  1.10   mycroft 			return;
    282  1.10   mycroft 		}
    283  1.54    itojun 		rt_timer_remove_all(rt, 0);
    284  1.10   mycroft 		ifa = rt->rt_ifa;
    285  1.78    dyoung 		rt->rt_ifa = NULL;
    286  1.10   mycroft 		IFAFREE(ifa);
    287  1.78    dyoung 		rt->rt_ifp = NULL;
    288  1.10   mycroft 		Free(rt_key(rt));
    289  1.22   thorpej 		pool_put(&rtentry_pool, rt);
    290   1.1       cgd 	}
    291   1.1       cgd }
    292   1.1       cgd 
    293  1.10   mycroft void
    294  1.60      matt ifafree(struct ifaddr *ifa)
    295  1.10   mycroft {
    296  1.30   thorpej 
    297  1.30   thorpej #ifdef DIAGNOSTIC
    298  1.10   mycroft 	if (ifa == NULL)
    299  1.30   thorpej 		panic("ifafree: null ifa");
    300  1.30   thorpej 	if (ifa->ifa_refcnt != 0)
    301  1.30   thorpej 		panic("ifafree: ifa_refcnt != 0 (%d)", ifa->ifa_refcnt);
    302  1.30   thorpej #endif
    303  1.31   thorpej #ifdef IFAREF_DEBUG
    304  1.31   thorpej 	printf("ifafree: freeing ifaddr %p\n", ifa);
    305  1.31   thorpej #endif
    306  1.30   thorpej 	free(ifa, M_IFADDR);
    307  1.10   mycroft }
    308  1.10   mycroft 
    309   1.1       cgd /*
    310   1.1       cgd  * Force a routing table entry to the specified
    311   1.1       cgd  * destination to go through the given gateway.
    312   1.1       cgd  * Normally called as a result of a routing redirect
    313   1.1       cgd  * message from the network layer.
    314   1.1       cgd  *
    315  1.13   mycroft  * N.B.: must be called at splsoftnet
    316   1.1       cgd  */
    317  1.14  christos void
    318  1.60      matt rtredirect(const struct sockaddr *dst, const struct sockaddr *gateway,
    319  1.60      matt 	const struct sockaddr *netmask, int flags, const struct sockaddr *src,
    320  1.60      matt 	struct rtentry **rtp)
    321   1.1       cgd {
    322  1.36  augustss 	struct rtentry *rt;
    323   1.1       cgd 	int error = 0;
    324  1.68  christos 	u_quad_t *stat = NULL;
    325  1.10   mycroft 	struct rt_addrinfo info;
    326  1.10   mycroft 	struct ifaddr *ifa;
    327   1.1       cgd 
    328   1.1       cgd 	/* verify the gateway is directly reachable */
    329  1.68  christos 	if ((ifa = ifa_ifwithnet(gateway)) == NULL) {
    330   1.1       cgd 		error = ENETUNREACH;
    331   1.8       cgd 		goto out;
    332   1.1       cgd 	}
    333   1.1       cgd 	rt = rtalloc1(dst, 0);
    334   1.1       cgd 	/*
    335   1.1       cgd 	 * If the redirect isn't from our current router for this dst,
    336   1.1       cgd 	 * it's either old or wrong.  If it redirects us to ourselves,
    337   1.1       cgd 	 * we have a routing loop, perhaps as a result of an interface
    338   1.1       cgd 	 * going down recently.
    339   1.1       cgd 	 */
    340  1.45    itojun #define	equal(a1, a2) \
    341  1.45    itojun 	((a1)->sa_len == (a2)->sa_len && \
    342  1.66  christos 	 memcmp((a1), (a2), (a1)->sa_len) == 0)
    343  1.10   mycroft 	if (!(flags & RTF_DONE) && rt &&
    344  1.10   mycroft 	     (!equal(src, rt->rt_gateway) || rt->rt_ifa != ifa))
    345   1.1       cgd 		error = EINVAL;
    346   1.1       cgd 	else if (ifa_ifwithaddr(gateway))
    347   1.1       cgd 		error = EHOSTUNREACH;
    348   1.1       cgd 	if (error)
    349   1.1       cgd 		goto done;
    350   1.1       cgd 	/*
    351   1.1       cgd 	 * Create a new entry if we just got back a wildcard entry
    352  1.33     soren 	 * or the lookup failed.  This is necessary for hosts
    353   1.1       cgd 	 * which use routing redirects generated by smart gateways
    354   1.1       cgd 	 * to dynamically build the routing tables.
    355   1.1       cgd 	 */
    356  1.68  christos 	if ((rt == NULL) || (rt_mask(rt) && rt_mask(rt)->sa_len < 2))
    357   1.1       cgd 		goto create;
    358   1.1       cgd 	/*
    359   1.1       cgd 	 * Don't listen to the redirect if it's
    360  1.65     perry 	 * for a route to an interface.
    361   1.1       cgd 	 */
    362   1.1       cgd 	if (rt->rt_flags & RTF_GATEWAY) {
    363   1.1       cgd 		if (((rt->rt_flags & RTF_HOST) == 0) && (flags & RTF_HOST)) {
    364   1.1       cgd 			/*
    365   1.1       cgd 			 * Changing from route to net => route to host.
    366   1.1       cgd 			 * Create new route, rather than smashing route to net.
    367   1.1       cgd 			 */
    368   1.1       cgd 		create:
    369  1.39    itojun 			if (rt)
    370  1.39    itojun 				rtfree(rt);
    371   1.1       cgd 			flags |=  RTF_GATEWAY | RTF_DYNAMIC;
    372  1.39    itojun 			info.rti_info[RTAX_DST] = dst;
    373  1.39    itojun 			info.rti_info[RTAX_GATEWAY] = gateway;
    374  1.39    itojun 			info.rti_info[RTAX_NETMASK] = netmask;
    375  1.39    itojun 			info.rti_ifa = ifa;
    376  1.39    itojun 			info.rti_flags = flags;
    377  1.39    itojun 			rt = NULL;
    378  1.39    itojun 			error = rtrequest1(RTM_ADD, &info, &rt);
    379  1.39    itojun 			if (rt != NULL)
    380  1.39    itojun 				flags = rt->rt_flags;
    381   1.1       cgd 			stat = &rtstat.rts_dynamic;
    382   1.1       cgd 		} else {
    383   1.1       cgd 			/*
    384   1.1       cgd 			 * Smash the current notion of the gateway to
    385   1.1       cgd 			 * this destination.  Should check about netmask!!!
    386   1.1       cgd 			 */
    387  1.10   mycroft 			rt->rt_flags |= RTF_MODIFIED;
    388  1.10   mycroft 			flags |= RTF_MODIFIED;
    389  1.10   mycroft 			stat = &rtstat.rts_newgateway;
    390  1.10   mycroft 			rt_setgate(rt, rt_key(rt), gateway);
    391   1.1       cgd 		}
    392   1.1       cgd 	} else
    393   1.1       cgd 		error = EHOSTUNREACH;
    394   1.1       cgd done:
    395   1.1       cgd 	if (rt) {
    396   1.1       cgd 		if (rtp && !error)
    397   1.1       cgd 			*rtp = rt;
    398   1.1       cgd 		else
    399   1.1       cgd 			rtfree(rt);
    400   1.1       cgd 	}
    401   1.8       cgd out:
    402   1.1       cgd 	if (error)
    403   1.1       cgd 		rtstat.rts_badredirect++;
    404   1.8       cgd 	else if (stat != NULL)
    405   1.8       cgd 		(*stat)++;
    406  1.44   thorpej 	memset((caddr_t)&info, 0, sizeof(info));
    407  1.10   mycroft 	info.rti_info[RTAX_DST] = dst;
    408  1.10   mycroft 	info.rti_info[RTAX_GATEWAY] = gateway;
    409  1.10   mycroft 	info.rti_info[RTAX_NETMASK] = netmask;
    410  1.10   mycroft 	info.rti_info[RTAX_AUTHOR] = src;
    411  1.10   mycroft 	rt_missmsg(RTM_REDIRECT, &info, flags, error);
    412   1.1       cgd }
    413   1.1       cgd 
    414   1.1       cgd /*
    415  1.40    itojun  * Delete a route and generate a message
    416  1.40    itojun  */
    417  1.40    itojun static int
    418  1.60      matt rtdeletemsg(struct rtentry *rt)
    419  1.40    itojun {
    420  1.40    itojun 	int error;
    421  1.40    itojun 	struct rt_addrinfo info;
    422  1.40    itojun 
    423  1.40    itojun 	/*
    424  1.40    itojun 	 * Request the new route so that the entry is not actually
    425  1.40    itojun 	 * deleted.  That will allow the information being reported to
    426  1.40    itojun 	 * be accurate (and consistent with route_output()).
    427  1.40    itojun 	 */
    428  1.44   thorpej 	memset((caddr_t)&info, 0, sizeof(info));
    429  1.40    itojun 	info.rti_info[RTAX_DST] = rt_key(rt);
    430  1.40    itojun 	info.rti_info[RTAX_NETMASK] = rt_mask(rt);
    431  1.40    itojun 	info.rti_info[RTAX_GATEWAY] = rt->rt_gateway;
    432  1.40    itojun 	info.rti_flags = rt->rt_flags;
    433  1.40    itojun 	error = rtrequest1(RTM_DELETE, &info, &rt);
    434  1.40    itojun 
    435  1.40    itojun 	rt_missmsg(RTM_DELETE, &info, info.rti_flags, error);
    436  1.40    itojun 
    437  1.40    itojun 	/* Adjust the refcount */
    438  1.40    itojun 	if (error == 0 && rt->rt_refcnt <= 0) {
    439  1.40    itojun 		rt->rt_refcnt++;
    440  1.40    itojun 		rtfree(rt);
    441  1.40    itojun 	}
    442  1.40    itojun 	return (error);
    443  1.40    itojun }
    444  1.40    itojun 
    445  1.41    itojun static int
    446  1.60      matt rtflushclone1(struct radix_node *rn, void *arg)
    447  1.41    itojun {
    448  1.41    itojun 	struct rtentry *rt, *parent;
    449  1.41    itojun 
    450  1.41    itojun 	rt = (struct rtentry *)rn;
    451  1.41    itojun 	parent = (struct rtentry *)arg;
    452  1.41    itojun 	if ((rt->rt_flags & RTF_CLONED) != 0 && rt->rt_parent == parent)
    453  1.41    itojun 		rtdeletemsg(rt);
    454  1.41    itojun 	return 0;
    455  1.41    itojun }
    456  1.41    itojun 
    457  1.41    itojun static void
    458  1.60      matt rtflushclone(struct radix_node_head *rnh, struct rtentry *parent)
    459  1.41    itojun {
    460  1.41    itojun 
    461  1.41    itojun #ifdef DIAGNOSTIC
    462  1.41    itojun 	if (!parent || (parent->rt_flags & RTF_CLONING) == 0)
    463  1.41    itojun 		panic("rtflushclone: called with a non-cloning route");
    464  1.41    itojun 	if (!rnh->rnh_walktree)
    465  1.41    itojun 		panic("rtflushclone: no rnh_walktree");
    466  1.41    itojun #endif
    467  1.42    itojun 	rnh->rnh_walktree(rnh, rtflushclone1, (void *)parent);
    468  1.41    itojun }
    469  1.41    itojun 
    470  1.40    itojun /*
    471  1.22   thorpej  * Routing table ioctl interface.
    472  1.22   thorpej  */
    473   1.9   mycroft int
    474  1.76  christos rtioctl(u_long req, caddr_t data, struct lwp *l)
    475   1.1       cgd {
    476   1.1       cgd 	return (EOPNOTSUPP);
    477   1.1       cgd }
    478   1.1       cgd 
    479   1.1       cgd struct ifaddr *
    480  1.60      matt ifa_ifwithroute(int flags, const struct sockaddr *dst,
    481  1.60      matt 	const struct sockaddr *gateway)
    482   1.1       cgd {
    483  1.36  augustss 	struct ifaddr *ifa;
    484   1.1       cgd 	if ((flags & RTF_GATEWAY) == 0) {
    485   1.1       cgd 		/*
    486   1.1       cgd 		 * If we are adding a route to an interface,
    487   1.1       cgd 		 * and the interface is a pt to pt link
    488   1.1       cgd 		 * we should search for the destination
    489   1.1       cgd 		 * as our clue to the interface.  Otherwise
    490   1.1       cgd 		 * we can use the local address.
    491   1.1       cgd 		 */
    492  1.68  christos 		ifa = NULL;
    493  1.65     perry 		if (flags & RTF_HOST)
    494   1.1       cgd 			ifa = ifa_ifwithdstaddr(dst);
    495  1.68  christos 		if (ifa == NULL)
    496   1.1       cgd 			ifa = ifa_ifwithaddr(gateway);
    497   1.1       cgd 	} else {
    498   1.1       cgd 		/*
    499   1.1       cgd 		 * If we are adding a route to a remote net
    500   1.1       cgd 		 * or host, the gateway may still be on the
    501   1.1       cgd 		 * other end of a pt to pt link.
    502   1.1       cgd 		 */
    503   1.1       cgd 		ifa = ifa_ifwithdstaddr(gateway);
    504   1.1       cgd 	}
    505  1.68  christos 	if (ifa == NULL)
    506   1.1       cgd 		ifa = ifa_ifwithnet(gateway);
    507  1.68  christos 	if (ifa == NULL) {
    508   1.1       cgd 		struct rtentry *rt = rtalloc1(dst, 0);
    509  1.68  christos 		if (rt == NULL)
    510  1.68  christos 			return NULL;
    511   1.1       cgd 		rt->rt_refcnt--;
    512  1.68  christos 		if ((ifa = rt->rt_ifa) == NULL)
    513  1.68  christos 			return NULL;
    514   1.1       cgd 	}
    515   1.1       cgd 	if (ifa->ifa_addr->sa_family != dst->sa_family) {
    516  1.10   mycroft 		struct ifaddr *oifa = ifa;
    517   1.1       cgd 		ifa = ifaof_ifpforaddr(dst, ifa->ifa_ifp);
    518   1.1       cgd 		if (ifa == 0)
    519   1.1       cgd 			ifa = oifa;
    520   1.1       cgd 	}
    521   1.1       cgd 	return (ifa);
    522   1.1       cgd }
    523   1.1       cgd 
    524   1.1       cgd #define ROUNDUP(a) (a>0 ? (1 + (((a) - 1) | (sizeof(long) - 1))) : sizeof(long))
    525   1.1       cgd 
    526   1.9   mycroft int
    527  1.60      matt rtrequest(int req, const struct sockaddr *dst, const struct sockaddr *gateway,
    528  1.60      matt 	const struct sockaddr *netmask, int flags, struct rtentry **ret_nrt)
    529   1.1       cgd {
    530  1.39    itojun 	struct rt_addrinfo info;
    531  1.39    itojun 
    532  1.44   thorpej 	memset(&info, 0, sizeof(info));
    533  1.39    itojun 	info.rti_flags = flags;
    534  1.39    itojun 	info.rti_info[RTAX_DST] = dst;
    535  1.39    itojun 	info.rti_info[RTAX_GATEWAY] = gateway;
    536  1.39    itojun 	info.rti_info[RTAX_NETMASK] = netmask;
    537  1.39    itojun 	return rtrequest1(req, &info, ret_nrt);
    538  1.39    itojun }
    539  1.39    itojun 
    540  1.39    itojun int
    541  1.60      matt rt_getifa(struct rt_addrinfo *info)
    542  1.39    itojun {
    543  1.39    itojun 	struct ifaddr *ifa;
    544  1.68  christos 	const struct sockaddr *dst = info->rti_info[RTAX_DST];
    545  1.68  christos 	const struct sockaddr *gateway = info->rti_info[RTAX_GATEWAY];
    546  1.68  christos 	const struct sockaddr *ifaaddr = info->rti_info[RTAX_IFA];
    547  1.68  christos 	const struct sockaddr *ifpaddr = info->rti_info[RTAX_IFP];
    548  1.68  christos 	int flags = info->rti_flags;
    549  1.39    itojun 
    550  1.39    itojun 	/*
    551  1.39    itojun 	 * ifp may be specified by sockaddr_dl when protocol address
    552  1.39    itojun 	 * is ambiguous
    553  1.39    itojun 	 */
    554  1.39    itojun 	if (info->rti_ifp == NULL && ifpaddr != NULL
    555  1.39    itojun 	    && ifpaddr->sa_family == AF_LINK &&
    556  1.59      matt 	    (ifa = ifa_ifwithnet((const struct sockaddr *)ifpaddr)) != NULL)
    557  1.39    itojun 		info->rti_ifp = ifa->ifa_ifp;
    558  1.39    itojun 	if (info->rti_ifa == NULL && ifaaddr != NULL)
    559  1.39    itojun 		info->rti_ifa = ifa_ifwithaddr(ifaaddr);
    560  1.39    itojun 	if (info->rti_ifa == NULL) {
    561  1.59      matt 		const struct sockaddr *sa;
    562  1.39    itojun 
    563  1.39    itojun 		sa = ifaaddr != NULL ? ifaaddr :
    564  1.39    itojun 		    (gateway != NULL ? gateway : dst);
    565  1.39    itojun 		if (sa != NULL && info->rti_ifp != NULL)
    566  1.39    itojun 			info->rti_ifa = ifaof_ifpforaddr(sa, info->rti_ifp);
    567  1.39    itojun 		else if (dst != NULL && gateway != NULL)
    568  1.39    itojun 			info->rti_ifa = ifa_ifwithroute(flags, dst, gateway);
    569  1.39    itojun 		else if (sa != NULL)
    570  1.39    itojun 			info->rti_ifa = ifa_ifwithroute(flags, sa, sa);
    571  1.39    itojun 	}
    572  1.74    dyoung 	if ((ifa = info->rti_ifa) == NULL)
    573  1.74    dyoung 		return ENETUNREACH;
    574  1.74    dyoung 	if (ifa->ifa_getifa != NULL)
    575  1.74    dyoung 		info->rti_ifa = ifa = (*ifa->ifa_getifa)(ifa, dst);
    576  1.74    dyoung 	if (info->rti_ifp == NULL)
    577  1.74    dyoung 		info->rti_ifp = ifa->ifa_ifp;
    578  1.74    dyoung 	return 0;
    579  1.39    itojun }
    580  1.39    itojun 
    581  1.39    itojun int
    582  1.60      matt rtrequest1(int req, struct rt_addrinfo *info, struct rtentry **ret_nrt)
    583  1.39    itojun {
    584  1.60      matt 	int s = splsoftnet();
    585  1.60      matt 	int error = 0;
    586  1.40    itojun 	struct rtentry *rt, *crt;
    587  1.36  augustss 	struct radix_node *rn;
    588  1.36  augustss 	struct radix_node_head *rnh;
    589  1.10   mycroft 	struct ifaddr *ifa;
    590  1.63  christos 	struct sockaddr_storage deldst;
    591  1.68  christos 	const struct sockaddr *dst = info->rti_info[RTAX_DST];
    592  1.68  christos 	const struct sockaddr *gateway = info->rti_info[RTAX_GATEWAY];
    593  1.68  christos 	const struct sockaddr *netmask = info->rti_info[RTAX_NETMASK];
    594  1.68  christos 	int flags = info->rti_flags;
    595   1.1       cgd #define senderr(x) { error = x ; goto bad; }
    596   1.1       cgd 
    597  1.68  christos 	if ((rnh = rt_tables[dst->sa_family]) == NULL)
    598   1.1       cgd 		senderr(ESRCH);
    599   1.1       cgd 	if (flags & RTF_HOST)
    600  1.68  christos 		netmask = NULL;
    601   1.1       cgd 	switch (req) {
    602   1.1       cgd 	case RTM_DELETE:
    603  1.63  christos 		if (netmask) {
    604  1.63  christos 			rt_maskedcopy(dst, (struct sockaddr *)&deldst, netmask);
    605  1.63  christos 			dst = (struct sockaddr *)&deldst;
    606  1.63  christos 		}
    607  1.68  christos 		if ((rn = rnh->rnh_lookup(dst, netmask, rnh)) == NULL)
    608  1.41    itojun 			senderr(ESRCH);
    609  1.41    itojun 		rt = (struct rtentry *)rn;
    610  1.41    itojun 		if ((rt->rt_flags & RTF_CLONING) != 0) {
    611  1.41    itojun 			/* clean up any cloned children */
    612  1.41    itojun 			rtflushclone(rnh, rt);
    613  1.41    itojun 		}
    614  1.68  christos 		if ((rn = rnh->rnh_deladdr(dst, netmask, rnh)) == NULL)
    615   1.1       cgd 			senderr(ESRCH);
    616   1.1       cgd 		if (rn->rn_flags & (RNF_ACTIVE | RNF_ROOT))
    617   1.1       cgd 			panic ("rtrequest delete");
    618   1.1       cgd 		rt = (struct rtentry *)rn;
    619  1.10   mycroft 		if (rt->rt_gwroute) {
    620  1.68  christos 			RTFREE(rt->rt_gwroute);
    621  1.68  christos 			rt->rt_gwroute = NULL;
    622  1.48    itojun 		}
    623  1.48    itojun 		if (rt->rt_parent) {
    624  1.48    itojun 			rt->rt_parent->rt_refcnt--;
    625  1.48    itojun 			rt->rt_parent = NULL;
    626  1.10   mycroft 		}
    627  1.28       erh 		rt->rt_flags &= ~RTF_UP;
    628   1.1       cgd 		if ((ifa = rt->rt_ifa) && ifa->ifa_rtrequest)
    629  1.39    itojun 			ifa->ifa_rtrequest(RTM_DELETE, rt, info);
    630   1.1       cgd 		rttrash++;
    631  1.10   mycroft 		if (ret_nrt)
    632  1.10   mycroft 			*ret_nrt = rt;
    633  1.10   mycroft 		else if (rt->rt_refcnt <= 0) {
    634  1.10   mycroft 			rt->rt_refcnt++;
    635   1.1       cgd 			rtfree(rt);
    636  1.10   mycroft 		}
    637   1.1       cgd 		break;
    638   1.1       cgd 
    639   1.1       cgd 	case RTM_RESOLVE:
    640  1.68  christos 		if (ret_nrt == NULL || (rt = *ret_nrt) == NULL)
    641   1.1       cgd 			senderr(EINVAL);
    642  1.40    itojun 		if ((rt->rt_flags & RTF_CLONING) == 0)
    643  1.40    itojun 			senderr(EINVAL);
    644   1.1       cgd 		ifa = rt->rt_ifa;
    645  1.40    itojun 		flags = rt->rt_flags & ~(RTF_CLONING | RTF_STATIC);
    646  1.40    itojun 		flags |= RTF_CLONED;
    647   1.1       cgd 		gateway = rt->rt_gateway;
    648  1.68  christos 		if ((netmask = rt->rt_genmask) == NULL)
    649   1.1       cgd 			flags |= RTF_HOST;
    650   1.1       cgd 		goto makeroute;
    651   1.1       cgd 
    652   1.1       cgd 	case RTM_ADD:
    653  1.68  christos 		if (info->rti_ifa == NULL && (error = rt_getifa(info)))
    654  1.39    itojun 			senderr(error);
    655  1.39    itojun 		ifa = info->rti_ifa;
    656   1.1       cgd 	makeroute:
    657  1.72       tls 		/* Already at splsoftnet() so pool_get/pool_put are safe */
    658  1.22   thorpej 		rt = pool_get(&rtentry_pool, PR_NOWAIT);
    659  1.68  christos 		if (rt == NULL)
    660   1.1       cgd 			senderr(ENOBUFS);
    661  1.10   mycroft 		Bzero(rt, sizeof(*rt));
    662  1.10   mycroft 		rt->rt_flags = RTF_UP | flags;
    663  1.18       kml 		LIST_INIT(&rt->rt_timer);
    664  1.10   mycroft 		if (rt_setgate(rt, dst, gateway)) {
    665  1.22   thorpej 			pool_put(&rtentry_pool, rt);
    666  1.10   mycroft 			senderr(ENOBUFS);
    667  1.10   mycroft 		}
    668   1.1       cgd 		if (netmask) {
    669  1.79    dyoung 			rt_maskedcopy(dst, rt_key(rt), netmask);
    670   1.1       cgd 		} else
    671  1.79    dyoung 			Bcopy(dst, rt_key(rt), dst->sa_len);
    672  1.74    dyoung 		rt_set_ifa(rt, ifa);
    673   1.1       cgd 		rt->rt_ifp = ifa->ifa_ifp;
    674  1.27      matt 		if (req == RTM_RESOLVE) {
    675   1.1       cgd 			rt->rt_rmx = (*ret_nrt)->rt_rmx; /* copy metrics */
    676  1.41    itojun 			rt->rt_parent = *ret_nrt;
    677  1.41    itojun 			rt->rt_parent->rt_refcnt++;
    678  1.40    itojun 		}
    679  1.79    dyoung 		rn = rnh->rnh_addaddr(rt_key(rt), netmask, rnh, rt->rt_nodes);
    680  1.79    dyoung 		if (rn == NULL && (crt = rtalloc1(rt_key(rt), 0)) != NULL) {
    681  1.40    itojun 			/* overwrite cloned route */
    682  1.40    itojun 			if ((crt->rt_flags & RTF_CLONED) != 0) {
    683  1.40    itojun 				rtdeletemsg(crt);
    684  1.79    dyoung 				rn = rnh->rnh_addaddr(rt_key(rt),
    685  1.66  christos 				    netmask, rnh, rt->rt_nodes);
    686  1.40    itojun 			}
    687  1.40    itojun 			RTFREE(crt);
    688  1.40    itojun 		}
    689  1.68  christos 		if (rn == NULL) {
    690  1.40    itojun 			IFAFREE(ifa);
    691  1.41    itojun 			if ((rt->rt_flags & RTF_CLONED) != 0 && rt->rt_parent)
    692  1.41    itojun 				rtfree(rt->rt_parent);
    693  1.40    itojun 			if (rt->rt_gwroute)
    694  1.40    itojun 				rtfree(rt->rt_gwroute);
    695  1.40    itojun 			Free(rt_key(rt));
    696  1.40    itojun 			pool_put(&rtentry_pool, rt);
    697  1.40    itojun 			senderr(EEXIST);
    698  1.27      matt 		}
    699   1.1       cgd 		if (ifa->ifa_rtrequest)
    700  1.39    itojun 			ifa->ifa_rtrequest(req, rt, info);
    701   1.1       cgd 		if (ret_nrt) {
    702   1.1       cgd 			*ret_nrt = rt;
    703   1.1       cgd 			rt->rt_refcnt++;
    704  1.41    itojun 		}
    705  1.41    itojun 		if ((rt->rt_flags & RTF_CLONING) != 0) {
    706  1.41    itojun 			/* clean up any cloned children */
    707  1.41    itojun 			rtflushclone(rnh, rt);
    708   1.1       cgd 		}
    709   1.1       cgd 		break;
    710   1.1       cgd 	}
    711   1.1       cgd bad:
    712   1.1       cgd 	splx(s);
    713   1.1       cgd 	return (error);
    714   1.1       cgd }
    715   1.1       cgd 
    716  1.10   mycroft int
    717  1.60      matt rt_setgate( struct rtentry *rt0, const struct sockaddr *dst,
    718  1.60      matt 	const struct sockaddr *gate)
    719  1.10   mycroft {
    720  1.59      matt 	char *new, *old;
    721  1.53   thorpej 	u_int dlen = ROUNDUP(dst->sa_len), glen = ROUNDUP(gate->sa_len);
    722  1.36  augustss 	struct rtentry *rt = rt0;
    723  1.10   mycroft 
    724  1.68  christos 	if (rt->rt_gateway == NULL || glen > ROUNDUP(rt->rt_gateway->sa_len)) {
    725  1.10   mycroft 		old = (caddr_t)rt_key(rt);
    726  1.10   mycroft 		R_Malloc(new, caddr_t, dlen + glen);
    727  1.68  christos 		if (new == NULL)
    728  1.10   mycroft 			return 1;
    729  1.32    itojun 		Bzero(new, dlen + glen);
    730  1.10   mycroft 		rt->rt_nodes->rn_key = new;
    731  1.10   mycroft 	} else {
    732  1.66  christos 		new = __UNCONST(rt->rt_nodes->rn_key); /*XXXUNCONST*/
    733  1.68  christos 		old = NULL;
    734  1.10   mycroft 	}
    735  1.10   mycroft 	Bcopy(gate, (rt->rt_gateway = (struct sockaddr *)(new + dlen)), glen);
    736  1.10   mycroft 	if (old) {
    737  1.10   mycroft 		Bcopy(dst, new, dlen);
    738  1.10   mycroft 		Free(old);
    739  1.10   mycroft 	}
    740  1.10   mycroft 	if (rt->rt_gwroute) {
    741  1.68  christos 		RTFREE(rt->rt_gwroute);
    742  1.68  christos 		rt->rt_gwroute = NULL;
    743  1.10   mycroft 	}
    744  1.10   mycroft 	if (rt->rt_flags & RTF_GATEWAY) {
    745  1.10   mycroft 		rt->rt_gwroute = rtalloc1(gate, 1);
    746  1.27      matt 		/*
    747  1.27      matt 		 * If we switched gateways, grab the MTU from the new
    748  1.47    itojun 		 * gateway route if the current MTU, if the current MTU is
    749  1.47    itojun 		 * greater than the MTU of gateway.
    750  1.47    itojun 		 * Note that, if the MTU of gateway is 0, we will reset the
    751  1.47    itojun 		 * MTU of the route to run PMTUD again from scratch. XXX
    752  1.27      matt 		 */
    753  1.27      matt 		if (rt->rt_gwroute
    754  1.27      matt 		    && !(rt->rt_rmx.rmx_locks & RTV_MTU)
    755  1.47    itojun 		    && rt->rt_rmx.rmx_mtu
    756  1.47    itojun 		    && rt->rt_rmx.rmx_mtu > rt->rt_gwroute->rt_rmx.rmx_mtu) {
    757  1.27      matt 			rt->rt_rmx.rmx_mtu = rt->rt_gwroute->rt_rmx.rmx_mtu;
    758  1.27      matt 		}
    759  1.10   mycroft 	}
    760  1.10   mycroft 	return 0;
    761  1.10   mycroft }
    762  1.10   mycroft 
    763   1.9   mycroft void
    764  1.60      matt rt_maskedcopy(const struct sockaddr *src, struct sockaddr *dst,
    765  1.60      matt 	const struct sockaddr *netmask)
    766   1.1       cgd {
    767  1.66  christos 	const u_char *cp1 = (const u_char *)src;
    768  1.36  augustss 	u_char *cp2 = (u_char *)dst;
    769  1.66  christos 	const u_char *cp3 = (const u_char *)netmask;
    770   1.1       cgd 	u_char *cplim = cp2 + *cp3;
    771   1.1       cgd 	u_char *cplim2 = cp2 + *cp1;
    772   1.1       cgd 
    773   1.1       cgd 	*cp2++ = *cp1++; *cp2++ = *cp1++; /* copies sa_len & sa_family */
    774   1.1       cgd 	cp3 += 2;
    775   1.1       cgd 	if (cplim > cplim2)
    776   1.1       cgd 		cplim = cplim2;
    777   1.1       cgd 	while (cp2 < cplim)
    778   1.1       cgd 		*cp2++ = *cp1++ & *cp3++;
    779   1.1       cgd 	if (cp2 < cplim2)
    780  1.66  christos 		memset(cp2, 0, (unsigned)(cplim2 - cp2));
    781   1.1       cgd }
    782  1.10   mycroft 
    783   1.1       cgd /*
    784  1.29  sommerfe  * Set up or tear down a routing table entry, normally
    785   1.1       cgd  * for an interface.
    786   1.1       cgd  */
    787   1.9   mycroft int
    788  1.60      matt rtinit(struct ifaddr *ifa, int cmd, int flags)
    789   1.1       cgd {
    790  1.36  augustss 	struct rtentry *rt;
    791  1.36  augustss 	struct sockaddr *dst, *odst;
    792  1.29  sommerfe 	struct sockaddr_storage deldst;
    793  1.68  christos 	struct rtentry *nrt = NULL;
    794   1.1       cgd 	int error;
    795  1.39    itojun 	struct rt_addrinfo info;
    796   1.1       cgd 
    797   1.1       cgd 	dst = flags & RTF_HOST ? ifa->ifa_dstaddr : ifa->ifa_addr;
    798   1.1       cgd 	if (cmd == RTM_DELETE) {
    799   1.1       cgd 		if ((flags & RTF_HOST) == 0 && ifa->ifa_netmask) {
    800  1.29  sommerfe 			/* Delete subnet route for this interface */
    801  1.29  sommerfe 			odst = dst;
    802  1.29  sommerfe 			dst = (struct sockaddr *)&deldst;
    803  1.29  sommerfe 			rt_maskedcopy(odst, dst, ifa->ifa_netmask);
    804   1.1       cgd 		}
    805  1.14  christos 		if ((rt = rtalloc1(dst, 0)) != NULL) {
    806   1.1       cgd 			rt->rt_refcnt--;
    807  1.29  sommerfe 			if (rt->rt_ifa != ifa)
    808   1.1       cgd 				return (flags & RTF_HOST ? EHOSTUNREACH
    809   1.1       cgd 							: ENETUNREACH);
    810   1.1       cgd 		}
    811   1.1       cgd 	}
    812  1.44   thorpej 	memset(&info, 0, sizeof(info));
    813  1.39    itojun 	info.rti_ifa = ifa;
    814  1.39    itojun 	info.rti_flags = flags | ifa->ifa_flags;
    815  1.39    itojun 	info.rti_info[RTAX_DST] = dst;
    816  1.39    itojun 	info.rti_info[RTAX_GATEWAY] = ifa->ifa_addr;
    817  1.39    itojun 	/*
    818  1.39    itojun 	 * XXX here, it seems that we are assuming that ifa_netmask is NULL
    819  1.39    itojun 	 * for RTF_HOST.  bsdi4 passes NULL explicitly (via intermediate
    820  1.39    itojun 	 * variable) when RTF_HOST is 1.  still not sure if i can safely
    821  1.39    itojun 	 * change it to meet bsdi4 behavior.
    822  1.39    itojun 	 */
    823  1.39    itojun 	info.rti_info[RTAX_NETMASK] = ifa->ifa_netmask;
    824  1.39    itojun 	error = rtrequest1(cmd, &info, &nrt);
    825  1.10   mycroft 	if (cmd == RTM_DELETE && error == 0 && (rt = nrt)) {
    826  1.10   mycroft 		rt_newaddrmsg(cmd, ifa, error, nrt);
    827  1.10   mycroft 		if (rt->rt_refcnt <= 0) {
    828  1.10   mycroft 			rt->rt_refcnt++;
    829  1.10   mycroft 			rtfree(rt);
    830  1.10   mycroft 		}
    831  1.10   mycroft 	}
    832  1.10   mycroft 	if (cmd == RTM_ADD && error == 0 && (rt = nrt)) {
    833  1.10   mycroft 		rt->rt_refcnt--;
    834  1.10   mycroft 		if (rt->rt_ifa != ifa) {
    835  1.17  christos 			printf("rtinit: wrong ifa (%p) was (%p)\n", ifa,
    836  1.17  christos 				rt->rt_ifa);
    837  1.10   mycroft 			if (rt->rt_ifa->ifa_rtrequest)
    838  1.39    itojun 				rt->rt_ifa->ifa_rtrequest(RTM_DELETE, rt, NULL);
    839  1.74    dyoung 			rt_replace_ifa(rt, ifa);
    840  1.10   mycroft 			rt->rt_ifp = ifa->ifa_ifp;
    841  1.10   mycroft 			if (ifa->ifa_rtrequest)
    842  1.39    itojun 				ifa->ifa_rtrequest(RTM_ADD, rt, NULL);
    843  1.10   mycroft 		}
    844  1.10   mycroft 		rt_newaddrmsg(cmd, ifa, error, nrt);
    845   1.1       cgd 	}
    846   1.1       cgd 	return (error);
    847  1.18       kml }
    848  1.18       kml 
    849  1.18       kml /*
    850  1.18       kml  * Route timer routines.  These routes allow functions to be called
    851  1.18       kml  * for various routes at any time.  This is useful in supporting
    852  1.18       kml  * path MTU discovery and redirect route deletion.
    853  1.18       kml  *
    854  1.18       kml  * This is similar to some BSDI internal functions, but it provides
    855  1.18       kml  * for multiple queues for efficiency's sake...
    856  1.18       kml  */
    857  1.18       kml 
    858  1.18       kml LIST_HEAD(, rttimer_queue) rttimer_queue_head;
    859  1.18       kml static int rt_init_done = 0;
    860  1.18       kml 
    861  1.60      matt #define RTTIMER_CALLOUT(r)	do {					\
    862  1.60      matt 		if (r->rtt_func != NULL) {				\
    863  1.60      matt 			(*r->rtt_func)(r->rtt_rt, r);			\
    864  1.60      matt 		} else {						\
    865  1.60      matt 			rtrequest((int) RTM_DELETE,			\
    866  1.60      matt 				  (struct sockaddr *)rt_key(r->rtt_rt),	\
    867  1.60      matt 				  0, 0, 0, 0);				\
    868  1.60      matt 		}							\
    869  1.60      matt 	} while (/*CONSTCOND*/0)
    870  1.18       kml 
    871  1.65     perry /*
    872  1.18       kml  * Some subtle order problems with domain initialization mean that
    873  1.18       kml  * we cannot count on this being run from rt_init before various
    874  1.18       kml  * protocol initializations are done.  Therefore, we make sure
    875  1.18       kml  * that this is run when the first queue is added...
    876  1.18       kml  */
    877  1.18       kml 
    878  1.65     perry void
    879  1.60      matt rt_timer_init(void)
    880  1.18       kml {
    881  1.18       kml 	assert(rt_init_done == 0);
    882  1.18       kml 
    883  1.18       kml 	LIST_INIT(&rttimer_queue_head);
    884  1.35   thorpej 	callout_init(&rt_timer_ch);
    885  1.35   thorpej 	callout_reset(&rt_timer_ch, hz, rt_timer_timer, NULL);
    886  1.18       kml 	rt_init_done = 1;
    887  1.18       kml }
    888  1.18       kml 
    889  1.18       kml struct rttimer_queue *
    890  1.60      matt rt_timer_queue_create(u_int timeout)
    891  1.18       kml {
    892  1.18       kml 	struct rttimer_queue *rtq;
    893  1.18       kml 
    894  1.18       kml 	if (rt_init_done == 0)
    895  1.18       kml 		rt_timer_init();
    896  1.18       kml 
    897  1.18       kml 	R_Malloc(rtq, struct rttimer_queue *, sizeof *rtq);
    898  1.18       kml 	if (rtq == NULL)
    899  1.65     perry 		return (NULL);
    900  1.32    itojun 	Bzero(rtq, sizeof *rtq);
    901  1.18       kml 
    902  1.18       kml 	rtq->rtq_timeout = timeout;
    903  1.37    itojun 	rtq->rtq_count = 0;
    904  1.24   thorpej 	TAILQ_INIT(&rtq->rtq_head);
    905  1.18       kml 	LIST_INSERT_HEAD(&rttimer_queue_head, rtq, rtq_link);
    906  1.18       kml 
    907  1.24   thorpej 	return (rtq);
    908  1.18       kml }
    909  1.18       kml 
    910  1.18       kml void
    911  1.60      matt rt_timer_queue_change(struct rttimer_queue *rtq, long timeout)
    912  1.18       kml {
    913  1.24   thorpej 
    914  1.18       kml 	rtq->rtq_timeout = timeout;
    915  1.18       kml }
    916  1.18       kml 
    917  1.18       kml void
    918  1.60      matt rt_timer_queue_remove_all(struct rttimer_queue *rtq, int destroy)
    919  1.18       kml {
    920  1.24   thorpej 	struct rttimer *r;
    921  1.18       kml 
    922  1.24   thorpej 	while ((r = TAILQ_FIRST(&rtq->rtq_head)) != NULL) {
    923  1.18       kml 		LIST_REMOVE(r, rtt_link);
    924  1.24   thorpej 		TAILQ_REMOVE(&rtq->rtq_head, r, rtt_next);
    925  1.24   thorpej 		if (destroy)
    926  1.18       kml 			RTTIMER_CALLOUT(r);
    927  1.72       tls 		/* we are already at splsoftnet */
    928  1.22   thorpej 		pool_put(&rttimer_pool, r);
    929  1.37    itojun 		if (rtq->rtq_count > 0)
    930  1.37    itojun 			rtq->rtq_count--;
    931  1.37    itojun 		else
    932  1.55    itojun 			printf("rt_timer_queue_remove_all: "
    933  1.55    itojun 			    "rtq_count reached 0\n");
    934  1.18       kml 	}
    935  1.55    itojun }
    936  1.55    itojun 
    937  1.55    itojun void
    938  1.60      matt rt_timer_queue_destroy(struct rttimer_queue *rtq, int destroy)
    939  1.55    itojun {
    940  1.55    itojun 
    941  1.55    itojun 	rt_timer_queue_remove_all(rtq, destroy);
    942  1.18       kml 
    943  1.18       kml 	LIST_REMOVE(rtq, rtq_link);
    944  1.22   thorpej 
    945  1.22   thorpej 	/*
    946  1.22   thorpej 	 * Caller is responsible for freeing the rttimer_queue structure.
    947  1.22   thorpej 	 */
    948  1.18       kml }
    949  1.18       kml 
    950  1.37    itojun unsigned long
    951  1.60      matt rt_timer_count(struct rttimer_queue *rtq)
    952  1.37    itojun {
    953  1.37    itojun 	return rtq->rtq_count;
    954  1.37    itojun }
    955  1.37    itojun 
    956  1.65     perry void
    957  1.60      matt rt_timer_remove_all(struct rtentry *rt, int destroy)
    958  1.18       kml {
    959  1.24   thorpej 	struct rttimer *r;
    960  1.18       kml 
    961  1.24   thorpej 	while ((r = LIST_FIRST(&rt->rt_timer)) != NULL) {
    962  1.18       kml 		LIST_REMOVE(r, rtt_link);
    963  1.24   thorpej 		TAILQ_REMOVE(&r->rtt_queue->rtq_head, r, rtt_next);
    964  1.54    itojun 		if (destroy)
    965  1.54    itojun 			RTTIMER_CALLOUT(r);
    966  1.37    itojun 		if (r->rtt_queue->rtq_count > 0)
    967  1.37    itojun 			r->rtt_queue->rtq_count--;
    968  1.37    itojun 		else
    969  1.37    itojun 			printf("rt_timer_remove_all: rtq_count reached 0\n");
    970  1.72       tls 		/* we are already at splsoftnet */
    971  1.38    itojun 		pool_put(&rttimer_pool, r);
    972  1.18       kml 	}
    973  1.18       kml }
    974  1.18       kml 
    975  1.65     perry int
    976  1.60      matt rt_timer_add(struct rtentry *rt,
    977  1.60      matt 	void (*func)(struct rtentry *, struct rttimer *),
    978  1.60      matt 	struct rttimer_queue *queue)
    979  1.18       kml {
    980  1.24   thorpej 	struct rttimer *r;
    981  1.72       tls 	int s;
    982  1.18       kml 
    983  1.24   thorpej 	/*
    984  1.24   thorpej 	 * If there's already a timer with this action, destroy it before
    985  1.24   thorpej 	 * we add a new one.
    986  1.24   thorpej 	 */
    987  1.24   thorpej 	for (r = LIST_FIRST(&rt->rt_timer); r != NULL;
    988  1.24   thorpej 	     r = LIST_NEXT(r, rtt_link)) {
    989  1.18       kml 		if (r->rtt_func == func) {
    990  1.18       kml 			LIST_REMOVE(r, rtt_link);
    991  1.24   thorpej 			TAILQ_REMOVE(&r->rtt_queue->rtq_head, r, rtt_next);
    992  1.37    itojun 			if (r->rtt_queue->rtq_count > 0)
    993  1.37    itojun 				r->rtt_queue->rtq_count--;
    994  1.37    itojun 			else
    995  1.37    itojun 				printf("rt_timer_add: rtq_count reached 0\n");
    996  1.72       tls 			s = splsoftnet();
    997  1.38    itojun 			pool_put(&rttimer_pool, r);
    998  1.72       tls 			splx(s);
    999  1.18       kml 			break;  /* only one per list, so we can quit... */
   1000  1.18       kml 		}
   1001  1.18       kml 	}
   1002  1.18       kml 
   1003  1.72       tls 	s = splsoftnet();
   1004  1.24   thorpej 	r = pool_get(&rttimer_pool, PR_NOWAIT);
   1005  1.72       tls 	splx(s);
   1006  1.24   thorpej 	if (r == NULL)
   1007  1.24   thorpej 		return (ENOBUFS);
   1008  1.32    itojun 	Bzero(r, sizeof(*r));
   1009  1.24   thorpej 
   1010  1.24   thorpej 	r->rtt_rt = rt;
   1011  1.70    kardel 	r->rtt_time = time_uptime;
   1012  1.24   thorpej 	r->rtt_func = func;
   1013  1.24   thorpej 	r->rtt_queue = queue;
   1014  1.24   thorpej 	LIST_INSERT_HEAD(&rt->rt_timer, r, rtt_link);
   1015  1.24   thorpej 	TAILQ_INSERT_TAIL(&queue->rtq_head, r, rtt_next);
   1016  1.37    itojun 	r->rtt_queue->rtq_count++;
   1017  1.65     perry 
   1018  1.24   thorpej 	return (0);
   1019  1.18       kml }
   1020  1.18       kml 
   1021  1.18       kml /* ARGSUSED */
   1022  1.18       kml void
   1023  1.76  christos rt_timer_timer(void *arg)
   1024  1.18       kml {
   1025  1.24   thorpej 	struct rttimer_queue *rtq;
   1026  1.24   thorpej 	struct rttimer *r;
   1027  1.24   thorpej 	int s;
   1028  1.21       kml 
   1029  1.24   thorpej 	s = splsoftnet();
   1030  1.65     perry 	for (rtq = LIST_FIRST(&rttimer_queue_head); rtq != NULL;
   1031  1.18       kml 	     rtq = LIST_NEXT(rtq, rtq_link)) {
   1032  1.24   thorpej 		while ((r = TAILQ_FIRST(&rtq->rtq_head)) != NULL &&
   1033  1.70    kardel 		    (r->rtt_time + rtq->rtq_timeout) < time_uptime) {
   1034  1.24   thorpej 			LIST_REMOVE(r, rtt_link);
   1035  1.24   thorpej 			TAILQ_REMOVE(&rtq->rtq_head, r, rtt_next);
   1036  1.24   thorpej 			RTTIMER_CALLOUT(r);
   1037  1.24   thorpej 			pool_put(&rttimer_pool, r);
   1038  1.37    itojun 			if (rtq->rtq_count > 0)
   1039  1.37    itojun 				rtq->rtq_count--;
   1040  1.37    itojun 			else
   1041  1.37    itojun 				printf("rt_timer_timer: rtq_count reached 0\n");
   1042  1.18       kml 		}
   1043  1.18       kml 	}
   1044  1.24   thorpej 	splx(s);
   1045  1.18       kml 
   1046  1.35   thorpej 	callout_reset(&rt_timer_ch, hz, rt_timer_timer, NULL);
   1047   1.1       cgd }
   1048