Home | History | Annotate | Line # | Download | only in net
if_gre.c revision 1.88.2.3
      1  1.88.2.3        ad /*	$NetBSD: if_gre.c,v 1.88.2.3 2007/04/10 13:26:47 ad Exp $ */
      2       1.4   thorpej 
      3       1.1       hwr /*
      4       1.4   thorpej  * Copyright (c) 1998 The NetBSD Foundation, Inc.
      5       1.1       hwr  * All rights reserved.
      6       1.1       hwr  *
      7       1.1       hwr  * This code is derived from software contributed to The NetBSD Foundation
      8       1.1       hwr  * by Heiko W.Rupp <hwr (at) pilhuhn.de>
      9       1.1       hwr  *
     10      1.56        is  * IPv6-over-GRE contributed by Gert Doering <gert (at) greenie.muc.de>
     11      1.56        is  *
     12       1.1       hwr  * Redistribution and use in source and binary forms, with or without
     13       1.1       hwr  * modification, are permitted provided that the following conditions
     14       1.1       hwr  * are met:
     15       1.1       hwr  * 1. Redistributions of source code must retain the above copyright
     16       1.1       hwr  *    notice, this list of conditions and the following disclaimer.
     17       1.1       hwr  * 2. Redistributions in binary form must reproduce the above copyright
     18       1.1       hwr  *    notice, this list of conditions and the following disclaimer in the
     19       1.1       hwr  *    documentation and/or other materials provided with the distribution.
     20       1.1       hwr  * 3. All advertising materials mentioning features or use of this software
     21       1.1       hwr  *    must display the following acknowledgement:
     22       1.1       hwr  *        This product includes software developed by the NetBSD
     23       1.1       hwr  *        Foundation, Inc. and its contributors.
     24       1.1       hwr  * 4. Neither the name of The NetBSD Foundation nor the names of its
     25       1.1       hwr  *    contributors may be used to endorse or promote products derived
     26       1.1       hwr  *    from this software without specific prior written permission.
     27       1.1       hwr  *
     28       1.1       hwr  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     29       1.1       hwr  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     30       1.1       hwr  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     31       1.1       hwr  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     32       1.1       hwr  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     33       1.1       hwr  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     34       1.1       hwr  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     35       1.1       hwr  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     36       1.1       hwr  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     37       1.1       hwr  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     38       1.1       hwr  * POSSIBILITY OF SUCH DAMAGE.
     39       1.1       hwr  */
     40       1.1       hwr 
     41       1.1       hwr /*
     42       1.1       hwr  * Encapsulate L3 protocols into IP
     43       1.1       hwr  * See RFC 1701 and 1702 for more details.
     44       1.1       hwr  * If_gre is compatible with Cisco GRE tunnels, so you can
     45       1.1       hwr  * have a NetBSD box as the other end of a tunnel interface of a Cisco
     46       1.1       hwr  * router. See gre(4) for more details.
     47       1.6       hwr  * Also supported:  IP in IP encaps (proto 55) as of RFC 2004
     48       1.1       hwr  */
     49      1.22     lukem 
     50      1.22     lukem #include <sys/cdefs.h>
     51  1.88.2.3        ad __KERNEL_RCSID(0, "$NetBSD: if_gre.c,v 1.88.2.3 2007/04/10 13:26:47 ad Exp $");
     52       1.1       hwr 
     53      1.62    dyoung #include "opt_gre.h"
     54       1.1       hwr #include "opt_inet.h"
     55       1.1       hwr #include "bpfilter.h"
     56       1.1       hwr 
     57      1.54  christos #ifdef INET
     58       1.1       hwr #include <sys/param.h>
     59      1.62    dyoung #include <sys/file.h>
     60      1.62    dyoung #include <sys/filedesc.h>
     61       1.1       hwr #include <sys/malloc.h>
     62       1.1       hwr #include <sys/mbuf.h>
     63      1.13    martin #include <sys/proc.h>
     64       1.1       hwr #include <sys/protosw.h>
     65       1.1       hwr #include <sys/socket.h>
     66      1.62    dyoung #include <sys/socketvar.h>
     67       1.1       hwr #include <sys/ioctl.h>
     68      1.10   thorpej #include <sys/queue.h>
     69       1.1       hwr #if __NetBSD__
     70       1.1       hwr #include <sys/systm.h>
     71      1.62    dyoung #include <sys/sysctl.h>
     72      1.60      elad #include <sys/kauth.h>
     73       1.1       hwr #endif
     74       1.1       hwr 
     75      1.62    dyoung #include <sys/kthread.h>
     76      1.62    dyoung 
     77       1.1       hwr #include <machine/cpu.h>
     78       1.1       hwr 
     79       1.1       hwr #include <net/ethertypes.h>
     80       1.1       hwr #include <net/if.h>
     81       1.1       hwr #include <net/if_types.h>
     82       1.1       hwr #include <net/netisr.h>
     83       1.1       hwr #include <net/route.h>
     84       1.1       hwr 
     85       1.1       hwr #ifdef INET
     86       1.1       hwr #include <netinet/in.h>
     87       1.1       hwr #include <netinet/in_systm.h>
     88       1.1       hwr #include <netinet/in_var.h>
     89       1.1       hwr #include <netinet/ip.h>
     90       1.1       hwr #include <netinet/ip_var.h>
     91       1.1       hwr #else
     92       1.4   thorpej #error "Huh? if_gre without inet?"
     93       1.1       hwr #endif
     94       1.1       hwr 
     95       1.1       hwr 
     96       1.1       hwr #ifdef NETATALK
     97       1.1       hwr #include <netatalk/at.h>
     98       1.1       hwr #include <netatalk/at_var.h>
     99       1.1       hwr #include <netatalk/at_extern.h>
    100       1.1       hwr #endif
    101       1.1       hwr 
    102       1.1       hwr #if NBPFILTER > 0
    103       1.1       hwr #include <sys/time.h>
    104       1.1       hwr #include <net/bpf.h>
    105       1.1       hwr #endif
    106       1.1       hwr 
    107       1.1       hwr #include <net/if_gre.h>
    108       1.1       hwr 
    109      1.20    itojun /*
    110      1.27    martin  * It is not easy to calculate the right value for a GRE MTU.
    111      1.27    martin  * We leave this task to the admin and use the same default that
    112      1.27    martin  * other vendors use.
    113      1.20    itojun  */
    114      1.27    martin #define GREMTU 1476
    115       1.1       hwr 
    116      1.62    dyoung #ifdef GRE_DEBUG
    117      1.62    dyoung #define	GRE_DPRINTF(__sc, __fmt, ...)				\
    118      1.62    dyoung 	do {							\
    119      1.62    dyoung 		if (((__sc)->sc_if.if_flags & IFF_DEBUG) != 0)	\
    120      1.62    dyoung 			printf(__fmt, __VA_ARGS__);		\
    121      1.62    dyoung 	} while (/*CONSTCOND*/0)
    122      1.62    dyoung #else
    123      1.62    dyoung #define	GRE_DPRINTF(__sc, __fmt, ...)	do { } while (/*CONSTCOND*/0)
    124      1.62    dyoung #endif /* GRE_DEBUG */
    125      1.62    dyoung 
    126      1.11   thorpej struct gre_softc_head gre_softc_list;
    127      1.26    martin int ip_gre_ttl = GRE_TTL;
    128       1.1       hwr 
    129      1.59   thorpej static int	gre_clone_create(struct if_clone *, int);
    130      1.59   thorpej static int	gre_clone_destroy(struct ifnet *);
    131      1.10   thorpej 
    132      1.59   thorpej static struct if_clone gre_cloner =
    133      1.10   thorpej     IF_CLONE_INITIALIZER("gre", gre_clone_create, gre_clone_destroy);
    134       1.1       hwr 
    135      1.84    dyoung static int	gre_output(struct ifnet *, struct mbuf *,
    136      1.84    dyoung 			   const struct sockaddr *, struct rtentry *);
    137      1.88  christos static int	gre_ioctl(struct ifnet *, u_long, void *);
    138       1.1       hwr 
    139      1.59   thorpej static int	gre_compute_route(struct gre_softc *sc);
    140      1.59   thorpej 
    141      1.62    dyoung static int gre_getsockname(struct socket *, struct mbuf *, struct lwp *);
    142      1.62    dyoung static int gre_getpeername(struct socket *, struct mbuf *, struct lwp *);
    143      1.62    dyoung static int gre_getnames(struct socket *, struct lwp *, struct sockaddr_in *,
    144      1.62    dyoung     struct sockaddr_in *);
    145      1.62    dyoung 
    146      1.62    dyoung static void
    147      1.82    dyoung gre_stop(volatile int *running)
    148      1.62    dyoung {
    149      1.62    dyoung 	*running = 0;
    150      1.62    dyoung 	wakeup(running);
    151      1.62    dyoung }
    152      1.62    dyoung 
    153      1.62    dyoung static void
    154      1.82    dyoung gre_join(volatile int *running)
    155      1.62    dyoung {
    156      1.62    dyoung 	int s;
    157      1.62    dyoung 
    158      1.62    dyoung 	s = splnet();
    159      1.62    dyoung 	while (*running != 0) {
    160      1.62    dyoung 		splx(s);
    161      1.62    dyoung 		tsleep(running, PSOCK, "grejoin", 0);
    162      1.62    dyoung 		s = splnet();
    163      1.62    dyoung 	}
    164      1.62    dyoung 	splx(s);
    165      1.62    dyoung }
    166      1.62    dyoung 
    167      1.62    dyoung static void
    168      1.62    dyoung gre_wakeup(struct gre_softc *sc)
    169      1.62    dyoung {
    170      1.62    dyoung 	GRE_DPRINTF(sc, "%s: enter\n", __func__);
    171      1.62    dyoung 	sc->sc_waitchan = 1;
    172      1.62    dyoung 	wakeup(&sc->sc_waitchan);
    173      1.62    dyoung }
    174      1.62    dyoung 
    175      1.59   thorpej static int
    176      1.59   thorpej gre_clone_create(struct if_clone *ifc, int unit)
    177       1.1       hwr {
    178       1.8  explorer 	struct gre_softc *sc;
    179       1.1       hwr 
    180      1.10   thorpej 	sc = malloc(sizeof(struct gre_softc), M_DEVBUF, M_WAITOK);
    181      1.10   thorpej 	memset(sc, 0, sizeof(struct gre_softc));
    182      1.10   thorpej 
    183      1.50    itojun 	snprintf(sc->sc_if.if_xname, sizeof(sc->sc_if.if_xname), "%s%d",
    184      1.50    itojun 	    ifc->ifc_name, unit);
    185      1.10   thorpej 	sc->sc_if.if_softc = sc;
    186      1.51      tron 	sc->sc_if.if_type = IFT_TUNNEL;
    187      1.34    itojun 	sc->sc_if.if_addrlen = 0;
    188      1.10   thorpej 	sc->sc_if.if_hdrlen = 24; /* IP + GRE */
    189      1.15   thorpej 	sc->sc_if.if_dlt = DLT_NULL;
    190      1.20    itojun 	sc->sc_if.if_mtu = GREMTU;
    191      1.10   thorpej 	sc->sc_if.if_flags = IFF_POINTOPOINT|IFF_MULTICAST;
    192      1.10   thorpej 	sc->sc_if.if_output = gre_output;
    193      1.10   thorpej 	sc->sc_if.if_ioctl = gre_ioctl;
    194      1.10   thorpej 	sc->g_dst.s_addr = sc->g_src.s_addr = INADDR_ANY;
    195      1.62    dyoung 	sc->g_dstport = sc->g_srcport = 0;
    196      1.75    dyoung 	sc->sc_proto = IPPROTO_GRE;
    197      1.64    dyoung 	sc->sc_snd.ifq_maxlen = 256;
    198      1.35    itojun 	sc->sc_if.if_flags |= IFF_LINK0;
    199      1.10   thorpej 	if_attach(&sc->sc_if);
    200      1.16   thorpej 	if_alloc_sadl(&sc->sc_if);
    201       1.1       hwr #if NBPFILTER > 0
    202      1.14   thorpej 	bpfattach(&sc->sc_if, DLT_NULL, sizeof(u_int32_t));
    203       1.1       hwr #endif
    204      1.10   thorpej 	LIST_INSERT_HEAD(&gre_softc_list, sc, sc_list);
    205      1.87    dyoung 	return 0;
    206      1.10   thorpej }
    207       1.1       hwr 
    208      1.59   thorpej static int
    209      1.59   thorpej gre_clone_destroy(struct ifnet *ifp)
    210      1.10   thorpej {
    211      1.77    dyoung 	int s;
    212      1.10   thorpej 	struct gre_softc *sc = ifp->if_softc;
    213      1.10   thorpej 
    214      1.10   thorpej 	LIST_REMOVE(sc, sc_list);
    215      1.10   thorpej #if NBPFILTER > 0
    216      1.10   thorpej 	bpfdetach(ifp);
    217      1.10   thorpej #endif
    218      1.77    dyoung 	s = splnet();
    219      1.77    dyoung 	ifp->if_flags &= ~IFF_UP;
    220      1.62    dyoung 	gre_wakeup(sc);
    221      1.77    dyoung 	splx(s);
    222      1.62    dyoung 	gre_join(&sc->sc_thread);
    223      1.77    dyoung 	s = splnet();
    224      1.85    dyoung 	rtcache_free(&sc->route);
    225      1.77    dyoung 	if_detach(ifp);
    226      1.77    dyoung 	splx(s);
    227      1.62    dyoung 	if (sc->sc_fp != NULL) {
    228      1.62    dyoung 		closef(sc->sc_fp, curlwp);
    229      1.62    dyoung 		sc->sc_fp = NULL;
    230      1.62    dyoung 	}
    231      1.10   thorpej 	free(sc, M_DEVBUF);
    232      1.53     peter 
    233      1.87    dyoung 	return 0;
    234       1.1       hwr }
    235       1.1       hwr 
    236      1.62    dyoung static void
    237      1.88  christos gre_receive(struct socket *so, void *arg, int waitflag)
    238      1.62    dyoung {
    239      1.62    dyoung 	struct gre_softc *sc = (struct gre_softc *)arg;
    240      1.62    dyoung 
    241      1.62    dyoung 	GRE_DPRINTF(sc, "%s: enter\n", __func__);
    242      1.62    dyoung 
    243      1.62    dyoung 	gre_wakeup(sc);
    244      1.62    dyoung }
    245      1.62    dyoung 
    246      1.62    dyoung static void
    247      1.88  christos gre_upcall_add(struct socket *so, void *arg)
    248      1.62    dyoung {
    249      1.62    dyoung 	/* XXX What if the kernel already set an upcall? */
    250      1.62    dyoung 	so->so_upcallarg = arg;
    251      1.62    dyoung 	so->so_upcall = gre_receive;
    252      1.62    dyoung 	so->so_rcv.sb_flags |= SB_UPCALL;
    253      1.62    dyoung }
    254      1.62    dyoung 
    255      1.62    dyoung static void
    256      1.62    dyoung gre_upcall_remove(struct socket *so)
    257      1.62    dyoung {
    258      1.62    dyoung 	/* XXX What if the kernel already set an upcall? */
    259      1.62    dyoung 	so->so_rcv.sb_flags &= ~SB_UPCALL;
    260      1.62    dyoung 	so->so_upcallarg = NULL;
    261      1.62    dyoung 	so->so_upcall = NULL;
    262      1.62    dyoung }
    263      1.62    dyoung 
    264      1.62    dyoung static void
    265      1.62    dyoung gre_sodestroy(struct socket **sop)
    266      1.62    dyoung {
    267      1.62    dyoung 	gre_upcall_remove(*sop);
    268      1.62    dyoung 	soshutdown(*sop, SHUT_RDWR);
    269      1.62    dyoung 	soclose(*sop);
    270      1.62    dyoung 	*sop = NULL;
    271      1.62    dyoung }
    272      1.62    dyoung 
    273      1.62    dyoung static struct mbuf *
    274      1.74  christos gre_getsockmbuf(struct socket *so)
    275      1.62    dyoung {
    276      1.62    dyoung 	struct mbuf *m;
    277      1.62    dyoung 
    278      1.62    dyoung 	m = m_get(M_WAIT, MT_SONAME);
    279      1.62    dyoung 	if (m != NULL)
    280      1.62    dyoung 		MCLAIM(m, so->so_mowner);
    281      1.62    dyoung 	return m;
    282      1.62    dyoung }
    283      1.62    dyoung 
    284      1.62    dyoung static int
    285      1.62    dyoung gre_socreate1(struct gre_softc *sc, struct lwp *l, struct gre_soparm *sp,
    286      1.62    dyoung     struct socket **sop)
    287      1.62    dyoung {
    288      1.62    dyoung 	int rc;
    289      1.62    dyoung 	struct mbuf *m;
    290      1.62    dyoung 	struct sockaddr_in *sin;
    291      1.62    dyoung 	struct socket *so;
    292      1.62    dyoung 
    293      1.62    dyoung 	GRE_DPRINTF(sc, "%s: enter\n", __func__);
    294      1.62    dyoung 	rc = socreate(AF_INET, sop, SOCK_DGRAM, IPPROTO_UDP, l);
    295      1.62    dyoung 	if (rc != 0) {
    296      1.62    dyoung 		GRE_DPRINTF(sc, "%s: socreate failed\n", __func__);
    297      1.62    dyoung 		return rc;
    298      1.62    dyoung 	}
    299      1.62    dyoung 
    300      1.62    dyoung 	so = *sop;
    301      1.62    dyoung 
    302  1.88.2.3        ad 	gre_upcall_add(so, sc);
    303      1.62    dyoung 	if ((m = gre_getsockmbuf(so)) == NULL) {
    304      1.62    dyoung 		rc = ENOBUFS;
    305      1.62    dyoung 		goto out;
    306      1.62    dyoung 	}
    307      1.62    dyoung 	sin = mtod(m, struct sockaddr_in *);
    308      1.62    dyoung 	sin->sin_len = m->m_len = sizeof(struct sockaddr_in);
    309      1.62    dyoung 	sin->sin_family = AF_INET;
    310      1.62    dyoung 	sin->sin_addr = sc->g_src;
    311      1.62    dyoung 	sin->sin_port = sc->g_srcport;
    312      1.62    dyoung 
    313      1.62    dyoung 	GRE_DPRINTF(sc, "%s: bind 0x%08" PRIx32 " port %d\n", __func__,
    314      1.62    dyoung 	    sin->sin_addr.s_addr, ntohs(sin->sin_port));
    315      1.62    dyoung 	if ((rc = sobind(so, m, l)) != 0) {
    316      1.62    dyoung 		GRE_DPRINTF(sc, "%s: sobind failed\n", __func__);
    317      1.62    dyoung 		goto out;
    318      1.62    dyoung 	}
    319      1.62    dyoung 
    320      1.62    dyoung 	if (sc->g_srcport == 0) {
    321      1.69    dyoung 		if ((rc = gre_getsockname(so, m, l)) != 0) {
    322      1.62    dyoung 			GRE_DPRINTF(sc, "%s: gre_getsockname failed\n",
    323      1.62    dyoung 			    __func__);
    324      1.62    dyoung 			goto out;
    325      1.62    dyoung 		}
    326      1.62    dyoung 		sc->g_srcport = sin->sin_port;
    327      1.62    dyoung 	}
    328      1.62    dyoung 
    329      1.62    dyoung 	sin->sin_addr = sc->g_dst;
    330      1.62    dyoung 	sin->sin_port = sc->g_dstport;
    331      1.62    dyoung 
    332      1.68    dyoung 	if ((rc = soconnect(so, m, l)) != 0) {
    333      1.62    dyoung 		GRE_DPRINTF(sc, "%s: soconnect failed\n", __func__);
    334      1.62    dyoung 		goto out;
    335      1.62    dyoung 	}
    336      1.62    dyoung 
    337      1.62    dyoung 	*mtod(m, int *) = ip_gre_ttl;
    338      1.76    dyoung 	m->m_len = sizeof(int);
    339      1.62    dyoung 	rc = (*so->so_proto->pr_ctloutput)(PRCO_SETOPT, so, IPPROTO_IP, IP_TTL,
    340      1.62    dyoung 	    &m);
    341      1.62    dyoung 	m = NULL;
    342      1.62    dyoung 	if (rc != 0) {
    343      1.62    dyoung 		printf("%s: setopt ttl failed\n", __func__);
    344      1.62    dyoung 		rc = 0;
    345      1.62    dyoung 	}
    346      1.62    dyoung out:
    347      1.62    dyoung 	m_freem(m);
    348      1.62    dyoung 
    349      1.62    dyoung 	if (rc != 0)
    350      1.62    dyoung 		gre_sodestroy(sop);
    351      1.62    dyoung 	else
    352      1.63    dyoung 		*sp = sc->sc_soparm;
    353      1.62    dyoung 
    354      1.62    dyoung 	return rc;
    355      1.62    dyoung }
    356      1.62    dyoung 
    357      1.62    dyoung static void
    358      1.62    dyoung gre_thread1(struct gre_softc *sc, struct lwp *l)
    359      1.62    dyoung {
    360      1.62    dyoung 	int flags, rc, s;
    361      1.62    dyoung 	const struct gre_h *gh;
    362      1.62    dyoung 	struct ifnet *ifp = &sc->sc_if;
    363      1.62    dyoung 	struct mbuf *m;
    364      1.62    dyoung 	struct socket *so = NULL;
    365      1.62    dyoung 	struct uio uio;
    366      1.62    dyoung 	struct gre_soparm sp;
    367      1.62    dyoung 
    368      1.62    dyoung 	GRE_DPRINTF(sc, "%s: enter\n", __func__);
    369      1.62    dyoung 	s = splnet();
    370      1.62    dyoung 
    371      1.62    dyoung 	sc->sc_waitchan = 1;
    372      1.62    dyoung 
    373      1.62    dyoung 	memset(&sp, 0, sizeof(sp));
    374      1.62    dyoung 	memset(&uio, 0, sizeof(uio));
    375      1.62    dyoung 
    376      1.62    dyoung 	ifp->if_flags |= IFF_RUNNING;
    377      1.62    dyoung 
    378      1.62    dyoung 	for (;;) {
    379      1.62    dyoung 		while (sc->sc_waitchan == 0) {
    380      1.62    dyoung 			splx(s);
    381      1.62    dyoung 			GRE_DPRINTF(sc, "%s: sleeping\n", __func__);
    382      1.62    dyoung 			tsleep(&sc->sc_waitchan, PSOCK, "grewait", 0);
    383      1.62    dyoung 			s = splnet();
    384      1.62    dyoung 		}
    385      1.62    dyoung 		sc->sc_waitchan = 0;
    386      1.62    dyoung 		GRE_DPRINTF(sc, "%s: awake\n", __func__);
    387      1.62    dyoung 		if ((ifp->if_flags & IFF_UP) != IFF_UP) {
    388      1.62    dyoung 			GRE_DPRINTF(sc, "%s: not up & running; exiting\n",
    389      1.62    dyoung 			    __func__);
    390      1.62    dyoung 			break;
    391      1.62    dyoung 		}
    392      1.75    dyoung 		if (sc->sc_proto != IPPROTO_UDP) {
    393      1.62    dyoung 			GRE_DPRINTF(sc, "%s: not udp; exiting\n", __func__);
    394      1.62    dyoung 			break;
    395      1.62    dyoung 		}
    396      1.62    dyoung 		/* XXX optimize */
    397      1.69    dyoung 		if (so == NULL || memcmp(&sp, &sc->sc_soparm, sizeof(sp)) != 0){
    398      1.62    dyoung 			GRE_DPRINTF(sc, "%s: parameters changed\n", __func__);
    399      1.62    dyoung 
    400      1.62    dyoung 			if (sp.sp_fp != NULL) {
    401      1.62    dyoung 				FILE_UNUSE(sp.sp_fp, NULL);
    402      1.62    dyoung 				sp.sp_fp = NULL;
    403      1.62    dyoung 				so = NULL;
    404      1.62    dyoung 			} else if (so != NULL)
    405      1.62    dyoung 				gre_sodestroy(&so);
    406      1.62    dyoung 
    407      1.62    dyoung 			if (sc->sc_fp != NULL) {
    408      1.62    dyoung 				so = (struct socket *)sc->sc_fp->f_data;
    409  1.88.2.3        ad 				gre_upcall_add(so, sc);
    410      1.63    dyoung 				sp = sc->sc_soparm;
    411      1.62    dyoung 				FILE_USE(sp.sp_fp);
    412      1.62    dyoung 			} else if (gre_socreate1(sc, l, &sp, &so) != 0)
    413      1.62    dyoung 				goto out;
    414      1.62    dyoung 		}
    415      1.62    dyoung 		for (;;) {
    416      1.62    dyoung 			flags = MSG_DONTWAIT;
    417      1.62    dyoung 			uio.uio_resid = 1000000;
    418      1.62    dyoung 			rc = (*so->so_receive)(so, NULL, &uio, &m, NULL,
    419      1.62    dyoung 			    &flags);
    420      1.62    dyoung 			/* TBD Back off if ECONNREFUSED (indicates
    421      1.62    dyoung 			 * ICMP Port Unreachable)?
    422      1.62    dyoung 			 */
    423      1.62    dyoung 			if (rc == EWOULDBLOCK) {
    424      1.62    dyoung 				GRE_DPRINTF(sc, "%s: so_receive EWOULDBLOCK\n",
    425      1.62    dyoung 				    __func__);
    426      1.62    dyoung 				break;
    427      1.62    dyoung 			} else if (rc != 0 || m == NULL) {
    428      1.62    dyoung 				GRE_DPRINTF(sc, "%s: rc %d m %p\n",
    429      1.62    dyoung 				    ifp->if_xname, rc, (void *)m);
    430      1.62    dyoung 				continue;
    431      1.62    dyoung 			} else
    432      1.62    dyoung 				GRE_DPRINTF(sc, "%s: so_receive ok\n",
    433      1.62    dyoung 				    __func__);
    434      1.62    dyoung 			if (m->m_len < sizeof(*gh) &&
    435      1.62    dyoung 			    (m = m_pullup(m, sizeof(*gh))) == NULL) {
    436      1.62    dyoung 				GRE_DPRINTF(sc, "%s: m_pullup failed\n",
    437      1.62    dyoung 				    __func__);
    438      1.62    dyoung 				continue;
    439      1.62    dyoung 			}
    440      1.62    dyoung 			gh = mtod(m, const struct gre_h *);
    441      1.62    dyoung 
    442  1.88.2.3        ad 			if (gre_input3(sc, m, 0, gh) == 0) {
    443      1.62    dyoung 				GRE_DPRINTF(sc, "%s: dropping unsupported\n",
    444      1.62    dyoung 				    __func__);
    445      1.62    dyoung 				m_freem(m);
    446      1.62    dyoung 			}
    447      1.62    dyoung 		}
    448      1.62    dyoung 		for (;;) {
    449      1.62    dyoung 			IF_DEQUEUE(&sc->sc_snd, m);
    450      1.62    dyoung 			if (m == NULL)
    451      1.62    dyoung 				break;
    452      1.62    dyoung 			GRE_DPRINTF(sc, "%s: dequeue\n", __func__);
    453      1.62    dyoung 			if ((so->so_state & SS_ISCONNECTED) == 0) {
    454      1.62    dyoung 				GRE_DPRINTF(sc, "%s: not connected\n",
    455      1.62    dyoung 				    __func__);
    456      1.62    dyoung 				m_freem(m);
    457      1.62    dyoung 				continue;
    458      1.62    dyoung 			}
    459      1.62    dyoung 			rc = (*so->so_send)(so, NULL, NULL, m, NULL, 0, l);
    460      1.62    dyoung 			/* XXX handle ENOBUFS? */
    461      1.62    dyoung 			if (rc != 0)
    462      1.62    dyoung 				GRE_DPRINTF(sc, "%s: so_send failed\n",
    463      1.62    dyoung 				    __func__);
    464      1.62    dyoung 		}
    465      1.62    dyoung 		/* Give the software interrupt queues a chance to
    466      1.62    dyoung 		 * run, or else when I send a ping from gre0 to gre1 on
    467      1.62    dyoung 		 * the same host, gre0 will not wake for the reply.
    468      1.62    dyoung 		 */
    469      1.62    dyoung 		splx(s);
    470      1.62    dyoung 		s = splnet();
    471      1.62    dyoung 	}
    472      1.62    dyoung 	if (sp.sp_fp != NULL) {
    473      1.62    dyoung 		GRE_DPRINTF(sc, "%s: removing upcall\n", __func__);
    474      1.62    dyoung 		gre_upcall_remove(so);
    475      1.62    dyoung 		FILE_UNUSE(sp.sp_fp, NULL);
    476      1.62    dyoung 		sp.sp_fp = NULL;
    477      1.66    dyoung 	} else if (so != NULL)
    478      1.62    dyoung 		gre_sodestroy(&so);
    479      1.62    dyoung out:
    480      1.62    dyoung 	GRE_DPRINTF(sc, "%s: stopping\n", __func__);
    481      1.75    dyoung 	if (sc->sc_proto == IPPROTO_UDP)
    482      1.62    dyoung 		ifp->if_flags &= ~IFF_RUNNING;
    483      1.64    dyoung 	while (!IF_IS_EMPTY(&sc->sc_snd)) {
    484      1.64    dyoung 		IF_DEQUEUE(&sc->sc_snd, m);
    485      1.64    dyoung 		m_freem(m);
    486      1.64    dyoung 	}
    487      1.62    dyoung 	gre_stop(&sc->sc_thread);
    488      1.62    dyoung 	/* must not touch sc after this! */
    489      1.62    dyoung 	GRE_DPRINTF(sc, "%s: restore ipl\n", __func__);
    490      1.62    dyoung 	splx(s);
    491      1.62    dyoung }
    492      1.62    dyoung 
    493      1.62    dyoung static void
    494      1.62    dyoung gre_thread(void *arg)
    495      1.62    dyoung {
    496      1.62    dyoung 	struct gre_softc *sc = (struct gre_softc *)arg;
    497      1.62    dyoung 
    498      1.62    dyoung 	gre_thread1(sc, curlwp);
    499      1.62    dyoung 	/* must not touch sc after this! */
    500      1.62    dyoung 	kthread_exit(0);
    501      1.62    dyoung }
    502      1.62    dyoung 
    503      1.62    dyoung int
    504  1.88.2.3        ad gre_input3(struct gre_softc *sc, struct mbuf *m, int hlen,
    505      1.62    dyoung     const struct gre_h *gh)
    506      1.62    dyoung {
    507      1.62    dyoung 	u_int16_t flags;
    508      1.62    dyoung #if NBPFILTER > 0
    509      1.62    dyoung 	u_int32_t af = AF_INET;		/* af passed to BPF tap */
    510      1.62    dyoung #endif
    511      1.62    dyoung 	int s, isr;
    512      1.62    dyoung 	struct ifqueue *ifq;
    513      1.62    dyoung 
    514      1.62    dyoung 	sc->sc_if.if_ipackets++;
    515      1.62    dyoung 	sc->sc_if.if_ibytes += m->m_pkthdr.len;
    516      1.62    dyoung 
    517  1.88.2.3        ad 	hlen += sizeof(struct gre_h);
    518      1.62    dyoung 
    519  1.88.2.3        ad 	/* process GRE flags as packet can be of variable len */
    520  1.88.2.3        ad 	flags = ntohs(gh->flags);
    521      1.62    dyoung 
    522  1.88.2.3        ad 	/* Checksum & Offset are present */
    523  1.88.2.3        ad 	if ((flags & GRE_CP) | (flags & GRE_RP))
    524  1.88.2.3        ad 		hlen += 4;
    525  1.88.2.3        ad 	/* We don't support routing fields (variable length) */
    526  1.88.2.3        ad 	if (flags & GRE_RP) {
    527  1.88.2.3        ad 		sc->sc_if.if_ierrors++;
    528  1.88.2.3        ad 		return 0;
    529  1.88.2.3        ad 	}
    530  1.88.2.3        ad 	if (flags & GRE_KP)
    531  1.88.2.3        ad 		hlen += 4;
    532  1.88.2.3        ad 	if (flags & GRE_SP)
    533  1.88.2.3        ad 		hlen += 4;
    534  1.88.2.3        ad 
    535  1.88.2.3        ad 	switch (ntohs(gh->ptype)) { /* ethertypes */
    536  1.88.2.3        ad 	case ETHERTYPE_IP: /* shouldn't need a schednetisr(), as */
    537  1.88.2.3        ad 		ifq = &ipintrq;          /* we are in ip_input */
    538  1.88.2.3        ad 		isr = NETISR_IP;
    539  1.88.2.3        ad 		break;
    540      1.62    dyoung #ifdef NETATALK
    541  1.88.2.3        ad 	case ETHERTYPE_ATALK:
    542  1.88.2.3        ad 		ifq = &atintrq1;
    543  1.88.2.3        ad 		isr = NETISR_ATALK;
    544      1.62    dyoung #if NBPFILTER > 0
    545  1.88.2.3        ad 		af = AF_APPLETALK;
    546      1.62    dyoung #endif
    547  1.88.2.3        ad 		break;
    548      1.62    dyoung #endif
    549      1.62    dyoung #ifdef INET6
    550  1.88.2.3        ad 	case ETHERTYPE_IPV6:
    551  1.88.2.3        ad 		GRE_DPRINTF(sc, "%s: IPv6 packet\n", __func__);
    552  1.88.2.3        ad 		ifq = &ip6intrq;
    553  1.88.2.3        ad 		isr = NETISR_IPV6;
    554      1.62    dyoung #if NBPFILTER > 0
    555  1.88.2.3        ad 		af = AF_INET6;
    556      1.62    dyoung #endif
    557      1.62    dyoung 		break;
    558  1.88.2.3        ad #endif
    559  1.88.2.3        ad 	default:	   /* others not yet supported */
    560  1.88.2.3        ad 		GRE_DPRINTF(sc, "%s: unhandled ethertype 0x%04x\n", __func__,
    561  1.88.2.3        ad 		    ntohs(gh->ptype));
    562  1.88.2.3        ad 		sc->sc_if.if_noproto++;
    563      1.87    dyoung 		return 0;
    564      1.62    dyoung 	}
    565      1.62    dyoung 
    566      1.62    dyoung 	if (hlen > m->m_pkthdr.len) {
    567      1.62    dyoung 		m_freem(m);
    568      1.62    dyoung 		sc->sc_if.if_ierrors++;
    569      1.87    dyoung 		return EINVAL;
    570      1.62    dyoung 	}
    571      1.62    dyoung 	m_adj(m, hlen);
    572      1.62    dyoung 
    573      1.62    dyoung #if NBPFILTER > 0
    574      1.62    dyoung 	if (sc->sc_if.if_bpf != NULL)
    575      1.62    dyoung 		bpf_mtap_af(sc->sc_if.if_bpf, af, m);
    576      1.62    dyoung #endif /*NBPFILTER > 0*/
    577      1.62    dyoung 
    578      1.62    dyoung 	m->m_pkthdr.rcvif = &sc->sc_if;
    579      1.62    dyoung 
    580      1.62    dyoung 	s = splnet();		/* possible */
    581      1.62    dyoung 	if (IF_QFULL(ifq)) {
    582      1.62    dyoung 		IF_DROP(ifq);
    583      1.62    dyoung 		m_freem(m);
    584      1.62    dyoung 	} else {
    585      1.62    dyoung 		IF_ENQUEUE(ifq, m);
    586      1.62    dyoung 	}
    587      1.62    dyoung 	/* we need schednetisr since the address family may change */
    588      1.62    dyoung 	schednetisr(isr);
    589      1.62    dyoung 	splx(s);
    590      1.62    dyoung 
    591      1.87    dyoung 	return 1;	/* packet is done, no further processing needed */
    592      1.62    dyoung }
    593      1.62    dyoung 
    594      1.20    itojun /*
    595       1.1       hwr  * The output routine. Takes a packet and encapsulates it in the protocol
    596      1.75    dyoung  * given by sc->sc_proto. See also RFC 1701 and RFC 2004
    597       1.1       hwr  */
    598      1.59   thorpej static int
    599      1.84    dyoung gre_output(struct ifnet *ifp, struct mbuf *m, const struct sockaddr *dst,
    600      1.74  christos 	   struct rtentry *rt)
    601       1.1       hwr {
    602  1.88.2.3        ad 	int error = 0, hlen, msiz;
    603      1.10   thorpej 	struct gre_softc *sc = ifp->if_softc;
    604      1.62    dyoung 	struct greip *gi;
    605      1.62    dyoung 	struct gre_h *gh;
    606      1.62    dyoung 	struct ip *eip, *ip;
    607      1.56        is 	u_int8_t ip_tos = 0;
    608      1.48    itojun 	u_int16_t etype = 0;
    609      1.20    itojun 	struct mobile_h mob_h;
    610      1.24    martin 
    611      1.39    itojun 	if ((ifp->if_flags & (IFF_UP | IFF_RUNNING)) == 0 ||
    612      1.37    itojun 	    sc->g_src.s_addr == INADDR_ANY || sc->g_dst.s_addr == INADDR_ANY) {
    613      1.37    itojun 		m_freem(m);
    614      1.38    itojun 		error = ENETDOWN;
    615      1.38    itojun 		goto end;
    616      1.37    itojun 	}
    617       1.1       hwr 
    618      1.62    dyoung 	gi = NULL;
    619      1.41    itojun 	ip = NULL;
    620       1.1       hwr 
    621       1.1       hwr #if NBPFILTER >0
    622      1.52  christos 	if (ifp->if_bpf)
    623      1.52  christos 		bpf_mtap_af(ifp->if_bpf, dst->sa_family, m);
    624       1.1       hwr #endif
    625       1.1       hwr 
    626      1.26    martin 	m->m_flags &= ~(M_BCAST|M_MCAST);
    627       1.1       hwr 
    628      1.75    dyoung 	switch (sc->sc_proto) {
    629      1.62    dyoung 	case IPPROTO_MOBILE:
    630  1.88.2.3        ad 		if (dst->sa_family != AF_INET) {
    631       1.3       hwr 			IF_DROP(&ifp->if_snd);
    632       1.3       hwr 			m_freem(m);
    633      1.38    itojun 			error = EINVAL;
    634      1.38    itojun 			goto end;
    635       1.3       hwr 		}
    636  1.88.2.3        ad 
    637  1.88.2.3        ad 		if (M_UNWRITABLE(m, sizeof(*ip)) &&
    638  1.88.2.3        ad 		    (m = m_pullup(m, sizeof(*ip))) == NULL) {
    639  1.88.2.3        ad 			error = ENOBUFS;
    640  1.88.2.3        ad 			goto end;
    641  1.88.2.3        ad 		}
    642  1.88.2.3        ad 		ip = mtod(m, struct ip *);
    643  1.88.2.3        ad 
    644  1.88.2.3        ad 		memset(&mob_h, 0, MOB_H_SIZ_L);
    645  1.88.2.3        ad 		mob_h.proto = (ip->ip_p) << 8;
    646  1.88.2.3        ad 		mob_h.odst = ip->ip_dst.s_addr;
    647  1.88.2.3        ad 		ip->ip_dst.s_addr = sc->g_dst.s_addr;
    648  1.88.2.3        ad 
    649  1.88.2.3        ad 		/*
    650  1.88.2.3        ad 		 * If the packet comes from our host, we only change
    651  1.88.2.3        ad 		 * the destination address in the IP header.
    652  1.88.2.3        ad 		 * Else we also need to save and change the source
    653  1.88.2.3        ad 		 */
    654  1.88.2.3        ad 		if (in_hosteq(ip->ip_src, sc->g_src)) {
    655  1.88.2.3        ad 			msiz = MOB_H_SIZ_S;
    656  1.88.2.3        ad 		} else {
    657  1.88.2.3        ad 			mob_h.proto |= MOB_H_SBIT;
    658  1.88.2.3        ad 			mob_h.osrc = ip->ip_src.s_addr;
    659  1.88.2.3        ad 			ip->ip_src.s_addr = sc->g_src.s_addr;
    660  1.88.2.3        ad 			msiz = MOB_H_SIZ_L;
    661  1.88.2.3        ad 		}
    662  1.88.2.3        ad 		HTONS(mob_h.proto);
    663  1.88.2.3        ad 		mob_h.hcrc = gre_in_cksum((u_int16_t *)&mob_h, msiz);
    664  1.88.2.3        ad 
    665  1.88.2.3        ad 		M_PREPEND(m, msiz, M_DONTWAIT);
    666  1.88.2.3        ad 		if (m == NULL) {
    667  1.88.2.3        ad 			error = ENOBUFS;
    668  1.88.2.3        ad 			goto end;
    669  1.88.2.3        ad 		}
    670  1.88.2.3        ad 		/* XXX Assuming that ip does not dangle after
    671  1.88.2.3        ad 		 * M_PREPEND.  In practice, that's true, but
    672  1.88.2.3        ad 		 * that's not in M_PREPEND's contract.
    673  1.88.2.3        ad 		 */
    674  1.88.2.3        ad 		memmove(mtod(m, void *), ip, sizeof(*ip));
    675  1.88.2.3        ad 		ip = mtod(m, struct ip *);
    676  1.88.2.3        ad 		memcpy(ip + 1, &mob_h, (size_t)msiz);
    677  1.88.2.3        ad 		ip->ip_len = htons(ntohs(ip->ip_len) + msiz);
    678      1.62    dyoung 		break;
    679      1.62    dyoung 	case IPPROTO_UDP:
    680      1.62    dyoung 	case IPPROTO_GRE:
    681      1.62    dyoung 		GRE_DPRINTF(sc, "%s: dst->sa_family=%d\n", __func__,
    682      1.62    dyoung 		    dst->sa_family);
    683      1.20    itojun 		switch (dst->sa_family) {
    684       1.1       hwr 		case AF_INET:
    685      1.41    itojun 			ip = mtod(m, struct ip *);
    686      1.56        is 			ip_tos = ip->ip_tos;
    687       1.8  explorer 			etype = ETHERTYPE_IP;
    688       1.1       hwr 			break;
    689       1.1       hwr #ifdef NETATALK
    690       1.1       hwr 		case AF_APPLETALK:
    691       1.8  explorer 			etype = ETHERTYPE_ATALK;
    692       1.1       hwr 			break;
    693       1.1       hwr #endif
    694      1.56        is #ifdef INET6
    695      1.56        is 		case AF_INET6:
    696      1.56        is 			etype = ETHERTYPE_IPV6;
    697      1.56        is 			break;
    698      1.56        is #endif
    699       1.1       hwr 		default:
    700       1.1       hwr 			IF_DROP(&ifp->if_snd);
    701       1.1       hwr 			m_freem(m);
    702      1.38    itojun 			error = EAFNOSUPPORT;
    703      1.38    itojun 			goto end;
    704       1.1       hwr 		}
    705      1.62    dyoung 		break;
    706      1.62    dyoung 	default:
    707       1.1       hwr 		IF_DROP(&ifp->if_snd);
    708       1.1       hwr 		m_freem(m);
    709      1.38    itojun 		error = EINVAL;
    710      1.38    itojun 		goto end;
    711       1.1       hwr 	}
    712       1.1       hwr 
    713      1.75    dyoung 	switch (sc->sc_proto) {
    714      1.62    dyoung 	case IPPROTO_GRE:
    715      1.62    dyoung 		hlen = sizeof(struct greip);
    716      1.62    dyoung 		break;
    717      1.62    dyoung 	case IPPROTO_UDP:
    718      1.62    dyoung 		hlen = sizeof(struct gre_h);
    719      1.62    dyoung 		break;
    720      1.62    dyoung 	default:
    721      1.62    dyoung 		hlen = 0;
    722      1.62    dyoung 		break;
    723      1.62    dyoung 	}
    724      1.62    dyoung 
    725      1.62    dyoung 	M_PREPEND(m, hlen, M_DONTWAIT);
    726      1.62    dyoung 
    727      1.62    dyoung 	if (m == NULL) {
    728       1.1       hwr 		IF_DROP(&ifp->if_snd);
    729      1.38    itojun 		error = ENOBUFS;
    730      1.38    itojun 		goto end;
    731       1.1       hwr 	}
    732       1.1       hwr 
    733      1.75    dyoung 	switch (sc->sc_proto) {
    734      1.62    dyoung 	case IPPROTO_UDP:
    735      1.62    dyoung 		gh = mtod(m, struct gre_h *);
    736      1.62    dyoung 		memset(gh, 0, sizeof(*gh));
    737      1.62    dyoung 		gh->ptype = htons(etype);
    738      1.62    dyoung 		/* XXX Need to handle IP ToS.  Look at how I handle IP TTL. */
    739      1.62    dyoung 		break;
    740      1.62    dyoung 	case IPPROTO_GRE:
    741      1.62    dyoung 		gi = mtod(m, struct greip *);
    742      1.62    dyoung 		gh = &gi->gi_g;
    743      1.62    dyoung 		eip = &gi->gi_i;
    744       1.1       hwr 		/* we don't have any GRE flags for now */
    745      1.62    dyoung 		memset(gh, 0, sizeof(*gh));
    746      1.62    dyoung 		gh->ptype = htons(etype);
    747      1.62    dyoung 		eip->ip_src = sc->g_src;
    748      1.62    dyoung 		eip->ip_dst = sc->g_dst;
    749      1.62    dyoung 		eip->ip_hl = (sizeof(struct ip)) >> 2;
    750      1.62    dyoung 		eip->ip_ttl = ip_gre_ttl;
    751      1.62    dyoung 		eip->ip_tos = ip_tos;
    752      1.62    dyoung 		eip->ip_len = htons(m->m_pkthdr.len);
    753      1.75    dyoung 		eip->ip_p = sc->sc_proto;
    754      1.62    dyoung 		break;
    755      1.62    dyoung 	case IPPROTO_MOBILE:
    756      1.62    dyoung 		eip = mtod(m, struct ip *);
    757      1.75    dyoung 		eip->ip_p = sc->sc_proto;
    758      1.62    dyoung 		break;
    759      1.62    dyoung 	default:
    760      1.62    dyoung 		error = EPROTONOSUPPORT;
    761      1.62    dyoung 		m_freem(m);
    762      1.62    dyoung 		goto end;
    763       1.3       hwr 	}
    764       1.1       hwr 
    765       1.1       hwr 	ifp->if_opackets++;
    766       1.8  explorer 	ifp->if_obytes += m->m_pkthdr.len;
    767      1.62    dyoung 
    768       1.1       hwr 	/* send it off */
    769      1.75    dyoung 	if (sc->sc_proto == IPPROTO_UDP) {
    770      1.62    dyoung 		if (IF_QFULL(&sc->sc_snd)) {
    771      1.62    dyoung 			IF_DROP(&sc->sc_snd);
    772      1.62    dyoung 			error = ENOBUFS;
    773      1.62    dyoung 			m_freem(m);
    774      1.62    dyoung 		} else {
    775      1.62    dyoung 			IF_ENQUEUE(&sc->sc_snd, m);
    776      1.62    dyoung 			gre_wakeup(sc);
    777      1.62    dyoung 			error = 0;
    778      1.62    dyoung 		}
    779      1.81     joerg 		goto end;
    780      1.81     joerg 	}
    781      1.86    dyoung 	if (sc->route.ro_rt == NULL)
    782      1.86    dyoung 		rtcache_init(&sc->route);
    783      1.86    dyoung 	else
    784      1.86    dyoung 		rtcache_check(&sc->route);
    785      1.81     joerg 	if (sc->route.ro_rt == NULL)
    786      1.81     joerg 		goto end;
    787      1.83    dyoung 	if (sc->route.ro_rt->rt_ifp->if_softc == sc)
    788      1.81     joerg 		rtcache_free(&sc->route);
    789      1.81     joerg 	else
    790      1.62    dyoung 		error = ip_output(m, NULL, &sc->route, 0,
    791      1.62    dyoung 		    (struct ip_moptions *)NULL, (struct socket *)NULL);
    792      1.38    itojun   end:
    793       1.8  explorer 	if (error)
    794       1.1       hwr 		ifp->if_oerrors++;
    795      1.87    dyoung 	return error;
    796       1.1       hwr }
    797       1.1       hwr 
    798      1.71    dyoung /* gre_kick must be synchronized with network interrupts in order
    799      1.71    dyoung  * to synchronize access to gre_softc members, so call it with
    800      1.71    dyoung  * interrupt priority level set to IPL_NET or greater.
    801      1.71    dyoung  */
    802      1.62    dyoung static int
    803      1.62    dyoung gre_kick(struct gre_softc *sc)
    804      1.62    dyoung {
    805      1.62    dyoung 	int rc;
    806      1.62    dyoung 	struct ifnet *ifp = &sc->sc_if;
    807      1.62    dyoung 
    808      1.75    dyoung 	if (sc->sc_proto == IPPROTO_UDP && (ifp->if_flags & IFF_UP) == IFF_UP &&
    809      1.62    dyoung 	    !sc->sc_thread) {
    810      1.62    dyoung 		sc->sc_thread = 1;
    811  1.88.2.2        ad 		rc = kthread_create(PRI_NONE, false, gre_thread, (void *)sc,
    812  1.88.2.1        ad 		    NULL, ifp->if_xname);
    813      1.62    dyoung 		if (rc != 0)
    814      1.62    dyoung 			gre_stop(&sc->sc_thread);
    815      1.62    dyoung 		return rc;
    816      1.62    dyoung 	} else {
    817      1.62    dyoung 		gre_wakeup(sc);
    818      1.62    dyoung 		return 0;
    819      1.62    dyoung 	}
    820      1.62    dyoung }
    821      1.62    dyoung 
    822      1.62    dyoung static int
    823      1.62    dyoung gre_getname(struct socket *so, int req, struct mbuf *nam, struct lwp *l)
    824      1.62    dyoung {
    825      1.62    dyoung 	int s, error;
    826      1.62    dyoung 
    827      1.62    dyoung 	s = splsoftnet();
    828  1.88.2.3        ad 	error = (*so->so_proto->pr_usrreq)(so, req, NULL, nam, NULL, l);
    829      1.62    dyoung 	splx(s);
    830      1.62    dyoung 	return error;
    831      1.62    dyoung }
    832      1.62    dyoung 
    833      1.62    dyoung static int
    834      1.62    dyoung gre_getsockname(struct socket *so, struct mbuf *nam, struct lwp *l)
    835      1.62    dyoung {
    836      1.62    dyoung 	return gre_getname(so, PRU_SOCKADDR, nam, l);
    837      1.62    dyoung }
    838      1.62    dyoung 
    839      1.62    dyoung static int
    840      1.62    dyoung gre_getpeername(struct socket *so, struct mbuf *nam, struct lwp *l)
    841      1.62    dyoung {
    842      1.62    dyoung 	return gre_getname(so, PRU_PEERADDR, nam, l);
    843      1.62    dyoung }
    844      1.62    dyoung 
    845      1.62    dyoung static int
    846      1.62    dyoung gre_getnames(struct socket *so, struct lwp *l, struct sockaddr_in *src,
    847      1.62    dyoung     struct sockaddr_in *dst)
    848      1.62    dyoung {
    849      1.62    dyoung 	struct mbuf *m;
    850      1.62    dyoung 	struct sockaddr_in *sin;
    851      1.62    dyoung 	int rc;
    852      1.62    dyoung 
    853      1.62    dyoung 	if ((m = gre_getsockmbuf(so)) == NULL)
    854      1.62    dyoung 		return ENOBUFS;
    855      1.62    dyoung 
    856      1.62    dyoung 	sin = mtod(m, struct sockaddr_in *);
    857      1.62    dyoung 
    858      1.62    dyoung 	if ((rc = gre_getsockname(so, m, l)) != 0)
    859      1.62    dyoung 		goto out;
    860      1.62    dyoung 	if (sin->sin_family != AF_INET) {
    861      1.62    dyoung 		rc = EAFNOSUPPORT;
    862      1.62    dyoung 		goto out;
    863      1.62    dyoung 	}
    864      1.62    dyoung 	*src = *sin;
    865      1.62    dyoung 
    866      1.62    dyoung 	if ((rc = gre_getpeername(so, m, l)) != 0)
    867      1.62    dyoung 		goto out;
    868      1.62    dyoung 	if (sin->sin_family != AF_INET) {
    869      1.62    dyoung 		rc = EAFNOSUPPORT;
    870      1.62    dyoung 		goto out;
    871      1.62    dyoung 	}
    872      1.62    dyoung 	*dst = *sin;
    873      1.62    dyoung 
    874      1.62    dyoung out:
    875      1.62    dyoung 	m_freem(m);
    876      1.62    dyoung 	return rc;
    877      1.62    dyoung }
    878      1.62    dyoung 
    879      1.59   thorpej static int
    880      1.88  christos gre_ioctl(struct ifnet *ifp, u_long cmd, void *data)
    881       1.1       hwr {
    882      1.62    dyoung 	u_char oproto;
    883      1.62    dyoung 	struct file *fp, *ofp;
    884      1.62    dyoung 	struct socket *so;
    885      1.62    dyoung 	struct sockaddr_in dst, src;
    886      1.62    dyoung 	struct proc *p = curproc;	/* XXX */
    887      1.61        ad 	struct lwp *l = curlwp;	/* XXX */
    888       1.8  explorer 	struct ifreq *ifr = (struct ifreq *)data;
    889      1.28    itojun 	struct if_laddrreq *lifr = (struct if_laddrreq *)data;
    890       1.8  explorer 	struct gre_softc *sc = ifp->if_softc;
    891       1.1       hwr 	int s;
    892       1.1       hwr 	struct sockaddr_in si;
    893       1.8  explorer 	struct sockaddr *sa = NULL;
    894      1.80  christos 	int error = 0;
    895       1.1       hwr 
    896      1.61        ad 	switch (cmd) {
    897      1.61        ad 	case SIOCSIFFLAGS:
    898      1.61        ad 	case SIOCSIFMTU:
    899      1.61        ad 	case GRESPROTO:
    900      1.61        ad 	case GRESADDRD:
    901      1.61        ad 	case GRESADDRS:
    902      1.62    dyoung 	case GRESSOCK:
    903      1.62    dyoung 	case GREDSOCK:
    904      1.61        ad 	case SIOCSLIFPHYADDR:
    905      1.61        ad 	case SIOCDIFPHYADDR:
    906      1.70      elad 		if (kauth_authorize_network(l->l_cred, KAUTH_NETWORK_INTERFACE,
    907      1.70      elad 		    KAUTH_REQ_NETWORK_INTERFACE_SETPRIV, ifp, (void *)cmd,
    908      1.70      elad 		    NULL) != 0)
    909      1.87    dyoung 			return EPERM;
    910      1.61        ad 		break;
    911      1.61        ad 	default:
    912      1.61        ad 		break;
    913      1.61        ad 	}
    914       1.1       hwr 
    915      1.18   thorpej 	s = splnet();
    916      1.20    itojun 	switch (cmd) {
    917      1.20    itojun 	case SIOCSIFADDR:
    918      1.36    itojun 		ifp->if_flags |= IFF_UP;
    919      1.78    dyoung 		if ((error = gre_kick(sc)) != 0)
    920      1.78    dyoung 			ifp->if_flags &= ~IFF_UP;
    921      1.36    itojun 		break;
    922      1.55     perry 	case SIOCSIFDSTADDR:
    923       1.1       hwr 		break;
    924       1.1       hwr 	case SIOCSIFFLAGS:
    925      1.75    dyoung 		oproto = sc->sc_proto;
    926      1.62    dyoung 		switch (ifr->ifr_flags & (IFF_LINK0|IFF_LINK2)) {
    927      1.62    dyoung 		case IFF_LINK0|IFF_LINK2:
    928      1.75    dyoung 			sc->sc_proto = IPPROTO_UDP;
    929      1.62    dyoung 			if (oproto != IPPROTO_UDP)
    930      1.62    dyoung 				ifp->if_flags &= ~IFF_RUNNING;
    931      1.62    dyoung 			error = gre_kick(sc);
    932      1.62    dyoung 			break;
    933      1.62    dyoung 		case IFF_LINK0:
    934      1.75    dyoung 			sc->sc_proto = IPPROTO_GRE;
    935      1.62    dyoung 			gre_wakeup(sc);
    936      1.62    dyoung 			goto recompute;
    937      1.62    dyoung 		case 0:
    938      1.75    dyoung 			sc->sc_proto = IPPROTO_MOBILE;
    939      1.62    dyoung 			gre_wakeup(sc);
    940      1.62    dyoung 			goto recompute;
    941      1.62    dyoung 		}
    942       1.1       hwr 		break;
    943      1.20    itojun 	case SIOCSIFMTU:
    944      1.27    martin 		if (ifr->ifr_mtu < 576) {
    945       1.1       hwr 			error = EINVAL;
    946       1.1       hwr 			break;
    947       1.1       hwr 		}
    948       1.1       hwr 		ifp->if_mtu = ifr->ifr_mtu;
    949       1.1       hwr 		break;
    950       1.1       hwr 	case SIOCGIFMTU:
    951       1.1       hwr 		ifr->ifr_mtu = sc->sc_if.if_mtu;
    952       1.1       hwr 		break;
    953       1.1       hwr 	case SIOCADDMULTI:
    954       1.1       hwr 	case SIOCDELMULTI:
    955       1.8  explorer 		if (ifr == 0) {
    956       1.1       hwr 			error = EAFNOSUPPORT;
    957       1.1       hwr 			break;
    958       1.1       hwr 		}
    959       1.8  explorer 		switch (ifr->ifr_addr.sa_family) {
    960       1.1       hwr #ifdef INET
    961       1.1       hwr 		case AF_INET:
    962       1.1       hwr 			break;
    963       1.1       hwr #endif
    964      1.56        is #ifdef INET6
    965      1.56        is 		case AF_INET6:
    966      1.56        is 			break;
    967      1.56        is #endif
    968       1.1       hwr 		default:
    969       1.1       hwr 			error = EAFNOSUPPORT;
    970       1.1       hwr 			break;
    971       1.1       hwr 		}
    972       1.1       hwr 		break;
    973       1.1       hwr 	case GRESPROTO:
    974      1.75    dyoung 		oproto = sc->sc_proto;
    975      1.75    dyoung 		sc->sc_proto = ifr->ifr_flags;
    976      1.75    dyoung 		switch (sc->sc_proto) {
    977      1.62    dyoung 		case IPPROTO_UDP:
    978      1.62    dyoung 			ifp->if_flags |= IFF_LINK0|IFF_LINK2;
    979      1.62    dyoung 			if (oproto != IPPROTO_UDP)
    980      1.62    dyoung 				ifp->if_flags &= ~IFF_RUNNING;
    981      1.62    dyoung 			error = gre_kick(sc);
    982      1.62    dyoung 			break;
    983      1.40    itojun 		case IPPROTO_GRE:
    984       1.3       hwr 			ifp->if_flags |= IFF_LINK0;
    985      1.62    dyoung 			ifp->if_flags &= ~IFF_LINK2;
    986      1.62    dyoung 			goto recompute;
    987      1.40    itojun 		case IPPROTO_MOBILE:
    988      1.62    dyoung 			ifp->if_flags &= ~(IFF_LINK0|IFF_LINK2);
    989      1.62    dyoung 			goto recompute;
    990       1.1       hwr 		default:
    991      1.40    itojun 			error = EPROTONOSUPPORT;
    992      1.35    itojun 			break;
    993       1.1       hwr 		}
    994       1.1       hwr 		break;
    995       1.1       hwr 	case GREGPROTO:
    996      1.75    dyoung 		ifr->ifr_flags = sc->sc_proto;
    997       1.1       hwr 		break;
    998       1.1       hwr 	case GRESADDRS:
    999       1.1       hwr 	case GRESADDRD:
   1000       1.1       hwr 		/*
   1001      1.20    itojun 		 * set tunnel endpoints, compute a less specific route
   1002      1.20    itojun 		 * to the remote end and mark if as up
   1003      1.20    itojun 		 */
   1004       1.1       hwr 		sa = &ifr->ifr_addr;
   1005      1.62    dyoung 		if (cmd == GRESADDRS) {
   1006       1.1       hwr 			sc->g_src = (satosin(sa))->sin_addr;
   1007      1.62    dyoung 			sc->g_srcport = satosin(sa)->sin_port;
   1008      1.62    dyoung 		}
   1009      1.62    dyoung 		if (cmd == GRESADDRD) {
   1010      1.75    dyoung 			if (sc->sc_proto == IPPROTO_UDP &&
   1011      1.62    dyoung 			    satosin(sa)->sin_port == 0) {
   1012      1.62    dyoung 				error = EINVAL;
   1013      1.62    dyoung 				break;
   1014      1.62    dyoung 			}
   1015       1.1       hwr 			sc->g_dst = (satosin(sa))->sin_addr;
   1016      1.62    dyoung 			sc->g_dstport = satosin(sa)->sin_port;
   1017      1.62    dyoung 		}
   1018      1.30    itojun 	recompute:
   1019      1.75    dyoung 		if (sc->sc_proto == IPPROTO_UDP ||
   1020      1.62    dyoung 		    (sc->g_src.s_addr != INADDR_ANY &&
   1021      1.62    dyoung 		     sc->g_dst.s_addr != INADDR_ANY)) {
   1022      1.62    dyoung 			if (sc->sc_fp != NULL) {
   1023      1.62    dyoung 				closef(sc->sc_fp, l);
   1024      1.62    dyoung 				sc->sc_fp = NULL;
   1025      1.62    dyoung 			}
   1026      1.81     joerg 			rtcache_free(&sc->route);
   1027      1.75    dyoung 			if (sc->sc_proto == IPPROTO_UDP)
   1028      1.62    dyoung 				error = gre_kick(sc);
   1029      1.62    dyoung 			else if (gre_compute_route(sc) == 0)
   1030      1.39    itojun 				ifp->if_flags |= IFF_RUNNING;
   1031      1.39    itojun 			else
   1032      1.39    itojun 				ifp->if_flags &= ~IFF_RUNNING;
   1033       1.1       hwr 		}
   1034       1.1       hwr 		break;
   1035       1.1       hwr 	case GREGADDRS:
   1036      1.33    itojun 		memset(&si, 0, sizeof(si));
   1037      1.28    itojun 		si.sin_family = AF_INET;
   1038      1.28    itojun 		si.sin_len = sizeof(struct sockaddr_in);
   1039       1.1       hwr 		si.sin_addr.s_addr = sc->g_src.s_addr;
   1040       1.8  explorer 		sa = sintosa(&si);
   1041       1.1       hwr 		ifr->ifr_addr = *sa;
   1042       1.1       hwr 		break;
   1043       1.1       hwr 	case GREGADDRD:
   1044      1.33    itojun 		memset(&si, 0, sizeof(si));
   1045      1.28    itojun 		si.sin_family = AF_INET;
   1046      1.28    itojun 		si.sin_len = sizeof(struct sockaddr_in);
   1047       1.1       hwr 		si.sin_addr.s_addr = sc->g_dst.s_addr;
   1048       1.8  explorer 		sa = sintosa(&si);
   1049       1.1       hwr 		ifr->ifr_addr = *sa;
   1050      1.28    itojun 		break;
   1051      1.62    dyoung 	case GREDSOCK:
   1052      1.75    dyoung 		if (sc->sc_proto != IPPROTO_UDP)
   1053      1.62    dyoung 			return EINVAL;
   1054      1.63    dyoung 		if (sc->sc_fp != NULL) {
   1055      1.63    dyoung 			closef(sc->sc_fp, l);
   1056      1.63    dyoung 			sc->sc_fp = NULL;
   1057      1.63    dyoung 			error = gre_kick(sc);
   1058      1.63    dyoung 		}
   1059      1.62    dyoung 		break;
   1060      1.62    dyoung 	case GRESSOCK:
   1061      1.75    dyoung 		if (sc->sc_proto != IPPROTO_UDP)
   1062      1.62    dyoung 			return EINVAL;
   1063      1.62    dyoung 		/* getsock() will FILE_USE() the descriptor for us */
   1064      1.62    dyoung 		if ((error = getsock(p->p_fd, (int)ifr->ifr_value, &fp)) != 0)
   1065      1.62    dyoung 			break;
   1066      1.62    dyoung 		so = (struct socket *)fp->f_data;
   1067      1.62    dyoung 		if (so->so_type != SOCK_DGRAM) {
   1068      1.62    dyoung 			FILE_UNUSE(fp, NULL);
   1069      1.62    dyoung 			error = EINVAL;
   1070      1.62    dyoung 			break;
   1071      1.62    dyoung 		}
   1072      1.62    dyoung 		/* check address */
   1073      1.62    dyoung 		if ((error = gre_getnames(so, curlwp, &src, &dst)) != 0) {
   1074      1.62    dyoung 			FILE_UNUSE(fp, NULL);
   1075      1.62    dyoung 			break;
   1076      1.62    dyoung 		}
   1077      1.62    dyoung 
   1078      1.62    dyoung 		fp->f_count++;
   1079      1.62    dyoung 
   1080      1.62    dyoung 		ofp = sc->sc_fp;
   1081      1.62    dyoung 		sc->sc_fp = fp;
   1082      1.62    dyoung 		if ((error = gre_kick(sc)) != 0) {
   1083      1.62    dyoung 			closef(fp, l);
   1084      1.62    dyoung 			sc->sc_fp = ofp;
   1085      1.62    dyoung 			break;
   1086      1.62    dyoung 		}
   1087      1.62    dyoung 		sc->g_src = src.sin_addr;
   1088      1.62    dyoung 		sc->g_srcport = src.sin_port;
   1089      1.62    dyoung 		sc->g_dst = dst.sin_addr;
   1090      1.62    dyoung 		sc->g_dstport = dst.sin_port;
   1091      1.62    dyoung 		if (ofp != NULL)
   1092      1.62    dyoung 			closef(ofp, l);
   1093      1.62    dyoung 		break;
   1094      1.28    itojun 	case SIOCSLIFPHYADDR:
   1095      1.28    itojun 		if (lifr->addr.ss_family != AF_INET ||
   1096      1.31    itojun 		    lifr->dstaddr.ss_family != AF_INET) {
   1097      1.31    itojun 			error = EAFNOSUPPORT;
   1098      1.31    itojun 			break;
   1099      1.31    itojun 		}
   1100      1.28    itojun 		if (lifr->addr.ss_len != sizeof(si) ||
   1101      1.31    itojun 		    lifr->dstaddr.ss_len != sizeof(si)) {
   1102      1.31    itojun 			error = EINVAL;
   1103      1.31    itojun 			break;
   1104      1.31    itojun 		}
   1105      1.62    dyoung 		sc->g_src = satosin(&lifr->addr)->sin_addr;
   1106      1.62    dyoung 		sc->g_dst = satosin(&lifr->dstaddr)->sin_addr;
   1107      1.62    dyoung 		sc->g_srcport = satosin(&lifr->addr)->sin_port;
   1108      1.62    dyoung 		sc->g_dstport = satosin(&lifr->dstaddr)->sin_port;
   1109      1.30    itojun 		goto recompute;
   1110      1.28    itojun 	case SIOCDIFPHYADDR:
   1111      1.28    itojun 		sc->g_src.s_addr = INADDR_ANY;
   1112      1.28    itojun 		sc->g_dst.s_addr = INADDR_ANY;
   1113      1.62    dyoung 		sc->g_srcport = 0;
   1114      1.62    dyoung 		sc->g_dstport = 0;
   1115      1.62    dyoung 		goto recompute;
   1116      1.28    itojun 	case SIOCGLIFPHYADDR:
   1117      1.28    itojun 		if (sc->g_src.s_addr == INADDR_ANY ||
   1118      1.28    itojun 		    sc->g_dst.s_addr == INADDR_ANY) {
   1119      1.28    itojun 			error = EADDRNOTAVAIL;
   1120      1.28    itojun 			break;
   1121      1.28    itojun 		}
   1122      1.33    itojun 		memset(&si, 0, sizeof(si));
   1123      1.28    itojun 		si.sin_family = AF_INET;
   1124      1.28    itojun 		si.sin_len = sizeof(struct sockaddr_in);
   1125      1.62    dyoung 		si.sin_addr = sc->g_src;
   1126      1.75    dyoung 		if (sc->sc_proto == IPPROTO_UDP)
   1127      1.62    dyoung 			si.sin_port = sc->g_srcport;
   1128      1.33    itojun 		memcpy(&lifr->addr, &si, sizeof(si));
   1129      1.62    dyoung 		si.sin_addr = sc->g_dst;
   1130      1.75    dyoung 		if (sc->sc_proto == IPPROTO_UDP)
   1131      1.62    dyoung 			si.sin_port = sc->g_dstport;
   1132      1.33    itojun 		memcpy(&lifr->dstaddr, &si, sizeof(si));
   1133       1.1       hwr 		break;
   1134       1.1       hwr 	default:
   1135       1.1       hwr 		error = EINVAL;
   1136      1.31    itojun 		break;
   1137       1.1       hwr 	}
   1138       1.1       hwr 	splx(s);
   1139      1.87    dyoung 	return error;
   1140       1.1       hwr }
   1141       1.1       hwr 
   1142      1.20    itojun /*
   1143      1.78    dyoung  * Compute a route to our destination.
   1144       1.1       hwr  */
   1145      1.59   thorpej static int
   1146       1.8  explorer gre_compute_route(struct gre_softc *sc)
   1147       1.1       hwr {
   1148       1.1       hwr 	struct route *ro;
   1149       1.1       hwr 
   1150       1.8  explorer 	ro = &sc->route;
   1151      1.20    itojun 
   1152       1.8  explorer 	memset(ro, 0, sizeof(struct route));
   1153      1.73    dyoung 	satosin(&ro->ro_dst)->sin_addr = sc->g_dst;
   1154       1.8  explorer 	ro->ro_dst.sa_family = AF_INET;
   1155       1.8  explorer 	ro->ro_dst.sa_len = sizeof(ro->ro_dst);
   1156       1.8  explorer 
   1157      1.81     joerg 	rtcache_init(ro);
   1158      1.81     joerg 
   1159      1.81     joerg 	if (ro->ro_rt == NULL || ro->ro_rt->rt_ifp->if_softc == sc) {
   1160  1.88.2.3        ad 		GRE_DPRINTF(sc, "%s: route to %s %s\n", sc->sc_if.if_xname,
   1161  1.88.2.3        ad 		    inet_ntoa(satocsin(rtcache_getdst(ro))->sin_addr),
   1162  1.88.2.3        ad 		    (ro->ro_rt == NULL)
   1163  1.88.2.3        ad 		        ?  "does not exist"
   1164  1.88.2.3        ad 			: "loops back to ourself");
   1165      1.81     joerg 		rtcache_free(ro);
   1166      1.81     joerg 		return EADDRNOTAVAIL;
   1167      1.25    martin 	}
   1168      1.25    martin 
   1169      1.25    martin 	return 0;
   1170       1.1       hwr }
   1171       1.1       hwr 
   1172       1.3       hwr /*
   1173      1.20    itojun  * do a checksum of a buffer - much like in_cksum, which operates on
   1174      1.20    itojun  * mbufs.
   1175       1.3       hwr  */
   1176      1.48    itojun u_int16_t
   1177      1.48    itojun gre_in_cksum(u_int16_t *p, u_int len)
   1178       1.3       hwr {
   1179      1.48    itojun 	u_int32_t sum = 0;
   1180       1.3       hwr 	int nwords = len >> 1;
   1181      1.20    itojun 
   1182       1.3       hwr 	while (nwords-- != 0)
   1183       1.3       hwr 		sum += *p++;
   1184      1.20    itojun 
   1185      1.20    itojun 	if (len & 1) {
   1186      1.20    itojun 		union {
   1187      1.20    itojun 			u_short w;
   1188      1.20    itojun 			u_char c[2];
   1189      1.20    itojun 		} u;
   1190      1.20    itojun 		u.c[0] = *(u_char *)p;
   1191      1.20    itojun 		u.c[1] = 0;
   1192      1.20    itojun 		sum += u.w;
   1193      1.20    itojun 	}
   1194      1.20    itojun 
   1195      1.20    itojun 	/* end-around-carry */
   1196      1.20    itojun 	sum = (sum >> 16) + (sum & 0xffff);
   1197      1.20    itojun 	sum += (sum >> 16);
   1198      1.87    dyoung 	return ~sum;
   1199       1.3       hwr }
   1200      1.54  christos #endif
   1201      1.54  christos 
   1202      1.59   thorpej void	greattach(int);
   1203      1.54  christos 
   1204      1.54  christos /* ARGSUSED */
   1205      1.54  christos void
   1206      1.74  christos greattach(int count)
   1207      1.54  christos {
   1208      1.54  christos #ifdef INET
   1209      1.54  christos 	LIST_INIT(&gre_softc_list);
   1210      1.54  christos 	if_clone_attach(&gre_cloner);
   1211      1.54  christos #endif
   1212      1.54  christos }
   1213