Home | History | Annotate | Line # | Download | only in net
if_gre.c revision 1.84
      1  1.84    dyoung /*	$NetBSD: if_gre.c,v 1.84 2007/02/17 22:34:08 dyoung Exp $ */
      2   1.4   thorpej 
      3   1.1       hwr /*
      4   1.4   thorpej  * Copyright (c) 1998 The NetBSD Foundation, Inc.
      5   1.1       hwr  * All rights reserved.
      6   1.1       hwr  *
      7   1.1       hwr  * This code is derived from software contributed to The NetBSD Foundation
      8   1.1       hwr  * by Heiko W.Rupp <hwr (at) pilhuhn.de>
      9   1.1       hwr  *
     10  1.56        is  * IPv6-over-GRE contributed by Gert Doering <gert (at) greenie.muc.de>
     11  1.56        is  *
     12   1.1       hwr  * Redistribution and use in source and binary forms, with or without
     13   1.1       hwr  * modification, are permitted provided that the following conditions
     14   1.1       hwr  * are met:
     15   1.1       hwr  * 1. Redistributions of source code must retain the above copyright
     16   1.1       hwr  *    notice, this list of conditions and the following disclaimer.
     17   1.1       hwr  * 2. Redistributions in binary form must reproduce the above copyright
     18   1.1       hwr  *    notice, this list of conditions and the following disclaimer in the
     19   1.1       hwr  *    documentation and/or other materials provided with the distribution.
     20   1.1       hwr  * 3. All advertising materials mentioning features or use of this software
     21   1.1       hwr  *    must display the following acknowledgement:
     22   1.1       hwr  *        This product includes software developed by the NetBSD
     23   1.1       hwr  *        Foundation, Inc. and its contributors.
     24   1.1       hwr  * 4. Neither the name of The NetBSD Foundation nor the names of its
     25   1.1       hwr  *    contributors may be used to endorse or promote products derived
     26   1.1       hwr  *    from this software without specific prior written permission.
     27   1.1       hwr  *
     28   1.1       hwr  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     29   1.1       hwr  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     30   1.1       hwr  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     31   1.1       hwr  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     32   1.1       hwr  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     33   1.1       hwr  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     34   1.1       hwr  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     35   1.1       hwr  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     36   1.1       hwr  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     37   1.1       hwr  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     38   1.1       hwr  * POSSIBILITY OF SUCH DAMAGE.
     39   1.1       hwr  */
     40   1.1       hwr 
     41   1.1       hwr /*
     42   1.1       hwr  * Encapsulate L3 protocols into IP
     43   1.1       hwr  * See RFC 1701 and 1702 for more details.
     44   1.1       hwr  * If_gre is compatible with Cisco GRE tunnels, so you can
     45   1.1       hwr  * have a NetBSD box as the other end of a tunnel interface of a Cisco
     46   1.1       hwr  * router. See gre(4) for more details.
     47   1.6       hwr  * Also supported:  IP in IP encaps (proto 55) as of RFC 2004
     48   1.1       hwr  */
     49  1.22     lukem 
     50  1.22     lukem #include <sys/cdefs.h>
     51  1.84    dyoung __KERNEL_RCSID(0, "$NetBSD: if_gre.c,v 1.84 2007/02/17 22:34:08 dyoung Exp $");
     52   1.1       hwr 
     53  1.62    dyoung #include "opt_gre.h"
     54   1.1       hwr #include "opt_inet.h"
     55   1.1       hwr #include "bpfilter.h"
     56   1.1       hwr 
     57  1.54  christos #ifdef INET
     58   1.1       hwr #include <sys/param.h>
     59  1.62    dyoung #include <sys/file.h>
     60  1.62    dyoung #include <sys/filedesc.h>
     61   1.1       hwr #include <sys/malloc.h>
     62   1.1       hwr #include <sys/mbuf.h>
     63  1.13    martin #include <sys/proc.h>
     64   1.1       hwr #include <sys/protosw.h>
     65   1.1       hwr #include <sys/socket.h>
     66  1.62    dyoung #include <sys/socketvar.h>
     67   1.1       hwr #include <sys/ioctl.h>
     68  1.10   thorpej #include <sys/queue.h>
     69   1.1       hwr #if __NetBSD__
     70   1.1       hwr #include <sys/systm.h>
     71  1.62    dyoung #include <sys/sysctl.h>
     72  1.60      elad #include <sys/kauth.h>
     73   1.1       hwr #endif
     74   1.1       hwr 
     75  1.62    dyoung #include <sys/kthread.h>
     76  1.62    dyoung 
     77   1.1       hwr #include <machine/cpu.h>
     78   1.1       hwr 
     79   1.1       hwr #include <net/ethertypes.h>
     80   1.1       hwr #include <net/if.h>
     81   1.1       hwr #include <net/if_types.h>
     82   1.1       hwr #include <net/netisr.h>
     83   1.1       hwr #include <net/route.h>
     84   1.1       hwr 
     85   1.1       hwr #ifdef INET
     86   1.1       hwr #include <netinet/in.h>
     87   1.1       hwr #include <netinet/in_systm.h>
     88   1.1       hwr #include <netinet/in_var.h>
     89   1.1       hwr #include <netinet/ip.h>
     90   1.1       hwr #include <netinet/ip_var.h>
     91   1.1       hwr #else
     92   1.4   thorpej #error "Huh? if_gre without inet?"
     93   1.1       hwr #endif
     94   1.1       hwr 
     95   1.1       hwr 
     96   1.1       hwr #ifdef NETATALK
     97   1.1       hwr #include <netatalk/at.h>
     98   1.1       hwr #include <netatalk/at_var.h>
     99   1.1       hwr #include <netatalk/at_extern.h>
    100   1.1       hwr #endif
    101   1.1       hwr 
    102   1.1       hwr #if NBPFILTER > 0
    103   1.1       hwr #include <sys/time.h>
    104   1.1       hwr #include <net/bpf.h>
    105   1.1       hwr #endif
    106   1.1       hwr 
    107   1.1       hwr #include <net/if_gre.h>
    108   1.1       hwr 
    109  1.20    itojun /*
    110  1.27    martin  * It is not easy to calculate the right value for a GRE MTU.
    111  1.27    martin  * We leave this task to the admin and use the same default that
    112  1.27    martin  * other vendors use.
    113  1.20    itojun  */
    114  1.27    martin #define GREMTU 1476
    115   1.1       hwr 
    116  1.62    dyoung #ifdef GRE_DEBUG
    117  1.62    dyoung #define	GRE_DPRINTF(__sc, __fmt, ...)				\
    118  1.62    dyoung 	do {							\
    119  1.62    dyoung 		if (((__sc)->sc_if.if_flags & IFF_DEBUG) != 0)	\
    120  1.62    dyoung 			printf(__fmt, __VA_ARGS__);		\
    121  1.62    dyoung 	} while (/*CONSTCOND*/0)
    122  1.62    dyoung #else
    123  1.62    dyoung #define	GRE_DPRINTF(__sc, __fmt, ...)	do { } while (/*CONSTCOND*/0)
    124  1.62    dyoung #endif /* GRE_DEBUG */
    125  1.62    dyoung 
    126  1.11   thorpej struct gre_softc_head gre_softc_list;
    127  1.26    martin int ip_gre_ttl = GRE_TTL;
    128   1.1       hwr 
    129  1.59   thorpej static int	gre_clone_create(struct if_clone *, int);
    130  1.59   thorpej static int	gre_clone_destroy(struct ifnet *);
    131  1.10   thorpej 
    132  1.59   thorpej static struct if_clone gre_cloner =
    133  1.10   thorpej     IF_CLONE_INITIALIZER("gre", gre_clone_create, gre_clone_destroy);
    134   1.1       hwr 
    135  1.84    dyoung static int	gre_output(struct ifnet *, struct mbuf *,
    136  1.84    dyoung 			   const struct sockaddr *, struct rtentry *);
    137  1.59   thorpej static int	gre_ioctl(struct ifnet *, u_long, caddr_t);
    138   1.1       hwr 
    139  1.59   thorpej static int	gre_compute_route(struct gre_softc *sc);
    140  1.59   thorpej 
    141  1.62    dyoung static int gre_getsockname(struct socket *, struct mbuf *, struct lwp *);
    142  1.62    dyoung static int gre_getpeername(struct socket *, struct mbuf *, struct lwp *);
    143  1.62    dyoung static int gre_getnames(struct socket *, struct lwp *, struct sockaddr_in *,
    144  1.62    dyoung     struct sockaddr_in *);
    145  1.62    dyoung 
    146  1.62    dyoung static void
    147  1.82    dyoung gre_stop(volatile int *running)
    148  1.62    dyoung {
    149  1.62    dyoung 	*running = 0;
    150  1.62    dyoung 	wakeup(running);
    151  1.62    dyoung }
    152  1.62    dyoung 
    153  1.62    dyoung static void
    154  1.82    dyoung gre_join(volatile int *running)
    155  1.62    dyoung {
    156  1.62    dyoung 	int s;
    157  1.62    dyoung 
    158  1.62    dyoung 	s = splnet();
    159  1.62    dyoung 	while (*running != 0) {
    160  1.62    dyoung 		splx(s);
    161  1.62    dyoung 		tsleep(running, PSOCK, "grejoin", 0);
    162  1.62    dyoung 		s = splnet();
    163  1.62    dyoung 	}
    164  1.62    dyoung 	splx(s);
    165  1.62    dyoung }
    166  1.62    dyoung 
    167  1.62    dyoung static void
    168  1.62    dyoung gre_wakeup(struct gre_softc *sc)
    169  1.62    dyoung {
    170  1.62    dyoung 	GRE_DPRINTF(sc, "%s: enter\n", __func__);
    171  1.62    dyoung 	sc->sc_waitchan = 1;
    172  1.62    dyoung 	wakeup(&sc->sc_waitchan);
    173  1.62    dyoung }
    174  1.62    dyoung 
    175  1.59   thorpej static int
    176  1.59   thorpej gre_clone_create(struct if_clone *ifc, int unit)
    177   1.1       hwr {
    178   1.8  explorer 	struct gre_softc *sc;
    179   1.1       hwr 
    180  1.10   thorpej 	sc = malloc(sizeof(struct gre_softc), M_DEVBUF, M_WAITOK);
    181  1.10   thorpej 	memset(sc, 0, sizeof(struct gre_softc));
    182  1.10   thorpej 
    183  1.50    itojun 	snprintf(sc->sc_if.if_xname, sizeof(sc->sc_if.if_xname), "%s%d",
    184  1.50    itojun 	    ifc->ifc_name, unit);
    185  1.10   thorpej 	sc->sc_if.if_softc = sc;
    186  1.51      tron 	sc->sc_if.if_type = IFT_TUNNEL;
    187  1.34    itojun 	sc->sc_if.if_addrlen = 0;
    188  1.10   thorpej 	sc->sc_if.if_hdrlen = 24; /* IP + GRE */
    189  1.15   thorpej 	sc->sc_if.if_dlt = DLT_NULL;
    190  1.20    itojun 	sc->sc_if.if_mtu = GREMTU;
    191  1.10   thorpej 	sc->sc_if.if_flags = IFF_POINTOPOINT|IFF_MULTICAST;
    192  1.10   thorpej 	sc->sc_if.if_output = gre_output;
    193  1.10   thorpej 	sc->sc_if.if_ioctl = gre_ioctl;
    194  1.10   thorpej 	sc->g_dst.s_addr = sc->g_src.s_addr = INADDR_ANY;
    195  1.62    dyoung 	sc->g_dstport = sc->g_srcport = 0;
    196  1.75    dyoung 	sc->sc_proto = IPPROTO_GRE;
    197  1.64    dyoung 	sc->sc_snd.ifq_maxlen = 256;
    198  1.35    itojun 	sc->sc_if.if_flags |= IFF_LINK0;
    199  1.10   thorpej 	if_attach(&sc->sc_if);
    200  1.16   thorpej 	if_alloc_sadl(&sc->sc_if);
    201   1.1       hwr #if NBPFILTER > 0
    202  1.14   thorpej 	bpfattach(&sc->sc_if, DLT_NULL, sizeof(u_int32_t));
    203   1.1       hwr #endif
    204  1.10   thorpej 	LIST_INSERT_HEAD(&gre_softc_list, sc, sc_list);
    205  1.10   thorpej 	return (0);
    206  1.10   thorpej }
    207   1.1       hwr 
    208  1.59   thorpej static int
    209  1.59   thorpej gre_clone_destroy(struct ifnet *ifp)
    210  1.10   thorpej {
    211  1.77    dyoung 	int s;
    212  1.10   thorpej 	struct gre_softc *sc = ifp->if_softc;
    213  1.10   thorpej 
    214  1.10   thorpej 	LIST_REMOVE(sc, sc_list);
    215  1.10   thorpej #if NBPFILTER > 0
    216  1.10   thorpej 	bpfdetach(ifp);
    217  1.10   thorpej #endif
    218  1.77    dyoung 	s = splnet();
    219  1.77    dyoung 	ifp->if_flags &= ~IFF_UP;
    220  1.62    dyoung 	gre_wakeup(sc);
    221  1.77    dyoung 	splx(s);
    222  1.62    dyoung 	gre_join(&sc->sc_thread);
    223  1.77    dyoung 	s = splnet();
    224  1.77    dyoung 	if_detach(ifp);
    225  1.77    dyoung 	splx(s);
    226  1.62    dyoung 	if (sc->sc_fp != NULL) {
    227  1.62    dyoung 		closef(sc->sc_fp, curlwp);
    228  1.62    dyoung 		sc->sc_fp = NULL;
    229  1.62    dyoung 	}
    230  1.10   thorpej 	free(sc, M_DEVBUF);
    231  1.53     peter 
    232  1.53     peter 	return (0);
    233   1.1       hwr }
    234   1.1       hwr 
    235  1.62    dyoung static void
    236  1.74  christos gre_receive(struct socket *so, caddr_t arg, int waitflag)
    237  1.62    dyoung {
    238  1.62    dyoung 	struct gre_softc *sc = (struct gre_softc *)arg;
    239  1.62    dyoung 
    240  1.62    dyoung 	GRE_DPRINTF(sc, "%s: enter\n", __func__);
    241  1.62    dyoung 
    242  1.62    dyoung 	gre_wakeup(sc);
    243  1.62    dyoung }
    244  1.62    dyoung 
    245  1.62    dyoung static void
    246  1.62    dyoung gre_upcall_add(struct socket *so, caddr_t arg)
    247  1.62    dyoung {
    248  1.62    dyoung 	/* XXX What if the kernel already set an upcall? */
    249  1.62    dyoung 	so->so_upcallarg = arg;
    250  1.62    dyoung 	so->so_upcall = gre_receive;
    251  1.62    dyoung 	so->so_rcv.sb_flags |= SB_UPCALL;
    252  1.62    dyoung }
    253  1.62    dyoung 
    254  1.62    dyoung static void
    255  1.62    dyoung gre_upcall_remove(struct socket *so)
    256  1.62    dyoung {
    257  1.62    dyoung 	/* XXX What if the kernel already set an upcall? */
    258  1.62    dyoung 	so->so_rcv.sb_flags &= ~SB_UPCALL;
    259  1.62    dyoung 	so->so_upcallarg = NULL;
    260  1.62    dyoung 	so->so_upcall = NULL;
    261  1.62    dyoung }
    262  1.62    dyoung 
    263  1.62    dyoung static void
    264  1.62    dyoung gre_sodestroy(struct socket **sop)
    265  1.62    dyoung {
    266  1.62    dyoung 	gre_upcall_remove(*sop);
    267  1.62    dyoung 	soshutdown(*sop, SHUT_RDWR);
    268  1.62    dyoung 	soclose(*sop);
    269  1.62    dyoung 	*sop = NULL;
    270  1.62    dyoung }
    271  1.62    dyoung 
    272  1.62    dyoung static struct mbuf *
    273  1.74  christos gre_getsockmbuf(struct socket *so)
    274  1.62    dyoung {
    275  1.62    dyoung 	struct mbuf *m;
    276  1.62    dyoung 
    277  1.62    dyoung 	m = m_get(M_WAIT, MT_SONAME);
    278  1.62    dyoung 	if (m != NULL)
    279  1.62    dyoung 		MCLAIM(m, so->so_mowner);
    280  1.62    dyoung 	return m;
    281  1.62    dyoung }
    282  1.62    dyoung 
    283  1.62    dyoung static int
    284  1.62    dyoung gre_socreate1(struct gre_softc *sc, struct lwp *l, struct gre_soparm *sp,
    285  1.62    dyoung     struct socket **sop)
    286  1.62    dyoung {
    287  1.62    dyoung 	int rc;
    288  1.62    dyoung 	struct mbuf *m;
    289  1.62    dyoung 	struct sockaddr_in *sin;
    290  1.62    dyoung 	struct socket *so;
    291  1.62    dyoung 
    292  1.62    dyoung 	GRE_DPRINTF(sc, "%s: enter\n", __func__);
    293  1.62    dyoung 	rc = socreate(AF_INET, sop, SOCK_DGRAM, IPPROTO_UDP, l);
    294  1.62    dyoung 	if (rc != 0) {
    295  1.62    dyoung 		GRE_DPRINTF(sc, "%s: socreate failed\n", __func__);
    296  1.62    dyoung 		return rc;
    297  1.62    dyoung 	}
    298  1.62    dyoung 
    299  1.62    dyoung 	so = *sop;
    300  1.62    dyoung 
    301  1.62    dyoung 	gre_upcall_add(so, (caddr_t)sc);
    302  1.62    dyoung 	if ((m = gre_getsockmbuf(so)) == NULL) {
    303  1.62    dyoung 		rc = ENOBUFS;
    304  1.62    dyoung 		goto out;
    305  1.62    dyoung 	}
    306  1.62    dyoung 	sin = mtod(m, struct sockaddr_in *);
    307  1.62    dyoung 	sin->sin_len = m->m_len = sizeof(struct sockaddr_in);
    308  1.62    dyoung 	sin->sin_family = AF_INET;
    309  1.62    dyoung 	sin->sin_addr = sc->g_src;
    310  1.62    dyoung 	sin->sin_port = sc->g_srcport;
    311  1.62    dyoung 
    312  1.62    dyoung 	GRE_DPRINTF(sc, "%s: bind 0x%08" PRIx32 " port %d\n", __func__,
    313  1.62    dyoung 	    sin->sin_addr.s_addr, ntohs(sin->sin_port));
    314  1.62    dyoung 	if ((rc = sobind(so, m, l)) != 0) {
    315  1.62    dyoung 		GRE_DPRINTF(sc, "%s: sobind failed\n", __func__);
    316  1.62    dyoung 		goto out;
    317  1.62    dyoung 	}
    318  1.62    dyoung 
    319  1.62    dyoung 	if (sc->g_srcport == 0) {
    320  1.69    dyoung 		if ((rc = gre_getsockname(so, m, l)) != 0) {
    321  1.62    dyoung 			GRE_DPRINTF(sc, "%s: gre_getsockname failed\n",
    322  1.62    dyoung 			    __func__);
    323  1.62    dyoung 			goto out;
    324  1.62    dyoung 		}
    325  1.62    dyoung 		sc->g_srcport = sin->sin_port;
    326  1.62    dyoung 	}
    327  1.62    dyoung 
    328  1.62    dyoung 	sin->sin_addr = sc->g_dst;
    329  1.62    dyoung 	sin->sin_port = sc->g_dstport;
    330  1.62    dyoung 
    331  1.68    dyoung 	if ((rc = soconnect(so, m, l)) != 0) {
    332  1.62    dyoung 		GRE_DPRINTF(sc, "%s: soconnect failed\n", __func__);
    333  1.62    dyoung 		goto out;
    334  1.62    dyoung 	}
    335  1.62    dyoung 
    336  1.62    dyoung 	*mtod(m, int *) = ip_gre_ttl;
    337  1.76    dyoung 	m->m_len = sizeof(int);
    338  1.62    dyoung 	rc = (*so->so_proto->pr_ctloutput)(PRCO_SETOPT, so, IPPROTO_IP, IP_TTL,
    339  1.62    dyoung 	    &m);
    340  1.62    dyoung 	m = NULL;
    341  1.62    dyoung 	if (rc != 0) {
    342  1.62    dyoung 		printf("%s: setopt ttl failed\n", __func__);
    343  1.62    dyoung 		rc = 0;
    344  1.62    dyoung 	}
    345  1.62    dyoung out:
    346  1.62    dyoung 	m_freem(m);
    347  1.62    dyoung 
    348  1.62    dyoung 	if (rc != 0)
    349  1.62    dyoung 		gre_sodestroy(sop);
    350  1.62    dyoung 	else
    351  1.63    dyoung 		*sp = sc->sc_soparm;
    352  1.62    dyoung 
    353  1.62    dyoung 	return rc;
    354  1.62    dyoung }
    355  1.62    dyoung 
    356  1.62    dyoung static void
    357  1.62    dyoung gre_thread1(struct gre_softc *sc, struct lwp *l)
    358  1.62    dyoung {
    359  1.62    dyoung 	int flags, rc, s;
    360  1.62    dyoung 	const struct gre_h *gh;
    361  1.62    dyoung 	struct ifnet *ifp = &sc->sc_if;
    362  1.62    dyoung 	struct mbuf *m;
    363  1.62    dyoung 	struct socket *so = NULL;
    364  1.62    dyoung 	struct uio uio;
    365  1.62    dyoung 	struct gre_soparm sp;
    366  1.62    dyoung 
    367  1.62    dyoung 	GRE_DPRINTF(sc, "%s: enter\n", __func__);
    368  1.62    dyoung 	s = splnet();
    369  1.62    dyoung 
    370  1.62    dyoung 	sc->sc_waitchan = 1;
    371  1.62    dyoung 
    372  1.62    dyoung 	memset(&sp, 0, sizeof(sp));
    373  1.62    dyoung 	memset(&uio, 0, sizeof(uio));
    374  1.62    dyoung 
    375  1.62    dyoung 	ifp->if_flags |= IFF_RUNNING;
    376  1.62    dyoung 
    377  1.62    dyoung 	for (;;) {
    378  1.62    dyoung 		while (sc->sc_waitchan == 0) {
    379  1.62    dyoung 			splx(s);
    380  1.62    dyoung 			GRE_DPRINTF(sc, "%s: sleeping\n", __func__);
    381  1.62    dyoung 			tsleep(&sc->sc_waitchan, PSOCK, "grewait", 0);
    382  1.62    dyoung 			s = splnet();
    383  1.62    dyoung 		}
    384  1.62    dyoung 		sc->sc_waitchan = 0;
    385  1.62    dyoung 		GRE_DPRINTF(sc, "%s: awake\n", __func__);
    386  1.62    dyoung 		if ((ifp->if_flags & IFF_UP) != IFF_UP) {
    387  1.62    dyoung 			GRE_DPRINTF(sc, "%s: not up & running; exiting\n",
    388  1.62    dyoung 			    __func__);
    389  1.62    dyoung 			break;
    390  1.62    dyoung 		}
    391  1.75    dyoung 		if (sc->sc_proto != IPPROTO_UDP) {
    392  1.62    dyoung 			GRE_DPRINTF(sc, "%s: not udp; exiting\n", __func__);
    393  1.62    dyoung 			break;
    394  1.62    dyoung 		}
    395  1.62    dyoung 		/* XXX optimize */
    396  1.69    dyoung 		if (so == NULL || memcmp(&sp, &sc->sc_soparm, sizeof(sp)) != 0){
    397  1.62    dyoung 			GRE_DPRINTF(sc, "%s: parameters changed\n", __func__);
    398  1.62    dyoung 
    399  1.62    dyoung 			if (sp.sp_fp != NULL) {
    400  1.62    dyoung 				FILE_UNUSE(sp.sp_fp, NULL);
    401  1.62    dyoung 				sp.sp_fp = NULL;
    402  1.62    dyoung 				so = NULL;
    403  1.62    dyoung 			} else if (so != NULL)
    404  1.62    dyoung 				gre_sodestroy(&so);
    405  1.62    dyoung 
    406  1.62    dyoung 			if (sc->sc_fp != NULL) {
    407  1.62    dyoung 				so = (struct socket *)sc->sc_fp->f_data;
    408  1.62    dyoung 				gre_upcall_add(so, (caddr_t)sc);
    409  1.63    dyoung 				sp = sc->sc_soparm;
    410  1.62    dyoung 				FILE_USE(sp.sp_fp);
    411  1.62    dyoung 			} else if (gre_socreate1(sc, l, &sp, &so) != 0)
    412  1.62    dyoung 				goto out;
    413  1.62    dyoung 		}
    414  1.62    dyoung 		for (;;) {
    415  1.62    dyoung 			flags = MSG_DONTWAIT;
    416  1.62    dyoung 			uio.uio_resid = 1000000;
    417  1.62    dyoung 			rc = (*so->so_receive)(so, NULL, &uio, &m, NULL,
    418  1.62    dyoung 			    &flags);
    419  1.62    dyoung 			/* TBD Back off if ECONNREFUSED (indicates
    420  1.62    dyoung 			 * ICMP Port Unreachable)?
    421  1.62    dyoung 			 */
    422  1.62    dyoung 			if (rc == EWOULDBLOCK) {
    423  1.62    dyoung 				GRE_DPRINTF(sc, "%s: so_receive EWOULDBLOCK\n",
    424  1.62    dyoung 				    __func__);
    425  1.62    dyoung 				break;
    426  1.62    dyoung 			} else if (rc != 0 || m == NULL) {
    427  1.62    dyoung 				GRE_DPRINTF(sc, "%s: rc %d m %p\n",
    428  1.62    dyoung 				    ifp->if_xname, rc, (void *)m);
    429  1.62    dyoung 				continue;
    430  1.62    dyoung 			} else
    431  1.62    dyoung 				GRE_DPRINTF(sc, "%s: so_receive ok\n",
    432  1.62    dyoung 				    __func__);
    433  1.62    dyoung 			if (m->m_len < sizeof(*gh) &&
    434  1.62    dyoung 			    (m = m_pullup(m, sizeof(*gh))) == NULL) {
    435  1.62    dyoung 				GRE_DPRINTF(sc, "%s: m_pullup failed\n",
    436  1.62    dyoung 				    __func__);
    437  1.62    dyoung 				continue;
    438  1.62    dyoung 			}
    439  1.62    dyoung 			gh = mtod(m, const struct gre_h *);
    440  1.62    dyoung 
    441  1.62    dyoung 			if (gre_input3(sc, m, 0, IPPROTO_GRE, gh) == 0) {
    442  1.62    dyoung 				GRE_DPRINTF(sc, "%s: dropping unsupported\n",
    443  1.62    dyoung 				    __func__);
    444  1.62    dyoung 				ifp->if_ierrors++;
    445  1.62    dyoung 				m_freem(m);
    446  1.62    dyoung 			}
    447  1.62    dyoung 		}
    448  1.62    dyoung 		for (;;) {
    449  1.62    dyoung 			IF_DEQUEUE(&sc->sc_snd, m);
    450  1.62    dyoung 			if (m == NULL)
    451  1.62    dyoung 				break;
    452  1.62    dyoung 			GRE_DPRINTF(sc, "%s: dequeue\n", __func__);
    453  1.62    dyoung 			if ((so->so_state & SS_ISCONNECTED) == 0) {
    454  1.62    dyoung 				GRE_DPRINTF(sc, "%s: not connected\n",
    455  1.62    dyoung 				    __func__);
    456  1.62    dyoung 				m_freem(m);
    457  1.62    dyoung 				continue;
    458  1.62    dyoung 			}
    459  1.62    dyoung 			rc = (*so->so_send)(so, NULL, NULL, m, NULL, 0, l);
    460  1.62    dyoung 			/* XXX handle ENOBUFS? */
    461  1.62    dyoung 			if (rc != 0)
    462  1.62    dyoung 				GRE_DPRINTF(sc, "%s: so_send failed\n",
    463  1.62    dyoung 				    __func__);
    464  1.62    dyoung 		}
    465  1.62    dyoung 		/* Give the software interrupt queues a chance to
    466  1.62    dyoung 		 * run, or else when I send a ping from gre0 to gre1 on
    467  1.62    dyoung 		 * the same host, gre0 will not wake for the reply.
    468  1.62    dyoung 		 */
    469  1.62    dyoung 		splx(s);
    470  1.62    dyoung 		s = splnet();
    471  1.62    dyoung 	}
    472  1.62    dyoung 	if (sp.sp_fp != NULL) {
    473  1.62    dyoung 		GRE_DPRINTF(sc, "%s: removing upcall\n", __func__);
    474  1.62    dyoung 		gre_upcall_remove(so);
    475  1.62    dyoung 		FILE_UNUSE(sp.sp_fp, NULL);
    476  1.62    dyoung 		sp.sp_fp = NULL;
    477  1.66    dyoung 	} else if (so != NULL)
    478  1.62    dyoung 		gre_sodestroy(&so);
    479  1.62    dyoung out:
    480  1.62    dyoung 	GRE_DPRINTF(sc, "%s: stopping\n", __func__);
    481  1.75    dyoung 	if (sc->sc_proto == IPPROTO_UDP)
    482  1.62    dyoung 		ifp->if_flags &= ~IFF_RUNNING;
    483  1.64    dyoung 	while (!IF_IS_EMPTY(&sc->sc_snd)) {
    484  1.64    dyoung 		IF_DEQUEUE(&sc->sc_snd, m);
    485  1.64    dyoung 		m_freem(m);
    486  1.64    dyoung 	}
    487  1.62    dyoung 	gre_stop(&sc->sc_thread);
    488  1.62    dyoung 	/* must not touch sc after this! */
    489  1.62    dyoung 	GRE_DPRINTF(sc, "%s: restore ipl\n", __func__);
    490  1.62    dyoung 	splx(s);
    491  1.62    dyoung }
    492  1.62    dyoung 
    493  1.62    dyoung static void
    494  1.62    dyoung gre_thread(void *arg)
    495  1.62    dyoung {
    496  1.62    dyoung 	struct gre_softc *sc = (struct gre_softc *)arg;
    497  1.62    dyoung 
    498  1.62    dyoung 	gre_thread1(sc, curlwp);
    499  1.62    dyoung 	/* must not touch sc after this! */
    500  1.62    dyoung 	kthread_exit(0);
    501  1.62    dyoung }
    502  1.62    dyoung 
    503  1.62    dyoung int
    504  1.62    dyoung gre_input3(struct gre_softc *sc, struct mbuf *m, int hlen, u_char proto,
    505  1.62    dyoung     const struct gre_h *gh)
    506  1.62    dyoung {
    507  1.62    dyoung 	u_int16_t flags;
    508  1.62    dyoung #if NBPFILTER > 0
    509  1.62    dyoung 	u_int32_t af = AF_INET;		/* af passed to BPF tap */
    510  1.62    dyoung #endif
    511  1.62    dyoung 	int s, isr;
    512  1.62    dyoung 	struct ifqueue *ifq;
    513  1.62    dyoung 
    514  1.62    dyoung 	sc->sc_if.if_ipackets++;
    515  1.62    dyoung 	sc->sc_if.if_ibytes += m->m_pkthdr.len;
    516  1.62    dyoung 
    517  1.62    dyoung 	switch (proto) {
    518  1.62    dyoung 	case IPPROTO_GRE:
    519  1.62    dyoung 		hlen += sizeof(struct gre_h);
    520  1.62    dyoung 
    521  1.62    dyoung 		/* process GRE flags as packet can be of variable len */
    522  1.62    dyoung 		flags = ntohs(gh->flags);
    523  1.62    dyoung 
    524  1.62    dyoung 		/* Checksum & Offset are present */
    525  1.62    dyoung 		if ((flags & GRE_CP) | (flags & GRE_RP))
    526  1.62    dyoung 			hlen += 4;
    527  1.62    dyoung 		/* We don't support routing fields (variable length) */
    528  1.62    dyoung 		if (flags & GRE_RP)
    529  1.62    dyoung 			return (0);
    530  1.62    dyoung 		if (flags & GRE_KP)
    531  1.62    dyoung 			hlen += 4;
    532  1.62    dyoung 		if (flags & GRE_SP)
    533  1.62    dyoung 			hlen += 4;
    534  1.62    dyoung 
    535  1.62    dyoung 		switch (ntohs(gh->ptype)) { /* ethertypes */
    536  1.62    dyoung 		case ETHERTYPE_IP: /* shouldn't need a schednetisr(), as */
    537  1.62    dyoung 			ifq = &ipintrq;          /* we are in ip_input */
    538  1.62    dyoung 			isr = NETISR_IP;
    539  1.62    dyoung 			break;
    540  1.62    dyoung #ifdef NETATALK
    541  1.62    dyoung 		case ETHERTYPE_ATALK:
    542  1.62    dyoung 			ifq = &atintrq1;
    543  1.62    dyoung 			isr = NETISR_ATALK;
    544  1.62    dyoung #if NBPFILTER > 0
    545  1.62    dyoung 			af = AF_APPLETALK;
    546  1.62    dyoung #endif
    547  1.62    dyoung 			break;
    548  1.62    dyoung #endif
    549  1.62    dyoung #ifdef INET6
    550  1.62    dyoung 		case ETHERTYPE_IPV6:
    551  1.62    dyoung 			GRE_DPRINTF(sc, "%s: IPv6 packet\n", __func__);
    552  1.62    dyoung 			ifq = &ip6intrq;
    553  1.62    dyoung 			isr = NETISR_IPV6;
    554  1.62    dyoung #if NBPFILTER > 0
    555  1.62    dyoung 			af = AF_INET6;
    556  1.62    dyoung #endif
    557  1.62    dyoung 			break;
    558  1.62    dyoung #endif
    559  1.62    dyoung 		default:	   /* others not yet supported */
    560  1.62    dyoung 			printf("%s: unhandled ethertype 0x%04x\n", __func__,
    561  1.62    dyoung 			    ntohs(gh->ptype));
    562  1.62    dyoung 			return (0);
    563  1.62    dyoung 		}
    564  1.62    dyoung 		break;
    565  1.62    dyoung 	default:
    566  1.62    dyoung 		/* others not yet supported */
    567  1.62    dyoung 		return (0);
    568  1.62    dyoung 	}
    569  1.62    dyoung 
    570  1.62    dyoung 	if (hlen > m->m_pkthdr.len) {
    571  1.62    dyoung 		m_freem(m);
    572  1.62    dyoung 		sc->sc_if.if_ierrors++;
    573  1.62    dyoung 		return (EINVAL);
    574  1.62    dyoung 	}
    575  1.62    dyoung 	m_adj(m, hlen);
    576  1.62    dyoung 
    577  1.62    dyoung #if NBPFILTER > 0
    578  1.62    dyoung 	if (sc->sc_if.if_bpf != NULL)
    579  1.62    dyoung 		bpf_mtap_af(sc->sc_if.if_bpf, af, m);
    580  1.62    dyoung #endif /*NBPFILTER > 0*/
    581  1.62    dyoung 
    582  1.62    dyoung 	m->m_pkthdr.rcvif = &sc->sc_if;
    583  1.62    dyoung 
    584  1.62    dyoung 	s = splnet();		/* possible */
    585  1.62    dyoung 	if (IF_QFULL(ifq)) {
    586  1.62    dyoung 		IF_DROP(ifq);
    587  1.62    dyoung 		m_freem(m);
    588  1.62    dyoung 	} else {
    589  1.62    dyoung 		IF_ENQUEUE(ifq, m);
    590  1.62    dyoung 	}
    591  1.62    dyoung 	/* we need schednetisr since the address family may change */
    592  1.62    dyoung 	schednetisr(isr);
    593  1.62    dyoung 	splx(s);
    594  1.62    dyoung 
    595  1.62    dyoung 	return (1);	/* packet is done, no further processing needed */
    596  1.62    dyoung }
    597  1.62    dyoung 
    598  1.20    itojun /*
    599   1.1       hwr  * The output routine. Takes a packet and encapsulates it in the protocol
    600  1.75    dyoung  * given by sc->sc_proto. See also RFC 1701 and RFC 2004
    601   1.1       hwr  */
    602  1.59   thorpej static int
    603  1.84    dyoung gre_output(struct ifnet *ifp, struct mbuf *m, const struct sockaddr *dst,
    604  1.74  christos 	   struct rtentry *rt)
    605   1.1       hwr {
    606  1.62    dyoung 	int error = 0, hlen;
    607  1.10   thorpej 	struct gre_softc *sc = ifp->if_softc;
    608  1.62    dyoung 	struct greip *gi;
    609  1.62    dyoung 	struct gre_h *gh;
    610  1.62    dyoung 	struct ip *eip, *ip;
    611  1.56        is 	u_int8_t ip_tos = 0;
    612  1.48    itojun 	u_int16_t etype = 0;
    613  1.20    itojun 	struct mobile_h mob_h;
    614  1.24    martin 
    615  1.39    itojun 	if ((ifp->if_flags & (IFF_UP | IFF_RUNNING)) == 0 ||
    616  1.37    itojun 	    sc->g_src.s_addr == INADDR_ANY || sc->g_dst.s_addr == INADDR_ANY) {
    617  1.37    itojun 		m_freem(m);
    618  1.38    itojun 		error = ENETDOWN;
    619  1.38    itojun 		goto end;
    620  1.37    itojun 	}
    621   1.1       hwr 
    622  1.62    dyoung 	gi = NULL;
    623  1.41    itojun 	ip = NULL;
    624   1.1       hwr 
    625   1.1       hwr #if NBPFILTER >0
    626  1.52  christos 	if (ifp->if_bpf)
    627  1.52  christos 		bpf_mtap_af(ifp->if_bpf, dst->sa_family, m);
    628   1.1       hwr #endif
    629   1.1       hwr 
    630  1.26    martin 	m->m_flags &= ~(M_BCAST|M_MCAST);
    631   1.1       hwr 
    632  1.75    dyoung 	switch (sc->sc_proto) {
    633  1.62    dyoung 	case IPPROTO_MOBILE:
    634   1.3       hwr 		if (dst->sa_family == AF_INET) {
    635   1.3       hwr 			int msiz;
    636   1.3       hwr 
    637  1.62    dyoung 			if (M_UNWRITABLE(m, sizeof(*ip)) &&
    638  1.62    dyoung 			    (m = m_pullup(m, sizeof(*ip))) == NULL) {
    639  1.62    dyoung 				error = ENOBUFS;
    640  1.62    dyoung 				goto end;
    641  1.62    dyoung 			}
    642  1.41    itojun 			ip = mtod(m, struct ip *);
    643   1.3       hwr 
    644   1.8  explorer 			memset(&mob_h, 0, MOB_H_SIZ_L);
    645  1.41    itojun 			mob_h.proto = (ip->ip_p) << 8;
    646  1.41    itojun 			mob_h.odst = ip->ip_dst.s_addr;
    647  1.41    itojun 			ip->ip_dst.s_addr = sc->g_dst.s_addr;
    648   1.3       hwr 
    649   1.3       hwr 			/*
    650   1.8  explorer 			 * If the packet comes from our host, we only change
    651   1.8  explorer 			 * the destination address in the IP header.
    652   1.8  explorer 			 * Else we also need to save and change the source
    653   1.3       hwr 			 */
    654  1.41    itojun 			if (in_hosteq(ip->ip_src, sc->g_src)) {
    655   1.8  explorer 				msiz = MOB_H_SIZ_S;
    656   1.3       hwr 			} else {
    657   1.3       hwr 				mob_h.proto |= MOB_H_SBIT;
    658  1.41    itojun 				mob_h.osrc = ip->ip_src.s_addr;
    659  1.41    itojun 				ip->ip_src.s_addr = sc->g_src.s_addr;
    660   1.8  explorer 				msiz = MOB_H_SIZ_L;
    661   1.3       hwr 			}
    662   1.3       hwr 			HTONS(mob_h.proto);
    663  1.48    itojun 			mob_h.hcrc = gre_in_cksum((u_int16_t *)&mob_h, msiz);
    664   1.3       hwr 
    665  1.62    dyoung 			M_PREPEND(m, msiz, M_DONTWAIT);
    666  1.62    dyoung 			if (m == NULL) {
    667  1.62    dyoung 				error = ENOBUFS;
    668  1.62    dyoung 				goto end;
    669   1.3       hwr 			}
    670  1.62    dyoung 			/* XXX Assuming that ip does not dangle after
    671  1.62    dyoung 			 * M_PREPEND.  In practice, that's true, but
    672  1.62    dyoung 			 * that's in M_PREPEND's contract.
    673  1.62    dyoung 			 */
    674  1.62    dyoung 			memmove(mtod(m, caddr_t), ip, sizeof(*ip));
    675  1.41    itojun 			ip = mtod(m, struct ip *);
    676  1.41    itojun 			memcpy((caddr_t)(ip + 1), &mob_h, (unsigned)msiz);
    677  1.42    itojun 			ip->ip_len = htons(ntohs(ip->ip_len) + msiz);
    678   1.3       hwr 		} else {  /* AF_INET */
    679   1.3       hwr 			IF_DROP(&ifp->if_snd);
    680   1.3       hwr 			m_freem(m);
    681  1.38    itojun 			error = EINVAL;
    682  1.38    itojun 			goto end;
    683   1.3       hwr 		}
    684  1.62    dyoung 		break;
    685  1.62    dyoung 	case IPPROTO_UDP:
    686  1.62    dyoung 	case IPPROTO_GRE:
    687  1.62    dyoung 		GRE_DPRINTF(sc, "%s: dst->sa_family=%d\n", __func__,
    688  1.62    dyoung 		    dst->sa_family);
    689  1.20    itojun 		switch (dst->sa_family) {
    690   1.1       hwr 		case AF_INET:
    691  1.41    itojun 			ip = mtod(m, struct ip *);
    692  1.56        is 			ip_tos = ip->ip_tos;
    693   1.8  explorer 			etype = ETHERTYPE_IP;
    694   1.1       hwr 			break;
    695   1.1       hwr #ifdef NETATALK
    696   1.1       hwr 		case AF_APPLETALK:
    697   1.8  explorer 			etype = ETHERTYPE_ATALK;
    698   1.1       hwr 			break;
    699   1.1       hwr #endif
    700  1.56        is #ifdef INET6
    701  1.56        is 		case AF_INET6:
    702  1.56        is 			etype = ETHERTYPE_IPV6;
    703  1.56        is 			break;
    704  1.56        is #endif
    705   1.1       hwr 		default:
    706   1.1       hwr 			IF_DROP(&ifp->if_snd);
    707   1.1       hwr 			m_freem(m);
    708  1.38    itojun 			error = EAFNOSUPPORT;
    709  1.38    itojun 			goto end;
    710   1.1       hwr 		}
    711  1.62    dyoung 		break;
    712  1.62    dyoung 	default:
    713   1.1       hwr 		IF_DROP(&ifp->if_snd);
    714   1.1       hwr 		m_freem(m);
    715  1.38    itojun 		error = EINVAL;
    716  1.38    itojun 		goto end;
    717   1.1       hwr 	}
    718   1.1       hwr 
    719  1.75    dyoung 	switch (sc->sc_proto) {
    720  1.62    dyoung 	case IPPROTO_GRE:
    721  1.62    dyoung 		hlen = sizeof(struct greip);
    722  1.62    dyoung 		break;
    723  1.62    dyoung 	case IPPROTO_UDP:
    724  1.62    dyoung 		hlen = sizeof(struct gre_h);
    725  1.62    dyoung 		break;
    726  1.62    dyoung 	default:
    727  1.62    dyoung 		hlen = 0;
    728  1.62    dyoung 		break;
    729  1.62    dyoung 	}
    730  1.62    dyoung 
    731  1.62    dyoung 	M_PREPEND(m, hlen, M_DONTWAIT);
    732  1.62    dyoung 
    733  1.62    dyoung 	if (m == NULL) {
    734   1.1       hwr 		IF_DROP(&ifp->if_snd);
    735  1.38    itojun 		error = ENOBUFS;
    736  1.38    itojun 		goto end;
    737   1.1       hwr 	}
    738   1.1       hwr 
    739  1.75    dyoung 	switch (sc->sc_proto) {
    740  1.62    dyoung 	case IPPROTO_UDP:
    741  1.62    dyoung 		gh = mtod(m, struct gre_h *);
    742  1.62    dyoung 		memset(gh, 0, sizeof(*gh));
    743  1.62    dyoung 		gh->ptype = htons(etype);
    744  1.62    dyoung 		/* XXX Need to handle IP ToS.  Look at how I handle IP TTL. */
    745  1.62    dyoung 		break;
    746  1.62    dyoung 	case IPPROTO_GRE:
    747  1.62    dyoung 		gi = mtod(m, struct greip *);
    748  1.62    dyoung 		gh = &gi->gi_g;
    749  1.62    dyoung 		eip = &gi->gi_i;
    750   1.1       hwr 		/* we don't have any GRE flags for now */
    751  1.62    dyoung 		memset(gh, 0, sizeof(*gh));
    752  1.62    dyoung 		gh->ptype = htons(etype);
    753  1.62    dyoung 		eip->ip_src = sc->g_src;
    754  1.62    dyoung 		eip->ip_dst = sc->g_dst;
    755  1.62    dyoung 		eip->ip_hl = (sizeof(struct ip)) >> 2;
    756  1.62    dyoung 		eip->ip_ttl = ip_gre_ttl;
    757  1.62    dyoung 		eip->ip_tos = ip_tos;
    758  1.62    dyoung 		eip->ip_len = htons(m->m_pkthdr.len);
    759  1.75    dyoung 		eip->ip_p = sc->sc_proto;
    760  1.62    dyoung 		break;
    761  1.62    dyoung 	case IPPROTO_MOBILE:
    762  1.62    dyoung 		eip = mtod(m, struct ip *);
    763  1.75    dyoung 		eip->ip_p = sc->sc_proto;
    764  1.62    dyoung 		break;
    765  1.62    dyoung 	default:
    766  1.62    dyoung 		error = EPROTONOSUPPORT;
    767  1.62    dyoung 		m_freem(m);
    768  1.62    dyoung 		goto end;
    769   1.3       hwr 	}
    770   1.1       hwr 
    771   1.1       hwr 	ifp->if_opackets++;
    772   1.8  explorer 	ifp->if_obytes += m->m_pkthdr.len;
    773  1.62    dyoung 
    774   1.1       hwr 	/* send it off */
    775  1.75    dyoung 	if (sc->sc_proto == IPPROTO_UDP) {
    776  1.62    dyoung 		if (IF_QFULL(&sc->sc_snd)) {
    777  1.62    dyoung 			IF_DROP(&sc->sc_snd);
    778  1.62    dyoung 			error = ENOBUFS;
    779  1.62    dyoung 			m_freem(m);
    780  1.62    dyoung 		} else {
    781  1.62    dyoung 			IF_ENQUEUE(&sc->sc_snd, m);
    782  1.62    dyoung 			gre_wakeup(sc);
    783  1.62    dyoung 			error = 0;
    784  1.62    dyoung 		}
    785  1.81     joerg 		goto end;
    786  1.81     joerg 	}
    787  1.81     joerg 	rtcache_check(&sc->route);
    788  1.81     joerg 	if (sc->route.ro_rt == NULL)
    789  1.81     joerg 		goto end;
    790  1.83    dyoung 	if (sc->route.ro_rt->rt_ifp->if_softc == sc)
    791  1.81     joerg 		rtcache_free(&sc->route);
    792  1.81     joerg 	else
    793  1.62    dyoung 		error = ip_output(m, NULL, &sc->route, 0,
    794  1.62    dyoung 		    (struct ip_moptions *)NULL, (struct socket *)NULL);
    795  1.38    itojun   end:
    796   1.8  explorer 	if (error)
    797   1.1       hwr 		ifp->if_oerrors++;
    798   1.8  explorer 	return (error);
    799   1.1       hwr }
    800   1.1       hwr 
    801  1.71    dyoung /* gre_kick must be synchronized with network interrupts in order
    802  1.71    dyoung  * to synchronize access to gre_softc members, so call it with
    803  1.71    dyoung  * interrupt priority level set to IPL_NET or greater.
    804  1.71    dyoung  */
    805  1.62    dyoung static int
    806  1.62    dyoung gre_kick(struct gre_softc *sc)
    807  1.62    dyoung {
    808  1.62    dyoung 	int rc;
    809  1.62    dyoung 	struct ifnet *ifp = &sc->sc_if;
    810  1.62    dyoung 
    811  1.75    dyoung 	if (sc->sc_proto == IPPROTO_UDP && (ifp->if_flags & IFF_UP) == IFF_UP &&
    812  1.62    dyoung 	    !sc->sc_thread) {
    813  1.62    dyoung 		sc->sc_thread = 1;
    814  1.62    dyoung 		rc = kthread_create1(gre_thread, (void *)sc, NULL,
    815  1.62    dyoung 		    ifp->if_xname);
    816  1.62    dyoung 		if (rc != 0)
    817  1.62    dyoung 			gre_stop(&sc->sc_thread);
    818  1.62    dyoung 		return rc;
    819  1.62    dyoung 	} else {
    820  1.62    dyoung 		gre_wakeup(sc);
    821  1.62    dyoung 		return 0;
    822  1.62    dyoung 	}
    823  1.62    dyoung }
    824  1.62    dyoung 
    825  1.62    dyoung static int
    826  1.62    dyoung gre_getname(struct socket *so, int req, struct mbuf *nam, struct lwp *l)
    827  1.62    dyoung {
    828  1.62    dyoung 	int s, error;
    829  1.62    dyoung 
    830  1.62    dyoung 	s = splsoftnet();
    831  1.62    dyoung 	error = (*so->so_proto->pr_usrreq)(so, req, (struct mbuf *)0,
    832  1.62    dyoung 	    nam, (struct mbuf *)0, l);
    833  1.62    dyoung 	splx(s);
    834  1.62    dyoung 	return error;
    835  1.62    dyoung }
    836  1.62    dyoung 
    837  1.62    dyoung static int
    838  1.62    dyoung gre_getsockname(struct socket *so, struct mbuf *nam, struct lwp *l)
    839  1.62    dyoung {
    840  1.62    dyoung 	return gre_getname(so, PRU_SOCKADDR, nam, l);
    841  1.62    dyoung }
    842  1.62    dyoung 
    843  1.62    dyoung static int
    844  1.62    dyoung gre_getpeername(struct socket *so, struct mbuf *nam, struct lwp *l)
    845  1.62    dyoung {
    846  1.62    dyoung 	return gre_getname(so, PRU_PEERADDR, nam, l);
    847  1.62    dyoung }
    848  1.62    dyoung 
    849  1.62    dyoung static int
    850  1.62    dyoung gre_getnames(struct socket *so, struct lwp *l, struct sockaddr_in *src,
    851  1.62    dyoung     struct sockaddr_in *dst)
    852  1.62    dyoung {
    853  1.62    dyoung 	struct mbuf *m;
    854  1.62    dyoung 	struct sockaddr_in *sin;
    855  1.62    dyoung 	int rc;
    856  1.62    dyoung 
    857  1.62    dyoung 	if ((m = gre_getsockmbuf(so)) == NULL)
    858  1.62    dyoung 		return ENOBUFS;
    859  1.62    dyoung 
    860  1.62    dyoung 	sin = mtod(m, struct sockaddr_in *);
    861  1.62    dyoung 
    862  1.62    dyoung 	if ((rc = gre_getsockname(so, m, l)) != 0)
    863  1.62    dyoung 		goto out;
    864  1.62    dyoung 	if (sin->sin_family != AF_INET) {
    865  1.62    dyoung 		rc = EAFNOSUPPORT;
    866  1.62    dyoung 		goto out;
    867  1.62    dyoung 	}
    868  1.62    dyoung 	*src = *sin;
    869  1.62    dyoung 
    870  1.62    dyoung 	if ((rc = gre_getpeername(so, m, l)) != 0)
    871  1.62    dyoung 		goto out;
    872  1.62    dyoung 	if (sin->sin_family != AF_INET) {
    873  1.62    dyoung 		rc = EAFNOSUPPORT;
    874  1.62    dyoung 		goto out;
    875  1.62    dyoung 	}
    876  1.62    dyoung 	*dst = *sin;
    877  1.62    dyoung 
    878  1.62    dyoung out:
    879  1.62    dyoung 	m_freem(m);
    880  1.62    dyoung 	return rc;
    881  1.62    dyoung }
    882  1.62    dyoung 
    883  1.59   thorpej static int
    884   1.8  explorer gre_ioctl(struct ifnet *ifp, u_long cmd, caddr_t data)
    885   1.1       hwr {
    886  1.62    dyoung 	u_char oproto;
    887  1.62    dyoung 	struct file *fp, *ofp;
    888  1.62    dyoung 	struct socket *so;
    889  1.62    dyoung 	struct sockaddr_in dst, src;
    890  1.62    dyoung 	struct proc *p = curproc;	/* XXX */
    891  1.61        ad 	struct lwp *l = curlwp;	/* XXX */
    892   1.8  explorer 	struct ifreq *ifr = (struct ifreq *)data;
    893  1.28    itojun 	struct if_laddrreq *lifr = (struct if_laddrreq *)data;
    894   1.8  explorer 	struct gre_softc *sc = ifp->if_softc;
    895   1.1       hwr 	int s;
    896   1.1       hwr 	struct sockaddr_in si;
    897   1.8  explorer 	struct sockaddr *sa = NULL;
    898  1.80  christos 	int error = 0;
    899   1.1       hwr 
    900  1.61        ad 	switch (cmd) {
    901  1.61        ad 	case SIOCSIFFLAGS:
    902  1.61        ad 	case SIOCSIFMTU:
    903  1.61        ad 	case GRESPROTO:
    904  1.61        ad 	case GRESADDRD:
    905  1.61        ad 	case GRESADDRS:
    906  1.62    dyoung 	case GRESSOCK:
    907  1.62    dyoung 	case GREDSOCK:
    908  1.61        ad 	case SIOCSLIFPHYADDR:
    909  1.61        ad 	case SIOCDIFPHYADDR:
    910  1.70      elad 		if (kauth_authorize_network(l->l_cred, KAUTH_NETWORK_INTERFACE,
    911  1.70      elad 		    KAUTH_REQ_NETWORK_INTERFACE_SETPRIV, ifp, (void *)cmd,
    912  1.70      elad 		    NULL) != 0)
    913  1.70      elad 			return (EPERM);
    914  1.61        ad 		break;
    915  1.61        ad 	default:
    916  1.61        ad 		break;
    917  1.61        ad 	}
    918   1.1       hwr 
    919  1.18   thorpej 	s = splnet();
    920  1.20    itojun 	switch (cmd) {
    921  1.20    itojun 	case SIOCSIFADDR:
    922  1.36    itojun 		ifp->if_flags |= IFF_UP;
    923  1.78    dyoung 		if ((error = gre_kick(sc)) != 0)
    924  1.78    dyoung 			ifp->if_flags &= ~IFF_UP;
    925  1.36    itojun 		break;
    926  1.55     perry 	case SIOCSIFDSTADDR:
    927   1.1       hwr 		break;
    928   1.1       hwr 	case SIOCSIFFLAGS:
    929  1.75    dyoung 		oproto = sc->sc_proto;
    930  1.62    dyoung 		switch (ifr->ifr_flags & (IFF_LINK0|IFF_LINK2)) {
    931  1.62    dyoung 		case IFF_LINK0|IFF_LINK2:
    932  1.75    dyoung 			sc->sc_proto = IPPROTO_UDP;
    933  1.62    dyoung 			if (oproto != IPPROTO_UDP)
    934  1.62    dyoung 				ifp->if_flags &= ~IFF_RUNNING;
    935  1.62    dyoung 			error = gre_kick(sc);
    936  1.62    dyoung 			break;
    937  1.62    dyoung 		case IFF_LINK0:
    938  1.75    dyoung 			sc->sc_proto = IPPROTO_GRE;
    939  1.62    dyoung 			gre_wakeup(sc);
    940  1.62    dyoung 			goto recompute;
    941  1.62    dyoung 		case 0:
    942  1.75    dyoung 			sc->sc_proto = IPPROTO_MOBILE;
    943  1.62    dyoung 			gre_wakeup(sc);
    944  1.62    dyoung 			goto recompute;
    945  1.62    dyoung 		}
    946   1.1       hwr 		break;
    947  1.20    itojun 	case SIOCSIFMTU:
    948  1.27    martin 		if (ifr->ifr_mtu < 576) {
    949   1.1       hwr 			error = EINVAL;
    950   1.1       hwr 			break;
    951   1.1       hwr 		}
    952   1.1       hwr 		ifp->if_mtu = ifr->ifr_mtu;
    953   1.1       hwr 		break;
    954   1.1       hwr 	case SIOCGIFMTU:
    955   1.1       hwr 		ifr->ifr_mtu = sc->sc_if.if_mtu;
    956   1.1       hwr 		break;
    957   1.1       hwr 	case SIOCADDMULTI:
    958   1.1       hwr 	case SIOCDELMULTI:
    959   1.8  explorer 		if (ifr == 0) {
    960   1.1       hwr 			error = EAFNOSUPPORT;
    961   1.1       hwr 			break;
    962   1.1       hwr 		}
    963   1.8  explorer 		switch (ifr->ifr_addr.sa_family) {
    964   1.1       hwr #ifdef INET
    965   1.1       hwr 		case AF_INET:
    966   1.1       hwr 			break;
    967   1.1       hwr #endif
    968  1.56        is #ifdef INET6
    969  1.56        is 		case AF_INET6:
    970  1.56        is 			break;
    971  1.56        is #endif
    972   1.1       hwr 		default:
    973   1.1       hwr 			error = EAFNOSUPPORT;
    974   1.1       hwr 			break;
    975   1.1       hwr 		}
    976   1.1       hwr 		break;
    977   1.1       hwr 	case GRESPROTO:
    978  1.75    dyoung 		oproto = sc->sc_proto;
    979  1.75    dyoung 		sc->sc_proto = ifr->ifr_flags;
    980  1.75    dyoung 		switch (sc->sc_proto) {
    981  1.62    dyoung 		case IPPROTO_UDP:
    982  1.62    dyoung 			ifp->if_flags |= IFF_LINK0|IFF_LINK2;
    983  1.62    dyoung 			if (oproto != IPPROTO_UDP)
    984  1.62    dyoung 				ifp->if_flags &= ~IFF_RUNNING;
    985  1.62    dyoung 			error = gre_kick(sc);
    986  1.62    dyoung 			break;
    987  1.40    itojun 		case IPPROTO_GRE:
    988   1.3       hwr 			ifp->if_flags |= IFF_LINK0;
    989  1.62    dyoung 			ifp->if_flags &= ~IFF_LINK2;
    990  1.62    dyoung 			goto recompute;
    991  1.40    itojun 		case IPPROTO_MOBILE:
    992  1.62    dyoung 			ifp->if_flags &= ~(IFF_LINK0|IFF_LINK2);
    993  1.62    dyoung 			goto recompute;
    994   1.1       hwr 		default:
    995  1.40    itojun 			error = EPROTONOSUPPORT;
    996  1.35    itojun 			break;
    997   1.1       hwr 		}
    998   1.1       hwr 		break;
    999   1.1       hwr 	case GREGPROTO:
   1000  1.75    dyoung 		ifr->ifr_flags = sc->sc_proto;
   1001   1.1       hwr 		break;
   1002   1.1       hwr 	case GRESADDRS:
   1003   1.1       hwr 	case GRESADDRD:
   1004   1.1       hwr 		/*
   1005  1.20    itojun 		 * set tunnel endpoints, compute a less specific route
   1006  1.20    itojun 		 * to the remote end and mark if as up
   1007  1.20    itojun 		 */
   1008   1.1       hwr 		sa = &ifr->ifr_addr;
   1009  1.62    dyoung 		if (cmd == GRESADDRS) {
   1010   1.1       hwr 			sc->g_src = (satosin(sa))->sin_addr;
   1011  1.62    dyoung 			sc->g_srcport = satosin(sa)->sin_port;
   1012  1.62    dyoung 		}
   1013  1.62    dyoung 		if (cmd == GRESADDRD) {
   1014  1.75    dyoung 			if (sc->sc_proto == IPPROTO_UDP &&
   1015  1.62    dyoung 			    satosin(sa)->sin_port == 0) {
   1016  1.62    dyoung 				error = EINVAL;
   1017  1.62    dyoung 				break;
   1018  1.62    dyoung 			}
   1019   1.1       hwr 			sc->g_dst = (satosin(sa))->sin_addr;
   1020  1.62    dyoung 			sc->g_dstport = satosin(sa)->sin_port;
   1021  1.62    dyoung 		}
   1022  1.30    itojun 	recompute:
   1023  1.75    dyoung 		if (sc->sc_proto == IPPROTO_UDP ||
   1024  1.62    dyoung 		    (sc->g_src.s_addr != INADDR_ANY &&
   1025  1.62    dyoung 		     sc->g_dst.s_addr != INADDR_ANY)) {
   1026  1.62    dyoung 			if (sc->sc_fp != NULL) {
   1027  1.62    dyoung 				closef(sc->sc_fp, l);
   1028  1.62    dyoung 				sc->sc_fp = NULL;
   1029  1.62    dyoung 			}
   1030  1.81     joerg 			rtcache_free(&sc->route);
   1031  1.75    dyoung 			if (sc->sc_proto == IPPROTO_UDP)
   1032  1.62    dyoung 				error = gre_kick(sc);
   1033  1.62    dyoung 			else if (gre_compute_route(sc) == 0)
   1034  1.39    itojun 				ifp->if_flags |= IFF_RUNNING;
   1035  1.39    itojun 			else
   1036  1.39    itojun 				ifp->if_flags &= ~IFF_RUNNING;
   1037   1.1       hwr 		}
   1038   1.1       hwr 		break;
   1039   1.1       hwr 	case GREGADDRS:
   1040  1.33    itojun 		memset(&si, 0, sizeof(si));
   1041  1.28    itojun 		si.sin_family = AF_INET;
   1042  1.28    itojun 		si.sin_len = sizeof(struct sockaddr_in);
   1043   1.1       hwr 		si.sin_addr.s_addr = sc->g_src.s_addr;
   1044   1.8  explorer 		sa = sintosa(&si);
   1045   1.1       hwr 		ifr->ifr_addr = *sa;
   1046   1.1       hwr 		break;
   1047   1.1       hwr 	case GREGADDRD:
   1048  1.33    itojun 		memset(&si, 0, sizeof(si));
   1049  1.28    itojun 		si.sin_family = AF_INET;
   1050  1.28    itojun 		si.sin_len = sizeof(struct sockaddr_in);
   1051   1.1       hwr 		si.sin_addr.s_addr = sc->g_dst.s_addr;
   1052   1.8  explorer 		sa = sintosa(&si);
   1053   1.1       hwr 		ifr->ifr_addr = *sa;
   1054  1.28    itojun 		break;
   1055  1.62    dyoung 	case GREDSOCK:
   1056  1.75    dyoung 		if (sc->sc_proto != IPPROTO_UDP)
   1057  1.62    dyoung 			return EINVAL;
   1058  1.63    dyoung 		if (sc->sc_fp != NULL) {
   1059  1.63    dyoung 			closef(sc->sc_fp, l);
   1060  1.63    dyoung 			sc->sc_fp = NULL;
   1061  1.63    dyoung 			error = gre_kick(sc);
   1062  1.63    dyoung 		}
   1063  1.62    dyoung 		break;
   1064  1.62    dyoung 	case GRESSOCK:
   1065  1.75    dyoung 		if (sc->sc_proto != IPPROTO_UDP)
   1066  1.62    dyoung 			return EINVAL;
   1067  1.62    dyoung 		/* getsock() will FILE_USE() the descriptor for us */
   1068  1.62    dyoung 		if ((error = getsock(p->p_fd, (int)ifr->ifr_value, &fp)) != 0)
   1069  1.62    dyoung 			break;
   1070  1.62    dyoung 		so = (struct socket *)fp->f_data;
   1071  1.62    dyoung 		if (so->so_type != SOCK_DGRAM) {
   1072  1.62    dyoung 			FILE_UNUSE(fp, NULL);
   1073  1.62    dyoung 			error = EINVAL;
   1074  1.62    dyoung 			break;
   1075  1.62    dyoung 		}
   1076  1.62    dyoung 		/* check address */
   1077  1.62    dyoung 		if ((error = gre_getnames(so, curlwp, &src, &dst)) != 0) {
   1078  1.62    dyoung 			FILE_UNUSE(fp, NULL);
   1079  1.62    dyoung 			break;
   1080  1.62    dyoung 		}
   1081  1.62    dyoung 
   1082  1.62    dyoung 		fp->f_count++;
   1083  1.62    dyoung 
   1084  1.62    dyoung 		ofp = sc->sc_fp;
   1085  1.62    dyoung 		sc->sc_fp = fp;
   1086  1.62    dyoung 		if ((error = gre_kick(sc)) != 0) {
   1087  1.62    dyoung 			closef(fp, l);
   1088  1.62    dyoung 			sc->sc_fp = ofp;
   1089  1.62    dyoung 			break;
   1090  1.62    dyoung 		}
   1091  1.62    dyoung 		sc->g_src = src.sin_addr;
   1092  1.62    dyoung 		sc->g_srcport = src.sin_port;
   1093  1.62    dyoung 		sc->g_dst = dst.sin_addr;
   1094  1.62    dyoung 		sc->g_dstport = dst.sin_port;
   1095  1.62    dyoung 		if (ofp != NULL)
   1096  1.62    dyoung 			closef(ofp, l);
   1097  1.62    dyoung 		break;
   1098  1.28    itojun 	case SIOCSLIFPHYADDR:
   1099  1.28    itojun 		if (lifr->addr.ss_family != AF_INET ||
   1100  1.31    itojun 		    lifr->dstaddr.ss_family != AF_INET) {
   1101  1.31    itojun 			error = EAFNOSUPPORT;
   1102  1.31    itojun 			break;
   1103  1.31    itojun 		}
   1104  1.28    itojun 		if (lifr->addr.ss_len != sizeof(si) ||
   1105  1.31    itojun 		    lifr->dstaddr.ss_len != sizeof(si)) {
   1106  1.31    itojun 			error = EINVAL;
   1107  1.31    itojun 			break;
   1108  1.31    itojun 		}
   1109  1.62    dyoung 		sc->g_src = satosin(&lifr->addr)->sin_addr;
   1110  1.62    dyoung 		sc->g_dst = satosin(&lifr->dstaddr)->sin_addr;
   1111  1.62    dyoung 		sc->g_srcport = satosin(&lifr->addr)->sin_port;
   1112  1.62    dyoung 		sc->g_dstport = satosin(&lifr->dstaddr)->sin_port;
   1113  1.30    itojun 		goto recompute;
   1114  1.28    itojun 	case SIOCDIFPHYADDR:
   1115  1.28    itojun 		sc->g_src.s_addr = INADDR_ANY;
   1116  1.28    itojun 		sc->g_dst.s_addr = INADDR_ANY;
   1117  1.62    dyoung 		sc->g_srcport = 0;
   1118  1.62    dyoung 		sc->g_dstport = 0;
   1119  1.62    dyoung 		goto recompute;
   1120  1.28    itojun 	case SIOCGLIFPHYADDR:
   1121  1.28    itojun 		if (sc->g_src.s_addr == INADDR_ANY ||
   1122  1.28    itojun 		    sc->g_dst.s_addr == INADDR_ANY) {
   1123  1.28    itojun 			error = EADDRNOTAVAIL;
   1124  1.28    itojun 			break;
   1125  1.28    itojun 		}
   1126  1.33    itojun 		memset(&si, 0, sizeof(si));
   1127  1.28    itojun 		si.sin_family = AF_INET;
   1128  1.28    itojun 		si.sin_len = sizeof(struct sockaddr_in);
   1129  1.62    dyoung 		si.sin_addr = sc->g_src;
   1130  1.75    dyoung 		if (sc->sc_proto == IPPROTO_UDP)
   1131  1.62    dyoung 			si.sin_port = sc->g_srcport;
   1132  1.33    itojun 		memcpy(&lifr->addr, &si, sizeof(si));
   1133  1.62    dyoung 		si.sin_addr = sc->g_dst;
   1134  1.75    dyoung 		if (sc->sc_proto == IPPROTO_UDP)
   1135  1.62    dyoung 			si.sin_port = sc->g_dstport;
   1136  1.33    itojun 		memcpy(&lifr->dstaddr, &si, sizeof(si));
   1137   1.1       hwr 		break;
   1138   1.1       hwr 	default:
   1139   1.1       hwr 		error = EINVAL;
   1140  1.31    itojun 		break;
   1141   1.1       hwr 	}
   1142   1.1       hwr 	splx(s);
   1143   1.8  explorer 	return (error);
   1144   1.1       hwr }
   1145   1.1       hwr 
   1146  1.20    itojun /*
   1147  1.78    dyoung  * Compute a route to our destination.
   1148   1.1       hwr  */
   1149  1.59   thorpej static int
   1150   1.8  explorer gre_compute_route(struct gre_softc *sc)
   1151   1.1       hwr {
   1152   1.1       hwr 	struct route *ro;
   1153   1.1       hwr 
   1154   1.8  explorer 	ro = &sc->route;
   1155  1.20    itojun 
   1156   1.8  explorer 	memset(ro, 0, sizeof(struct route));
   1157  1.73    dyoung 	satosin(&ro->ro_dst)->sin_addr = sc->g_dst;
   1158   1.8  explorer 	ro->ro_dst.sa_family = AF_INET;
   1159   1.8  explorer 	ro->ro_dst.sa_len = sizeof(ro->ro_dst);
   1160   1.8  explorer 
   1161   1.1       hwr #ifdef DIAGNOSTIC
   1162  1.45     grant 	printf("%s: searching for a route to %s", sc->sc_if.if_xname,
   1163  1.84    dyoung 	    inet_ntoa(satocsin(rtcache_getdst(ro))->sin_addr));
   1164   1.1       hwr #endif
   1165   1.1       hwr 
   1166  1.81     joerg 	rtcache_init(ro);
   1167  1.81     joerg 
   1168  1.81     joerg 	if (ro->ro_rt == NULL || ro->ro_rt->rt_ifp->if_softc == sc) {
   1169  1.25    martin #ifdef DIAGNOSTIC
   1170  1.25    martin 		if (ro->ro_rt == NULL)
   1171  1.25    martin 			printf(" - no route found!\n");
   1172  1.25    martin 		else
   1173  1.25    martin 			printf(" - route loops back to ourself!\n");
   1174  1.25    martin #endif
   1175  1.81     joerg 		rtcache_free(ro);
   1176  1.81     joerg 		return EADDRNOTAVAIL;
   1177  1.25    martin 	}
   1178  1.25    martin 
   1179  1.25    martin 	return 0;
   1180   1.1       hwr }
   1181   1.1       hwr 
   1182   1.3       hwr /*
   1183  1.20    itojun  * do a checksum of a buffer - much like in_cksum, which operates on
   1184  1.20    itojun  * mbufs.
   1185   1.3       hwr  */
   1186  1.48    itojun u_int16_t
   1187  1.48    itojun gre_in_cksum(u_int16_t *p, u_int len)
   1188   1.3       hwr {
   1189  1.48    itojun 	u_int32_t sum = 0;
   1190   1.3       hwr 	int nwords = len >> 1;
   1191  1.20    itojun 
   1192   1.3       hwr 	while (nwords-- != 0)
   1193   1.3       hwr 		sum += *p++;
   1194  1.20    itojun 
   1195  1.20    itojun 	if (len & 1) {
   1196  1.20    itojun 		union {
   1197  1.20    itojun 			u_short w;
   1198  1.20    itojun 			u_char c[2];
   1199  1.20    itojun 		} u;
   1200  1.20    itojun 		u.c[0] = *(u_char *)p;
   1201  1.20    itojun 		u.c[1] = 0;
   1202  1.20    itojun 		sum += u.w;
   1203  1.20    itojun 	}
   1204  1.20    itojun 
   1205  1.20    itojun 	/* end-around-carry */
   1206  1.20    itojun 	sum = (sum >> 16) + (sum & 0xffff);
   1207  1.20    itojun 	sum += (sum >> 16);
   1208  1.20    itojun 	return (~sum);
   1209   1.3       hwr }
   1210  1.54  christos #endif
   1211  1.54  christos 
   1212  1.59   thorpej void	greattach(int);
   1213  1.54  christos 
   1214  1.54  christos /* ARGSUSED */
   1215  1.54  christos void
   1216  1.74  christos greattach(int count)
   1217  1.54  christos {
   1218  1.54  christos #ifdef INET
   1219  1.54  christos 	LIST_INIT(&gre_softc_list);
   1220  1.54  christos 	if_clone_attach(&gre_cloner);
   1221  1.54  christos #endif
   1222  1.54  christos }
   1223