if_gre.c revision 1.62 1 1.62 dyoung /* $NetBSD: if_gre.c,v 1.62 2006/08/31 17:46:16 dyoung Exp $ */
2 1.4 thorpej
3 1.1 hwr /*
4 1.4 thorpej * Copyright (c) 1998 The NetBSD Foundation, Inc.
5 1.1 hwr * All rights reserved.
6 1.1 hwr *
7 1.1 hwr * This code is derived from software contributed to The NetBSD Foundation
8 1.1 hwr * by Heiko W.Rupp <hwr (at) pilhuhn.de>
9 1.1 hwr *
10 1.56 is * IPv6-over-GRE contributed by Gert Doering <gert (at) greenie.muc.de>
11 1.56 is *
12 1.1 hwr * Redistribution and use in source and binary forms, with or without
13 1.1 hwr * modification, are permitted provided that the following conditions
14 1.1 hwr * are met:
15 1.1 hwr * 1. Redistributions of source code must retain the above copyright
16 1.1 hwr * notice, this list of conditions and the following disclaimer.
17 1.1 hwr * 2. Redistributions in binary form must reproduce the above copyright
18 1.1 hwr * notice, this list of conditions and the following disclaimer in the
19 1.1 hwr * documentation and/or other materials provided with the distribution.
20 1.1 hwr * 3. All advertising materials mentioning features or use of this software
21 1.1 hwr * must display the following acknowledgement:
22 1.1 hwr * This product includes software developed by the NetBSD
23 1.1 hwr * Foundation, Inc. and its contributors.
24 1.1 hwr * 4. Neither the name of The NetBSD Foundation nor the names of its
25 1.1 hwr * contributors may be used to endorse or promote products derived
26 1.1 hwr * from this software without specific prior written permission.
27 1.1 hwr *
28 1.1 hwr * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
29 1.1 hwr * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
30 1.1 hwr * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
31 1.1 hwr * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
32 1.1 hwr * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
33 1.1 hwr * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
34 1.1 hwr * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
35 1.1 hwr * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
36 1.1 hwr * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
37 1.1 hwr * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
38 1.1 hwr * POSSIBILITY OF SUCH DAMAGE.
39 1.1 hwr */
40 1.1 hwr
41 1.1 hwr /*
42 1.1 hwr * Encapsulate L3 protocols into IP
43 1.1 hwr * See RFC 1701 and 1702 for more details.
44 1.1 hwr * If_gre is compatible with Cisco GRE tunnels, so you can
45 1.1 hwr * have a NetBSD box as the other end of a tunnel interface of a Cisco
46 1.1 hwr * router. See gre(4) for more details.
47 1.6 hwr * Also supported: IP in IP encaps (proto 55) as of RFC 2004
48 1.1 hwr */
49 1.22 lukem
50 1.22 lukem #include <sys/cdefs.h>
51 1.62 dyoung __KERNEL_RCSID(0, "$NetBSD: if_gre.c,v 1.62 2006/08/31 17:46:16 dyoung Exp $");
52 1.1 hwr
53 1.62 dyoung #include "opt_gre.h"
54 1.1 hwr #include "opt_inet.h"
55 1.9 drochner #include "opt_ns.h"
56 1.1 hwr #include "bpfilter.h"
57 1.1 hwr
58 1.54 christos #ifdef INET
59 1.1 hwr #include <sys/param.h>
60 1.62 dyoung #include <sys/file.h>
61 1.62 dyoung #include <sys/filedesc.h>
62 1.1 hwr #include <sys/malloc.h>
63 1.1 hwr #include <sys/mbuf.h>
64 1.13 martin #include <sys/proc.h>
65 1.1 hwr #include <sys/protosw.h>
66 1.1 hwr #include <sys/socket.h>
67 1.62 dyoung #include <sys/socketvar.h>
68 1.1 hwr #include <sys/ioctl.h>
69 1.10 thorpej #include <sys/queue.h>
70 1.1 hwr #if __NetBSD__
71 1.1 hwr #include <sys/systm.h>
72 1.62 dyoung #include <sys/sysctl.h>
73 1.60 elad #include <sys/kauth.h>
74 1.1 hwr #endif
75 1.1 hwr
76 1.62 dyoung #include <sys/kthread.h>
77 1.62 dyoung
78 1.1 hwr #include <machine/cpu.h>
79 1.1 hwr
80 1.1 hwr #include <net/ethertypes.h>
81 1.1 hwr #include <net/if.h>
82 1.1 hwr #include <net/if_types.h>
83 1.1 hwr #include <net/netisr.h>
84 1.1 hwr #include <net/route.h>
85 1.1 hwr
86 1.1 hwr #ifdef INET
87 1.1 hwr #include <netinet/in.h>
88 1.1 hwr #include <netinet/in_systm.h>
89 1.1 hwr #include <netinet/in_var.h>
90 1.1 hwr #include <netinet/ip.h>
91 1.1 hwr #include <netinet/ip_var.h>
92 1.1 hwr #else
93 1.4 thorpej #error "Huh? if_gre without inet?"
94 1.1 hwr #endif
95 1.1 hwr
96 1.1 hwr #ifdef NS
97 1.1 hwr #include <netns/ns.h>
98 1.1 hwr #include <netns/ns_if.h>
99 1.1 hwr #endif
100 1.1 hwr
101 1.1 hwr #ifdef NETATALK
102 1.1 hwr #include <netatalk/at.h>
103 1.1 hwr #include <netatalk/at_var.h>
104 1.1 hwr #include <netatalk/at_extern.h>
105 1.1 hwr #endif
106 1.1 hwr
107 1.1 hwr #if NBPFILTER > 0
108 1.1 hwr #include <sys/time.h>
109 1.1 hwr #include <net/bpf.h>
110 1.1 hwr #endif
111 1.1 hwr
112 1.1 hwr #include <net/if_gre.h>
113 1.1 hwr
114 1.20 itojun /*
115 1.27 martin * It is not easy to calculate the right value for a GRE MTU.
116 1.27 martin * We leave this task to the admin and use the same default that
117 1.27 martin * other vendors use.
118 1.20 itojun */
119 1.27 martin #define GREMTU 1476
120 1.1 hwr
121 1.62 dyoung #ifdef GRE_DEBUG
122 1.62 dyoung #define GRE_DPRINTF(__sc, __fmt, ...) \
123 1.62 dyoung do { \
124 1.62 dyoung if (((__sc)->sc_if.if_flags & IFF_DEBUG) != 0) \
125 1.62 dyoung printf(__fmt, __VA_ARGS__); \
126 1.62 dyoung } while (/*CONSTCOND*/0)
127 1.62 dyoung #else
128 1.62 dyoung #define GRE_DPRINTF(__sc, __fmt, ...) do { } while (/*CONSTCOND*/0)
129 1.62 dyoung #endif /* GRE_DEBUG */
130 1.62 dyoung
131 1.11 thorpej struct gre_softc_head gre_softc_list;
132 1.26 martin int ip_gre_ttl = GRE_TTL;
133 1.1 hwr
134 1.59 thorpej static int gre_clone_create(struct if_clone *, int);
135 1.59 thorpej static int gre_clone_destroy(struct ifnet *);
136 1.10 thorpej
137 1.59 thorpej static struct if_clone gre_cloner =
138 1.10 thorpej IF_CLONE_INITIALIZER("gre", gre_clone_create, gre_clone_destroy);
139 1.1 hwr
140 1.59 thorpej static int gre_output(struct ifnet *, struct mbuf *, struct sockaddr *,
141 1.59 thorpej struct rtentry *);
142 1.59 thorpej static int gre_ioctl(struct ifnet *, u_long, caddr_t);
143 1.1 hwr
144 1.59 thorpej static int gre_compute_route(struct gre_softc *sc);
145 1.59 thorpej
146 1.62 dyoung static int gre_getsockname(struct socket *, struct mbuf *, struct lwp *);
147 1.62 dyoung static int gre_getpeername(struct socket *, struct mbuf *, struct lwp *);
148 1.62 dyoung static int gre_getnames(struct socket *, struct lwp *, struct sockaddr_in *,
149 1.62 dyoung struct sockaddr_in *);
150 1.62 dyoung
151 1.62 dyoung static void
152 1.62 dyoung gre_stop(int *running)
153 1.62 dyoung {
154 1.62 dyoung *running = 0;
155 1.62 dyoung wakeup(running);
156 1.62 dyoung }
157 1.62 dyoung
158 1.62 dyoung static void
159 1.62 dyoung gre_join(int *running)
160 1.62 dyoung {
161 1.62 dyoung int s;
162 1.62 dyoung
163 1.62 dyoung s = splnet();
164 1.62 dyoung while (*running != 0) {
165 1.62 dyoung splx(s);
166 1.62 dyoung tsleep(running, PSOCK, "grejoin", 0);
167 1.62 dyoung s = splnet();
168 1.62 dyoung }
169 1.62 dyoung splx(s);
170 1.62 dyoung }
171 1.62 dyoung
172 1.62 dyoung static void
173 1.62 dyoung gre_wakeup(struct gre_softc *sc)
174 1.62 dyoung {
175 1.62 dyoung GRE_DPRINTF(sc, "%s: enter\n", __func__);
176 1.62 dyoung sc->sc_waitchan = 1;
177 1.62 dyoung wakeup(&sc->sc_waitchan);
178 1.62 dyoung }
179 1.62 dyoung
180 1.59 thorpej static int
181 1.59 thorpej gre_clone_create(struct if_clone *ifc, int unit)
182 1.1 hwr {
183 1.8 explorer struct gre_softc *sc;
184 1.1 hwr
185 1.10 thorpej sc = malloc(sizeof(struct gre_softc), M_DEVBUF, M_WAITOK);
186 1.10 thorpej memset(sc, 0, sizeof(struct gre_softc));
187 1.10 thorpej
188 1.50 itojun snprintf(sc->sc_if.if_xname, sizeof(sc->sc_if.if_xname), "%s%d",
189 1.50 itojun ifc->ifc_name, unit);
190 1.10 thorpej sc->sc_if.if_softc = sc;
191 1.51 tron sc->sc_if.if_type = IFT_TUNNEL;
192 1.34 itojun sc->sc_if.if_addrlen = 0;
193 1.10 thorpej sc->sc_if.if_hdrlen = 24; /* IP + GRE */
194 1.15 thorpej sc->sc_if.if_dlt = DLT_NULL;
195 1.20 itojun sc->sc_if.if_mtu = GREMTU;
196 1.10 thorpej sc->sc_if.if_flags = IFF_POINTOPOINT|IFF_MULTICAST;
197 1.10 thorpej sc->sc_if.if_output = gre_output;
198 1.10 thorpej sc->sc_if.if_ioctl = gre_ioctl;
199 1.10 thorpej sc->g_dst.s_addr = sc->g_src.s_addr = INADDR_ANY;
200 1.62 dyoung sc->g_dstport = sc->g_srcport = 0;
201 1.10 thorpej sc->g_proto = IPPROTO_GRE;
202 1.62 dyoung IFQ_SET_READY(&sc->sc_snd);
203 1.62 dyoung IFQ_SET_MAXLEN(&sc->sc_snd, IFQ_MAXLEN);
204 1.35 itojun sc->sc_if.if_flags |= IFF_LINK0;
205 1.10 thorpej if_attach(&sc->sc_if);
206 1.16 thorpej if_alloc_sadl(&sc->sc_if);
207 1.1 hwr #if NBPFILTER > 0
208 1.14 thorpej bpfattach(&sc->sc_if, DLT_NULL, sizeof(u_int32_t));
209 1.1 hwr #endif
210 1.10 thorpej LIST_INSERT_HEAD(&gre_softc_list, sc, sc_list);
211 1.10 thorpej return (0);
212 1.10 thorpej }
213 1.1 hwr
214 1.59 thorpej static int
215 1.59 thorpej gre_clone_destroy(struct ifnet *ifp)
216 1.10 thorpej {
217 1.10 thorpej struct gre_softc *sc = ifp->if_softc;
218 1.10 thorpej
219 1.10 thorpej LIST_REMOVE(sc, sc_list);
220 1.10 thorpej #if NBPFILTER > 0
221 1.10 thorpej bpfdetach(ifp);
222 1.10 thorpej #endif
223 1.10 thorpej if_detach(ifp);
224 1.62 dyoung gre_wakeup(sc);
225 1.62 dyoung gre_join(&sc->sc_thread);
226 1.62 dyoung if (sc->sc_fp != NULL) {
227 1.62 dyoung closef(sc->sc_fp, curlwp);
228 1.62 dyoung sc->sc_fp = NULL;
229 1.62 dyoung }
230 1.10 thorpej free(sc, M_DEVBUF);
231 1.53 peter
232 1.53 peter return (0);
233 1.1 hwr }
234 1.1 hwr
235 1.62 dyoung static void
236 1.62 dyoung gre_receive(struct socket *so, caddr_t arg, int waitflag)
237 1.62 dyoung {
238 1.62 dyoung struct gre_softc *sc = (struct gre_softc *)arg;
239 1.62 dyoung
240 1.62 dyoung GRE_DPRINTF(sc, "%s: enter\n", __func__);
241 1.62 dyoung
242 1.62 dyoung gre_wakeup(sc);
243 1.62 dyoung }
244 1.62 dyoung
245 1.62 dyoung static void
246 1.62 dyoung gre_upcall_add(struct socket *so, caddr_t arg)
247 1.62 dyoung {
248 1.62 dyoung /* XXX What if the kernel already set an upcall? */
249 1.62 dyoung so->so_upcallarg = arg;
250 1.62 dyoung so->so_upcall = gre_receive;
251 1.62 dyoung so->so_rcv.sb_flags |= SB_UPCALL;
252 1.62 dyoung }
253 1.62 dyoung
254 1.62 dyoung static void
255 1.62 dyoung gre_upcall_remove(struct socket *so)
256 1.62 dyoung {
257 1.62 dyoung /* XXX What if the kernel already set an upcall? */
258 1.62 dyoung so->so_rcv.sb_flags &= ~SB_UPCALL;
259 1.62 dyoung so->so_upcallarg = NULL;
260 1.62 dyoung so->so_upcall = NULL;
261 1.62 dyoung }
262 1.62 dyoung
263 1.62 dyoung static void
264 1.62 dyoung gre_sodestroy(struct socket **sop)
265 1.62 dyoung {
266 1.62 dyoung gre_upcall_remove(*sop);
267 1.62 dyoung soshutdown(*sop, SHUT_RDWR);
268 1.62 dyoung soclose(*sop);
269 1.62 dyoung *sop = NULL;
270 1.62 dyoung }
271 1.62 dyoung
272 1.62 dyoung static struct mbuf *
273 1.62 dyoung gre_getsockmbuf(struct socket *so)
274 1.62 dyoung {
275 1.62 dyoung struct mbuf *m;
276 1.62 dyoung
277 1.62 dyoung m = m_get(M_WAIT, MT_SONAME);
278 1.62 dyoung if (m != NULL)
279 1.62 dyoung MCLAIM(m, so->so_mowner);
280 1.62 dyoung return m;
281 1.62 dyoung }
282 1.62 dyoung
283 1.62 dyoung static int
284 1.62 dyoung gre_socreate1(struct gre_softc *sc, struct lwp *l, struct gre_soparm *sp,
285 1.62 dyoung struct socket **sop)
286 1.62 dyoung {
287 1.62 dyoung int rc;
288 1.62 dyoung struct mbuf *m;
289 1.62 dyoung struct sockaddr_in *sin;
290 1.62 dyoung struct socket *so;
291 1.62 dyoung
292 1.62 dyoung GRE_DPRINTF(sc, "%s: enter\n", __func__);
293 1.62 dyoung rc = socreate(AF_INET, sop, SOCK_DGRAM, IPPROTO_UDP, l);
294 1.62 dyoung if (rc != 0) {
295 1.62 dyoung GRE_DPRINTF(sc, "%s: socreate failed\n", __func__);
296 1.62 dyoung return rc;
297 1.62 dyoung }
298 1.62 dyoung
299 1.62 dyoung so = *sop;
300 1.62 dyoung
301 1.62 dyoung gre_upcall_add(so, (caddr_t)sc);
302 1.62 dyoung if ((m = gre_getsockmbuf(so)) == NULL) {
303 1.62 dyoung rc = ENOBUFS;
304 1.62 dyoung goto out;
305 1.62 dyoung }
306 1.62 dyoung sin = mtod(m, struct sockaddr_in *);
307 1.62 dyoung sin->sin_len = m->m_len = sizeof(struct sockaddr_in);
308 1.62 dyoung sin->sin_family = AF_INET;
309 1.62 dyoung sin->sin_addr = sc->g_src;
310 1.62 dyoung sin->sin_port = sc->g_srcport;
311 1.62 dyoung
312 1.62 dyoung GRE_DPRINTF(sc, "%s: bind 0x%08" PRIx32 " port %d\n", __func__,
313 1.62 dyoung sin->sin_addr.s_addr, ntohs(sin->sin_port));
314 1.62 dyoung if ((rc = sobind(so, m, l)) != 0) {
315 1.62 dyoung GRE_DPRINTF(sc, "%s: sobind failed\n", __func__);
316 1.62 dyoung goto out;
317 1.62 dyoung }
318 1.62 dyoung
319 1.62 dyoung if (sc->g_srcport == 0) {
320 1.62 dyoung if (gre_getsockname(so, m, l) != 0) {
321 1.62 dyoung GRE_DPRINTF(sc, "%s: gre_getsockname failed\n",
322 1.62 dyoung __func__);
323 1.62 dyoung goto out;
324 1.62 dyoung }
325 1.62 dyoung sc->g_srcport = sin->sin_port;
326 1.62 dyoung }
327 1.62 dyoung
328 1.62 dyoung sin->sin_addr = sc->g_dst;
329 1.62 dyoung sin->sin_port = sc->g_dstport;
330 1.62 dyoung
331 1.62 dyoung rc = soconnect(so, m, l);
332 1.62 dyoung
333 1.62 dyoung if (rc != 0) {
334 1.62 dyoung GRE_DPRINTF(sc, "%s: soconnect failed\n", __func__);
335 1.62 dyoung goto out;
336 1.62 dyoung }
337 1.62 dyoung
338 1.62 dyoung *mtod(m, int *) = ip_gre_ttl;
339 1.62 dyoung rc = (*so->so_proto->pr_ctloutput)(PRCO_SETOPT, so, IPPROTO_IP, IP_TTL,
340 1.62 dyoung &m);
341 1.62 dyoung m = NULL;
342 1.62 dyoung if (rc != 0) {
343 1.62 dyoung printf("%s: setopt ttl failed\n", __func__);
344 1.62 dyoung rc = 0;
345 1.62 dyoung }
346 1.62 dyoung out:
347 1.62 dyoung m_freem(m);
348 1.62 dyoung
349 1.62 dyoung if (rc != 0)
350 1.62 dyoung gre_sodestroy(sop);
351 1.62 dyoung else
352 1.62 dyoung *sp = sc->sc_sp;
353 1.62 dyoung
354 1.62 dyoung return rc;
355 1.62 dyoung }
356 1.62 dyoung
357 1.62 dyoung static void
358 1.62 dyoung gre_thread1(struct gre_softc *sc, struct lwp *l)
359 1.62 dyoung {
360 1.62 dyoung int flags, rc, s;
361 1.62 dyoung const struct gre_h *gh;
362 1.62 dyoung struct ifnet *ifp = &sc->sc_if;
363 1.62 dyoung struct mbuf *m;
364 1.62 dyoung struct socket *so = NULL;
365 1.62 dyoung struct uio uio;
366 1.62 dyoung struct gre_soparm sp;
367 1.62 dyoung
368 1.62 dyoung GRE_DPRINTF(sc, "%s: enter\n", __func__);
369 1.62 dyoung s = splnet();
370 1.62 dyoung
371 1.62 dyoung sc->sc_waitchan = 1;
372 1.62 dyoung
373 1.62 dyoung memset(&sp, 0, sizeof(sp));
374 1.62 dyoung memset(&uio, 0, sizeof(uio));
375 1.62 dyoung
376 1.62 dyoung ifp->if_flags |= IFF_RUNNING;
377 1.62 dyoung
378 1.62 dyoung for (;;) {
379 1.62 dyoung while (sc->sc_waitchan == 0) {
380 1.62 dyoung splx(s);
381 1.62 dyoung GRE_DPRINTF(sc, "%s: sleeping\n", __func__);
382 1.62 dyoung tsleep(&sc->sc_waitchan, PSOCK, "grewait", 0);
383 1.62 dyoung s = splnet();
384 1.62 dyoung }
385 1.62 dyoung sc->sc_waitchan = 0;
386 1.62 dyoung GRE_DPRINTF(sc, "%s: awake\n", __func__);
387 1.62 dyoung if ((ifp->if_flags & IFF_UP) != IFF_UP) {
388 1.62 dyoung GRE_DPRINTF(sc, "%s: not up & running; exiting\n",
389 1.62 dyoung __func__);
390 1.62 dyoung break;
391 1.62 dyoung }
392 1.62 dyoung if (sc->g_proto != IPPROTO_UDP) {
393 1.62 dyoung GRE_DPRINTF(sc, "%s: not udp; exiting\n", __func__);
394 1.62 dyoung break;
395 1.62 dyoung }
396 1.62 dyoung /* XXX optimize */
397 1.62 dyoung if (memcmp(&sp, &sc->sc_sp, sizeof(sp)) != 0) {
398 1.62 dyoung GRE_DPRINTF(sc, "%s: parameters changed\n", __func__);
399 1.62 dyoung
400 1.62 dyoung if (sp.sp_fp != NULL) {
401 1.62 dyoung FILE_UNUSE(sp.sp_fp, NULL);
402 1.62 dyoung sp.sp_fp = NULL;
403 1.62 dyoung so = NULL;
404 1.62 dyoung } else if (so != NULL)
405 1.62 dyoung gre_sodestroy(&so);
406 1.62 dyoung
407 1.62 dyoung if (sc->sc_fp != NULL) {
408 1.62 dyoung so = (struct socket *)sc->sc_fp->f_data;
409 1.62 dyoung gre_upcall_add(so, (caddr_t)sc);
410 1.62 dyoung sp = sc->sc_sp;
411 1.62 dyoung FILE_USE(sp.sp_fp);
412 1.62 dyoung } else if (gre_socreate1(sc, l, &sp, &so) != 0)
413 1.62 dyoung goto out;
414 1.62 dyoung }
415 1.62 dyoung for (;;) {
416 1.62 dyoung flags = MSG_DONTWAIT;
417 1.62 dyoung uio.uio_resid = 1000000;
418 1.62 dyoung rc = (*so->so_receive)(so, NULL, &uio, &m, NULL,
419 1.62 dyoung &flags);
420 1.62 dyoung /* TBD Back off if ECONNREFUSED (indicates
421 1.62 dyoung * ICMP Port Unreachable)?
422 1.62 dyoung */
423 1.62 dyoung if (rc == EWOULDBLOCK) {
424 1.62 dyoung GRE_DPRINTF(sc, "%s: so_receive EWOULDBLOCK\n",
425 1.62 dyoung __func__);
426 1.62 dyoung break;
427 1.62 dyoung } else if (rc != 0 || m == NULL) {
428 1.62 dyoung GRE_DPRINTF(sc, "%s: rc %d m %p\n",
429 1.62 dyoung ifp->if_xname, rc, (void *)m);
430 1.62 dyoung continue;
431 1.62 dyoung } else
432 1.62 dyoung GRE_DPRINTF(sc, "%s: so_receive ok\n",
433 1.62 dyoung __func__);
434 1.62 dyoung if (m->m_len < sizeof(*gh) &&
435 1.62 dyoung (m = m_pullup(m, sizeof(*gh))) == NULL) {
436 1.62 dyoung GRE_DPRINTF(sc, "%s: m_pullup failed\n",
437 1.62 dyoung __func__);
438 1.62 dyoung continue;
439 1.62 dyoung }
440 1.62 dyoung gh = mtod(m, const struct gre_h *);
441 1.62 dyoung
442 1.62 dyoung if (gre_input3(sc, m, 0, IPPROTO_GRE, gh) == 0) {
443 1.62 dyoung GRE_DPRINTF(sc, "%s: dropping unsupported\n",
444 1.62 dyoung __func__);
445 1.62 dyoung ifp->if_ierrors++;
446 1.62 dyoung m_freem(m);
447 1.62 dyoung }
448 1.62 dyoung }
449 1.62 dyoung for (;;) {
450 1.62 dyoung IF_DEQUEUE(&sc->sc_snd, m);
451 1.62 dyoung if (m == NULL)
452 1.62 dyoung break;
453 1.62 dyoung GRE_DPRINTF(sc, "%s: dequeue\n", __func__);
454 1.62 dyoung if ((so->so_state & SS_ISCONNECTED) == 0) {
455 1.62 dyoung GRE_DPRINTF(sc, "%s: not connected\n",
456 1.62 dyoung __func__);
457 1.62 dyoung m_freem(m);
458 1.62 dyoung continue;
459 1.62 dyoung }
460 1.62 dyoung rc = (*so->so_send)(so, NULL, NULL, m, NULL, 0, l);
461 1.62 dyoung /* XXX handle ENOBUFS? */
462 1.62 dyoung if (rc != 0)
463 1.62 dyoung GRE_DPRINTF(sc, "%s: so_send failed\n",
464 1.62 dyoung __func__);
465 1.62 dyoung }
466 1.62 dyoung /* Give the software interrupt queues a chance to
467 1.62 dyoung * run, or else when I send a ping from gre0 to gre1 on
468 1.62 dyoung * the same host, gre0 will not wake for the reply.
469 1.62 dyoung */
470 1.62 dyoung splx(s);
471 1.62 dyoung s = splnet();
472 1.62 dyoung }
473 1.62 dyoung if (sp.sp_fp != NULL) {
474 1.62 dyoung GRE_DPRINTF(sc, "%s: removing upcall\n", __func__);
475 1.62 dyoung gre_upcall_remove(so);
476 1.62 dyoung FILE_UNUSE(sp.sp_fp, NULL);
477 1.62 dyoung sp.sp_fp = NULL;
478 1.62 dyoung } else
479 1.62 dyoung gre_sodestroy(&so);
480 1.62 dyoung out:
481 1.62 dyoung GRE_DPRINTF(sc, "%s: stopping\n", __func__);
482 1.62 dyoung if (sc->g_proto == IPPROTO_UDP)
483 1.62 dyoung ifp->if_flags &= ~IFF_RUNNING;
484 1.62 dyoung IFQ_PURGE(&sc->sc_snd);
485 1.62 dyoung gre_stop(&sc->sc_thread);
486 1.62 dyoung /* must not touch sc after this! */
487 1.62 dyoung GRE_DPRINTF(sc, "%s: restore ipl\n", __func__);
488 1.62 dyoung splx(s);
489 1.62 dyoung }
490 1.62 dyoung
491 1.62 dyoung static void
492 1.62 dyoung gre_thread(void *arg)
493 1.62 dyoung {
494 1.62 dyoung struct gre_softc *sc = (struct gre_softc *)arg;
495 1.62 dyoung
496 1.62 dyoung gre_thread1(sc, curlwp);
497 1.62 dyoung /* must not touch sc after this! */
498 1.62 dyoung kthread_exit(0);
499 1.62 dyoung }
500 1.62 dyoung
501 1.62 dyoung int
502 1.62 dyoung gre_input3(struct gre_softc *sc, struct mbuf *m, int hlen, u_char proto,
503 1.62 dyoung const struct gre_h *gh)
504 1.62 dyoung {
505 1.62 dyoung u_int16_t flags;
506 1.62 dyoung #if NBPFILTER > 0
507 1.62 dyoung u_int32_t af = AF_INET; /* af passed to BPF tap */
508 1.62 dyoung #endif
509 1.62 dyoung int s, isr;
510 1.62 dyoung struct ifqueue *ifq;
511 1.62 dyoung
512 1.62 dyoung sc->sc_if.if_ipackets++;
513 1.62 dyoung sc->sc_if.if_ibytes += m->m_pkthdr.len;
514 1.62 dyoung
515 1.62 dyoung switch (proto) {
516 1.62 dyoung case IPPROTO_GRE:
517 1.62 dyoung hlen += sizeof(struct gre_h);
518 1.62 dyoung
519 1.62 dyoung /* process GRE flags as packet can be of variable len */
520 1.62 dyoung flags = ntohs(gh->flags);
521 1.62 dyoung
522 1.62 dyoung /* Checksum & Offset are present */
523 1.62 dyoung if ((flags & GRE_CP) | (flags & GRE_RP))
524 1.62 dyoung hlen += 4;
525 1.62 dyoung /* We don't support routing fields (variable length) */
526 1.62 dyoung if (flags & GRE_RP)
527 1.62 dyoung return (0);
528 1.62 dyoung if (flags & GRE_KP)
529 1.62 dyoung hlen += 4;
530 1.62 dyoung if (flags & GRE_SP)
531 1.62 dyoung hlen += 4;
532 1.62 dyoung
533 1.62 dyoung switch (ntohs(gh->ptype)) { /* ethertypes */
534 1.62 dyoung case ETHERTYPE_IP: /* shouldn't need a schednetisr(), as */
535 1.62 dyoung ifq = &ipintrq; /* we are in ip_input */
536 1.62 dyoung isr = NETISR_IP;
537 1.62 dyoung break;
538 1.62 dyoung #ifdef NS
539 1.62 dyoung case ETHERTYPE_NS:
540 1.62 dyoung ifq = &nsintrq;
541 1.62 dyoung isr = NETISR_NS;
542 1.62 dyoung #if NBPFILTER > 0
543 1.62 dyoung af = AF_NS;
544 1.62 dyoung #endif
545 1.62 dyoung break;
546 1.62 dyoung #endif
547 1.62 dyoung #ifdef NETATALK
548 1.62 dyoung case ETHERTYPE_ATALK:
549 1.62 dyoung ifq = &atintrq1;
550 1.62 dyoung isr = NETISR_ATALK;
551 1.62 dyoung #if NBPFILTER > 0
552 1.62 dyoung af = AF_APPLETALK;
553 1.62 dyoung #endif
554 1.62 dyoung break;
555 1.62 dyoung #endif
556 1.62 dyoung #ifdef INET6
557 1.62 dyoung case ETHERTYPE_IPV6:
558 1.62 dyoung GRE_DPRINTF(sc, "%s: IPv6 packet\n", __func__);
559 1.62 dyoung ifq = &ip6intrq;
560 1.62 dyoung isr = NETISR_IPV6;
561 1.62 dyoung #if NBPFILTER > 0
562 1.62 dyoung af = AF_INET6;
563 1.62 dyoung #endif
564 1.62 dyoung break;
565 1.62 dyoung #endif
566 1.62 dyoung default: /* others not yet supported */
567 1.62 dyoung printf("%s: unhandled ethertype 0x%04x\n", __func__,
568 1.62 dyoung ntohs(gh->ptype));
569 1.62 dyoung return (0);
570 1.62 dyoung }
571 1.62 dyoung break;
572 1.62 dyoung default:
573 1.62 dyoung /* others not yet supported */
574 1.62 dyoung return (0);
575 1.62 dyoung }
576 1.62 dyoung
577 1.62 dyoung if (hlen > m->m_pkthdr.len) {
578 1.62 dyoung m_freem(m);
579 1.62 dyoung sc->sc_if.if_ierrors++;
580 1.62 dyoung return (EINVAL);
581 1.62 dyoung }
582 1.62 dyoung m_adj(m, hlen);
583 1.62 dyoung
584 1.62 dyoung #if NBPFILTER > 0
585 1.62 dyoung if (sc->sc_if.if_bpf != NULL)
586 1.62 dyoung bpf_mtap_af(sc->sc_if.if_bpf, af, m);
587 1.62 dyoung #endif /*NBPFILTER > 0*/
588 1.62 dyoung
589 1.62 dyoung m->m_pkthdr.rcvif = &sc->sc_if;
590 1.62 dyoung
591 1.62 dyoung s = splnet(); /* possible */
592 1.62 dyoung if (IF_QFULL(ifq)) {
593 1.62 dyoung IF_DROP(ifq);
594 1.62 dyoung m_freem(m);
595 1.62 dyoung } else {
596 1.62 dyoung IF_ENQUEUE(ifq, m);
597 1.62 dyoung }
598 1.62 dyoung /* we need schednetisr since the address family may change */
599 1.62 dyoung schednetisr(isr);
600 1.62 dyoung splx(s);
601 1.62 dyoung
602 1.62 dyoung return (1); /* packet is done, no further processing needed */
603 1.62 dyoung }
604 1.62 dyoung
605 1.20 itojun /*
606 1.1 hwr * The output routine. Takes a packet and encapsulates it in the protocol
607 1.6 hwr * given by sc->g_proto. See also RFC 1701 and RFC 2004
608 1.1 hwr */
609 1.59 thorpej static int
610 1.8 explorer gre_output(struct ifnet *ifp, struct mbuf *m, struct sockaddr *dst,
611 1.8 explorer struct rtentry *rt)
612 1.1 hwr {
613 1.62 dyoung int error = 0, hlen;
614 1.10 thorpej struct gre_softc *sc = ifp->if_softc;
615 1.62 dyoung struct greip *gi;
616 1.62 dyoung struct gre_h *gh;
617 1.62 dyoung struct ip *eip, *ip;
618 1.56 is u_int8_t ip_tos = 0;
619 1.48 itojun u_int16_t etype = 0;
620 1.20 itojun struct mobile_h mob_h;
621 1.24 martin
622 1.39 itojun if ((ifp->if_flags & (IFF_UP | IFF_RUNNING)) == 0 ||
623 1.37 itojun sc->g_src.s_addr == INADDR_ANY || sc->g_dst.s_addr == INADDR_ANY) {
624 1.37 itojun m_freem(m);
625 1.38 itojun error = ENETDOWN;
626 1.38 itojun goto end;
627 1.37 itojun }
628 1.1 hwr
629 1.62 dyoung gi = NULL;
630 1.41 itojun ip = NULL;
631 1.1 hwr
632 1.1 hwr #if NBPFILTER >0
633 1.52 christos if (ifp->if_bpf)
634 1.52 christos bpf_mtap_af(ifp->if_bpf, dst->sa_family, m);
635 1.1 hwr #endif
636 1.1 hwr
637 1.26 martin m->m_flags &= ~(M_BCAST|M_MCAST);
638 1.1 hwr
639 1.62 dyoung switch (sc->g_proto) {
640 1.62 dyoung case IPPROTO_MOBILE:
641 1.3 hwr if (dst->sa_family == AF_INET) {
642 1.3 hwr int msiz;
643 1.3 hwr
644 1.62 dyoung if (M_UNWRITABLE(m, sizeof(*ip)) &&
645 1.62 dyoung (m = m_pullup(m, sizeof(*ip))) == NULL) {
646 1.62 dyoung error = ENOBUFS;
647 1.62 dyoung goto end;
648 1.62 dyoung }
649 1.41 itojun ip = mtod(m, struct ip *);
650 1.3 hwr
651 1.8 explorer memset(&mob_h, 0, MOB_H_SIZ_L);
652 1.41 itojun mob_h.proto = (ip->ip_p) << 8;
653 1.41 itojun mob_h.odst = ip->ip_dst.s_addr;
654 1.41 itojun ip->ip_dst.s_addr = sc->g_dst.s_addr;
655 1.3 hwr
656 1.3 hwr /*
657 1.8 explorer * If the packet comes from our host, we only change
658 1.8 explorer * the destination address in the IP header.
659 1.8 explorer * Else we also need to save and change the source
660 1.3 hwr */
661 1.41 itojun if (in_hosteq(ip->ip_src, sc->g_src)) {
662 1.8 explorer msiz = MOB_H_SIZ_S;
663 1.3 hwr } else {
664 1.3 hwr mob_h.proto |= MOB_H_SBIT;
665 1.41 itojun mob_h.osrc = ip->ip_src.s_addr;
666 1.41 itojun ip->ip_src.s_addr = sc->g_src.s_addr;
667 1.8 explorer msiz = MOB_H_SIZ_L;
668 1.3 hwr }
669 1.3 hwr HTONS(mob_h.proto);
670 1.48 itojun mob_h.hcrc = gre_in_cksum((u_int16_t *)&mob_h, msiz);
671 1.3 hwr
672 1.62 dyoung M_PREPEND(m, msiz, M_DONTWAIT);
673 1.62 dyoung if (m == NULL) {
674 1.62 dyoung error = ENOBUFS;
675 1.62 dyoung goto end;
676 1.3 hwr }
677 1.62 dyoung /* XXX Assuming that ip does not dangle after
678 1.62 dyoung * M_PREPEND. In practice, that's true, but
679 1.62 dyoung * that's in M_PREPEND's contract.
680 1.62 dyoung */
681 1.62 dyoung memmove(mtod(m, caddr_t), ip, sizeof(*ip));
682 1.41 itojun ip = mtod(m, struct ip *);
683 1.41 itojun memcpy((caddr_t)(ip + 1), &mob_h, (unsigned)msiz);
684 1.42 itojun ip->ip_len = htons(ntohs(ip->ip_len) + msiz);
685 1.3 hwr } else { /* AF_INET */
686 1.3 hwr IF_DROP(&ifp->if_snd);
687 1.3 hwr m_freem(m);
688 1.38 itojun error = EINVAL;
689 1.38 itojun goto end;
690 1.3 hwr }
691 1.62 dyoung break;
692 1.62 dyoung case IPPROTO_UDP:
693 1.62 dyoung case IPPROTO_GRE:
694 1.62 dyoung GRE_DPRINTF(sc, "%s: dst->sa_family=%d\n", __func__,
695 1.62 dyoung dst->sa_family);
696 1.20 itojun switch (dst->sa_family) {
697 1.1 hwr case AF_INET:
698 1.41 itojun ip = mtod(m, struct ip *);
699 1.56 is ip_tos = ip->ip_tos;
700 1.8 explorer etype = ETHERTYPE_IP;
701 1.1 hwr break;
702 1.1 hwr #ifdef NETATALK
703 1.1 hwr case AF_APPLETALK:
704 1.8 explorer etype = ETHERTYPE_ATALK;
705 1.1 hwr break;
706 1.1 hwr #endif
707 1.1 hwr #ifdef NS
708 1.1 hwr case AF_NS:
709 1.8 explorer etype = ETHERTYPE_NS;
710 1.1 hwr break;
711 1.1 hwr #endif
712 1.56 is #ifdef INET6
713 1.56 is case AF_INET6:
714 1.56 is etype = ETHERTYPE_IPV6;
715 1.56 is break;
716 1.56 is #endif
717 1.1 hwr default:
718 1.1 hwr IF_DROP(&ifp->if_snd);
719 1.1 hwr m_freem(m);
720 1.38 itojun error = EAFNOSUPPORT;
721 1.38 itojun goto end;
722 1.1 hwr }
723 1.62 dyoung break;
724 1.62 dyoung default:
725 1.1 hwr IF_DROP(&ifp->if_snd);
726 1.1 hwr m_freem(m);
727 1.38 itojun error = EINVAL;
728 1.38 itojun goto end;
729 1.1 hwr }
730 1.1 hwr
731 1.62 dyoung switch (sc->g_proto) {
732 1.62 dyoung case IPPROTO_GRE:
733 1.62 dyoung hlen = sizeof(struct greip);
734 1.62 dyoung break;
735 1.62 dyoung case IPPROTO_UDP:
736 1.62 dyoung hlen = sizeof(struct gre_h);
737 1.62 dyoung break;
738 1.62 dyoung default:
739 1.62 dyoung hlen = 0;
740 1.62 dyoung break;
741 1.62 dyoung }
742 1.62 dyoung
743 1.62 dyoung M_PREPEND(m, hlen, M_DONTWAIT);
744 1.62 dyoung
745 1.62 dyoung if (m == NULL) {
746 1.1 hwr IF_DROP(&ifp->if_snd);
747 1.38 itojun error = ENOBUFS;
748 1.38 itojun goto end;
749 1.1 hwr }
750 1.1 hwr
751 1.62 dyoung switch (sc->g_proto) {
752 1.62 dyoung case IPPROTO_UDP:
753 1.62 dyoung gh = mtod(m, struct gre_h *);
754 1.62 dyoung memset(gh, 0, sizeof(*gh));
755 1.62 dyoung gh->ptype = htons(etype);
756 1.62 dyoung /* XXX Need to handle IP ToS. Look at how I handle IP TTL. */
757 1.62 dyoung break;
758 1.62 dyoung case IPPROTO_GRE:
759 1.62 dyoung gi = mtod(m, struct greip *);
760 1.62 dyoung gh = &gi->gi_g;
761 1.62 dyoung eip = &gi->gi_i;
762 1.1 hwr /* we don't have any GRE flags for now */
763 1.62 dyoung memset(gh, 0, sizeof(*gh));
764 1.62 dyoung gh->ptype = htons(etype);
765 1.62 dyoung eip->ip_src = sc->g_src;
766 1.62 dyoung eip->ip_dst = sc->g_dst;
767 1.62 dyoung eip->ip_hl = (sizeof(struct ip)) >> 2;
768 1.62 dyoung eip->ip_ttl = ip_gre_ttl;
769 1.62 dyoung eip->ip_tos = ip_tos;
770 1.62 dyoung eip->ip_len = htons(m->m_pkthdr.len);
771 1.62 dyoung eip->ip_p = sc->g_proto;
772 1.62 dyoung break;
773 1.62 dyoung case IPPROTO_MOBILE:
774 1.62 dyoung eip = mtod(m, struct ip *);
775 1.62 dyoung eip->ip_p = sc->g_proto;
776 1.62 dyoung break;
777 1.62 dyoung default:
778 1.62 dyoung error = EPROTONOSUPPORT;
779 1.62 dyoung m_freem(m);
780 1.62 dyoung goto end;
781 1.3 hwr }
782 1.1 hwr
783 1.1 hwr ifp->if_opackets++;
784 1.8 explorer ifp->if_obytes += m->m_pkthdr.len;
785 1.62 dyoung
786 1.1 hwr /* send it off */
787 1.62 dyoung if (sc->g_proto == IPPROTO_UDP) {
788 1.62 dyoung if (IF_QFULL(&sc->sc_snd)) {
789 1.62 dyoung IF_DROP(&sc->sc_snd);
790 1.62 dyoung error = ENOBUFS;
791 1.62 dyoung m_freem(m);
792 1.62 dyoung } else {
793 1.62 dyoung IF_ENQUEUE(&sc->sc_snd, m);
794 1.62 dyoung gre_wakeup(sc);
795 1.62 dyoung error = 0;
796 1.62 dyoung }
797 1.62 dyoung } else {
798 1.62 dyoung error = ip_output(m, NULL, &sc->route, 0,
799 1.62 dyoung (struct ip_moptions *)NULL, (struct socket *)NULL);
800 1.62 dyoung }
801 1.38 itojun end:
802 1.8 explorer if (error)
803 1.1 hwr ifp->if_oerrors++;
804 1.8 explorer return (error);
805 1.1 hwr }
806 1.1 hwr
807 1.62 dyoung /* Must be called at IPL_NET. */
808 1.62 dyoung static int
809 1.62 dyoung gre_kick(struct gre_softc *sc)
810 1.62 dyoung {
811 1.62 dyoung int rc;
812 1.62 dyoung struct ifnet *ifp = &sc->sc_if;
813 1.62 dyoung
814 1.62 dyoung if (sc->g_proto == IPPROTO_UDP && (ifp->if_flags & IFF_UP) == IFF_UP &&
815 1.62 dyoung !sc->sc_thread) {
816 1.62 dyoung sc->sc_thread = 1;
817 1.62 dyoung rc = kthread_create1(gre_thread, (void *)sc, NULL,
818 1.62 dyoung ifp->if_xname);
819 1.62 dyoung if (rc != 0)
820 1.62 dyoung gre_stop(&sc->sc_thread);
821 1.62 dyoung return rc;
822 1.62 dyoung } else {
823 1.62 dyoung gre_wakeup(sc);
824 1.62 dyoung return 0;
825 1.62 dyoung }
826 1.62 dyoung }
827 1.62 dyoung
828 1.62 dyoung static int
829 1.62 dyoung gre_getname(struct socket *so, int req, struct mbuf *nam, struct lwp *l)
830 1.62 dyoung {
831 1.62 dyoung int s, error;
832 1.62 dyoung
833 1.62 dyoung s = splsoftnet();
834 1.62 dyoung error = (*so->so_proto->pr_usrreq)(so, req, (struct mbuf *)0,
835 1.62 dyoung nam, (struct mbuf *)0, l);
836 1.62 dyoung splx(s);
837 1.62 dyoung return error;
838 1.62 dyoung }
839 1.62 dyoung
840 1.62 dyoung static int
841 1.62 dyoung gre_getsockname(struct socket *so, struct mbuf *nam, struct lwp *l)
842 1.62 dyoung {
843 1.62 dyoung return gre_getname(so, PRU_SOCKADDR, nam, l);
844 1.62 dyoung }
845 1.62 dyoung
846 1.62 dyoung static int
847 1.62 dyoung gre_getpeername(struct socket *so, struct mbuf *nam, struct lwp *l)
848 1.62 dyoung {
849 1.62 dyoung return gre_getname(so, PRU_PEERADDR, nam, l);
850 1.62 dyoung }
851 1.62 dyoung
852 1.62 dyoung static int
853 1.62 dyoung gre_getnames(struct socket *so, struct lwp *l, struct sockaddr_in *src,
854 1.62 dyoung struct sockaddr_in *dst)
855 1.62 dyoung {
856 1.62 dyoung struct mbuf *m;
857 1.62 dyoung struct sockaddr_in *sin;
858 1.62 dyoung int rc;
859 1.62 dyoung
860 1.62 dyoung if ((m = gre_getsockmbuf(so)) == NULL)
861 1.62 dyoung return ENOBUFS;
862 1.62 dyoung
863 1.62 dyoung sin = mtod(m, struct sockaddr_in *);
864 1.62 dyoung
865 1.62 dyoung if ((rc = gre_getsockname(so, m, l)) != 0)
866 1.62 dyoung goto out;
867 1.62 dyoung if (sin->sin_family != AF_INET) {
868 1.62 dyoung rc = EAFNOSUPPORT;
869 1.62 dyoung goto out;
870 1.62 dyoung }
871 1.62 dyoung *src = *sin;
872 1.62 dyoung
873 1.62 dyoung if ((rc = gre_getpeername(so, m, l)) != 0)
874 1.62 dyoung goto out;
875 1.62 dyoung if (sin->sin_family != AF_INET) {
876 1.62 dyoung rc = EAFNOSUPPORT;
877 1.62 dyoung goto out;
878 1.62 dyoung }
879 1.62 dyoung *dst = *sin;
880 1.62 dyoung
881 1.62 dyoung out:
882 1.62 dyoung m_freem(m);
883 1.62 dyoung return rc;
884 1.62 dyoung }
885 1.62 dyoung
886 1.59 thorpej static int
887 1.8 explorer gre_ioctl(struct ifnet *ifp, u_long cmd, caddr_t data)
888 1.1 hwr {
889 1.62 dyoung u_char oproto;
890 1.62 dyoung struct file *fp, *ofp;
891 1.62 dyoung struct socket *so;
892 1.62 dyoung struct sockaddr_in dst, src;
893 1.62 dyoung struct proc *p = curproc; /* XXX */
894 1.61 ad struct lwp *l = curlwp; /* XXX */
895 1.8 explorer struct ifreq *ifr = (struct ifreq *)data;
896 1.28 itojun struct if_laddrreq *lifr = (struct if_laddrreq *)data;
897 1.8 explorer struct gre_softc *sc = ifp->if_softc;
898 1.1 hwr int s;
899 1.1 hwr struct sockaddr_in si;
900 1.8 explorer struct sockaddr *sa = NULL;
901 1.1 hwr int error;
902 1.1 hwr
903 1.61 ad switch (cmd) {
904 1.61 ad case SIOCSIFFLAGS:
905 1.61 ad case SIOCSIFMTU:
906 1.61 ad case GRESPROTO:
907 1.61 ad case GRESADDRD:
908 1.61 ad case GRESADDRS:
909 1.62 dyoung case GRESSOCK:
910 1.62 dyoung case GREDSOCK:
911 1.61 ad case SIOCSLIFPHYADDR:
912 1.61 ad case SIOCDIFPHYADDR:
913 1.61 ad if ((error = kauth_authorize_generic(l->l_cred,
914 1.61 ad KAUTH_GENERIC_ISSUSER, &l->l_acflag)) != 0)
915 1.61 ad return (error);
916 1.61 ad break;
917 1.61 ad default:
918 1.61 ad error = 0;
919 1.61 ad break;
920 1.61 ad }
921 1.1 hwr
922 1.18 thorpej s = splnet();
923 1.20 itojun switch (cmd) {
924 1.20 itojun case SIOCSIFADDR:
925 1.36 itojun ifp->if_flags |= IFF_UP;
926 1.62 dyoung error = gre_kick(sc);
927 1.36 itojun break;
928 1.55 perry case SIOCSIFDSTADDR:
929 1.1 hwr break;
930 1.1 hwr case SIOCSIFFLAGS:
931 1.62 dyoung oproto = sc->g_proto;
932 1.62 dyoung switch (ifr->ifr_flags & (IFF_LINK0|IFF_LINK2)) {
933 1.62 dyoung case IFF_LINK0|IFF_LINK2:
934 1.62 dyoung sc->g_proto = IPPROTO_UDP;
935 1.62 dyoung if (oproto != IPPROTO_UDP)
936 1.62 dyoung ifp->if_flags &= ~IFF_RUNNING;
937 1.62 dyoung error = gre_kick(sc);
938 1.62 dyoung break;
939 1.62 dyoung case IFF_LINK0:
940 1.35 itojun sc->g_proto = IPPROTO_GRE;
941 1.62 dyoung gre_wakeup(sc);
942 1.62 dyoung goto recompute;
943 1.62 dyoung case 0:
944 1.35 itojun sc->g_proto = IPPROTO_MOBILE;
945 1.62 dyoung gre_wakeup(sc);
946 1.62 dyoung goto recompute;
947 1.62 dyoung }
948 1.1 hwr break;
949 1.20 itojun case SIOCSIFMTU:
950 1.27 martin if (ifr->ifr_mtu < 576) {
951 1.1 hwr error = EINVAL;
952 1.1 hwr break;
953 1.1 hwr }
954 1.1 hwr ifp->if_mtu = ifr->ifr_mtu;
955 1.1 hwr break;
956 1.1 hwr case SIOCGIFMTU:
957 1.1 hwr ifr->ifr_mtu = sc->sc_if.if_mtu;
958 1.1 hwr break;
959 1.1 hwr case SIOCADDMULTI:
960 1.1 hwr case SIOCDELMULTI:
961 1.8 explorer if (ifr == 0) {
962 1.1 hwr error = EAFNOSUPPORT;
963 1.1 hwr break;
964 1.1 hwr }
965 1.8 explorer switch (ifr->ifr_addr.sa_family) {
966 1.1 hwr #ifdef INET
967 1.1 hwr case AF_INET:
968 1.1 hwr break;
969 1.1 hwr #endif
970 1.56 is #ifdef INET6
971 1.56 is case AF_INET6:
972 1.56 is break;
973 1.56 is #endif
974 1.1 hwr default:
975 1.1 hwr error = EAFNOSUPPORT;
976 1.1 hwr break;
977 1.1 hwr }
978 1.1 hwr break;
979 1.1 hwr case GRESPROTO:
980 1.62 dyoung oproto = sc->g_proto;
981 1.1 hwr sc->g_proto = ifr->ifr_flags;
982 1.1 hwr switch (sc->g_proto) {
983 1.62 dyoung case IPPROTO_UDP:
984 1.62 dyoung ifp->if_flags |= IFF_LINK0|IFF_LINK2;
985 1.62 dyoung if (oproto != IPPROTO_UDP)
986 1.62 dyoung ifp->if_flags &= ~IFF_RUNNING;
987 1.62 dyoung error = gre_kick(sc);
988 1.62 dyoung break;
989 1.40 itojun case IPPROTO_GRE:
990 1.3 hwr ifp->if_flags |= IFF_LINK0;
991 1.62 dyoung ifp->if_flags &= ~IFF_LINK2;
992 1.62 dyoung goto recompute;
993 1.40 itojun case IPPROTO_MOBILE:
994 1.62 dyoung ifp->if_flags &= ~(IFF_LINK0|IFF_LINK2);
995 1.62 dyoung goto recompute;
996 1.1 hwr default:
997 1.40 itojun error = EPROTONOSUPPORT;
998 1.35 itojun break;
999 1.1 hwr }
1000 1.1 hwr break;
1001 1.1 hwr case GREGPROTO:
1002 1.1 hwr ifr->ifr_flags = sc->g_proto;
1003 1.1 hwr break;
1004 1.1 hwr case GRESADDRS:
1005 1.1 hwr case GRESADDRD:
1006 1.1 hwr /*
1007 1.20 itojun * set tunnel endpoints, compute a less specific route
1008 1.20 itojun * to the remote end and mark if as up
1009 1.20 itojun */
1010 1.1 hwr sa = &ifr->ifr_addr;
1011 1.62 dyoung if (cmd == GRESADDRS) {
1012 1.1 hwr sc->g_src = (satosin(sa))->sin_addr;
1013 1.62 dyoung sc->g_srcport = satosin(sa)->sin_port;
1014 1.62 dyoung }
1015 1.62 dyoung if (cmd == GRESADDRD) {
1016 1.62 dyoung if (sc->g_proto == IPPROTO_UDP &&
1017 1.62 dyoung satosin(sa)->sin_port == 0) {
1018 1.62 dyoung error = EINVAL;
1019 1.62 dyoung break;
1020 1.62 dyoung }
1021 1.1 hwr sc->g_dst = (satosin(sa))->sin_addr;
1022 1.62 dyoung sc->g_dstport = satosin(sa)->sin_port;
1023 1.62 dyoung }
1024 1.30 itojun recompute:
1025 1.62 dyoung if (sc->g_proto == IPPROTO_UDP ||
1026 1.62 dyoung (sc->g_src.s_addr != INADDR_ANY &&
1027 1.62 dyoung sc->g_dst.s_addr != INADDR_ANY)) {
1028 1.62 dyoung if (sc->sc_fp != NULL) {
1029 1.62 dyoung closef(sc->sc_fp, l);
1030 1.62 dyoung sc->sc_fp = NULL;
1031 1.62 dyoung }
1032 1.62 dyoung if (sc->route.ro_rt != NULL) {
1033 1.1 hwr RTFREE(sc->route.ro_rt);
1034 1.62 dyoung sc->route.ro_rt = NULL;
1035 1.62 dyoung }
1036 1.62 dyoung if (sc->g_proto == IPPROTO_UDP)
1037 1.62 dyoung error = gre_kick(sc);
1038 1.62 dyoung else if (gre_compute_route(sc) == 0)
1039 1.39 itojun ifp->if_flags |= IFF_RUNNING;
1040 1.39 itojun else
1041 1.39 itojun ifp->if_flags &= ~IFF_RUNNING;
1042 1.1 hwr }
1043 1.1 hwr break;
1044 1.1 hwr case GREGADDRS:
1045 1.33 itojun memset(&si, 0, sizeof(si));
1046 1.28 itojun si.sin_family = AF_INET;
1047 1.28 itojun si.sin_len = sizeof(struct sockaddr_in);
1048 1.1 hwr si.sin_addr.s_addr = sc->g_src.s_addr;
1049 1.8 explorer sa = sintosa(&si);
1050 1.1 hwr ifr->ifr_addr = *sa;
1051 1.1 hwr break;
1052 1.1 hwr case GREGADDRD:
1053 1.33 itojun memset(&si, 0, sizeof(si));
1054 1.28 itojun si.sin_family = AF_INET;
1055 1.28 itojun si.sin_len = sizeof(struct sockaddr_in);
1056 1.1 hwr si.sin_addr.s_addr = sc->g_dst.s_addr;
1057 1.8 explorer sa = sintosa(&si);
1058 1.1 hwr ifr->ifr_addr = *sa;
1059 1.28 itojun break;
1060 1.62 dyoung case GREDSOCK:
1061 1.62 dyoung if (sc->g_proto != IPPROTO_UDP)
1062 1.62 dyoung return EINVAL;
1063 1.62 dyoung closef(sc->sc_fp, l);
1064 1.62 dyoung sc->sc_fp = NULL;
1065 1.62 dyoung error = gre_kick(sc);
1066 1.62 dyoung break;
1067 1.62 dyoung case GRESSOCK:
1068 1.62 dyoung if (sc->g_proto != IPPROTO_UDP)
1069 1.62 dyoung return EINVAL;
1070 1.62 dyoung /* getsock() will FILE_USE() the descriptor for us */
1071 1.62 dyoung if ((error = getsock(p->p_fd, (int)ifr->ifr_value, &fp)) != 0)
1072 1.62 dyoung break;
1073 1.62 dyoung so = (struct socket *)fp->f_data;
1074 1.62 dyoung if (so->so_type != SOCK_DGRAM) {
1075 1.62 dyoung FILE_UNUSE(fp, NULL);
1076 1.62 dyoung error = EINVAL;
1077 1.62 dyoung break;
1078 1.62 dyoung }
1079 1.62 dyoung /* check address */
1080 1.62 dyoung if ((error = gre_getnames(so, curlwp, &src, &dst)) != 0) {
1081 1.62 dyoung FILE_UNUSE(fp, NULL);
1082 1.62 dyoung break;
1083 1.62 dyoung }
1084 1.62 dyoung
1085 1.62 dyoung fp->f_count++;
1086 1.62 dyoung
1087 1.62 dyoung ofp = sc->sc_fp;
1088 1.62 dyoung sc->sc_fp = fp;
1089 1.62 dyoung if ((error = gre_kick(sc)) != 0) {
1090 1.62 dyoung closef(fp, l);
1091 1.62 dyoung sc->sc_fp = ofp;
1092 1.62 dyoung break;
1093 1.62 dyoung }
1094 1.62 dyoung sc->g_src = src.sin_addr;
1095 1.62 dyoung sc->g_srcport = src.sin_port;
1096 1.62 dyoung sc->g_dst = dst.sin_addr;
1097 1.62 dyoung sc->g_dstport = dst.sin_port;
1098 1.62 dyoung if (ofp != NULL)
1099 1.62 dyoung closef(ofp, l);
1100 1.62 dyoung break;
1101 1.28 itojun case SIOCSLIFPHYADDR:
1102 1.28 itojun if (lifr->addr.ss_family != AF_INET ||
1103 1.31 itojun lifr->dstaddr.ss_family != AF_INET) {
1104 1.31 itojun error = EAFNOSUPPORT;
1105 1.31 itojun break;
1106 1.31 itojun }
1107 1.28 itojun if (lifr->addr.ss_len != sizeof(si) ||
1108 1.31 itojun lifr->dstaddr.ss_len != sizeof(si)) {
1109 1.31 itojun error = EINVAL;
1110 1.31 itojun break;
1111 1.31 itojun }
1112 1.62 dyoung sc->g_src = satosin(&lifr->addr)->sin_addr;
1113 1.62 dyoung sc->g_dst = satosin(&lifr->dstaddr)->sin_addr;
1114 1.62 dyoung sc->g_srcport = satosin(&lifr->addr)->sin_port;
1115 1.62 dyoung sc->g_dstport = satosin(&lifr->dstaddr)->sin_port;
1116 1.30 itojun goto recompute;
1117 1.28 itojun case SIOCDIFPHYADDR:
1118 1.28 itojun sc->g_src.s_addr = INADDR_ANY;
1119 1.28 itojun sc->g_dst.s_addr = INADDR_ANY;
1120 1.62 dyoung sc->g_srcport = 0;
1121 1.62 dyoung sc->g_dstport = 0;
1122 1.62 dyoung goto recompute;
1123 1.28 itojun case SIOCGLIFPHYADDR:
1124 1.28 itojun if (sc->g_src.s_addr == INADDR_ANY ||
1125 1.28 itojun sc->g_dst.s_addr == INADDR_ANY) {
1126 1.28 itojun error = EADDRNOTAVAIL;
1127 1.28 itojun break;
1128 1.28 itojun }
1129 1.33 itojun memset(&si, 0, sizeof(si));
1130 1.28 itojun si.sin_family = AF_INET;
1131 1.28 itojun si.sin_len = sizeof(struct sockaddr_in);
1132 1.62 dyoung si.sin_addr = sc->g_src;
1133 1.62 dyoung if (sc->g_proto == IPPROTO_UDP)
1134 1.62 dyoung si.sin_port = sc->g_srcport;
1135 1.33 itojun memcpy(&lifr->addr, &si, sizeof(si));
1136 1.62 dyoung si.sin_addr = sc->g_dst;
1137 1.62 dyoung if (sc->g_proto == IPPROTO_UDP)
1138 1.62 dyoung si.sin_port = sc->g_dstport;
1139 1.33 itojun memcpy(&lifr->dstaddr, &si, sizeof(si));
1140 1.1 hwr break;
1141 1.1 hwr default:
1142 1.1 hwr error = EINVAL;
1143 1.31 itojun break;
1144 1.1 hwr }
1145 1.1 hwr splx(s);
1146 1.8 explorer return (error);
1147 1.1 hwr }
1148 1.1 hwr
1149 1.20 itojun /*
1150 1.1 hwr * computes a route to our destination that is not the one
1151 1.1 hwr * which would be taken by ip_output(), as this one will loop back to
1152 1.1 hwr * us. If the interface is p2p as a--->b, then a routing entry exists
1153 1.1 hwr * If we now send a packet to b (e.g. ping b), this will come down here
1154 1.43 wiz * gets src=a, dst=b tacked on and would from ip_output() sent back to
1155 1.1 hwr * if_gre.
1156 1.1 hwr * Goal here is to compute a route to b that is less specific than
1157 1.1 hwr * a-->b. We know that this one exists as in normal operation we have
1158 1.1 hwr * at least a default route which matches.
1159 1.1 hwr */
1160 1.59 thorpej static int
1161 1.8 explorer gre_compute_route(struct gre_softc *sc)
1162 1.1 hwr {
1163 1.1 hwr struct route *ro;
1164 1.8 explorer u_int32_t a, b, c;
1165 1.1 hwr
1166 1.8 explorer ro = &sc->route;
1167 1.20 itojun
1168 1.8 explorer memset(ro, 0, sizeof(struct route));
1169 1.8 explorer ((struct sockaddr_in *)&ro->ro_dst)->sin_addr = sc->g_dst;
1170 1.8 explorer ro->ro_dst.sa_family = AF_INET;
1171 1.8 explorer ro->ro_dst.sa_len = sizeof(ro->ro_dst);
1172 1.8 explorer
1173 1.1 hwr /*
1174 1.1 hwr * toggle last bit, so our interface is not found, but a less
1175 1.20 itojun * specific route. I'd rather like to specify a shorter mask,
1176 1.20 itojun * but this is not possible. Should work though. XXX
1177 1.1 hwr * there is a simpler way ...
1178 1.20 itojun */
1179 1.8 explorer if ((sc->sc_if.if_flags & IFF_LINK1) == 0) {
1180 1.8 explorer a = ntohl(sc->g_dst.s_addr);
1181 1.8 explorer b = a & 0x01;
1182 1.8 explorer c = a & 0xfffffffe;
1183 1.8 explorer b = b ^ 0x01;
1184 1.8 explorer a = b | c;
1185 1.8 explorer ((struct sockaddr_in *)&ro->ro_dst)->sin_addr.s_addr
1186 1.20 itojun = htonl(a);
1187 1.8 explorer }
1188 1.1 hwr
1189 1.1 hwr #ifdef DIAGNOSTIC
1190 1.45 grant printf("%s: searching for a route to %s", sc->sc_if.if_xname,
1191 1.19 itojun inet_ntoa(((struct sockaddr_in *)&ro->ro_dst)->sin_addr));
1192 1.1 hwr #endif
1193 1.1 hwr
1194 1.1 hwr rtalloc(ro);
1195 1.1 hwr
1196 1.1 hwr /*
1197 1.25 martin * check if this returned a route at all and this route is no
1198 1.25 martin * recursion to ourself
1199 1.25 martin */
1200 1.25 martin if (ro->ro_rt == NULL || ro->ro_rt->rt_ifp->if_softc == sc) {
1201 1.25 martin #ifdef DIAGNOSTIC
1202 1.25 martin if (ro->ro_rt == NULL)
1203 1.25 martin printf(" - no route found!\n");
1204 1.25 martin else
1205 1.25 martin printf(" - route loops back to ourself!\n");
1206 1.25 martin #endif
1207 1.25 martin return EADDRNOTAVAIL;
1208 1.25 martin }
1209 1.25 martin
1210 1.25 martin /*
1211 1.20 itojun * now change it back - else ip_output will just drop
1212 1.20 itojun * the route and search one to this interface ...
1213 1.20 itojun */
1214 1.8 explorer if ((sc->sc_if.if_flags & IFF_LINK1) == 0)
1215 1.8 explorer ((struct sockaddr_in *)&ro->ro_dst)->sin_addr = sc->g_dst;
1216 1.1 hwr
1217 1.1 hwr #ifdef DIAGNOSTIC
1218 1.62 dyoung printf(", choosing %s with gateway %s\n", ro->ro_rt->rt_ifp->if_xname,
1219 1.19 itojun inet_ntoa(((struct sockaddr_in *)(ro->ro_rt->rt_gateway))->sin_addr));
1220 1.1 hwr #endif
1221 1.25 martin
1222 1.25 martin return 0;
1223 1.1 hwr }
1224 1.1 hwr
1225 1.3 hwr /*
1226 1.20 itojun * do a checksum of a buffer - much like in_cksum, which operates on
1227 1.20 itojun * mbufs.
1228 1.3 hwr */
1229 1.48 itojun u_int16_t
1230 1.48 itojun gre_in_cksum(u_int16_t *p, u_int len)
1231 1.3 hwr {
1232 1.48 itojun u_int32_t sum = 0;
1233 1.3 hwr int nwords = len >> 1;
1234 1.20 itojun
1235 1.3 hwr while (nwords-- != 0)
1236 1.3 hwr sum += *p++;
1237 1.20 itojun
1238 1.20 itojun if (len & 1) {
1239 1.20 itojun union {
1240 1.20 itojun u_short w;
1241 1.20 itojun u_char c[2];
1242 1.20 itojun } u;
1243 1.20 itojun u.c[0] = *(u_char *)p;
1244 1.20 itojun u.c[1] = 0;
1245 1.20 itojun sum += u.w;
1246 1.20 itojun }
1247 1.20 itojun
1248 1.20 itojun /* end-around-carry */
1249 1.20 itojun sum = (sum >> 16) + (sum & 0xffff);
1250 1.20 itojun sum += (sum >> 16);
1251 1.20 itojun return (~sum);
1252 1.3 hwr }
1253 1.54 christos #endif
1254 1.54 christos
1255 1.59 thorpej void greattach(int);
1256 1.54 christos
1257 1.54 christos /* ARGSUSED */
1258 1.54 christos void
1259 1.59 thorpej greattach(int count)
1260 1.54 christos {
1261 1.54 christos #ifdef INET
1262 1.54 christos LIST_INIT(&gre_softc_list);
1263 1.54 christos if_clone_attach(&gre_cloner);
1264 1.54 christos #endif
1265 1.54 christos }
1266