if_gre.c revision 1.95 1 1.95 xtraeme /* $NetBSD: if_gre.c,v 1.95 2007/05/29 22:05:01 xtraeme Exp $ */
2 1.4 thorpej
3 1.1 hwr /*
4 1.4 thorpej * Copyright (c) 1998 The NetBSD Foundation, Inc.
5 1.1 hwr * All rights reserved.
6 1.1 hwr *
7 1.1 hwr * This code is derived from software contributed to The NetBSD Foundation
8 1.1 hwr * by Heiko W.Rupp <hwr (at) pilhuhn.de>
9 1.1 hwr *
10 1.56 is * IPv6-over-GRE contributed by Gert Doering <gert (at) greenie.muc.de>
11 1.56 is *
12 1.1 hwr * Redistribution and use in source and binary forms, with or without
13 1.1 hwr * modification, are permitted provided that the following conditions
14 1.1 hwr * are met:
15 1.1 hwr * 1. Redistributions of source code must retain the above copyright
16 1.1 hwr * notice, this list of conditions and the following disclaimer.
17 1.1 hwr * 2. Redistributions in binary form must reproduce the above copyright
18 1.1 hwr * notice, this list of conditions and the following disclaimer in the
19 1.1 hwr * documentation and/or other materials provided with the distribution.
20 1.1 hwr * 3. All advertising materials mentioning features or use of this software
21 1.1 hwr * must display the following acknowledgement:
22 1.1 hwr * This product includes software developed by the NetBSD
23 1.1 hwr * Foundation, Inc. and its contributors.
24 1.1 hwr * 4. Neither the name of The NetBSD Foundation nor the names of its
25 1.1 hwr * contributors may be used to endorse or promote products derived
26 1.1 hwr * from this software without specific prior written permission.
27 1.1 hwr *
28 1.1 hwr * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
29 1.1 hwr * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
30 1.1 hwr * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
31 1.1 hwr * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
32 1.1 hwr * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
33 1.1 hwr * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
34 1.1 hwr * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
35 1.1 hwr * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
36 1.1 hwr * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
37 1.1 hwr * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
38 1.1 hwr * POSSIBILITY OF SUCH DAMAGE.
39 1.1 hwr */
40 1.1 hwr
41 1.1 hwr /*
42 1.1 hwr * Encapsulate L3 protocols into IP
43 1.1 hwr * See RFC 1701 and 1702 for more details.
44 1.1 hwr * If_gre is compatible with Cisco GRE tunnels, so you can
45 1.1 hwr * have a NetBSD box as the other end of a tunnel interface of a Cisco
46 1.1 hwr * router. See gre(4) for more details.
47 1.6 hwr * Also supported: IP in IP encaps (proto 55) as of RFC 2004
48 1.1 hwr */
49 1.22 lukem
50 1.22 lukem #include <sys/cdefs.h>
51 1.95 xtraeme __KERNEL_RCSID(0, "$NetBSD: if_gre.c,v 1.95 2007/05/29 22:05:01 xtraeme Exp $");
52 1.1 hwr
53 1.62 dyoung #include "opt_gre.h"
54 1.1 hwr #include "opt_inet.h"
55 1.94 christos #include "opt_compat_netbsd.h"
56 1.1 hwr #include "bpfilter.h"
57 1.1 hwr
58 1.54 christos #ifdef INET
59 1.1 hwr #include <sys/param.h>
60 1.62 dyoung #include <sys/file.h>
61 1.62 dyoung #include <sys/filedesc.h>
62 1.1 hwr #include <sys/malloc.h>
63 1.1 hwr #include <sys/mbuf.h>
64 1.13 martin #include <sys/proc.h>
65 1.1 hwr #include <sys/protosw.h>
66 1.1 hwr #include <sys/socket.h>
67 1.62 dyoung #include <sys/socketvar.h>
68 1.1 hwr #include <sys/ioctl.h>
69 1.10 thorpej #include <sys/queue.h>
70 1.1 hwr #if __NetBSD__
71 1.1 hwr #include <sys/systm.h>
72 1.62 dyoung #include <sys/sysctl.h>
73 1.60 elad #include <sys/kauth.h>
74 1.1 hwr #endif
75 1.1 hwr
76 1.93 dyoung #include <sys/kernel.h>
77 1.93 dyoung #include <sys/mutex.h>
78 1.93 dyoung #include <sys/condvar.h>
79 1.62 dyoung #include <sys/kthread.h>
80 1.62 dyoung
81 1.1 hwr #include <machine/cpu.h>
82 1.1 hwr
83 1.1 hwr #include <net/ethertypes.h>
84 1.1 hwr #include <net/if.h>
85 1.1 hwr #include <net/if_types.h>
86 1.1 hwr #include <net/netisr.h>
87 1.1 hwr #include <net/route.h>
88 1.1 hwr
89 1.1 hwr #ifdef INET
90 1.1 hwr #include <netinet/in.h>
91 1.1 hwr #include <netinet/in_systm.h>
92 1.1 hwr #include <netinet/in_var.h>
93 1.1 hwr #include <netinet/ip.h>
94 1.1 hwr #include <netinet/ip_var.h>
95 1.1 hwr #else
96 1.4 thorpej #error "Huh? if_gre without inet?"
97 1.1 hwr #endif
98 1.1 hwr
99 1.1 hwr
100 1.1 hwr #ifdef NETATALK
101 1.1 hwr #include <netatalk/at.h>
102 1.1 hwr #include <netatalk/at_var.h>
103 1.1 hwr #include <netatalk/at_extern.h>
104 1.1 hwr #endif
105 1.1 hwr
106 1.1 hwr #if NBPFILTER > 0
107 1.1 hwr #include <sys/time.h>
108 1.1 hwr #include <net/bpf.h>
109 1.1 hwr #endif
110 1.1 hwr
111 1.1 hwr #include <net/if_gre.h>
112 1.1 hwr
113 1.94 christos #if defined(COMPAT_09) || defined(COMPAT_10) || defined(COMPAT_11) || \
114 1.94 christos defined(COMPAT_12) || defined(COMPAT_13) || defined(COMPAT_14) || \
115 1.94 christos defined(COMPAT_15) || defined(COMPAT_16) || defined(COMPAT_20) || \
116 1.94 christos defined(COMPAT_30) || defined(COMPAT_40)
117 1.94 christos #define COMPAT_OIFREQ
118 1.94 christos #include <compat/sys/sockio.h>
119 1.94 christos #endif
120 1.20 itojun /*
121 1.27 martin * It is not easy to calculate the right value for a GRE MTU.
122 1.27 martin * We leave this task to the admin and use the same default that
123 1.27 martin * other vendors use.
124 1.20 itojun */
125 1.27 martin #define GREMTU 1476
126 1.1 hwr
127 1.62 dyoung #ifdef GRE_DEBUG
128 1.62 dyoung #define GRE_DPRINTF(__sc, __fmt, ...) \
129 1.62 dyoung do { \
130 1.62 dyoung if (((__sc)->sc_if.if_flags & IFF_DEBUG) != 0) \
131 1.62 dyoung printf(__fmt, __VA_ARGS__); \
132 1.62 dyoung } while (/*CONSTCOND*/0)
133 1.62 dyoung #else
134 1.62 dyoung #define GRE_DPRINTF(__sc, __fmt, ...) do { } while (/*CONSTCOND*/0)
135 1.62 dyoung #endif /* GRE_DEBUG */
136 1.62 dyoung
137 1.11 thorpej struct gre_softc_head gre_softc_list;
138 1.26 martin int ip_gre_ttl = GRE_TTL;
139 1.1 hwr
140 1.59 thorpej static int gre_clone_create(struct if_clone *, int);
141 1.59 thorpej static int gre_clone_destroy(struct ifnet *);
142 1.10 thorpej
143 1.59 thorpej static struct if_clone gre_cloner =
144 1.10 thorpej IF_CLONE_INITIALIZER("gre", gre_clone_create, gre_clone_destroy);
145 1.1 hwr
146 1.84 dyoung static int gre_output(struct ifnet *, struct mbuf *,
147 1.84 dyoung const struct sockaddr *, struct rtentry *);
148 1.88 christos static int gre_ioctl(struct ifnet *, u_long, void *);
149 1.1 hwr
150 1.59 thorpej static int gre_compute_route(struct gre_softc *sc);
151 1.59 thorpej
152 1.93 dyoung static void gre_closef(struct file **, struct lwp *);
153 1.62 dyoung static int gre_getsockname(struct socket *, struct mbuf *, struct lwp *);
154 1.62 dyoung static int gre_getpeername(struct socket *, struct mbuf *, struct lwp *);
155 1.62 dyoung static int gre_getnames(struct socket *, struct lwp *, struct sockaddr_in *,
156 1.62 dyoung struct sockaddr_in *);
157 1.62 dyoung
158 1.93 dyoung /* Calling thread must hold sc->sc_mtx. */
159 1.62 dyoung static void
160 1.93 dyoung gre_stop(struct gre_softc *sc)
161 1.62 dyoung {
162 1.93 dyoung sc->sc_running = 0;
163 1.93 dyoung cv_signal(&sc->sc_join_cv);
164 1.62 dyoung }
165 1.62 dyoung
166 1.93 dyoung /* Calling thread must hold sc->sc_mtx. */
167 1.62 dyoung static void
168 1.93 dyoung gre_join(struct gre_softc *sc)
169 1.62 dyoung {
170 1.93 dyoung while (sc->sc_running != 0)
171 1.93 dyoung cv_wait(&sc->sc_join_cv, &sc->sc_mtx);
172 1.62 dyoung }
173 1.62 dyoung
174 1.93 dyoung /* Calling thread must hold sc->sc_mtx. */
175 1.62 dyoung static void
176 1.62 dyoung gre_wakeup(struct gre_softc *sc)
177 1.62 dyoung {
178 1.62 dyoung GRE_DPRINTF(sc, "%s: enter\n", __func__);
179 1.93 dyoung sc->sc_haswork = 1;
180 1.93 dyoung cv_signal(&sc->sc_work_cv);
181 1.62 dyoung }
182 1.62 dyoung
183 1.59 thorpej static int
184 1.59 thorpej gre_clone_create(struct if_clone *ifc, int unit)
185 1.1 hwr {
186 1.8 explorer struct gre_softc *sc;
187 1.1 hwr
188 1.10 thorpej sc = malloc(sizeof(struct gre_softc), M_DEVBUF, M_WAITOK);
189 1.10 thorpej memset(sc, 0, sizeof(struct gre_softc));
190 1.93 dyoung mutex_init(&sc->sc_mtx, MUTEX_DRIVER, IPL_NET);
191 1.93 dyoung cv_init(&sc->sc_work_cv, "gre work");
192 1.93 dyoung cv_init(&sc->sc_join_cv, "gre join");
193 1.93 dyoung cv_init(&sc->sc_soparm_cv, "gre soparm");
194 1.10 thorpej
195 1.50 itojun snprintf(sc->sc_if.if_xname, sizeof(sc->sc_if.if_xname), "%s%d",
196 1.50 itojun ifc->ifc_name, unit);
197 1.10 thorpej sc->sc_if.if_softc = sc;
198 1.51 tron sc->sc_if.if_type = IFT_TUNNEL;
199 1.34 itojun sc->sc_if.if_addrlen = 0;
200 1.10 thorpej sc->sc_if.if_hdrlen = 24; /* IP + GRE */
201 1.15 thorpej sc->sc_if.if_dlt = DLT_NULL;
202 1.20 itojun sc->sc_if.if_mtu = GREMTU;
203 1.10 thorpej sc->sc_if.if_flags = IFF_POINTOPOINT|IFF_MULTICAST;
204 1.10 thorpej sc->sc_if.if_output = gre_output;
205 1.10 thorpej sc->sc_if.if_ioctl = gre_ioctl;
206 1.10 thorpej sc->g_dst.s_addr = sc->g_src.s_addr = INADDR_ANY;
207 1.62 dyoung sc->g_dstport = sc->g_srcport = 0;
208 1.75 dyoung sc->sc_proto = IPPROTO_GRE;
209 1.64 dyoung sc->sc_snd.ifq_maxlen = 256;
210 1.35 itojun sc->sc_if.if_flags |= IFF_LINK0;
211 1.10 thorpej if_attach(&sc->sc_if);
212 1.16 thorpej if_alloc_sadl(&sc->sc_if);
213 1.1 hwr #if NBPFILTER > 0
214 1.14 thorpej bpfattach(&sc->sc_if, DLT_NULL, sizeof(u_int32_t));
215 1.1 hwr #endif
216 1.10 thorpej LIST_INSERT_HEAD(&gre_softc_list, sc, sc_list);
217 1.87 dyoung return 0;
218 1.10 thorpej }
219 1.1 hwr
220 1.59 thorpej static int
221 1.59 thorpej gre_clone_destroy(struct ifnet *ifp)
222 1.10 thorpej {
223 1.10 thorpej struct gre_softc *sc = ifp->if_softc;
224 1.10 thorpej
225 1.10 thorpej LIST_REMOVE(sc, sc_list);
226 1.10 thorpej #if NBPFILTER > 0
227 1.10 thorpej bpfdetach(ifp);
228 1.10 thorpej #endif
229 1.93 dyoung if_detach(ifp);
230 1.93 dyoung mutex_enter(&sc->sc_mtx);
231 1.62 dyoung gre_wakeup(sc);
232 1.93 dyoung gre_join(sc);
233 1.93 dyoung mutex_exit(&sc->sc_mtx);
234 1.85 dyoung rtcache_free(&sc->route);
235 1.93 dyoung
236 1.93 dyoung cv_destroy(&sc->sc_soparm_cv);
237 1.93 dyoung cv_destroy(&sc->sc_join_cv);
238 1.93 dyoung cv_destroy(&sc->sc_work_cv);
239 1.93 dyoung mutex_destroy(&sc->sc_mtx);
240 1.10 thorpej free(sc, M_DEVBUF);
241 1.53 peter
242 1.87 dyoung return 0;
243 1.1 hwr }
244 1.1 hwr
245 1.62 dyoung static void
246 1.88 christos gre_receive(struct socket *so, void *arg, int waitflag)
247 1.62 dyoung {
248 1.62 dyoung struct gre_softc *sc = (struct gre_softc *)arg;
249 1.62 dyoung
250 1.62 dyoung GRE_DPRINTF(sc, "%s: enter\n", __func__);
251 1.62 dyoung
252 1.62 dyoung gre_wakeup(sc);
253 1.62 dyoung }
254 1.62 dyoung
255 1.62 dyoung static void
256 1.88 christos gre_upcall_add(struct socket *so, void *arg)
257 1.62 dyoung {
258 1.62 dyoung /* XXX What if the kernel already set an upcall? */
259 1.62 dyoung so->so_upcallarg = arg;
260 1.62 dyoung so->so_upcall = gre_receive;
261 1.62 dyoung so->so_rcv.sb_flags |= SB_UPCALL;
262 1.62 dyoung }
263 1.62 dyoung
264 1.62 dyoung static void
265 1.62 dyoung gre_upcall_remove(struct socket *so)
266 1.62 dyoung {
267 1.62 dyoung /* XXX What if the kernel already set an upcall? */
268 1.62 dyoung so->so_rcv.sb_flags &= ~SB_UPCALL;
269 1.62 dyoung so->so_upcallarg = NULL;
270 1.62 dyoung so->so_upcall = NULL;
271 1.62 dyoung }
272 1.62 dyoung
273 1.62 dyoung static void
274 1.62 dyoung gre_sodestroy(struct socket **sop)
275 1.62 dyoung {
276 1.62 dyoung gre_upcall_remove(*sop);
277 1.62 dyoung soshutdown(*sop, SHUT_RDWR);
278 1.62 dyoung soclose(*sop);
279 1.62 dyoung *sop = NULL;
280 1.62 dyoung }
281 1.62 dyoung
282 1.62 dyoung static struct mbuf *
283 1.74 christos gre_getsockmbuf(struct socket *so)
284 1.62 dyoung {
285 1.62 dyoung struct mbuf *m;
286 1.62 dyoung
287 1.62 dyoung m = m_get(M_WAIT, MT_SONAME);
288 1.62 dyoung if (m != NULL)
289 1.62 dyoung MCLAIM(m, so->so_mowner);
290 1.62 dyoung return m;
291 1.62 dyoung }
292 1.62 dyoung
293 1.62 dyoung static int
294 1.62 dyoung gre_socreate1(struct gre_softc *sc, struct lwp *l, struct gre_soparm *sp,
295 1.62 dyoung struct socket **sop)
296 1.62 dyoung {
297 1.62 dyoung int rc;
298 1.62 dyoung struct mbuf *m;
299 1.62 dyoung struct sockaddr_in *sin;
300 1.62 dyoung struct socket *so;
301 1.62 dyoung
302 1.62 dyoung GRE_DPRINTF(sc, "%s: enter\n", __func__);
303 1.62 dyoung rc = socreate(AF_INET, sop, SOCK_DGRAM, IPPROTO_UDP, l);
304 1.62 dyoung if (rc != 0) {
305 1.62 dyoung GRE_DPRINTF(sc, "%s: socreate failed\n", __func__);
306 1.62 dyoung return rc;
307 1.62 dyoung }
308 1.62 dyoung
309 1.62 dyoung so = *sop;
310 1.62 dyoung
311 1.90 dyoung gre_upcall_add(so, sc);
312 1.62 dyoung if ((m = gre_getsockmbuf(so)) == NULL) {
313 1.62 dyoung rc = ENOBUFS;
314 1.62 dyoung goto out;
315 1.62 dyoung }
316 1.62 dyoung sin = mtod(m, struct sockaddr_in *);
317 1.62 dyoung sin->sin_len = m->m_len = sizeof(struct sockaddr_in);
318 1.62 dyoung sin->sin_family = AF_INET;
319 1.62 dyoung sin->sin_addr = sc->g_src;
320 1.62 dyoung sin->sin_port = sc->g_srcport;
321 1.62 dyoung
322 1.62 dyoung GRE_DPRINTF(sc, "%s: bind 0x%08" PRIx32 " port %d\n", __func__,
323 1.62 dyoung sin->sin_addr.s_addr, ntohs(sin->sin_port));
324 1.62 dyoung if ((rc = sobind(so, m, l)) != 0) {
325 1.62 dyoung GRE_DPRINTF(sc, "%s: sobind failed\n", __func__);
326 1.62 dyoung goto out;
327 1.62 dyoung }
328 1.62 dyoung
329 1.62 dyoung if (sc->g_srcport == 0) {
330 1.69 dyoung if ((rc = gre_getsockname(so, m, l)) != 0) {
331 1.62 dyoung GRE_DPRINTF(sc, "%s: gre_getsockname failed\n",
332 1.62 dyoung __func__);
333 1.62 dyoung goto out;
334 1.62 dyoung }
335 1.62 dyoung sc->g_srcport = sin->sin_port;
336 1.62 dyoung }
337 1.62 dyoung
338 1.62 dyoung sin->sin_addr = sc->g_dst;
339 1.62 dyoung sin->sin_port = sc->g_dstport;
340 1.62 dyoung
341 1.68 dyoung if ((rc = soconnect(so, m, l)) != 0) {
342 1.62 dyoung GRE_DPRINTF(sc, "%s: soconnect failed\n", __func__);
343 1.62 dyoung goto out;
344 1.62 dyoung }
345 1.62 dyoung
346 1.62 dyoung *mtod(m, int *) = ip_gre_ttl;
347 1.76 dyoung m->m_len = sizeof(int);
348 1.62 dyoung rc = (*so->so_proto->pr_ctloutput)(PRCO_SETOPT, so, IPPROTO_IP, IP_TTL,
349 1.62 dyoung &m);
350 1.62 dyoung m = NULL;
351 1.62 dyoung if (rc != 0) {
352 1.62 dyoung printf("%s: setopt ttl failed\n", __func__);
353 1.62 dyoung rc = 0;
354 1.62 dyoung }
355 1.62 dyoung out:
356 1.62 dyoung m_freem(m);
357 1.62 dyoung
358 1.62 dyoung if (rc != 0)
359 1.62 dyoung gre_sodestroy(sop);
360 1.62 dyoung else
361 1.63 dyoung *sp = sc->sc_soparm;
362 1.62 dyoung
363 1.62 dyoung return rc;
364 1.62 dyoung }
365 1.62 dyoung
366 1.62 dyoung static void
367 1.62 dyoung gre_thread1(struct gre_softc *sc, struct lwp *l)
368 1.62 dyoung {
369 1.93 dyoung int flags, rc;
370 1.62 dyoung const struct gre_h *gh;
371 1.62 dyoung struct ifnet *ifp = &sc->sc_if;
372 1.62 dyoung struct mbuf *m;
373 1.62 dyoung struct socket *so = NULL;
374 1.62 dyoung struct uio uio;
375 1.62 dyoung struct gre_soparm sp;
376 1.93 dyoung struct file *fp = NULL;
377 1.62 dyoung
378 1.62 dyoung GRE_DPRINTF(sc, "%s: enter\n", __func__);
379 1.93 dyoung mutex_enter(&sc->sc_mtx);
380 1.62 dyoung
381 1.93 dyoung sc->sc_haswork = 1;
382 1.62 dyoung
383 1.62 dyoung memset(&sp, 0, sizeof(sp));
384 1.62 dyoung memset(&uio, 0, sizeof(uio));
385 1.62 dyoung
386 1.62 dyoung ifp->if_flags |= IFF_RUNNING;
387 1.62 dyoung
388 1.62 dyoung for (;;) {
389 1.93 dyoung while (sc->sc_haswork == 0) {
390 1.62 dyoung GRE_DPRINTF(sc, "%s: sleeping\n", __func__);
391 1.93 dyoung cv_wait(&sc->sc_work_cv, &sc->sc_mtx);
392 1.62 dyoung }
393 1.93 dyoung sc->sc_haswork = 0;
394 1.62 dyoung GRE_DPRINTF(sc, "%s: awake\n", __func__);
395 1.62 dyoung if ((ifp->if_flags & IFF_UP) != IFF_UP) {
396 1.62 dyoung GRE_DPRINTF(sc, "%s: not up & running; exiting\n",
397 1.62 dyoung __func__);
398 1.62 dyoung break;
399 1.62 dyoung }
400 1.75 dyoung if (sc->sc_proto != IPPROTO_UDP) {
401 1.62 dyoung GRE_DPRINTF(sc, "%s: not udp; exiting\n", __func__);
402 1.62 dyoung break;
403 1.62 dyoung }
404 1.62 dyoung /* XXX optimize */
405 1.93 dyoung if (so == NULL || sc->sc_fp != NULL ||
406 1.93 dyoung memcmp(&sp, &sc->sc_soparm, sizeof(sp)) != 0) {
407 1.62 dyoung GRE_DPRINTF(sc, "%s: parameters changed\n", __func__);
408 1.62 dyoung
409 1.93 dyoung if (fp != NULL) {
410 1.93 dyoung gre_closef(&fp, curlwp);
411 1.62 dyoung so = NULL;
412 1.62 dyoung } else if (so != NULL)
413 1.62 dyoung gre_sodestroy(&so);
414 1.62 dyoung
415 1.62 dyoung if (sc->sc_fp != NULL) {
416 1.93 dyoung fp = sc->sc_fp;
417 1.93 dyoung sc->sc_fp = NULL;
418 1.93 dyoung so = (struct socket *)fp->f_data;
419 1.90 dyoung gre_upcall_add(so, sc);
420 1.63 dyoung sp = sc->sc_soparm;
421 1.62 dyoung } else if (gre_socreate1(sc, l, &sp, &so) != 0)
422 1.62 dyoung goto out;
423 1.62 dyoung }
424 1.93 dyoung cv_signal(&sc->sc_soparm_cv);
425 1.62 dyoung for (;;) {
426 1.62 dyoung flags = MSG_DONTWAIT;
427 1.62 dyoung uio.uio_resid = 1000000;
428 1.62 dyoung rc = (*so->so_receive)(so, NULL, &uio, &m, NULL,
429 1.62 dyoung &flags);
430 1.62 dyoung /* TBD Back off if ECONNREFUSED (indicates
431 1.62 dyoung * ICMP Port Unreachable)?
432 1.62 dyoung */
433 1.62 dyoung if (rc == EWOULDBLOCK) {
434 1.62 dyoung GRE_DPRINTF(sc, "%s: so_receive EWOULDBLOCK\n",
435 1.62 dyoung __func__);
436 1.62 dyoung break;
437 1.62 dyoung } else if (rc != 0 || m == NULL) {
438 1.62 dyoung GRE_DPRINTF(sc, "%s: rc %d m %p\n",
439 1.62 dyoung ifp->if_xname, rc, (void *)m);
440 1.62 dyoung continue;
441 1.62 dyoung } else
442 1.62 dyoung GRE_DPRINTF(sc, "%s: so_receive ok\n",
443 1.62 dyoung __func__);
444 1.62 dyoung if (m->m_len < sizeof(*gh) &&
445 1.62 dyoung (m = m_pullup(m, sizeof(*gh))) == NULL) {
446 1.62 dyoung GRE_DPRINTF(sc, "%s: m_pullup failed\n",
447 1.62 dyoung __func__);
448 1.62 dyoung continue;
449 1.62 dyoung }
450 1.62 dyoung gh = mtod(m, const struct gre_h *);
451 1.62 dyoung
452 1.93 dyoung if (gre_input3(sc, m, 0, gh, 1) == 0) {
453 1.62 dyoung GRE_DPRINTF(sc, "%s: dropping unsupported\n",
454 1.62 dyoung __func__);
455 1.62 dyoung m_freem(m);
456 1.62 dyoung }
457 1.62 dyoung }
458 1.62 dyoung for (;;) {
459 1.62 dyoung IF_DEQUEUE(&sc->sc_snd, m);
460 1.62 dyoung if (m == NULL)
461 1.62 dyoung break;
462 1.62 dyoung GRE_DPRINTF(sc, "%s: dequeue\n", __func__);
463 1.62 dyoung if ((so->so_state & SS_ISCONNECTED) == 0) {
464 1.62 dyoung GRE_DPRINTF(sc, "%s: not connected\n",
465 1.62 dyoung __func__);
466 1.62 dyoung m_freem(m);
467 1.62 dyoung continue;
468 1.62 dyoung }
469 1.62 dyoung rc = (*so->so_send)(so, NULL, NULL, m, NULL, 0, l);
470 1.62 dyoung /* XXX handle ENOBUFS? */
471 1.62 dyoung if (rc != 0)
472 1.62 dyoung GRE_DPRINTF(sc, "%s: so_send failed\n",
473 1.62 dyoung __func__);
474 1.62 dyoung }
475 1.62 dyoung }
476 1.93 dyoung if (fp != NULL) {
477 1.62 dyoung GRE_DPRINTF(sc, "%s: removing upcall\n", __func__);
478 1.62 dyoung gre_upcall_remove(so);
479 1.66 dyoung } else if (so != NULL)
480 1.62 dyoung gre_sodestroy(&so);
481 1.62 dyoung out:
482 1.62 dyoung GRE_DPRINTF(sc, "%s: stopping\n", __func__);
483 1.93 dyoung if (fp != NULL)
484 1.93 dyoung gre_closef(&fp, curlwp);
485 1.75 dyoung if (sc->sc_proto == IPPROTO_UDP)
486 1.62 dyoung ifp->if_flags &= ~IFF_RUNNING;
487 1.64 dyoung while (!IF_IS_EMPTY(&sc->sc_snd)) {
488 1.64 dyoung IF_DEQUEUE(&sc->sc_snd, m);
489 1.64 dyoung m_freem(m);
490 1.64 dyoung }
491 1.93 dyoung gre_stop(sc);
492 1.62 dyoung /* must not touch sc after this! */
493 1.62 dyoung GRE_DPRINTF(sc, "%s: restore ipl\n", __func__);
494 1.93 dyoung mutex_exit(&sc->sc_mtx);
495 1.62 dyoung }
496 1.62 dyoung
497 1.62 dyoung static void
498 1.62 dyoung gre_thread(void *arg)
499 1.62 dyoung {
500 1.62 dyoung struct gre_softc *sc = (struct gre_softc *)arg;
501 1.62 dyoung
502 1.62 dyoung gre_thread1(sc, curlwp);
503 1.62 dyoung /* must not touch sc after this! */
504 1.62 dyoung kthread_exit(0);
505 1.62 dyoung }
506 1.62 dyoung
507 1.93 dyoung /* Calling thread must hold sc->sc_mtx. */
508 1.62 dyoung int
509 1.89 dyoung gre_input3(struct gre_softc *sc, struct mbuf *m, int hlen,
510 1.93 dyoung const struct gre_h *gh, int mtx_held)
511 1.62 dyoung {
512 1.62 dyoung u_int16_t flags;
513 1.62 dyoung #if NBPFILTER > 0
514 1.62 dyoung u_int32_t af = AF_INET; /* af passed to BPF tap */
515 1.62 dyoung #endif
516 1.93 dyoung int isr;
517 1.62 dyoung struct ifqueue *ifq;
518 1.62 dyoung
519 1.62 dyoung sc->sc_if.if_ipackets++;
520 1.62 dyoung sc->sc_if.if_ibytes += m->m_pkthdr.len;
521 1.62 dyoung
522 1.89 dyoung hlen += sizeof(struct gre_h);
523 1.62 dyoung
524 1.89 dyoung /* process GRE flags as packet can be of variable len */
525 1.89 dyoung flags = ntohs(gh->flags);
526 1.62 dyoung
527 1.89 dyoung /* Checksum & Offset are present */
528 1.89 dyoung if ((flags & GRE_CP) | (flags & GRE_RP))
529 1.89 dyoung hlen += 4;
530 1.89 dyoung /* We don't support routing fields (variable length) */
531 1.89 dyoung if (flags & GRE_RP) {
532 1.89 dyoung sc->sc_if.if_ierrors++;
533 1.89 dyoung return 0;
534 1.89 dyoung }
535 1.89 dyoung if (flags & GRE_KP)
536 1.89 dyoung hlen += 4;
537 1.89 dyoung if (flags & GRE_SP)
538 1.89 dyoung hlen += 4;
539 1.89 dyoung
540 1.89 dyoung switch (ntohs(gh->ptype)) { /* ethertypes */
541 1.89 dyoung case ETHERTYPE_IP: /* shouldn't need a schednetisr(), as */
542 1.89 dyoung ifq = &ipintrq; /* we are in ip_input */
543 1.89 dyoung isr = NETISR_IP;
544 1.89 dyoung break;
545 1.62 dyoung #ifdef NETATALK
546 1.89 dyoung case ETHERTYPE_ATALK:
547 1.89 dyoung ifq = &atintrq1;
548 1.89 dyoung isr = NETISR_ATALK;
549 1.62 dyoung #if NBPFILTER > 0
550 1.89 dyoung af = AF_APPLETALK;
551 1.62 dyoung #endif
552 1.89 dyoung break;
553 1.62 dyoung #endif
554 1.62 dyoung #ifdef INET6
555 1.89 dyoung case ETHERTYPE_IPV6:
556 1.89 dyoung GRE_DPRINTF(sc, "%s: IPv6 packet\n", __func__);
557 1.89 dyoung ifq = &ip6intrq;
558 1.89 dyoung isr = NETISR_IPV6;
559 1.62 dyoung #if NBPFILTER > 0
560 1.89 dyoung af = AF_INET6;
561 1.62 dyoung #endif
562 1.89 dyoung break;
563 1.62 dyoung #endif
564 1.89 dyoung default: /* others not yet supported */
565 1.90 dyoung GRE_DPRINTF(sc, "%s: unhandled ethertype 0x%04x\n", __func__,
566 1.89 dyoung ntohs(gh->ptype));
567 1.89 dyoung sc->sc_if.if_noproto++;
568 1.87 dyoung return 0;
569 1.62 dyoung }
570 1.62 dyoung
571 1.62 dyoung if (hlen > m->m_pkthdr.len) {
572 1.62 dyoung m_freem(m);
573 1.62 dyoung sc->sc_if.if_ierrors++;
574 1.87 dyoung return EINVAL;
575 1.62 dyoung }
576 1.62 dyoung m_adj(m, hlen);
577 1.62 dyoung
578 1.62 dyoung #if NBPFILTER > 0
579 1.62 dyoung if (sc->sc_if.if_bpf != NULL)
580 1.62 dyoung bpf_mtap_af(sc->sc_if.if_bpf, af, m);
581 1.62 dyoung #endif /*NBPFILTER > 0*/
582 1.62 dyoung
583 1.62 dyoung m->m_pkthdr.rcvif = &sc->sc_if;
584 1.62 dyoung
585 1.93 dyoung if (!mtx_held)
586 1.93 dyoung mutex_enter(&sc->sc_mtx);
587 1.62 dyoung if (IF_QFULL(ifq)) {
588 1.62 dyoung IF_DROP(ifq);
589 1.62 dyoung m_freem(m);
590 1.62 dyoung } else {
591 1.62 dyoung IF_ENQUEUE(ifq, m);
592 1.62 dyoung }
593 1.62 dyoung /* we need schednetisr since the address family may change */
594 1.62 dyoung schednetisr(isr);
595 1.93 dyoung if (!mtx_held)
596 1.93 dyoung mutex_exit(&sc->sc_mtx);
597 1.62 dyoung
598 1.87 dyoung return 1; /* packet is done, no further processing needed */
599 1.62 dyoung }
600 1.62 dyoung
601 1.20 itojun /*
602 1.1 hwr * The output routine. Takes a packet and encapsulates it in the protocol
603 1.75 dyoung * given by sc->sc_proto. See also RFC 1701 and RFC 2004
604 1.1 hwr */
605 1.59 thorpej static int
606 1.84 dyoung gre_output(struct ifnet *ifp, struct mbuf *m, const struct sockaddr *dst,
607 1.74 christos struct rtentry *rt)
608 1.1 hwr {
609 1.89 dyoung int error = 0, hlen, msiz;
610 1.10 thorpej struct gre_softc *sc = ifp->if_softc;
611 1.62 dyoung struct greip *gi;
612 1.62 dyoung struct gre_h *gh;
613 1.62 dyoung struct ip *eip, *ip;
614 1.56 is u_int8_t ip_tos = 0;
615 1.48 itojun u_int16_t etype = 0;
616 1.20 itojun struct mobile_h mob_h;
617 1.24 martin
618 1.39 itojun if ((ifp->if_flags & (IFF_UP | IFF_RUNNING)) == 0 ||
619 1.37 itojun sc->g_src.s_addr == INADDR_ANY || sc->g_dst.s_addr == INADDR_ANY) {
620 1.37 itojun m_freem(m);
621 1.38 itojun error = ENETDOWN;
622 1.38 itojun goto end;
623 1.37 itojun }
624 1.1 hwr
625 1.62 dyoung gi = NULL;
626 1.41 itojun ip = NULL;
627 1.1 hwr
628 1.1 hwr #if NBPFILTER >0
629 1.52 christos if (ifp->if_bpf)
630 1.52 christos bpf_mtap_af(ifp->if_bpf, dst->sa_family, m);
631 1.1 hwr #endif
632 1.1 hwr
633 1.26 martin m->m_flags &= ~(M_BCAST|M_MCAST);
634 1.1 hwr
635 1.75 dyoung switch (sc->sc_proto) {
636 1.62 dyoung case IPPROTO_MOBILE:
637 1.89 dyoung if (dst->sa_family != AF_INET) {
638 1.89 dyoung IF_DROP(&ifp->if_snd);
639 1.89 dyoung m_freem(m);
640 1.89 dyoung error = EINVAL;
641 1.89 dyoung goto end;
642 1.89 dyoung }
643 1.89 dyoung
644 1.89 dyoung if (M_UNWRITABLE(m, sizeof(*ip)) &&
645 1.89 dyoung (m = m_pullup(m, sizeof(*ip))) == NULL) {
646 1.89 dyoung error = ENOBUFS;
647 1.89 dyoung goto end;
648 1.89 dyoung }
649 1.89 dyoung ip = mtod(m, struct ip *);
650 1.3 hwr
651 1.89 dyoung memset(&mob_h, 0, MOB_H_SIZ_L);
652 1.89 dyoung mob_h.proto = (ip->ip_p) << 8;
653 1.89 dyoung mob_h.odst = ip->ip_dst.s_addr;
654 1.89 dyoung ip->ip_dst.s_addr = sc->g_dst.s_addr;
655 1.3 hwr
656 1.89 dyoung /*
657 1.89 dyoung * If the packet comes from our host, we only change
658 1.89 dyoung * the destination address in the IP header.
659 1.89 dyoung * Else we also need to save and change the source
660 1.89 dyoung */
661 1.89 dyoung if (in_hosteq(ip->ip_src, sc->g_src)) {
662 1.89 dyoung msiz = MOB_H_SIZ_S;
663 1.89 dyoung } else {
664 1.89 dyoung mob_h.proto |= MOB_H_SBIT;
665 1.89 dyoung mob_h.osrc = ip->ip_src.s_addr;
666 1.89 dyoung ip->ip_src.s_addr = sc->g_src.s_addr;
667 1.89 dyoung msiz = MOB_H_SIZ_L;
668 1.89 dyoung }
669 1.89 dyoung HTONS(mob_h.proto);
670 1.89 dyoung mob_h.hcrc = gre_in_cksum((u_int16_t *)&mob_h, msiz);
671 1.3 hwr
672 1.89 dyoung M_PREPEND(m, msiz, M_DONTWAIT);
673 1.89 dyoung if (m == NULL) {
674 1.89 dyoung error = ENOBUFS;
675 1.38 itojun goto end;
676 1.3 hwr }
677 1.89 dyoung /* XXX Assuming that ip does not dangle after
678 1.89 dyoung * M_PREPEND. In practice, that's true, but
679 1.90 dyoung * that's not in M_PREPEND's contract.
680 1.89 dyoung */
681 1.89 dyoung memmove(mtod(m, void *), ip, sizeof(*ip));
682 1.89 dyoung ip = mtod(m, struct ip *);
683 1.90 dyoung memcpy(ip + 1, &mob_h, (size_t)msiz);
684 1.89 dyoung ip->ip_len = htons(ntohs(ip->ip_len) + msiz);
685 1.62 dyoung break;
686 1.62 dyoung case IPPROTO_UDP:
687 1.62 dyoung case IPPROTO_GRE:
688 1.62 dyoung GRE_DPRINTF(sc, "%s: dst->sa_family=%d\n", __func__,
689 1.62 dyoung dst->sa_family);
690 1.20 itojun switch (dst->sa_family) {
691 1.1 hwr case AF_INET:
692 1.41 itojun ip = mtod(m, struct ip *);
693 1.56 is ip_tos = ip->ip_tos;
694 1.8 explorer etype = ETHERTYPE_IP;
695 1.1 hwr break;
696 1.1 hwr #ifdef NETATALK
697 1.1 hwr case AF_APPLETALK:
698 1.8 explorer etype = ETHERTYPE_ATALK;
699 1.1 hwr break;
700 1.1 hwr #endif
701 1.56 is #ifdef INET6
702 1.56 is case AF_INET6:
703 1.56 is etype = ETHERTYPE_IPV6;
704 1.56 is break;
705 1.56 is #endif
706 1.1 hwr default:
707 1.1 hwr IF_DROP(&ifp->if_snd);
708 1.1 hwr m_freem(m);
709 1.38 itojun error = EAFNOSUPPORT;
710 1.38 itojun goto end;
711 1.1 hwr }
712 1.62 dyoung break;
713 1.62 dyoung default:
714 1.1 hwr IF_DROP(&ifp->if_snd);
715 1.1 hwr m_freem(m);
716 1.38 itojun error = EINVAL;
717 1.38 itojun goto end;
718 1.1 hwr }
719 1.1 hwr
720 1.75 dyoung switch (sc->sc_proto) {
721 1.62 dyoung case IPPROTO_GRE:
722 1.62 dyoung hlen = sizeof(struct greip);
723 1.62 dyoung break;
724 1.62 dyoung case IPPROTO_UDP:
725 1.62 dyoung hlen = sizeof(struct gre_h);
726 1.62 dyoung break;
727 1.62 dyoung default:
728 1.62 dyoung hlen = 0;
729 1.62 dyoung break;
730 1.62 dyoung }
731 1.62 dyoung
732 1.62 dyoung M_PREPEND(m, hlen, M_DONTWAIT);
733 1.62 dyoung
734 1.62 dyoung if (m == NULL) {
735 1.1 hwr IF_DROP(&ifp->if_snd);
736 1.38 itojun error = ENOBUFS;
737 1.38 itojun goto end;
738 1.1 hwr }
739 1.1 hwr
740 1.75 dyoung switch (sc->sc_proto) {
741 1.62 dyoung case IPPROTO_UDP:
742 1.62 dyoung gh = mtod(m, struct gre_h *);
743 1.62 dyoung memset(gh, 0, sizeof(*gh));
744 1.62 dyoung gh->ptype = htons(etype);
745 1.62 dyoung /* XXX Need to handle IP ToS. Look at how I handle IP TTL. */
746 1.62 dyoung break;
747 1.62 dyoung case IPPROTO_GRE:
748 1.62 dyoung gi = mtod(m, struct greip *);
749 1.62 dyoung gh = &gi->gi_g;
750 1.62 dyoung eip = &gi->gi_i;
751 1.1 hwr /* we don't have any GRE flags for now */
752 1.62 dyoung memset(gh, 0, sizeof(*gh));
753 1.62 dyoung gh->ptype = htons(etype);
754 1.62 dyoung eip->ip_src = sc->g_src;
755 1.62 dyoung eip->ip_dst = sc->g_dst;
756 1.62 dyoung eip->ip_hl = (sizeof(struct ip)) >> 2;
757 1.62 dyoung eip->ip_ttl = ip_gre_ttl;
758 1.62 dyoung eip->ip_tos = ip_tos;
759 1.62 dyoung eip->ip_len = htons(m->m_pkthdr.len);
760 1.75 dyoung eip->ip_p = sc->sc_proto;
761 1.62 dyoung break;
762 1.62 dyoung case IPPROTO_MOBILE:
763 1.62 dyoung eip = mtod(m, struct ip *);
764 1.75 dyoung eip->ip_p = sc->sc_proto;
765 1.62 dyoung break;
766 1.62 dyoung default:
767 1.62 dyoung error = EPROTONOSUPPORT;
768 1.62 dyoung m_freem(m);
769 1.62 dyoung goto end;
770 1.3 hwr }
771 1.1 hwr
772 1.1 hwr ifp->if_opackets++;
773 1.8 explorer ifp->if_obytes += m->m_pkthdr.len;
774 1.62 dyoung
775 1.1 hwr /* send it off */
776 1.75 dyoung if (sc->sc_proto == IPPROTO_UDP) {
777 1.62 dyoung if (IF_QFULL(&sc->sc_snd)) {
778 1.62 dyoung IF_DROP(&sc->sc_snd);
779 1.62 dyoung error = ENOBUFS;
780 1.62 dyoung m_freem(m);
781 1.62 dyoung } else {
782 1.62 dyoung IF_ENQUEUE(&sc->sc_snd, m);
783 1.62 dyoung gre_wakeup(sc);
784 1.62 dyoung error = 0;
785 1.62 dyoung }
786 1.81 joerg goto end;
787 1.81 joerg }
788 1.86 dyoung if (sc->route.ro_rt == NULL)
789 1.86 dyoung rtcache_init(&sc->route);
790 1.86 dyoung else
791 1.86 dyoung rtcache_check(&sc->route);
792 1.91 dyoung if (sc->route.ro_rt == NULL) {
793 1.91 dyoung m_freem(m);
794 1.81 joerg goto end;
795 1.91 dyoung }
796 1.91 dyoung if (sc->route.ro_rt->rt_ifp->if_softc == sc) {
797 1.92 dyoung rtcache_clear(&sc->route);
798 1.91 dyoung m_freem(m);
799 1.91 dyoung } else
800 1.92 dyoung error = ip_output(m, NULL, &sc->route, 0, NULL, NULL);
801 1.38 itojun end:
802 1.8 explorer if (error)
803 1.1 hwr ifp->if_oerrors++;
804 1.87 dyoung return error;
805 1.1 hwr }
806 1.1 hwr
807 1.93 dyoung /* Calling thread must hold sc->sc_mtx. */
808 1.62 dyoung static int
809 1.62 dyoung gre_kick(struct gre_softc *sc)
810 1.62 dyoung {
811 1.62 dyoung int rc;
812 1.62 dyoung struct ifnet *ifp = &sc->sc_if;
813 1.62 dyoung
814 1.75 dyoung if (sc->sc_proto == IPPROTO_UDP && (ifp->if_flags & IFF_UP) == IFF_UP &&
815 1.93 dyoung !sc->sc_running) {
816 1.93 dyoung sc->sc_running = 1;
817 1.93 dyoung mutex_exit(&sc->sc_mtx);
818 1.90 dyoung rc = kthread_create1(gre_thread, sc, NULL, ifp->if_xname);
819 1.93 dyoung mutex_enter(&sc->sc_mtx);
820 1.62 dyoung if (rc != 0)
821 1.93 dyoung gre_stop(sc);
822 1.62 dyoung return rc;
823 1.62 dyoung } else {
824 1.62 dyoung gre_wakeup(sc);
825 1.62 dyoung return 0;
826 1.62 dyoung }
827 1.62 dyoung }
828 1.62 dyoung
829 1.93 dyoung /* Calling thread must hold sc->sc_mtx. */
830 1.62 dyoung static int
831 1.62 dyoung gre_getname(struct socket *so, int req, struct mbuf *nam, struct lwp *l)
832 1.62 dyoung {
833 1.93 dyoung return (*so->so_proto->pr_usrreq)(so, req, NULL, nam, NULL, l);
834 1.62 dyoung }
835 1.62 dyoung
836 1.93 dyoung /* Calling thread must hold sc->sc_mtx. */
837 1.62 dyoung static int
838 1.62 dyoung gre_getsockname(struct socket *so, struct mbuf *nam, struct lwp *l)
839 1.62 dyoung {
840 1.62 dyoung return gre_getname(so, PRU_SOCKADDR, nam, l);
841 1.62 dyoung }
842 1.62 dyoung
843 1.93 dyoung /* Calling thread must hold sc->sc_mtx. */
844 1.62 dyoung static int
845 1.62 dyoung gre_getpeername(struct socket *so, struct mbuf *nam, struct lwp *l)
846 1.62 dyoung {
847 1.62 dyoung return gre_getname(so, PRU_PEERADDR, nam, l);
848 1.62 dyoung }
849 1.62 dyoung
850 1.93 dyoung /* Calling thread must hold sc->sc_mtx. */
851 1.62 dyoung static int
852 1.62 dyoung gre_getnames(struct socket *so, struct lwp *l, struct sockaddr_in *src,
853 1.62 dyoung struct sockaddr_in *dst)
854 1.62 dyoung {
855 1.62 dyoung struct mbuf *m;
856 1.62 dyoung struct sockaddr_in *sin;
857 1.62 dyoung int rc;
858 1.62 dyoung
859 1.62 dyoung if ((m = gre_getsockmbuf(so)) == NULL)
860 1.62 dyoung return ENOBUFS;
861 1.62 dyoung
862 1.62 dyoung sin = mtod(m, struct sockaddr_in *);
863 1.62 dyoung
864 1.62 dyoung if ((rc = gre_getsockname(so, m, l)) != 0)
865 1.62 dyoung goto out;
866 1.62 dyoung if (sin->sin_family != AF_INET) {
867 1.62 dyoung rc = EAFNOSUPPORT;
868 1.62 dyoung goto out;
869 1.62 dyoung }
870 1.62 dyoung *src = *sin;
871 1.62 dyoung
872 1.62 dyoung if ((rc = gre_getpeername(so, m, l)) != 0)
873 1.62 dyoung goto out;
874 1.62 dyoung if (sin->sin_family != AF_INET) {
875 1.62 dyoung rc = EAFNOSUPPORT;
876 1.62 dyoung goto out;
877 1.62 dyoung }
878 1.62 dyoung *dst = *sin;
879 1.62 dyoung
880 1.62 dyoung out:
881 1.62 dyoung m_freem(m);
882 1.62 dyoung return rc;
883 1.62 dyoung }
884 1.62 dyoung
885 1.93 dyoung static void
886 1.93 dyoung gre_closef(struct file **fpp, struct lwp *l)
887 1.93 dyoung {
888 1.93 dyoung struct file *fp = *fpp;
889 1.93 dyoung
890 1.93 dyoung simple_lock(&fp->f_slock);
891 1.93 dyoung FILE_USE(fp);
892 1.93 dyoung closef(fp, l);
893 1.93 dyoung *fpp = NULL;
894 1.93 dyoung }
895 1.93 dyoung
896 1.59 thorpej static int
897 1.88 christos gre_ioctl(struct ifnet *ifp, u_long cmd, void *data)
898 1.1 hwr {
899 1.62 dyoung u_char oproto;
900 1.93 dyoung struct file *fp;
901 1.62 dyoung struct socket *so;
902 1.62 dyoung struct sockaddr_in dst, src;
903 1.62 dyoung struct proc *p = curproc; /* XXX */
904 1.61 ad struct lwp *l = curlwp; /* XXX */
905 1.94 christos struct ifreq *ifr;
906 1.28 itojun struct if_laddrreq *lifr = (struct if_laddrreq *)data;
907 1.8 explorer struct gre_softc *sc = ifp->if_softc;
908 1.1 hwr struct sockaddr_in si;
909 1.8 explorer struct sockaddr *sa = NULL;
910 1.80 christos int error = 0;
911 1.94 christos u_long ocmd = cmd;
912 1.94 christos #ifdef COMPAT_OIFREQ
913 1.95 xtraeme struct oifreq *oifr = NULL;
914 1.94 christos struct ifreq ifrb;
915 1.94 christos
916 1.94 christos cmd = cvtcmd(cmd);
917 1.94 christos if (cmd != ocmd) {
918 1.94 christos oifr = data;
919 1.94 christos data = ifr = &ifrb;
920 1.94 christos ifreqo2n(oifr, ifr);
921 1.94 christos } else
922 1.94 christos #endif
923 1.94 christos ifr = data;
924 1.94 christos
925 1.61 ad switch (cmd) {
926 1.61 ad case SIOCSIFFLAGS:
927 1.61 ad case SIOCSIFMTU:
928 1.61 ad case GRESPROTO:
929 1.61 ad case GRESADDRD:
930 1.61 ad case GRESADDRS:
931 1.62 dyoung case GRESSOCK:
932 1.62 dyoung case GREDSOCK:
933 1.61 ad case SIOCSLIFPHYADDR:
934 1.61 ad case SIOCDIFPHYADDR:
935 1.70 elad if (kauth_authorize_network(l->l_cred, KAUTH_NETWORK_INTERFACE,
936 1.70 elad KAUTH_REQ_NETWORK_INTERFACE_SETPRIV, ifp, (void *)cmd,
937 1.70 elad NULL) != 0)
938 1.87 dyoung return EPERM;
939 1.61 ad break;
940 1.61 ad default:
941 1.61 ad break;
942 1.61 ad }
943 1.1 hwr
944 1.93 dyoung mutex_enter(&sc->sc_mtx);
945 1.20 itojun switch (cmd) {
946 1.20 itojun case SIOCSIFADDR:
947 1.36 itojun ifp->if_flags |= IFF_UP;
948 1.78 dyoung if ((error = gre_kick(sc)) != 0)
949 1.78 dyoung ifp->if_flags &= ~IFF_UP;
950 1.36 itojun break;
951 1.55 perry case SIOCSIFDSTADDR:
952 1.1 hwr break;
953 1.1 hwr case SIOCSIFFLAGS:
954 1.75 dyoung oproto = sc->sc_proto;
955 1.62 dyoung switch (ifr->ifr_flags & (IFF_LINK0|IFF_LINK2)) {
956 1.62 dyoung case IFF_LINK0|IFF_LINK2:
957 1.75 dyoung sc->sc_proto = IPPROTO_UDP;
958 1.62 dyoung if (oproto != IPPROTO_UDP)
959 1.62 dyoung ifp->if_flags &= ~IFF_RUNNING;
960 1.62 dyoung error = gre_kick(sc);
961 1.62 dyoung break;
962 1.62 dyoung case IFF_LINK0:
963 1.75 dyoung sc->sc_proto = IPPROTO_GRE;
964 1.62 dyoung gre_wakeup(sc);
965 1.62 dyoung goto recompute;
966 1.62 dyoung case 0:
967 1.75 dyoung sc->sc_proto = IPPROTO_MOBILE;
968 1.62 dyoung gre_wakeup(sc);
969 1.62 dyoung goto recompute;
970 1.62 dyoung }
971 1.1 hwr break;
972 1.20 itojun case SIOCSIFMTU:
973 1.27 martin if (ifr->ifr_mtu < 576) {
974 1.1 hwr error = EINVAL;
975 1.1 hwr break;
976 1.1 hwr }
977 1.1 hwr ifp->if_mtu = ifr->ifr_mtu;
978 1.1 hwr break;
979 1.1 hwr case SIOCGIFMTU:
980 1.1 hwr ifr->ifr_mtu = sc->sc_if.if_mtu;
981 1.1 hwr break;
982 1.1 hwr case SIOCADDMULTI:
983 1.1 hwr case SIOCDELMULTI:
984 1.8 explorer if (ifr == 0) {
985 1.1 hwr error = EAFNOSUPPORT;
986 1.1 hwr break;
987 1.1 hwr }
988 1.8 explorer switch (ifr->ifr_addr.sa_family) {
989 1.1 hwr #ifdef INET
990 1.1 hwr case AF_INET:
991 1.1 hwr break;
992 1.1 hwr #endif
993 1.56 is #ifdef INET6
994 1.56 is case AF_INET6:
995 1.56 is break;
996 1.56 is #endif
997 1.1 hwr default:
998 1.1 hwr error = EAFNOSUPPORT;
999 1.1 hwr break;
1000 1.1 hwr }
1001 1.1 hwr break;
1002 1.1 hwr case GRESPROTO:
1003 1.75 dyoung oproto = sc->sc_proto;
1004 1.75 dyoung sc->sc_proto = ifr->ifr_flags;
1005 1.75 dyoung switch (sc->sc_proto) {
1006 1.62 dyoung case IPPROTO_UDP:
1007 1.62 dyoung ifp->if_flags |= IFF_LINK0|IFF_LINK2;
1008 1.62 dyoung if (oproto != IPPROTO_UDP)
1009 1.62 dyoung ifp->if_flags &= ~IFF_RUNNING;
1010 1.62 dyoung error = gre_kick(sc);
1011 1.62 dyoung break;
1012 1.40 itojun case IPPROTO_GRE:
1013 1.3 hwr ifp->if_flags |= IFF_LINK0;
1014 1.62 dyoung ifp->if_flags &= ~IFF_LINK2;
1015 1.62 dyoung goto recompute;
1016 1.40 itojun case IPPROTO_MOBILE:
1017 1.62 dyoung ifp->if_flags &= ~(IFF_LINK0|IFF_LINK2);
1018 1.62 dyoung goto recompute;
1019 1.1 hwr default:
1020 1.40 itojun error = EPROTONOSUPPORT;
1021 1.35 itojun break;
1022 1.1 hwr }
1023 1.1 hwr break;
1024 1.1 hwr case GREGPROTO:
1025 1.75 dyoung ifr->ifr_flags = sc->sc_proto;
1026 1.1 hwr break;
1027 1.1 hwr case GRESADDRS:
1028 1.1 hwr case GRESADDRD:
1029 1.1 hwr /*
1030 1.20 itojun * set tunnel endpoints, compute a less specific route
1031 1.20 itojun * to the remote end and mark if as up
1032 1.20 itojun */
1033 1.1 hwr sa = &ifr->ifr_addr;
1034 1.62 dyoung if (cmd == GRESADDRS) {
1035 1.1 hwr sc->g_src = (satosin(sa))->sin_addr;
1036 1.62 dyoung sc->g_srcport = satosin(sa)->sin_port;
1037 1.62 dyoung }
1038 1.62 dyoung if (cmd == GRESADDRD) {
1039 1.75 dyoung if (sc->sc_proto == IPPROTO_UDP &&
1040 1.62 dyoung satosin(sa)->sin_port == 0) {
1041 1.62 dyoung error = EINVAL;
1042 1.62 dyoung break;
1043 1.62 dyoung }
1044 1.1 hwr sc->g_dst = (satosin(sa))->sin_addr;
1045 1.62 dyoung sc->g_dstport = satosin(sa)->sin_port;
1046 1.62 dyoung }
1047 1.30 itojun recompute:
1048 1.75 dyoung if (sc->sc_proto == IPPROTO_UDP ||
1049 1.62 dyoung (sc->g_src.s_addr != INADDR_ANY &&
1050 1.62 dyoung sc->g_dst.s_addr != INADDR_ANY)) {
1051 1.81 joerg rtcache_free(&sc->route);
1052 1.75 dyoung if (sc->sc_proto == IPPROTO_UDP)
1053 1.62 dyoung error = gre_kick(sc);
1054 1.62 dyoung else if (gre_compute_route(sc) == 0)
1055 1.39 itojun ifp->if_flags |= IFF_RUNNING;
1056 1.39 itojun else
1057 1.39 itojun ifp->if_flags &= ~IFF_RUNNING;
1058 1.1 hwr }
1059 1.1 hwr break;
1060 1.1 hwr case GREGADDRS:
1061 1.33 itojun memset(&si, 0, sizeof(si));
1062 1.28 itojun si.sin_family = AF_INET;
1063 1.28 itojun si.sin_len = sizeof(struct sockaddr_in);
1064 1.1 hwr si.sin_addr.s_addr = sc->g_src.s_addr;
1065 1.8 explorer sa = sintosa(&si);
1066 1.1 hwr ifr->ifr_addr = *sa;
1067 1.1 hwr break;
1068 1.1 hwr case GREGADDRD:
1069 1.33 itojun memset(&si, 0, sizeof(si));
1070 1.28 itojun si.sin_family = AF_INET;
1071 1.28 itojun si.sin_len = sizeof(struct sockaddr_in);
1072 1.1 hwr si.sin_addr.s_addr = sc->g_dst.s_addr;
1073 1.8 explorer sa = sintosa(&si);
1074 1.1 hwr ifr->ifr_addr = *sa;
1075 1.28 itojun break;
1076 1.62 dyoung case GREDSOCK:
1077 1.93 dyoung if (sc->sc_proto != IPPROTO_UDP) {
1078 1.93 dyoung error = EINVAL;
1079 1.93 dyoung break;
1080 1.63 dyoung }
1081 1.93 dyoung ifp->if_flags &= ~IFF_UP;
1082 1.93 dyoung gre_wakeup(sc);
1083 1.62 dyoung break;
1084 1.62 dyoung case GRESSOCK:
1085 1.93 dyoung if (sc->sc_proto != IPPROTO_UDP) {
1086 1.93 dyoung error = EINVAL;
1087 1.93 dyoung break;
1088 1.93 dyoung }
1089 1.93 dyoung /* getsock() will FILE_USE() and unlock the descriptor for us */
1090 1.62 dyoung if ((error = getsock(p->p_fd, (int)ifr->ifr_value, &fp)) != 0)
1091 1.62 dyoung break;
1092 1.62 dyoung so = (struct socket *)fp->f_data;
1093 1.62 dyoung if (so->so_type != SOCK_DGRAM) {
1094 1.62 dyoung FILE_UNUSE(fp, NULL);
1095 1.62 dyoung error = EINVAL;
1096 1.62 dyoung break;
1097 1.62 dyoung }
1098 1.62 dyoung /* check address */
1099 1.62 dyoung if ((error = gre_getnames(so, curlwp, &src, &dst)) != 0) {
1100 1.62 dyoung FILE_UNUSE(fp, NULL);
1101 1.62 dyoung break;
1102 1.62 dyoung }
1103 1.62 dyoung
1104 1.93 dyoung /* Increase reference count. Now that our reference
1105 1.93 dyoung * to the file descriptor is counted, this thread
1106 1.93 dyoung * can release our "use" of the descriptor, but it
1107 1.93 dyoung * will not be destroyed by some other thread's
1108 1.93 dyoung * action. This thread needs to release its use,
1109 1.93 dyoung * too, because one and only one thread can have
1110 1.93 dyoung * use of the descriptor at once. The kernel thread
1111 1.93 dyoung * will pick up the use if it needs it.
1112 1.93 dyoung */
1113 1.93 dyoung
1114 1.62 dyoung fp->f_count++;
1115 1.93 dyoung FILE_UNUSE(fp, NULL);
1116 1.93 dyoung
1117 1.93 dyoung while (sc->sc_fp != NULL && error == 0) {
1118 1.93 dyoung error = cv_timedwait_sig(&sc->sc_soparm_cv, &sc->sc_mtx,
1119 1.93 dyoung MAX(1, hz / 2));
1120 1.93 dyoung }
1121 1.93 dyoung if (error == 0) {
1122 1.93 dyoung sc->sc_fp = fp;
1123 1.93 dyoung ifp->if_flags |= IFF_UP;
1124 1.93 dyoung }
1125 1.62 dyoung
1126 1.93 dyoung if (error != 0 || (error = gre_kick(sc)) != 0) {
1127 1.93 dyoung gre_closef(&fp, l);
1128 1.62 dyoung break;
1129 1.62 dyoung }
1130 1.93 dyoung /* fp does not any longer belong to this thread. */
1131 1.62 dyoung sc->g_src = src.sin_addr;
1132 1.62 dyoung sc->g_srcport = src.sin_port;
1133 1.62 dyoung sc->g_dst = dst.sin_addr;
1134 1.62 dyoung sc->g_dstport = dst.sin_port;
1135 1.62 dyoung break;
1136 1.28 itojun case SIOCSLIFPHYADDR:
1137 1.28 itojun if (lifr->addr.ss_family != AF_INET ||
1138 1.31 itojun lifr->dstaddr.ss_family != AF_INET) {
1139 1.31 itojun error = EAFNOSUPPORT;
1140 1.31 itojun break;
1141 1.31 itojun }
1142 1.28 itojun if (lifr->addr.ss_len != sizeof(si) ||
1143 1.31 itojun lifr->dstaddr.ss_len != sizeof(si)) {
1144 1.31 itojun error = EINVAL;
1145 1.31 itojun break;
1146 1.31 itojun }
1147 1.62 dyoung sc->g_src = satosin(&lifr->addr)->sin_addr;
1148 1.62 dyoung sc->g_dst = satosin(&lifr->dstaddr)->sin_addr;
1149 1.62 dyoung sc->g_srcport = satosin(&lifr->addr)->sin_port;
1150 1.62 dyoung sc->g_dstport = satosin(&lifr->dstaddr)->sin_port;
1151 1.30 itojun goto recompute;
1152 1.28 itojun case SIOCDIFPHYADDR:
1153 1.28 itojun sc->g_src.s_addr = INADDR_ANY;
1154 1.28 itojun sc->g_dst.s_addr = INADDR_ANY;
1155 1.62 dyoung sc->g_srcport = 0;
1156 1.62 dyoung sc->g_dstport = 0;
1157 1.62 dyoung goto recompute;
1158 1.28 itojun case SIOCGLIFPHYADDR:
1159 1.28 itojun if (sc->g_src.s_addr == INADDR_ANY ||
1160 1.28 itojun sc->g_dst.s_addr == INADDR_ANY) {
1161 1.28 itojun error = EADDRNOTAVAIL;
1162 1.28 itojun break;
1163 1.28 itojun }
1164 1.33 itojun memset(&si, 0, sizeof(si));
1165 1.28 itojun si.sin_family = AF_INET;
1166 1.28 itojun si.sin_len = sizeof(struct sockaddr_in);
1167 1.62 dyoung si.sin_addr = sc->g_src;
1168 1.75 dyoung if (sc->sc_proto == IPPROTO_UDP)
1169 1.62 dyoung si.sin_port = sc->g_srcport;
1170 1.33 itojun memcpy(&lifr->addr, &si, sizeof(si));
1171 1.62 dyoung si.sin_addr = sc->g_dst;
1172 1.75 dyoung if (sc->sc_proto == IPPROTO_UDP)
1173 1.62 dyoung si.sin_port = sc->g_dstport;
1174 1.33 itojun memcpy(&lifr->dstaddr, &si, sizeof(si));
1175 1.1 hwr break;
1176 1.1 hwr default:
1177 1.1 hwr error = EINVAL;
1178 1.31 itojun break;
1179 1.1 hwr }
1180 1.94 christos #ifdef COMPAT_OIFREQ
1181 1.94 christos if (cmd != ocmd)
1182 1.94 christos ifreqn2o(oifr, ifr);
1183 1.94 christos #endif
1184 1.93 dyoung mutex_exit(&sc->sc_mtx);
1185 1.87 dyoung return error;
1186 1.1 hwr }
1187 1.1 hwr
1188 1.20 itojun /*
1189 1.78 dyoung * Compute a route to our destination.
1190 1.1 hwr */
1191 1.59 thorpej static int
1192 1.8 explorer gre_compute_route(struct gre_softc *sc)
1193 1.1 hwr {
1194 1.1 hwr struct route *ro;
1195 1.92 dyoung union {
1196 1.92 dyoung struct sockaddr dst;
1197 1.92 dyoung struct sockaddr_in dst4;
1198 1.92 dyoung } u;
1199 1.1 hwr
1200 1.8 explorer ro = &sc->route;
1201 1.20 itojun
1202 1.92 dyoung memset(ro, 0, sizeof(*ro));
1203 1.92 dyoung sockaddr_in_init(&u.dst4, &sc->g_dst, 0);
1204 1.92 dyoung rtcache_setdst(ro, &u.dst);
1205 1.8 explorer
1206 1.81 joerg rtcache_init(ro);
1207 1.81 joerg
1208 1.81 joerg if (ro->ro_rt == NULL || ro->ro_rt->rt_ifp->if_softc == sc) {
1209 1.90 dyoung GRE_DPRINTF(sc, "%s: route to %s %s\n", sc->sc_if.if_xname,
1210 1.92 dyoung inet_ntoa(u.dst4.sin_addr),
1211 1.90 dyoung (ro->ro_rt == NULL)
1212 1.90 dyoung ? "does not exist"
1213 1.90 dyoung : "loops back to ourself");
1214 1.81 joerg rtcache_free(ro);
1215 1.81 joerg return EADDRNOTAVAIL;
1216 1.25 martin }
1217 1.25 martin
1218 1.25 martin return 0;
1219 1.1 hwr }
1220 1.1 hwr
1221 1.3 hwr /*
1222 1.20 itojun * do a checksum of a buffer - much like in_cksum, which operates on
1223 1.20 itojun * mbufs.
1224 1.3 hwr */
1225 1.48 itojun u_int16_t
1226 1.48 itojun gre_in_cksum(u_int16_t *p, u_int len)
1227 1.3 hwr {
1228 1.48 itojun u_int32_t sum = 0;
1229 1.3 hwr int nwords = len >> 1;
1230 1.20 itojun
1231 1.3 hwr while (nwords-- != 0)
1232 1.3 hwr sum += *p++;
1233 1.20 itojun
1234 1.20 itojun if (len & 1) {
1235 1.20 itojun union {
1236 1.20 itojun u_short w;
1237 1.20 itojun u_char c[2];
1238 1.20 itojun } u;
1239 1.20 itojun u.c[0] = *(u_char *)p;
1240 1.20 itojun u.c[1] = 0;
1241 1.20 itojun sum += u.w;
1242 1.20 itojun }
1243 1.20 itojun
1244 1.20 itojun /* end-around-carry */
1245 1.20 itojun sum = (sum >> 16) + (sum & 0xffff);
1246 1.20 itojun sum += (sum >> 16);
1247 1.87 dyoung return ~sum;
1248 1.3 hwr }
1249 1.54 christos #endif
1250 1.54 christos
1251 1.59 thorpej void greattach(int);
1252 1.54 christos
1253 1.54 christos /* ARGSUSED */
1254 1.54 christos void
1255 1.74 christos greattach(int count)
1256 1.54 christos {
1257 1.54 christos #ifdef INET
1258 1.54 christos LIST_INIT(&gre_softc_list);
1259 1.54 christos if_clone_attach(&gre_cloner);
1260 1.54 christos #endif
1261 1.54 christos }
1262