if_gre.c revision 1.88.2.6 1 1.88.2.6 ad /* $NetBSD: if_gre.c,v 1.88.2.6 2007/06/09 23:58:11 ad Exp $ */
2 1.4 thorpej
3 1.1 hwr /*
4 1.4 thorpej * Copyright (c) 1998 The NetBSD Foundation, Inc.
5 1.1 hwr * All rights reserved.
6 1.1 hwr *
7 1.1 hwr * This code is derived from software contributed to The NetBSD Foundation
8 1.1 hwr * by Heiko W.Rupp <hwr (at) pilhuhn.de>
9 1.1 hwr *
10 1.56 is * IPv6-over-GRE contributed by Gert Doering <gert (at) greenie.muc.de>
11 1.56 is *
12 1.1 hwr * Redistribution and use in source and binary forms, with or without
13 1.1 hwr * modification, are permitted provided that the following conditions
14 1.1 hwr * are met:
15 1.1 hwr * 1. Redistributions of source code must retain the above copyright
16 1.1 hwr * notice, this list of conditions and the following disclaimer.
17 1.1 hwr * 2. Redistributions in binary form must reproduce the above copyright
18 1.1 hwr * notice, this list of conditions and the following disclaimer in the
19 1.1 hwr * documentation and/or other materials provided with the distribution.
20 1.1 hwr * 3. All advertising materials mentioning features or use of this software
21 1.1 hwr * must display the following acknowledgement:
22 1.1 hwr * This product includes software developed by the NetBSD
23 1.1 hwr * Foundation, Inc. and its contributors.
24 1.1 hwr * 4. Neither the name of The NetBSD Foundation nor the names of its
25 1.1 hwr * contributors may be used to endorse or promote products derived
26 1.1 hwr * from this software without specific prior written permission.
27 1.1 hwr *
28 1.1 hwr * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
29 1.1 hwr * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
30 1.1 hwr * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
31 1.1 hwr * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
32 1.1 hwr * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
33 1.1 hwr * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
34 1.1 hwr * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
35 1.1 hwr * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
36 1.1 hwr * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
37 1.1 hwr * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
38 1.1 hwr * POSSIBILITY OF SUCH DAMAGE.
39 1.1 hwr */
40 1.1 hwr
41 1.1 hwr /*
42 1.1 hwr * Encapsulate L3 protocols into IP
43 1.1 hwr * See RFC 1701 and 1702 for more details.
44 1.1 hwr * If_gre is compatible with Cisco GRE tunnels, so you can
45 1.1 hwr * have a NetBSD box as the other end of a tunnel interface of a Cisco
46 1.1 hwr * router. See gre(4) for more details.
47 1.6 hwr * Also supported: IP in IP encaps (proto 55) as of RFC 2004
48 1.1 hwr */
49 1.22 lukem
50 1.22 lukem #include <sys/cdefs.h>
51 1.88.2.6 ad __KERNEL_RCSID(0, "$NetBSD: if_gre.c,v 1.88.2.6 2007/06/09 23:58:11 ad Exp $");
52 1.1 hwr
53 1.62 dyoung #include "opt_gre.h"
54 1.1 hwr #include "opt_inet.h"
55 1.1 hwr #include "bpfilter.h"
56 1.1 hwr
57 1.54 christos #ifdef INET
58 1.1 hwr #include <sys/param.h>
59 1.62 dyoung #include <sys/file.h>
60 1.62 dyoung #include <sys/filedesc.h>
61 1.1 hwr #include <sys/malloc.h>
62 1.1 hwr #include <sys/mbuf.h>
63 1.13 martin #include <sys/proc.h>
64 1.1 hwr #include <sys/protosw.h>
65 1.1 hwr #include <sys/socket.h>
66 1.62 dyoung #include <sys/socketvar.h>
67 1.1 hwr #include <sys/ioctl.h>
68 1.10 thorpej #include <sys/queue.h>
69 1.1 hwr #if __NetBSD__
70 1.1 hwr #include <sys/systm.h>
71 1.62 dyoung #include <sys/sysctl.h>
72 1.60 elad #include <sys/kauth.h>
73 1.1 hwr #endif
74 1.1 hwr
75 1.88.2.5 ad #include <sys/kernel.h>
76 1.88.2.5 ad #include <sys/mutex.h>
77 1.88.2.5 ad #include <sys/condvar.h>
78 1.62 dyoung #include <sys/kthread.h>
79 1.62 dyoung
80 1.1 hwr #include <machine/cpu.h>
81 1.1 hwr
82 1.1 hwr #include <net/ethertypes.h>
83 1.1 hwr #include <net/if.h>
84 1.1 hwr #include <net/if_types.h>
85 1.1 hwr #include <net/netisr.h>
86 1.1 hwr #include <net/route.h>
87 1.1 hwr
88 1.1 hwr #ifdef INET
89 1.1 hwr #include <netinet/in.h>
90 1.1 hwr #include <netinet/in_systm.h>
91 1.1 hwr #include <netinet/in_var.h>
92 1.1 hwr #include <netinet/ip.h>
93 1.1 hwr #include <netinet/ip_var.h>
94 1.1 hwr #else
95 1.4 thorpej #error "Huh? if_gre without inet?"
96 1.1 hwr #endif
97 1.1 hwr
98 1.1 hwr
99 1.1 hwr #ifdef NETATALK
100 1.1 hwr #include <netatalk/at.h>
101 1.1 hwr #include <netatalk/at_var.h>
102 1.1 hwr #include <netatalk/at_extern.h>
103 1.1 hwr #endif
104 1.1 hwr
105 1.1 hwr #if NBPFILTER > 0
106 1.1 hwr #include <sys/time.h>
107 1.1 hwr #include <net/bpf.h>
108 1.1 hwr #endif
109 1.1 hwr
110 1.1 hwr #include <net/if_gre.h>
111 1.1 hwr
112 1.88.2.6 ad #include <compat/sys/sockio.h>
113 1.20 itojun /*
114 1.27 martin * It is not easy to calculate the right value for a GRE MTU.
115 1.27 martin * We leave this task to the admin and use the same default that
116 1.27 martin * other vendors use.
117 1.20 itojun */
118 1.27 martin #define GREMTU 1476
119 1.1 hwr
120 1.62 dyoung #ifdef GRE_DEBUG
121 1.62 dyoung #define GRE_DPRINTF(__sc, __fmt, ...) \
122 1.62 dyoung do { \
123 1.62 dyoung if (((__sc)->sc_if.if_flags & IFF_DEBUG) != 0) \
124 1.62 dyoung printf(__fmt, __VA_ARGS__); \
125 1.62 dyoung } while (/*CONSTCOND*/0)
126 1.62 dyoung #else
127 1.62 dyoung #define GRE_DPRINTF(__sc, __fmt, ...) do { } while (/*CONSTCOND*/0)
128 1.62 dyoung #endif /* GRE_DEBUG */
129 1.62 dyoung
130 1.11 thorpej struct gre_softc_head gre_softc_list;
131 1.26 martin int ip_gre_ttl = GRE_TTL;
132 1.1 hwr
133 1.59 thorpej static int gre_clone_create(struct if_clone *, int);
134 1.59 thorpej static int gre_clone_destroy(struct ifnet *);
135 1.10 thorpej
136 1.59 thorpej static struct if_clone gre_cloner =
137 1.10 thorpej IF_CLONE_INITIALIZER("gre", gre_clone_create, gre_clone_destroy);
138 1.1 hwr
139 1.84 dyoung static int gre_output(struct ifnet *, struct mbuf *,
140 1.84 dyoung const struct sockaddr *, struct rtentry *);
141 1.88 christos static int gre_ioctl(struct ifnet *, u_long, void *);
142 1.1 hwr
143 1.59 thorpej static int gre_compute_route(struct gre_softc *sc);
144 1.59 thorpej
145 1.88.2.5 ad static void gre_closef(struct file **, struct lwp *);
146 1.62 dyoung static int gre_getsockname(struct socket *, struct mbuf *, struct lwp *);
147 1.62 dyoung static int gre_getpeername(struct socket *, struct mbuf *, struct lwp *);
148 1.62 dyoung static int gre_getnames(struct socket *, struct lwp *, struct sockaddr_in *,
149 1.62 dyoung struct sockaddr_in *);
150 1.62 dyoung
151 1.88.2.5 ad /* Calling thread must hold sc->sc_mtx. */
152 1.62 dyoung static void
153 1.88.2.5 ad gre_stop(struct gre_softc *sc)
154 1.62 dyoung {
155 1.88.2.5 ad sc->sc_running = 0;
156 1.88.2.5 ad cv_signal(&sc->sc_join_cv);
157 1.62 dyoung }
158 1.62 dyoung
159 1.88.2.5 ad /* Calling thread must hold sc->sc_mtx. */
160 1.62 dyoung static void
161 1.88.2.5 ad gre_join(struct gre_softc *sc)
162 1.62 dyoung {
163 1.88.2.5 ad while (sc->sc_running != 0)
164 1.88.2.5 ad cv_wait(&sc->sc_join_cv, &sc->sc_mtx);
165 1.62 dyoung }
166 1.62 dyoung
167 1.88.2.5 ad /* Calling thread must hold sc->sc_mtx. */
168 1.62 dyoung static void
169 1.62 dyoung gre_wakeup(struct gre_softc *sc)
170 1.62 dyoung {
171 1.62 dyoung GRE_DPRINTF(sc, "%s: enter\n", __func__);
172 1.88.2.5 ad sc->sc_haswork = 1;
173 1.88.2.5 ad cv_signal(&sc->sc_work_cv);
174 1.62 dyoung }
175 1.62 dyoung
176 1.59 thorpej static int
177 1.59 thorpej gre_clone_create(struct if_clone *ifc, int unit)
178 1.1 hwr {
179 1.8 explorer struct gre_softc *sc;
180 1.1 hwr
181 1.10 thorpej sc = malloc(sizeof(struct gre_softc), M_DEVBUF, M_WAITOK);
182 1.10 thorpej memset(sc, 0, sizeof(struct gre_softc));
183 1.88.2.5 ad mutex_init(&sc->sc_mtx, MUTEX_DRIVER, IPL_NET);
184 1.88.2.5 ad cv_init(&sc->sc_work_cv, "gre work");
185 1.88.2.5 ad cv_init(&sc->sc_join_cv, "gre join");
186 1.88.2.5 ad cv_init(&sc->sc_soparm_cv, "gre soparm");
187 1.10 thorpej
188 1.50 itojun snprintf(sc->sc_if.if_xname, sizeof(sc->sc_if.if_xname), "%s%d",
189 1.50 itojun ifc->ifc_name, unit);
190 1.10 thorpej sc->sc_if.if_softc = sc;
191 1.51 tron sc->sc_if.if_type = IFT_TUNNEL;
192 1.34 itojun sc->sc_if.if_addrlen = 0;
193 1.10 thorpej sc->sc_if.if_hdrlen = 24; /* IP + GRE */
194 1.15 thorpej sc->sc_if.if_dlt = DLT_NULL;
195 1.20 itojun sc->sc_if.if_mtu = GREMTU;
196 1.10 thorpej sc->sc_if.if_flags = IFF_POINTOPOINT|IFF_MULTICAST;
197 1.10 thorpej sc->sc_if.if_output = gre_output;
198 1.10 thorpej sc->sc_if.if_ioctl = gre_ioctl;
199 1.10 thorpej sc->g_dst.s_addr = sc->g_src.s_addr = INADDR_ANY;
200 1.62 dyoung sc->g_dstport = sc->g_srcport = 0;
201 1.75 dyoung sc->sc_proto = IPPROTO_GRE;
202 1.64 dyoung sc->sc_snd.ifq_maxlen = 256;
203 1.35 itojun sc->sc_if.if_flags |= IFF_LINK0;
204 1.10 thorpej if_attach(&sc->sc_if);
205 1.16 thorpej if_alloc_sadl(&sc->sc_if);
206 1.1 hwr #if NBPFILTER > 0
207 1.14 thorpej bpfattach(&sc->sc_if, DLT_NULL, sizeof(u_int32_t));
208 1.1 hwr #endif
209 1.10 thorpej LIST_INSERT_HEAD(&gre_softc_list, sc, sc_list);
210 1.87 dyoung return 0;
211 1.10 thorpej }
212 1.1 hwr
213 1.59 thorpej static int
214 1.59 thorpej gre_clone_destroy(struct ifnet *ifp)
215 1.10 thorpej {
216 1.10 thorpej struct gre_softc *sc = ifp->if_softc;
217 1.10 thorpej
218 1.10 thorpej LIST_REMOVE(sc, sc_list);
219 1.10 thorpej #if NBPFILTER > 0
220 1.10 thorpej bpfdetach(ifp);
221 1.10 thorpej #endif
222 1.88.2.5 ad if_detach(ifp);
223 1.88.2.5 ad mutex_enter(&sc->sc_mtx);
224 1.62 dyoung gre_wakeup(sc);
225 1.88.2.5 ad gre_join(sc);
226 1.88.2.5 ad mutex_exit(&sc->sc_mtx);
227 1.85 dyoung rtcache_free(&sc->route);
228 1.88.2.5 ad
229 1.88.2.5 ad cv_destroy(&sc->sc_soparm_cv);
230 1.88.2.5 ad cv_destroy(&sc->sc_join_cv);
231 1.88.2.5 ad cv_destroy(&sc->sc_work_cv);
232 1.88.2.5 ad mutex_destroy(&sc->sc_mtx);
233 1.10 thorpej free(sc, M_DEVBUF);
234 1.53 peter
235 1.87 dyoung return 0;
236 1.1 hwr }
237 1.1 hwr
238 1.62 dyoung static void
239 1.88 christos gre_receive(struct socket *so, void *arg, int waitflag)
240 1.62 dyoung {
241 1.62 dyoung struct gre_softc *sc = (struct gre_softc *)arg;
242 1.62 dyoung
243 1.62 dyoung GRE_DPRINTF(sc, "%s: enter\n", __func__);
244 1.62 dyoung
245 1.62 dyoung gre_wakeup(sc);
246 1.62 dyoung }
247 1.62 dyoung
248 1.62 dyoung static void
249 1.88 christos gre_upcall_add(struct socket *so, void *arg)
250 1.62 dyoung {
251 1.62 dyoung /* XXX What if the kernel already set an upcall? */
252 1.62 dyoung so->so_upcallarg = arg;
253 1.62 dyoung so->so_upcall = gre_receive;
254 1.62 dyoung so->so_rcv.sb_flags |= SB_UPCALL;
255 1.62 dyoung }
256 1.62 dyoung
257 1.62 dyoung static void
258 1.62 dyoung gre_upcall_remove(struct socket *so)
259 1.62 dyoung {
260 1.62 dyoung /* XXX What if the kernel already set an upcall? */
261 1.62 dyoung so->so_rcv.sb_flags &= ~SB_UPCALL;
262 1.62 dyoung so->so_upcallarg = NULL;
263 1.62 dyoung so->so_upcall = NULL;
264 1.62 dyoung }
265 1.62 dyoung
266 1.62 dyoung static void
267 1.62 dyoung gre_sodestroy(struct socket **sop)
268 1.62 dyoung {
269 1.62 dyoung gre_upcall_remove(*sop);
270 1.62 dyoung soshutdown(*sop, SHUT_RDWR);
271 1.62 dyoung soclose(*sop);
272 1.62 dyoung *sop = NULL;
273 1.62 dyoung }
274 1.62 dyoung
275 1.62 dyoung static struct mbuf *
276 1.74 christos gre_getsockmbuf(struct socket *so)
277 1.62 dyoung {
278 1.62 dyoung struct mbuf *m;
279 1.62 dyoung
280 1.62 dyoung m = m_get(M_WAIT, MT_SONAME);
281 1.62 dyoung if (m != NULL)
282 1.62 dyoung MCLAIM(m, so->so_mowner);
283 1.62 dyoung return m;
284 1.62 dyoung }
285 1.62 dyoung
286 1.62 dyoung static int
287 1.62 dyoung gre_socreate1(struct gre_softc *sc, struct lwp *l, struct gre_soparm *sp,
288 1.62 dyoung struct socket **sop)
289 1.62 dyoung {
290 1.62 dyoung int rc;
291 1.62 dyoung struct mbuf *m;
292 1.62 dyoung struct sockaddr_in *sin;
293 1.62 dyoung struct socket *so;
294 1.62 dyoung
295 1.62 dyoung GRE_DPRINTF(sc, "%s: enter\n", __func__);
296 1.62 dyoung rc = socreate(AF_INET, sop, SOCK_DGRAM, IPPROTO_UDP, l);
297 1.62 dyoung if (rc != 0) {
298 1.62 dyoung GRE_DPRINTF(sc, "%s: socreate failed\n", __func__);
299 1.62 dyoung return rc;
300 1.62 dyoung }
301 1.62 dyoung
302 1.62 dyoung so = *sop;
303 1.62 dyoung
304 1.88.2.3 ad gre_upcall_add(so, sc);
305 1.62 dyoung if ((m = gre_getsockmbuf(so)) == NULL) {
306 1.62 dyoung rc = ENOBUFS;
307 1.62 dyoung goto out;
308 1.62 dyoung }
309 1.62 dyoung sin = mtod(m, struct sockaddr_in *);
310 1.62 dyoung sin->sin_len = m->m_len = sizeof(struct sockaddr_in);
311 1.62 dyoung sin->sin_family = AF_INET;
312 1.62 dyoung sin->sin_addr = sc->g_src;
313 1.62 dyoung sin->sin_port = sc->g_srcport;
314 1.62 dyoung
315 1.62 dyoung GRE_DPRINTF(sc, "%s: bind 0x%08" PRIx32 " port %d\n", __func__,
316 1.62 dyoung sin->sin_addr.s_addr, ntohs(sin->sin_port));
317 1.62 dyoung if ((rc = sobind(so, m, l)) != 0) {
318 1.62 dyoung GRE_DPRINTF(sc, "%s: sobind failed\n", __func__);
319 1.62 dyoung goto out;
320 1.62 dyoung }
321 1.62 dyoung
322 1.62 dyoung if (sc->g_srcport == 0) {
323 1.69 dyoung if ((rc = gre_getsockname(so, m, l)) != 0) {
324 1.62 dyoung GRE_DPRINTF(sc, "%s: gre_getsockname failed\n",
325 1.62 dyoung __func__);
326 1.62 dyoung goto out;
327 1.62 dyoung }
328 1.62 dyoung sc->g_srcport = sin->sin_port;
329 1.62 dyoung }
330 1.62 dyoung
331 1.62 dyoung sin->sin_addr = sc->g_dst;
332 1.62 dyoung sin->sin_port = sc->g_dstport;
333 1.62 dyoung
334 1.68 dyoung if ((rc = soconnect(so, m, l)) != 0) {
335 1.62 dyoung GRE_DPRINTF(sc, "%s: soconnect failed\n", __func__);
336 1.62 dyoung goto out;
337 1.62 dyoung }
338 1.62 dyoung
339 1.62 dyoung *mtod(m, int *) = ip_gre_ttl;
340 1.76 dyoung m->m_len = sizeof(int);
341 1.62 dyoung rc = (*so->so_proto->pr_ctloutput)(PRCO_SETOPT, so, IPPROTO_IP, IP_TTL,
342 1.62 dyoung &m);
343 1.62 dyoung m = NULL;
344 1.62 dyoung if (rc != 0) {
345 1.62 dyoung printf("%s: setopt ttl failed\n", __func__);
346 1.62 dyoung rc = 0;
347 1.62 dyoung }
348 1.62 dyoung out:
349 1.62 dyoung m_freem(m);
350 1.62 dyoung
351 1.62 dyoung if (rc != 0)
352 1.62 dyoung gre_sodestroy(sop);
353 1.62 dyoung else
354 1.63 dyoung *sp = sc->sc_soparm;
355 1.62 dyoung
356 1.62 dyoung return rc;
357 1.62 dyoung }
358 1.62 dyoung
359 1.62 dyoung static void
360 1.62 dyoung gre_thread1(struct gre_softc *sc, struct lwp *l)
361 1.62 dyoung {
362 1.88.2.5 ad int flags, rc;
363 1.62 dyoung const struct gre_h *gh;
364 1.62 dyoung struct ifnet *ifp = &sc->sc_if;
365 1.62 dyoung struct mbuf *m;
366 1.62 dyoung struct socket *so = NULL;
367 1.62 dyoung struct uio uio;
368 1.62 dyoung struct gre_soparm sp;
369 1.88.2.5 ad struct file *fp = NULL;
370 1.62 dyoung
371 1.62 dyoung GRE_DPRINTF(sc, "%s: enter\n", __func__);
372 1.88.2.5 ad mutex_enter(&sc->sc_mtx);
373 1.62 dyoung
374 1.88.2.5 ad sc->sc_haswork = 1;
375 1.62 dyoung
376 1.62 dyoung memset(&sp, 0, sizeof(sp));
377 1.62 dyoung memset(&uio, 0, sizeof(uio));
378 1.62 dyoung
379 1.62 dyoung ifp->if_flags |= IFF_RUNNING;
380 1.62 dyoung
381 1.62 dyoung for (;;) {
382 1.88.2.5 ad while (sc->sc_haswork == 0) {
383 1.62 dyoung GRE_DPRINTF(sc, "%s: sleeping\n", __func__);
384 1.88.2.5 ad cv_wait(&sc->sc_work_cv, &sc->sc_mtx);
385 1.62 dyoung }
386 1.88.2.5 ad sc->sc_haswork = 0;
387 1.62 dyoung GRE_DPRINTF(sc, "%s: awake\n", __func__);
388 1.62 dyoung if ((ifp->if_flags & IFF_UP) != IFF_UP) {
389 1.62 dyoung GRE_DPRINTF(sc, "%s: not up & running; exiting\n",
390 1.62 dyoung __func__);
391 1.62 dyoung break;
392 1.62 dyoung }
393 1.75 dyoung if (sc->sc_proto != IPPROTO_UDP) {
394 1.62 dyoung GRE_DPRINTF(sc, "%s: not udp; exiting\n", __func__);
395 1.62 dyoung break;
396 1.62 dyoung }
397 1.62 dyoung /* XXX optimize */
398 1.88.2.5 ad if (so == NULL || sc->sc_fp != NULL ||
399 1.88.2.5 ad memcmp(&sp, &sc->sc_soparm, sizeof(sp)) != 0) {
400 1.62 dyoung GRE_DPRINTF(sc, "%s: parameters changed\n", __func__);
401 1.62 dyoung
402 1.88.2.5 ad if (fp != NULL) {
403 1.88.2.5 ad gre_closef(&fp, curlwp);
404 1.62 dyoung so = NULL;
405 1.62 dyoung } else if (so != NULL)
406 1.62 dyoung gre_sodestroy(&so);
407 1.62 dyoung
408 1.62 dyoung if (sc->sc_fp != NULL) {
409 1.88.2.5 ad fp = sc->sc_fp;
410 1.88.2.5 ad sc->sc_fp = NULL;
411 1.88.2.5 ad so = (struct socket *)fp->f_data;
412 1.88.2.3 ad gre_upcall_add(so, sc);
413 1.63 dyoung sp = sc->sc_soparm;
414 1.62 dyoung } else if (gre_socreate1(sc, l, &sp, &so) != 0)
415 1.62 dyoung goto out;
416 1.62 dyoung }
417 1.88.2.5 ad cv_signal(&sc->sc_soparm_cv);
418 1.62 dyoung for (;;) {
419 1.62 dyoung flags = MSG_DONTWAIT;
420 1.62 dyoung uio.uio_resid = 1000000;
421 1.62 dyoung rc = (*so->so_receive)(so, NULL, &uio, &m, NULL,
422 1.62 dyoung &flags);
423 1.62 dyoung /* TBD Back off if ECONNREFUSED (indicates
424 1.62 dyoung * ICMP Port Unreachable)?
425 1.62 dyoung */
426 1.62 dyoung if (rc == EWOULDBLOCK) {
427 1.62 dyoung GRE_DPRINTF(sc, "%s: so_receive EWOULDBLOCK\n",
428 1.62 dyoung __func__);
429 1.62 dyoung break;
430 1.62 dyoung } else if (rc != 0 || m == NULL) {
431 1.62 dyoung GRE_DPRINTF(sc, "%s: rc %d m %p\n",
432 1.62 dyoung ifp->if_xname, rc, (void *)m);
433 1.62 dyoung continue;
434 1.62 dyoung } else
435 1.62 dyoung GRE_DPRINTF(sc, "%s: so_receive ok\n",
436 1.62 dyoung __func__);
437 1.62 dyoung if (m->m_len < sizeof(*gh) &&
438 1.62 dyoung (m = m_pullup(m, sizeof(*gh))) == NULL) {
439 1.62 dyoung GRE_DPRINTF(sc, "%s: m_pullup failed\n",
440 1.62 dyoung __func__);
441 1.62 dyoung continue;
442 1.62 dyoung }
443 1.62 dyoung gh = mtod(m, const struct gre_h *);
444 1.62 dyoung
445 1.88.2.5 ad if (gre_input3(sc, m, 0, gh, 1) == 0) {
446 1.62 dyoung GRE_DPRINTF(sc, "%s: dropping unsupported\n",
447 1.62 dyoung __func__);
448 1.62 dyoung m_freem(m);
449 1.62 dyoung }
450 1.62 dyoung }
451 1.62 dyoung for (;;) {
452 1.62 dyoung IF_DEQUEUE(&sc->sc_snd, m);
453 1.62 dyoung if (m == NULL)
454 1.62 dyoung break;
455 1.62 dyoung GRE_DPRINTF(sc, "%s: dequeue\n", __func__);
456 1.62 dyoung if ((so->so_state & SS_ISCONNECTED) == 0) {
457 1.62 dyoung GRE_DPRINTF(sc, "%s: not connected\n",
458 1.62 dyoung __func__);
459 1.62 dyoung m_freem(m);
460 1.62 dyoung continue;
461 1.62 dyoung }
462 1.62 dyoung rc = (*so->so_send)(so, NULL, NULL, m, NULL, 0, l);
463 1.62 dyoung /* XXX handle ENOBUFS? */
464 1.62 dyoung if (rc != 0)
465 1.62 dyoung GRE_DPRINTF(sc, "%s: so_send failed\n",
466 1.62 dyoung __func__);
467 1.62 dyoung }
468 1.62 dyoung }
469 1.88.2.5 ad if (fp != NULL) {
470 1.62 dyoung GRE_DPRINTF(sc, "%s: removing upcall\n", __func__);
471 1.62 dyoung gre_upcall_remove(so);
472 1.66 dyoung } else if (so != NULL)
473 1.62 dyoung gre_sodestroy(&so);
474 1.62 dyoung out:
475 1.62 dyoung GRE_DPRINTF(sc, "%s: stopping\n", __func__);
476 1.88.2.5 ad if (fp != NULL)
477 1.88.2.5 ad gre_closef(&fp, curlwp);
478 1.75 dyoung if (sc->sc_proto == IPPROTO_UDP)
479 1.62 dyoung ifp->if_flags &= ~IFF_RUNNING;
480 1.64 dyoung while (!IF_IS_EMPTY(&sc->sc_snd)) {
481 1.64 dyoung IF_DEQUEUE(&sc->sc_snd, m);
482 1.64 dyoung m_freem(m);
483 1.64 dyoung }
484 1.88.2.5 ad gre_stop(sc);
485 1.62 dyoung /* must not touch sc after this! */
486 1.62 dyoung GRE_DPRINTF(sc, "%s: restore ipl\n", __func__);
487 1.88.2.5 ad mutex_exit(&sc->sc_mtx);
488 1.62 dyoung }
489 1.62 dyoung
490 1.62 dyoung static void
491 1.62 dyoung gre_thread(void *arg)
492 1.62 dyoung {
493 1.62 dyoung struct gre_softc *sc = (struct gre_softc *)arg;
494 1.62 dyoung
495 1.62 dyoung gre_thread1(sc, curlwp);
496 1.62 dyoung /* must not touch sc after this! */
497 1.62 dyoung kthread_exit(0);
498 1.62 dyoung }
499 1.62 dyoung
500 1.88.2.5 ad /* Calling thread must hold sc->sc_mtx. */
501 1.62 dyoung int
502 1.88.2.3 ad gre_input3(struct gre_softc *sc, struct mbuf *m, int hlen,
503 1.88.2.5 ad const struct gre_h *gh, int mtx_held)
504 1.62 dyoung {
505 1.62 dyoung u_int16_t flags;
506 1.62 dyoung #if NBPFILTER > 0
507 1.62 dyoung u_int32_t af = AF_INET; /* af passed to BPF tap */
508 1.62 dyoung #endif
509 1.88.2.5 ad int isr;
510 1.62 dyoung struct ifqueue *ifq;
511 1.62 dyoung
512 1.62 dyoung sc->sc_if.if_ipackets++;
513 1.62 dyoung sc->sc_if.if_ibytes += m->m_pkthdr.len;
514 1.62 dyoung
515 1.88.2.3 ad hlen += sizeof(struct gre_h);
516 1.62 dyoung
517 1.88.2.3 ad /* process GRE flags as packet can be of variable len */
518 1.88.2.3 ad flags = ntohs(gh->flags);
519 1.62 dyoung
520 1.88.2.3 ad /* Checksum & Offset are present */
521 1.88.2.3 ad if ((flags & GRE_CP) | (flags & GRE_RP))
522 1.88.2.3 ad hlen += 4;
523 1.88.2.3 ad /* We don't support routing fields (variable length) */
524 1.88.2.3 ad if (flags & GRE_RP) {
525 1.88.2.3 ad sc->sc_if.if_ierrors++;
526 1.88.2.3 ad return 0;
527 1.88.2.3 ad }
528 1.88.2.3 ad if (flags & GRE_KP)
529 1.88.2.3 ad hlen += 4;
530 1.88.2.3 ad if (flags & GRE_SP)
531 1.88.2.3 ad hlen += 4;
532 1.88.2.3 ad
533 1.88.2.3 ad switch (ntohs(gh->ptype)) { /* ethertypes */
534 1.88.2.3 ad case ETHERTYPE_IP: /* shouldn't need a schednetisr(), as */
535 1.88.2.3 ad ifq = &ipintrq; /* we are in ip_input */
536 1.88.2.3 ad isr = NETISR_IP;
537 1.88.2.3 ad break;
538 1.62 dyoung #ifdef NETATALK
539 1.88.2.3 ad case ETHERTYPE_ATALK:
540 1.88.2.3 ad ifq = &atintrq1;
541 1.88.2.3 ad isr = NETISR_ATALK;
542 1.62 dyoung #if NBPFILTER > 0
543 1.88.2.3 ad af = AF_APPLETALK;
544 1.62 dyoung #endif
545 1.88.2.3 ad break;
546 1.62 dyoung #endif
547 1.62 dyoung #ifdef INET6
548 1.88.2.3 ad case ETHERTYPE_IPV6:
549 1.88.2.3 ad GRE_DPRINTF(sc, "%s: IPv6 packet\n", __func__);
550 1.88.2.3 ad ifq = &ip6intrq;
551 1.88.2.3 ad isr = NETISR_IPV6;
552 1.62 dyoung #if NBPFILTER > 0
553 1.88.2.3 ad af = AF_INET6;
554 1.62 dyoung #endif
555 1.62 dyoung break;
556 1.88.2.3 ad #endif
557 1.88.2.3 ad default: /* others not yet supported */
558 1.88.2.3 ad GRE_DPRINTF(sc, "%s: unhandled ethertype 0x%04x\n", __func__,
559 1.88.2.3 ad ntohs(gh->ptype));
560 1.88.2.3 ad sc->sc_if.if_noproto++;
561 1.87 dyoung return 0;
562 1.62 dyoung }
563 1.62 dyoung
564 1.62 dyoung if (hlen > m->m_pkthdr.len) {
565 1.62 dyoung m_freem(m);
566 1.62 dyoung sc->sc_if.if_ierrors++;
567 1.87 dyoung return EINVAL;
568 1.62 dyoung }
569 1.62 dyoung m_adj(m, hlen);
570 1.62 dyoung
571 1.62 dyoung #if NBPFILTER > 0
572 1.62 dyoung if (sc->sc_if.if_bpf != NULL)
573 1.62 dyoung bpf_mtap_af(sc->sc_if.if_bpf, af, m);
574 1.62 dyoung #endif /*NBPFILTER > 0*/
575 1.62 dyoung
576 1.62 dyoung m->m_pkthdr.rcvif = &sc->sc_if;
577 1.62 dyoung
578 1.88.2.5 ad if (!mtx_held)
579 1.88.2.5 ad mutex_enter(&sc->sc_mtx);
580 1.62 dyoung if (IF_QFULL(ifq)) {
581 1.62 dyoung IF_DROP(ifq);
582 1.62 dyoung m_freem(m);
583 1.62 dyoung } else {
584 1.62 dyoung IF_ENQUEUE(ifq, m);
585 1.62 dyoung }
586 1.62 dyoung /* we need schednetisr since the address family may change */
587 1.62 dyoung schednetisr(isr);
588 1.88.2.5 ad if (!mtx_held)
589 1.88.2.5 ad mutex_exit(&sc->sc_mtx);
590 1.62 dyoung
591 1.87 dyoung return 1; /* packet is done, no further processing needed */
592 1.62 dyoung }
593 1.62 dyoung
594 1.20 itojun /*
595 1.1 hwr * The output routine. Takes a packet and encapsulates it in the protocol
596 1.75 dyoung * given by sc->sc_proto. See also RFC 1701 and RFC 2004
597 1.1 hwr */
598 1.59 thorpej static int
599 1.84 dyoung gre_output(struct ifnet *ifp, struct mbuf *m, const struct sockaddr *dst,
600 1.74 christos struct rtentry *rt)
601 1.1 hwr {
602 1.88.2.3 ad int error = 0, hlen, msiz;
603 1.10 thorpej struct gre_softc *sc = ifp->if_softc;
604 1.62 dyoung struct greip *gi;
605 1.62 dyoung struct gre_h *gh;
606 1.62 dyoung struct ip *eip, *ip;
607 1.56 is u_int8_t ip_tos = 0;
608 1.48 itojun u_int16_t etype = 0;
609 1.20 itojun struct mobile_h mob_h;
610 1.24 martin
611 1.39 itojun if ((ifp->if_flags & (IFF_UP | IFF_RUNNING)) == 0 ||
612 1.37 itojun sc->g_src.s_addr == INADDR_ANY || sc->g_dst.s_addr == INADDR_ANY) {
613 1.37 itojun m_freem(m);
614 1.38 itojun error = ENETDOWN;
615 1.38 itojun goto end;
616 1.37 itojun }
617 1.1 hwr
618 1.62 dyoung gi = NULL;
619 1.41 itojun ip = NULL;
620 1.1 hwr
621 1.1 hwr #if NBPFILTER >0
622 1.52 christos if (ifp->if_bpf)
623 1.52 christos bpf_mtap_af(ifp->if_bpf, dst->sa_family, m);
624 1.1 hwr #endif
625 1.1 hwr
626 1.26 martin m->m_flags &= ~(M_BCAST|M_MCAST);
627 1.1 hwr
628 1.75 dyoung switch (sc->sc_proto) {
629 1.62 dyoung case IPPROTO_MOBILE:
630 1.88.2.3 ad if (dst->sa_family != AF_INET) {
631 1.3 hwr IF_DROP(&ifp->if_snd);
632 1.3 hwr m_freem(m);
633 1.38 itojun error = EINVAL;
634 1.38 itojun goto end;
635 1.3 hwr }
636 1.88.2.3 ad
637 1.88.2.3 ad if (M_UNWRITABLE(m, sizeof(*ip)) &&
638 1.88.2.3 ad (m = m_pullup(m, sizeof(*ip))) == NULL) {
639 1.88.2.3 ad error = ENOBUFS;
640 1.88.2.3 ad goto end;
641 1.88.2.3 ad }
642 1.88.2.3 ad ip = mtod(m, struct ip *);
643 1.88.2.3 ad
644 1.88.2.3 ad memset(&mob_h, 0, MOB_H_SIZ_L);
645 1.88.2.3 ad mob_h.proto = (ip->ip_p) << 8;
646 1.88.2.3 ad mob_h.odst = ip->ip_dst.s_addr;
647 1.88.2.3 ad ip->ip_dst.s_addr = sc->g_dst.s_addr;
648 1.88.2.3 ad
649 1.88.2.3 ad /*
650 1.88.2.3 ad * If the packet comes from our host, we only change
651 1.88.2.3 ad * the destination address in the IP header.
652 1.88.2.3 ad * Else we also need to save and change the source
653 1.88.2.3 ad */
654 1.88.2.3 ad if (in_hosteq(ip->ip_src, sc->g_src)) {
655 1.88.2.3 ad msiz = MOB_H_SIZ_S;
656 1.88.2.3 ad } else {
657 1.88.2.3 ad mob_h.proto |= MOB_H_SBIT;
658 1.88.2.3 ad mob_h.osrc = ip->ip_src.s_addr;
659 1.88.2.3 ad ip->ip_src.s_addr = sc->g_src.s_addr;
660 1.88.2.3 ad msiz = MOB_H_SIZ_L;
661 1.88.2.3 ad }
662 1.88.2.3 ad HTONS(mob_h.proto);
663 1.88.2.3 ad mob_h.hcrc = gre_in_cksum((u_int16_t *)&mob_h, msiz);
664 1.88.2.3 ad
665 1.88.2.3 ad M_PREPEND(m, msiz, M_DONTWAIT);
666 1.88.2.3 ad if (m == NULL) {
667 1.88.2.3 ad error = ENOBUFS;
668 1.88.2.3 ad goto end;
669 1.88.2.3 ad }
670 1.88.2.3 ad /* XXX Assuming that ip does not dangle after
671 1.88.2.3 ad * M_PREPEND. In practice, that's true, but
672 1.88.2.3 ad * that's not in M_PREPEND's contract.
673 1.88.2.3 ad */
674 1.88.2.3 ad memmove(mtod(m, void *), ip, sizeof(*ip));
675 1.88.2.3 ad ip = mtod(m, struct ip *);
676 1.88.2.3 ad memcpy(ip + 1, &mob_h, (size_t)msiz);
677 1.88.2.3 ad ip->ip_len = htons(ntohs(ip->ip_len) + msiz);
678 1.62 dyoung break;
679 1.62 dyoung case IPPROTO_UDP:
680 1.62 dyoung case IPPROTO_GRE:
681 1.62 dyoung GRE_DPRINTF(sc, "%s: dst->sa_family=%d\n", __func__,
682 1.62 dyoung dst->sa_family);
683 1.20 itojun switch (dst->sa_family) {
684 1.1 hwr case AF_INET:
685 1.41 itojun ip = mtod(m, struct ip *);
686 1.56 is ip_tos = ip->ip_tos;
687 1.8 explorer etype = ETHERTYPE_IP;
688 1.1 hwr break;
689 1.1 hwr #ifdef NETATALK
690 1.1 hwr case AF_APPLETALK:
691 1.8 explorer etype = ETHERTYPE_ATALK;
692 1.1 hwr break;
693 1.1 hwr #endif
694 1.56 is #ifdef INET6
695 1.56 is case AF_INET6:
696 1.56 is etype = ETHERTYPE_IPV6;
697 1.56 is break;
698 1.56 is #endif
699 1.1 hwr default:
700 1.1 hwr IF_DROP(&ifp->if_snd);
701 1.1 hwr m_freem(m);
702 1.38 itojun error = EAFNOSUPPORT;
703 1.38 itojun goto end;
704 1.1 hwr }
705 1.62 dyoung break;
706 1.62 dyoung default:
707 1.1 hwr IF_DROP(&ifp->if_snd);
708 1.1 hwr m_freem(m);
709 1.38 itojun error = EINVAL;
710 1.38 itojun goto end;
711 1.1 hwr }
712 1.1 hwr
713 1.75 dyoung switch (sc->sc_proto) {
714 1.62 dyoung case IPPROTO_GRE:
715 1.62 dyoung hlen = sizeof(struct greip);
716 1.62 dyoung break;
717 1.62 dyoung case IPPROTO_UDP:
718 1.62 dyoung hlen = sizeof(struct gre_h);
719 1.62 dyoung break;
720 1.62 dyoung default:
721 1.62 dyoung hlen = 0;
722 1.62 dyoung break;
723 1.62 dyoung }
724 1.62 dyoung
725 1.62 dyoung M_PREPEND(m, hlen, M_DONTWAIT);
726 1.62 dyoung
727 1.62 dyoung if (m == NULL) {
728 1.1 hwr IF_DROP(&ifp->if_snd);
729 1.38 itojun error = ENOBUFS;
730 1.38 itojun goto end;
731 1.1 hwr }
732 1.1 hwr
733 1.75 dyoung switch (sc->sc_proto) {
734 1.62 dyoung case IPPROTO_UDP:
735 1.62 dyoung gh = mtod(m, struct gre_h *);
736 1.62 dyoung memset(gh, 0, sizeof(*gh));
737 1.62 dyoung gh->ptype = htons(etype);
738 1.62 dyoung /* XXX Need to handle IP ToS. Look at how I handle IP TTL. */
739 1.62 dyoung break;
740 1.62 dyoung case IPPROTO_GRE:
741 1.62 dyoung gi = mtod(m, struct greip *);
742 1.62 dyoung gh = &gi->gi_g;
743 1.62 dyoung eip = &gi->gi_i;
744 1.1 hwr /* we don't have any GRE flags for now */
745 1.62 dyoung memset(gh, 0, sizeof(*gh));
746 1.62 dyoung gh->ptype = htons(etype);
747 1.62 dyoung eip->ip_src = sc->g_src;
748 1.62 dyoung eip->ip_dst = sc->g_dst;
749 1.62 dyoung eip->ip_hl = (sizeof(struct ip)) >> 2;
750 1.62 dyoung eip->ip_ttl = ip_gre_ttl;
751 1.62 dyoung eip->ip_tos = ip_tos;
752 1.62 dyoung eip->ip_len = htons(m->m_pkthdr.len);
753 1.75 dyoung eip->ip_p = sc->sc_proto;
754 1.62 dyoung break;
755 1.62 dyoung case IPPROTO_MOBILE:
756 1.62 dyoung eip = mtod(m, struct ip *);
757 1.75 dyoung eip->ip_p = sc->sc_proto;
758 1.62 dyoung break;
759 1.62 dyoung default:
760 1.62 dyoung error = EPROTONOSUPPORT;
761 1.62 dyoung m_freem(m);
762 1.62 dyoung goto end;
763 1.3 hwr }
764 1.1 hwr
765 1.1 hwr ifp->if_opackets++;
766 1.8 explorer ifp->if_obytes += m->m_pkthdr.len;
767 1.62 dyoung
768 1.1 hwr /* send it off */
769 1.75 dyoung if (sc->sc_proto == IPPROTO_UDP) {
770 1.62 dyoung if (IF_QFULL(&sc->sc_snd)) {
771 1.62 dyoung IF_DROP(&sc->sc_snd);
772 1.62 dyoung error = ENOBUFS;
773 1.62 dyoung m_freem(m);
774 1.62 dyoung } else {
775 1.62 dyoung IF_ENQUEUE(&sc->sc_snd, m);
776 1.62 dyoung gre_wakeup(sc);
777 1.62 dyoung error = 0;
778 1.62 dyoung }
779 1.81 joerg goto end;
780 1.81 joerg }
781 1.86 dyoung if (sc->route.ro_rt == NULL)
782 1.86 dyoung rtcache_init(&sc->route);
783 1.86 dyoung else
784 1.86 dyoung rtcache_check(&sc->route);
785 1.88.2.5 ad if (sc->route.ro_rt == NULL) {
786 1.88.2.5 ad m_freem(m);
787 1.81 joerg goto end;
788 1.88.2.5 ad }
789 1.88.2.5 ad if (sc->route.ro_rt->rt_ifp->if_softc == sc) {
790 1.88.2.5 ad rtcache_clear(&sc->route);
791 1.88.2.5 ad m_freem(m);
792 1.88.2.5 ad } else
793 1.88.2.5 ad error = ip_output(m, NULL, &sc->route, 0, NULL, NULL);
794 1.38 itojun end:
795 1.8 explorer if (error)
796 1.1 hwr ifp->if_oerrors++;
797 1.87 dyoung return error;
798 1.1 hwr }
799 1.1 hwr
800 1.88.2.5 ad /* Calling thread must hold sc->sc_mtx. */
801 1.62 dyoung static int
802 1.62 dyoung gre_kick(struct gre_softc *sc)
803 1.62 dyoung {
804 1.62 dyoung int rc;
805 1.62 dyoung struct ifnet *ifp = &sc->sc_if;
806 1.62 dyoung
807 1.75 dyoung if (sc->sc_proto == IPPROTO_UDP && (ifp->if_flags & IFF_UP) == IFF_UP &&
808 1.88.2.5 ad !sc->sc_running) {
809 1.88.2.5 ad sc->sc_running = 1;
810 1.88.2.5 ad rc = kthread_create(PRI_NONE, 0, NULL, gre_thread, sc,
811 1.88.2.1 ad NULL, ifp->if_xname);
812 1.62 dyoung if (rc != 0)
813 1.88.2.5 ad gre_stop(sc);
814 1.62 dyoung return rc;
815 1.62 dyoung } else {
816 1.62 dyoung gre_wakeup(sc);
817 1.62 dyoung return 0;
818 1.62 dyoung }
819 1.62 dyoung }
820 1.62 dyoung
821 1.88.2.5 ad /* Calling thread must hold sc->sc_mtx. */
822 1.62 dyoung static int
823 1.62 dyoung gre_getname(struct socket *so, int req, struct mbuf *nam, struct lwp *l)
824 1.62 dyoung {
825 1.88.2.5 ad return (*so->so_proto->pr_usrreq)(so, req, NULL, nam, NULL, l);
826 1.62 dyoung }
827 1.62 dyoung
828 1.88.2.5 ad /* Calling thread must hold sc->sc_mtx. */
829 1.62 dyoung static int
830 1.62 dyoung gre_getsockname(struct socket *so, struct mbuf *nam, struct lwp *l)
831 1.62 dyoung {
832 1.62 dyoung return gre_getname(so, PRU_SOCKADDR, nam, l);
833 1.62 dyoung }
834 1.62 dyoung
835 1.88.2.5 ad /* Calling thread must hold sc->sc_mtx. */
836 1.62 dyoung static int
837 1.62 dyoung gre_getpeername(struct socket *so, struct mbuf *nam, struct lwp *l)
838 1.62 dyoung {
839 1.62 dyoung return gre_getname(so, PRU_PEERADDR, nam, l);
840 1.62 dyoung }
841 1.62 dyoung
842 1.88.2.5 ad /* Calling thread must hold sc->sc_mtx. */
843 1.62 dyoung static int
844 1.62 dyoung gre_getnames(struct socket *so, struct lwp *l, struct sockaddr_in *src,
845 1.62 dyoung struct sockaddr_in *dst)
846 1.62 dyoung {
847 1.62 dyoung struct mbuf *m;
848 1.62 dyoung struct sockaddr_in *sin;
849 1.62 dyoung int rc;
850 1.62 dyoung
851 1.62 dyoung if ((m = gre_getsockmbuf(so)) == NULL)
852 1.62 dyoung return ENOBUFS;
853 1.62 dyoung
854 1.62 dyoung sin = mtod(m, struct sockaddr_in *);
855 1.62 dyoung
856 1.62 dyoung if ((rc = gre_getsockname(so, m, l)) != 0)
857 1.62 dyoung goto out;
858 1.62 dyoung if (sin->sin_family != AF_INET) {
859 1.62 dyoung rc = EAFNOSUPPORT;
860 1.62 dyoung goto out;
861 1.62 dyoung }
862 1.62 dyoung *src = *sin;
863 1.62 dyoung
864 1.62 dyoung if ((rc = gre_getpeername(so, m, l)) != 0)
865 1.62 dyoung goto out;
866 1.62 dyoung if (sin->sin_family != AF_INET) {
867 1.62 dyoung rc = EAFNOSUPPORT;
868 1.62 dyoung goto out;
869 1.62 dyoung }
870 1.62 dyoung *dst = *sin;
871 1.62 dyoung
872 1.62 dyoung out:
873 1.62 dyoung m_freem(m);
874 1.62 dyoung return rc;
875 1.62 dyoung }
876 1.62 dyoung
877 1.88.2.5 ad static void
878 1.88.2.5 ad gre_closef(struct file **fpp, struct lwp *l)
879 1.88.2.5 ad {
880 1.88.2.5 ad struct file *fp = *fpp;
881 1.88.2.5 ad
882 1.88.2.6 ad mutex_enter(&fp->f_lock);
883 1.88.2.5 ad FILE_USE(fp);
884 1.88.2.5 ad closef(fp, l);
885 1.88.2.5 ad *fpp = NULL;
886 1.88.2.5 ad }
887 1.88.2.5 ad
888 1.59 thorpej static int
889 1.88 christos gre_ioctl(struct ifnet *ifp, u_long cmd, void *data)
890 1.1 hwr {
891 1.62 dyoung u_char oproto;
892 1.88.2.5 ad struct file *fp;
893 1.62 dyoung struct socket *so;
894 1.62 dyoung struct sockaddr_in dst, src;
895 1.62 dyoung struct proc *p = curproc; /* XXX */
896 1.61 ad struct lwp *l = curlwp; /* XXX */
897 1.88.2.6 ad struct ifreq *ifr;
898 1.28 itojun struct if_laddrreq *lifr = (struct if_laddrreq *)data;
899 1.8 explorer struct gre_softc *sc = ifp->if_softc;
900 1.1 hwr struct sockaddr_in si;
901 1.8 explorer struct sockaddr *sa = NULL;
902 1.80 christos int error = 0;
903 1.88.2.6 ad #ifdef COMPAT_OIFREQ
904 1.88.2.6 ad u_long ocmd = cmd;
905 1.88.2.6 ad struct oifreq *oifr = NULL;
906 1.88.2.6 ad struct ifreq ifrb;
907 1.88.2.6 ad
908 1.88.2.6 ad cmd = cvtcmd(cmd);
909 1.88.2.6 ad if (cmd != ocmd) {
910 1.88.2.6 ad oifr = data;
911 1.88.2.6 ad data = ifr = &ifrb;
912 1.88.2.6 ad ifreqo2n(oifr, ifr);
913 1.88.2.6 ad } else
914 1.88.2.6 ad #endif
915 1.88.2.6 ad ifr = data;
916 1.88.2.6 ad
917 1.61 ad switch (cmd) {
918 1.61 ad case SIOCSIFFLAGS:
919 1.61 ad case SIOCSIFMTU:
920 1.61 ad case GRESPROTO:
921 1.61 ad case GRESADDRD:
922 1.61 ad case GRESADDRS:
923 1.62 dyoung case GRESSOCK:
924 1.62 dyoung case GREDSOCK:
925 1.61 ad case SIOCSLIFPHYADDR:
926 1.61 ad case SIOCDIFPHYADDR:
927 1.70 elad if (kauth_authorize_network(l->l_cred, KAUTH_NETWORK_INTERFACE,
928 1.70 elad KAUTH_REQ_NETWORK_INTERFACE_SETPRIV, ifp, (void *)cmd,
929 1.70 elad NULL) != 0)
930 1.87 dyoung return EPERM;
931 1.61 ad break;
932 1.61 ad default:
933 1.61 ad break;
934 1.61 ad }
935 1.1 hwr
936 1.88.2.5 ad mutex_enter(&sc->sc_mtx);
937 1.20 itojun switch (cmd) {
938 1.20 itojun case SIOCSIFADDR:
939 1.36 itojun ifp->if_flags |= IFF_UP;
940 1.78 dyoung if ((error = gre_kick(sc)) != 0)
941 1.78 dyoung ifp->if_flags &= ~IFF_UP;
942 1.36 itojun break;
943 1.55 perry case SIOCSIFDSTADDR:
944 1.1 hwr break;
945 1.1 hwr case SIOCSIFFLAGS:
946 1.75 dyoung oproto = sc->sc_proto;
947 1.62 dyoung switch (ifr->ifr_flags & (IFF_LINK0|IFF_LINK2)) {
948 1.62 dyoung case IFF_LINK0|IFF_LINK2:
949 1.75 dyoung sc->sc_proto = IPPROTO_UDP;
950 1.62 dyoung if (oproto != IPPROTO_UDP)
951 1.62 dyoung ifp->if_flags &= ~IFF_RUNNING;
952 1.62 dyoung error = gre_kick(sc);
953 1.62 dyoung break;
954 1.62 dyoung case IFF_LINK0:
955 1.75 dyoung sc->sc_proto = IPPROTO_GRE;
956 1.62 dyoung gre_wakeup(sc);
957 1.62 dyoung goto recompute;
958 1.62 dyoung case 0:
959 1.75 dyoung sc->sc_proto = IPPROTO_MOBILE;
960 1.62 dyoung gre_wakeup(sc);
961 1.62 dyoung goto recompute;
962 1.62 dyoung }
963 1.1 hwr break;
964 1.20 itojun case SIOCSIFMTU:
965 1.27 martin if (ifr->ifr_mtu < 576) {
966 1.1 hwr error = EINVAL;
967 1.1 hwr break;
968 1.1 hwr }
969 1.1 hwr ifp->if_mtu = ifr->ifr_mtu;
970 1.1 hwr break;
971 1.1 hwr case SIOCGIFMTU:
972 1.1 hwr ifr->ifr_mtu = sc->sc_if.if_mtu;
973 1.1 hwr break;
974 1.1 hwr case SIOCADDMULTI:
975 1.1 hwr case SIOCDELMULTI:
976 1.8 explorer if (ifr == 0) {
977 1.1 hwr error = EAFNOSUPPORT;
978 1.1 hwr break;
979 1.1 hwr }
980 1.8 explorer switch (ifr->ifr_addr.sa_family) {
981 1.1 hwr #ifdef INET
982 1.1 hwr case AF_INET:
983 1.1 hwr break;
984 1.1 hwr #endif
985 1.56 is #ifdef INET6
986 1.56 is case AF_INET6:
987 1.56 is break;
988 1.56 is #endif
989 1.1 hwr default:
990 1.1 hwr error = EAFNOSUPPORT;
991 1.1 hwr break;
992 1.1 hwr }
993 1.1 hwr break;
994 1.1 hwr case GRESPROTO:
995 1.75 dyoung oproto = sc->sc_proto;
996 1.75 dyoung sc->sc_proto = ifr->ifr_flags;
997 1.75 dyoung switch (sc->sc_proto) {
998 1.62 dyoung case IPPROTO_UDP:
999 1.62 dyoung ifp->if_flags |= IFF_LINK0|IFF_LINK2;
1000 1.62 dyoung if (oproto != IPPROTO_UDP)
1001 1.62 dyoung ifp->if_flags &= ~IFF_RUNNING;
1002 1.62 dyoung error = gre_kick(sc);
1003 1.62 dyoung break;
1004 1.40 itojun case IPPROTO_GRE:
1005 1.3 hwr ifp->if_flags |= IFF_LINK0;
1006 1.62 dyoung ifp->if_flags &= ~IFF_LINK2;
1007 1.62 dyoung goto recompute;
1008 1.40 itojun case IPPROTO_MOBILE:
1009 1.62 dyoung ifp->if_flags &= ~(IFF_LINK0|IFF_LINK2);
1010 1.62 dyoung goto recompute;
1011 1.1 hwr default:
1012 1.40 itojun error = EPROTONOSUPPORT;
1013 1.35 itojun break;
1014 1.1 hwr }
1015 1.1 hwr break;
1016 1.1 hwr case GREGPROTO:
1017 1.75 dyoung ifr->ifr_flags = sc->sc_proto;
1018 1.1 hwr break;
1019 1.1 hwr case GRESADDRS:
1020 1.1 hwr case GRESADDRD:
1021 1.1 hwr /*
1022 1.20 itojun * set tunnel endpoints, compute a less specific route
1023 1.20 itojun * to the remote end and mark if as up
1024 1.20 itojun */
1025 1.1 hwr sa = &ifr->ifr_addr;
1026 1.62 dyoung if (cmd == GRESADDRS) {
1027 1.1 hwr sc->g_src = (satosin(sa))->sin_addr;
1028 1.62 dyoung sc->g_srcport = satosin(sa)->sin_port;
1029 1.62 dyoung }
1030 1.62 dyoung if (cmd == GRESADDRD) {
1031 1.75 dyoung if (sc->sc_proto == IPPROTO_UDP &&
1032 1.62 dyoung satosin(sa)->sin_port == 0) {
1033 1.62 dyoung error = EINVAL;
1034 1.62 dyoung break;
1035 1.62 dyoung }
1036 1.1 hwr sc->g_dst = (satosin(sa))->sin_addr;
1037 1.62 dyoung sc->g_dstport = satosin(sa)->sin_port;
1038 1.62 dyoung }
1039 1.30 itojun recompute:
1040 1.75 dyoung if (sc->sc_proto == IPPROTO_UDP ||
1041 1.62 dyoung (sc->g_src.s_addr != INADDR_ANY &&
1042 1.62 dyoung sc->g_dst.s_addr != INADDR_ANY)) {
1043 1.81 joerg rtcache_free(&sc->route);
1044 1.75 dyoung if (sc->sc_proto == IPPROTO_UDP)
1045 1.62 dyoung error = gre_kick(sc);
1046 1.62 dyoung else if (gre_compute_route(sc) == 0)
1047 1.39 itojun ifp->if_flags |= IFF_RUNNING;
1048 1.39 itojun else
1049 1.39 itojun ifp->if_flags &= ~IFF_RUNNING;
1050 1.1 hwr }
1051 1.1 hwr break;
1052 1.1 hwr case GREGADDRS:
1053 1.33 itojun memset(&si, 0, sizeof(si));
1054 1.28 itojun si.sin_family = AF_INET;
1055 1.28 itojun si.sin_len = sizeof(struct sockaddr_in);
1056 1.1 hwr si.sin_addr.s_addr = sc->g_src.s_addr;
1057 1.8 explorer sa = sintosa(&si);
1058 1.1 hwr ifr->ifr_addr = *sa;
1059 1.1 hwr break;
1060 1.1 hwr case GREGADDRD:
1061 1.33 itojun memset(&si, 0, sizeof(si));
1062 1.28 itojun si.sin_family = AF_INET;
1063 1.28 itojun si.sin_len = sizeof(struct sockaddr_in);
1064 1.1 hwr si.sin_addr.s_addr = sc->g_dst.s_addr;
1065 1.8 explorer sa = sintosa(&si);
1066 1.1 hwr ifr->ifr_addr = *sa;
1067 1.28 itojun break;
1068 1.62 dyoung case GREDSOCK:
1069 1.88.2.5 ad if (sc->sc_proto != IPPROTO_UDP) {
1070 1.88.2.5 ad error = EINVAL;
1071 1.88.2.5 ad break;
1072 1.63 dyoung }
1073 1.88.2.5 ad ifp->if_flags &= ~IFF_UP;
1074 1.88.2.5 ad gre_wakeup(sc);
1075 1.62 dyoung break;
1076 1.62 dyoung case GRESSOCK:
1077 1.88.2.5 ad if (sc->sc_proto != IPPROTO_UDP) {
1078 1.88.2.5 ad error = EINVAL;
1079 1.88.2.5 ad break;
1080 1.88.2.5 ad }
1081 1.88.2.5 ad /* getsock() will FILE_USE() and unlock the descriptor for us */
1082 1.62 dyoung if ((error = getsock(p->p_fd, (int)ifr->ifr_value, &fp)) != 0)
1083 1.62 dyoung break;
1084 1.62 dyoung so = (struct socket *)fp->f_data;
1085 1.62 dyoung if (so->so_type != SOCK_DGRAM) {
1086 1.62 dyoung FILE_UNUSE(fp, NULL);
1087 1.62 dyoung error = EINVAL;
1088 1.62 dyoung break;
1089 1.62 dyoung }
1090 1.62 dyoung /* check address */
1091 1.62 dyoung if ((error = gre_getnames(so, curlwp, &src, &dst)) != 0) {
1092 1.62 dyoung FILE_UNUSE(fp, NULL);
1093 1.62 dyoung break;
1094 1.62 dyoung }
1095 1.62 dyoung
1096 1.88.2.5 ad /* Increase reference count. Now that our reference
1097 1.88.2.5 ad * to the file descriptor is counted, this thread
1098 1.88.2.5 ad * can release our "use" of the descriptor, but it
1099 1.88.2.5 ad * will not be destroyed by some other thread's
1100 1.88.2.5 ad * action. This thread needs to release its use,
1101 1.88.2.5 ad * too, because one and only one thread can have
1102 1.88.2.5 ad * use of the descriptor at once. The kernel thread
1103 1.88.2.5 ad * will pick up the use if it needs it.
1104 1.88.2.5 ad */
1105 1.88.2.5 ad
1106 1.62 dyoung fp->f_count++;
1107 1.88.2.5 ad FILE_UNUSE(fp, NULL);
1108 1.88.2.5 ad
1109 1.88.2.5 ad while (sc->sc_fp != NULL && error == 0) {
1110 1.88.2.5 ad error = cv_timedwait_sig(&sc->sc_soparm_cv, &sc->sc_mtx,
1111 1.88.2.5 ad MAX(1, hz / 2));
1112 1.88.2.5 ad }
1113 1.88.2.5 ad if (error == 0) {
1114 1.88.2.5 ad sc->sc_fp = fp;
1115 1.88.2.5 ad ifp->if_flags |= IFF_UP;
1116 1.88.2.5 ad }
1117 1.62 dyoung
1118 1.88.2.5 ad if (error != 0 || (error = gre_kick(sc)) != 0) {
1119 1.88.2.5 ad gre_closef(&fp, l);
1120 1.62 dyoung break;
1121 1.62 dyoung }
1122 1.88.2.5 ad /* fp does not any longer belong to this thread. */
1123 1.62 dyoung sc->g_src = src.sin_addr;
1124 1.62 dyoung sc->g_srcport = src.sin_port;
1125 1.62 dyoung sc->g_dst = dst.sin_addr;
1126 1.62 dyoung sc->g_dstport = dst.sin_port;
1127 1.62 dyoung break;
1128 1.28 itojun case SIOCSLIFPHYADDR:
1129 1.28 itojun if (lifr->addr.ss_family != AF_INET ||
1130 1.31 itojun lifr->dstaddr.ss_family != AF_INET) {
1131 1.31 itojun error = EAFNOSUPPORT;
1132 1.31 itojun break;
1133 1.31 itojun }
1134 1.28 itojun if (lifr->addr.ss_len != sizeof(si) ||
1135 1.31 itojun lifr->dstaddr.ss_len != sizeof(si)) {
1136 1.31 itojun error = EINVAL;
1137 1.31 itojun break;
1138 1.31 itojun }
1139 1.62 dyoung sc->g_src = satosin(&lifr->addr)->sin_addr;
1140 1.62 dyoung sc->g_dst = satosin(&lifr->dstaddr)->sin_addr;
1141 1.62 dyoung sc->g_srcport = satosin(&lifr->addr)->sin_port;
1142 1.62 dyoung sc->g_dstport = satosin(&lifr->dstaddr)->sin_port;
1143 1.30 itojun goto recompute;
1144 1.28 itojun case SIOCDIFPHYADDR:
1145 1.28 itojun sc->g_src.s_addr = INADDR_ANY;
1146 1.28 itojun sc->g_dst.s_addr = INADDR_ANY;
1147 1.62 dyoung sc->g_srcport = 0;
1148 1.62 dyoung sc->g_dstport = 0;
1149 1.62 dyoung goto recompute;
1150 1.28 itojun case SIOCGLIFPHYADDR:
1151 1.28 itojun if (sc->g_src.s_addr == INADDR_ANY ||
1152 1.28 itojun sc->g_dst.s_addr == INADDR_ANY) {
1153 1.28 itojun error = EADDRNOTAVAIL;
1154 1.28 itojun break;
1155 1.28 itojun }
1156 1.33 itojun memset(&si, 0, sizeof(si));
1157 1.28 itojun si.sin_family = AF_INET;
1158 1.28 itojun si.sin_len = sizeof(struct sockaddr_in);
1159 1.62 dyoung si.sin_addr = sc->g_src;
1160 1.75 dyoung if (sc->sc_proto == IPPROTO_UDP)
1161 1.62 dyoung si.sin_port = sc->g_srcport;
1162 1.33 itojun memcpy(&lifr->addr, &si, sizeof(si));
1163 1.62 dyoung si.sin_addr = sc->g_dst;
1164 1.75 dyoung if (sc->sc_proto == IPPROTO_UDP)
1165 1.62 dyoung si.sin_port = sc->g_dstport;
1166 1.33 itojun memcpy(&lifr->dstaddr, &si, sizeof(si));
1167 1.1 hwr break;
1168 1.1 hwr default:
1169 1.1 hwr error = EINVAL;
1170 1.31 itojun break;
1171 1.1 hwr }
1172 1.88.2.6 ad #ifdef COMPAT_OIFREQ
1173 1.88.2.6 ad if (cmd != ocmd)
1174 1.88.2.6 ad ifreqn2o(oifr, ifr);
1175 1.88.2.6 ad #endif
1176 1.88.2.5 ad mutex_exit(&sc->sc_mtx);
1177 1.87 dyoung return error;
1178 1.1 hwr }
1179 1.1 hwr
1180 1.20 itojun /*
1181 1.78 dyoung * Compute a route to our destination.
1182 1.1 hwr */
1183 1.59 thorpej static int
1184 1.8 explorer gre_compute_route(struct gre_softc *sc)
1185 1.1 hwr {
1186 1.1 hwr struct route *ro;
1187 1.88.2.5 ad union {
1188 1.88.2.5 ad struct sockaddr dst;
1189 1.88.2.5 ad struct sockaddr_in dst4;
1190 1.88.2.5 ad } u;
1191 1.1 hwr
1192 1.8 explorer ro = &sc->route;
1193 1.20 itojun
1194 1.88.2.5 ad memset(ro, 0, sizeof(*ro));
1195 1.88.2.5 ad sockaddr_in_init(&u.dst4, &sc->g_dst, 0);
1196 1.88.2.5 ad rtcache_setdst(ro, &u.dst);
1197 1.8 explorer
1198 1.81 joerg rtcache_init(ro);
1199 1.81 joerg
1200 1.81 joerg if (ro->ro_rt == NULL || ro->ro_rt->rt_ifp->if_softc == sc) {
1201 1.88.2.3 ad GRE_DPRINTF(sc, "%s: route to %s %s\n", sc->sc_if.if_xname,
1202 1.88.2.5 ad inet_ntoa(u.dst4.sin_addr),
1203 1.88.2.3 ad (ro->ro_rt == NULL)
1204 1.88.2.3 ad ? "does not exist"
1205 1.88.2.3 ad : "loops back to ourself");
1206 1.81 joerg rtcache_free(ro);
1207 1.81 joerg return EADDRNOTAVAIL;
1208 1.25 martin }
1209 1.25 martin
1210 1.25 martin return 0;
1211 1.1 hwr }
1212 1.1 hwr
1213 1.3 hwr /*
1214 1.20 itojun * do a checksum of a buffer - much like in_cksum, which operates on
1215 1.20 itojun * mbufs.
1216 1.3 hwr */
1217 1.48 itojun u_int16_t
1218 1.48 itojun gre_in_cksum(u_int16_t *p, u_int len)
1219 1.3 hwr {
1220 1.48 itojun u_int32_t sum = 0;
1221 1.3 hwr int nwords = len >> 1;
1222 1.20 itojun
1223 1.3 hwr while (nwords-- != 0)
1224 1.3 hwr sum += *p++;
1225 1.20 itojun
1226 1.20 itojun if (len & 1) {
1227 1.20 itojun union {
1228 1.20 itojun u_short w;
1229 1.20 itojun u_char c[2];
1230 1.20 itojun } u;
1231 1.20 itojun u.c[0] = *(u_char *)p;
1232 1.20 itojun u.c[1] = 0;
1233 1.20 itojun sum += u.w;
1234 1.20 itojun }
1235 1.20 itojun
1236 1.20 itojun /* end-around-carry */
1237 1.20 itojun sum = (sum >> 16) + (sum & 0xffff);
1238 1.20 itojun sum += (sum >> 16);
1239 1.87 dyoung return ~sum;
1240 1.3 hwr }
1241 1.54 christos #endif
1242 1.54 christos
1243 1.59 thorpej void greattach(int);
1244 1.54 christos
1245 1.54 christos /* ARGSUSED */
1246 1.54 christos void
1247 1.74 christos greattach(int count)
1248 1.54 christos {
1249 1.54 christos #ifdef INET
1250 1.54 christos LIST_INIT(&gre_softc_list);
1251 1.54 christos if_clone_attach(&gre_cloner);
1252 1.54 christos #endif
1253 1.54 christos }
1254