if_gre.c revision 1.139 1 1.139 dyoung /* $NetBSD: if_gre.c,v 1.139 2008/11/07 00:20:13 dyoung Exp $ */
2 1.4 thorpej
3 1.1 hwr /*
4 1.125 ad * Copyright (c) 1998, 2008 The NetBSD Foundation, Inc.
5 1.1 hwr * All rights reserved.
6 1.1 hwr *
7 1.1 hwr * This code is derived from software contributed to The NetBSD Foundation
8 1.1 hwr * by Heiko W.Rupp <hwr (at) pilhuhn.de>
9 1.1 hwr *
10 1.56 is * IPv6-over-GRE contributed by Gert Doering <gert (at) greenie.muc.de>
11 1.56 is *
12 1.134 dyoung * GRE over UDP/IPv4/IPv6 sockets contributed by David Young <dyoung (at) NetBSD.org>
13 1.134 dyoung *
14 1.1 hwr * Redistribution and use in source and binary forms, with or without
15 1.1 hwr * modification, are permitted provided that the following conditions
16 1.1 hwr * are met:
17 1.1 hwr * 1. Redistributions of source code must retain the above copyright
18 1.1 hwr * notice, this list of conditions and the following disclaimer.
19 1.1 hwr * 2. Redistributions in binary form must reproduce the above copyright
20 1.1 hwr * notice, this list of conditions and the following disclaimer in the
21 1.1 hwr * documentation and/or other materials provided with the distribution.
22 1.1 hwr *
23 1.1 hwr * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
24 1.1 hwr * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
25 1.1 hwr * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
26 1.1 hwr * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
27 1.1 hwr * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
28 1.1 hwr * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
29 1.1 hwr * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
30 1.1 hwr * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
31 1.1 hwr * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
32 1.1 hwr * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
33 1.1 hwr * POSSIBILITY OF SUCH DAMAGE.
34 1.134 dyoung *
35 1.134 dyoung * This material is based upon work partially supported by NSF
36 1.134 dyoung * under Contract No. NSF CNS-0626584.
37 1.1 hwr */
38 1.1 hwr
39 1.1 hwr /*
40 1.1 hwr * Encapsulate L3 protocols into IP
41 1.1 hwr * See RFC 1701 and 1702 for more details.
42 1.1 hwr * If_gre is compatible with Cisco GRE tunnels, so you can
43 1.1 hwr * have a NetBSD box as the other end of a tunnel interface of a Cisco
44 1.1 hwr * router. See gre(4) for more details.
45 1.1 hwr */
46 1.22 lukem
47 1.22 lukem #include <sys/cdefs.h>
48 1.139 dyoung __KERNEL_RCSID(0, "$NetBSD: if_gre.c,v 1.139 2008/11/07 00:20:13 dyoung Exp $");
49 1.1 hwr
50 1.62 dyoung #include "opt_gre.h"
51 1.1 hwr #include "opt_inet.h"
52 1.1 hwr #include "bpfilter.h"
53 1.1 hwr
54 1.54 christos #ifdef INET
55 1.1 hwr #include <sys/param.h>
56 1.62 dyoung #include <sys/file.h>
57 1.62 dyoung #include <sys/filedesc.h>
58 1.1 hwr #include <sys/malloc.h>
59 1.111 dyoung #include <sys/mallocvar.h>
60 1.1 hwr #include <sys/mbuf.h>
61 1.13 martin #include <sys/proc.h>
62 1.111 dyoung #include <sys/domain.h>
63 1.1 hwr #include <sys/protosw.h>
64 1.1 hwr #include <sys/socket.h>
65 1.62 dyoung #include <sys/socketvar.h>
66 1.1 hwr #include <sys/ioctl.h>
67 1.10 thorpej #include <sys/queue.h>
68 1.118 ad #include <sys/intr.h>
69 1.1 hwr #if __NetBSD__
70 1.1 hwr #include <sys/systm.h>
71 1.62 dyoung #include <sys/sysctl.h>
72 1.60 elad #include <sys/kauth.h>
73 1.1 hwr #endif
74 1.1 hwr
75 1.93 dyoung #include <sys/kernel.h>
76 1.93 dyoung #include <sys/mutex.h>
77 1.93 dyoung #include <sys/condvar.h>
78 1.62 dyoung #include <sys/kthread.h>
79 1.62 dyoung
80 1.117 ad #include <sys/cpu.h>
81 1.1 hwr
82 1.1 hwr #include <net/ethertypes.h>
83 1.1 hwr #include <net/if.h>
84 1.1 hwr #include <net/if_types.h>
85 1.1 hwr #include <net/netisr.h>
86 1.1 hwr #include <net/route.h>
87 1.1 hwr
88 1.1 hwr #ifdef INET
89 1.1 hwr #include <netinet/in.h>
90 1.1 hwr #include <netinet/in_systm.h>
91 1.1 hwr #include <netinet/in_var.h>
92 1.1 hwr #include <netinet/ip.h>
93 1.1 hwr #include <netinet/ip_var.h>
94 1.1 hwr #else
95 1.4 thorpej #error "Huh? if_gre without inet?"
96 1.1 hwr #endif
97 1.1 hwr
98 1.1 hwr
99 1.1 hwr #ifdef NETATALK
100 1.1 hwr #include <netatalk/at.h>
101 1.1 hwr #include <netatalk/at_var.h>
102 1.1 hwr #include <netatalk/at_extern.h>
103 1.1 hwr #endif
104 1.1 hwr
105 1.1 hwr #if NBPFILTER > 0
106 1.1 hwr #include <sys/time.h>
107 1.1 hwr #include <net/bpf.h>
108 1.1 hwr #endif
109 1.1 hwr
110 1.1 hwr #include <net/if_gre.h>
111 1.1 hwr
112 1.101 skd #include <compat/sys/socket.h>
113 1.94 christos #include <compat/sys/sockio.h>
114 1.20 itojun /*
115 1.27 martin * It is not easy to calculate the right value for a GRE MTU.
116 1.27 martin * We leave this task to the admin and use the same default that
117 1.27 martin * other vendors use.
118 1.20 itojun */
119 1.27 martin #define GREMTU 1476
120 1.1 hwr
121 1.62 dyoung #ifdef GRE_DEBUG
122 1.102 dyoung int gre_debug = 0;
123 1.132 dyoung #define GRE_DPRINTF(__sc, ...) \
124 1.132 dyoung do { \
125 1.132 dyoung if (__predict_false(gre_debug || \
126 1.132 dyoung ((__sc)->sc_if.if_flags & IFF_DEBUG) != 0)) { \
127 1.132 dyoung printf("%s.%d: ", __func__, __LINE__); \
128 1.132 dyoung printf(__VA_ARGS__); \
129 1.132 dyoung } \
130 1.62 dyoung } while (/*CONSTCOND*/0)
131 1.62 dyoung #else
132 1.62 dyoung #define GRE_DPRINTF(__sc, __fmt, ...) do { } while (/*CONSTCOND*/0)
133 1.62 dyoung #endif /* GRE_DEBUG */
134 1.62 dyoung
135 1.26 martin int ip_gre_ttl = GRE_TTL;
136 1.111 dyoung MALLOC_DEFINE(M_GRE_BUFQ, "gre_bufq", "gre mbuf queue");
137 1.1 hwr
138 1.111 dyoung static int gre_clone_create(struct if_clone *, int);
139 1.111 dyoung static int gre_clone_destroy(struct ifnet *);
140 1.10 thorpej
141 1.59 thorpej static struct if_clone gre_cloner =
142 1.10 thorpej IF_CLONE_INITIALIZER("gre", gre_clone_create, gre_clone_destroy);
143 1.1 hwr
144 1.111 dyoung static int gre_input(struct gre_softc *, struct mbuf *, int,
145 1.111 dyoung const struct gre_h *);
146 1.115 dyoung static bool gre_is_nullconf(const struct gre_soparm *);
147 1.111 dyoung static int gre_output(struct ifnet *, struct mbuf *,
148 1.84 dyoung const struct sockaddr *, struct rtentry *);
149 1.111 dyoung static int gre_ioctl(struct ifnet *, u_long, void *);
150 1.62 dyoung static int gre_getsockname(struct socket *, struct mbuf *, struct lwp *);
151 1.62 dyoung static int gre_getpeername(struct socket *, struct mbuf *, struct lwp *);
152 1.111 dyoung static int gre_getnames(struct socket *, struct lwp *,
153 1.111 dyoung struct sockaddr_storage *, struct sockaddr_storage *);
154 1.115 dyoung static void gre_clearconf(struct gre_soparm *, bool);
155 1.112 dyoung static int gre_soreceive(struct socket *, struct mbuf **);
156 1.133 dyoung static int gre_sosend(struct socket *, struct mbuf *);
157 1.132 dyoung static struct socket *gre_reconf(struct gre_softc *, const struct gre_soparm *);
158 1.132 dyoung
159 1.132 dyoung static bool gre_fp_send(struct gre_softc *, enum gre_msg, file_t *);
160 1.132 dyoung static bool gre_fp_recv(struct gre_softc *);
161 1.132 dyoung static void gre_fp_recvloop(void *);
162 1.111 dyoung
163 1.111 dyoung static int
164 1.111 dyoung nearest_pow2(size_t len0)
165 1.111 dyoung {
166 1.111 dyoung size_t len, mid;
167 1.111 dyoung
168 1.111 dyoung if (len0 == 0)
169 1.111 dyoung return 1;
170 1.111 dyoung
171 1.111 dyoung for (len = len0; (len & (len - 1)) != 0; len &= len - 1)
172 1.111 dyoung ;
173 1.111 dyoung
174 1.111 dyoung mid = len | (len >> 1);
175 1.111 dyoung
176 1.111 dyoung /* avoid overflow */
177 1.111 dyoung if ((len << 1) < len)
178 1.111 dyoung return len;
179 1.111 dyoung if (len0 >= mid)
180 1.111 dyoung return len << 1;
181 1.111 dyoung return len;
182 1.111 dyoung }
183 1.111 dyoung
184 1.111 dyoung static struct gre_bufq *
185 1.111 dyoung gre_bufq_init(struct gre_bufq *bq, size_t len0)
186 1.111 dyoung {
187 1.111 dyoung size_t len;
188 1.111 dyoung
189 1.111 dyoung len = nearest_pow2(len0);
190 1.111 dyoung
191 1.111 dyoung memset(bq, 0, sizeof(*bq));
192 1.111 dyoung bq->bq_buf = malloc(len * sizeof(struct mbuf *), M_GRE_BUFQ, M_WAITOK);
193 1.111 dyoung bq->bq_len = len;
194 1.111 dyoung bq->bq_lenmask = len - 1;
195 1.111 dyoung
196 1.111 dyoung return bq;
197 1.111 dyoung }
198 1.111 dyoung
199 1.111 dyoung static bool
200 1.111 dyoung gre_bufq_empty(struct gre_bufq *bq)
201 1.111 dyoung {
202 1.111 dyoung return bq->bq_prodidx == bq->bq_considx;
203 1.111 dyoung }
204 1.111 dyoung
205 1.111 dyoung static struct mbuf *
206 1.111 dyoung gre_bufq_dequeue(struct gre_bufq *bq)
207 1.111 dyoung {
208 1.111 dyoung struct mbuf *m;
209 1.111 dyoung
210 1.111 dyoung if (gre_bufq_empty(bq))
211 1.111 dyoung return NULL;
212 1.111 dyoung
213 1.111 dyoung m = bq->bq_buf[bq->bq_considx];
214 1.111 dyoung bq->bq_considx = (bq->bq_considx + 1) & bq->bq_lenmask;
215 1.111 dyoung
216 1.111 dyoung return m;
217 1.111 dyoung }
218 1.111 dyoung
219 1.111 dyoung static void
220 1.111 dyoung gre_bufq_purge(struct gre_bufq *bq)
221 1.111 dyoung {
222 1.111 dyoung struct mbuf *m;
223 1.111 dyoung
224 1.111 dyoung while ((m = gre_bufq_dequeue(bq)) != NULL)
225 1.111 dyoung m_freem(m);
226 1.111 dyoung }
227 1.111 dyoung
228 1.111 dyoung static int
229 1.111 dyoung gre_bufq_enqueue(struct gre_bufq *bq, struct mbuf *m)
230 1.111 dyoung {
231 1.111 dyoung int next;
232 1.111 dyoung
233 1.111 dyoung next = (bq->bq_prodidx + 1) & bq->bq_lenmask;
234 1.111 dyoung
235 1.111 dyoung if (next == bq->bq_considx) {
236 1.111 dyoung bq->bq_drops++;
237 1.111 dyoung return ENOBUFS;
238 1.111 dyoung }
239 1.111 dyoung
240 1.111 dyoung bq->bq_buf[bq->bq_prodidx] = m;
241 1.111 dyoung bq->bq_prodidx = next;
242 1.111 dyoung return 0;
243 1.111 dyoung }
244 1.111 dyoung
245 1.111 dyoung static void
246 1.111 dyoung greintr(void *arg)
247 1.111 dyoung {
248 1.111 dyoung struct gre_softc *sc = (struct gre_softc *)arg;
249 1.132 dyoung struct socket *so = sc->sc_soparm.sp_so;
250 1.112 dyoung int rc;
251 1.112 dyoung struct mbuf *m;
252 1.111 dyoung
253 1.132 dyoung KASSERT(so != NULL);
254 1.112 dyoung
255 1.112 dyoung sc->sc_send_ev.ev_count++;
256 1.132 dyoung GRE_DPRINTF(sc, "enter\n");
257 1.112 dyoung while ((m = gre_bufq_dequeue(&sc->sc_snd)) != NULL) {
258 1.112 dyoung /* XXX handle ENOBUFS? */
259 1.133 dyoung if ((rc = gre_sosend(so, m)) != 0)
260 1.132 dyoung GRE_DPRINTF(sc, "gre_sosend failed %d\n", rc);
261 1.112 dyoung }
262 1.111 dyoung }
263 1.111 dyoung
264 1.111 dyoung /* Caller must hold sc->sc_mtx. */
265 1.111 dyoung static void
266 1.111 dyoung gre_wait(struct gre_softc *sc)
267 1.111 dyoung {
268 1.111 dyoung sc->sc_waiters++;
269 1.111 dyoung cv_wait(&sc->sc_condvar, &sc->sc_mtx);
270 1.111 dyoung sc->sc_waiters--;
271 1.111 dyoung }
272 1.62 dyoung
273 1.62 dyoung static void
274 1.132 dyoung gre_fp_wait(struct gre_softc *sc)
275 1.62 dyoung {
276 1.132 dyoung sc->sc_fp_waiters++;
277 1.132 dyoung cv_wait(&sc->sc_fp_condvar, &sc->sc_mtx);
278 1.132 dyoung sc->sc_fp_waiters--;
279 1.62 dyoung }
280 1.62 dyoung
281 1.111 dyoung static void
282 1.111 dyoung gre_evcnt_detach(struct gre_softc *sc)
283 1.111 dyoung {
284 1.111 dyoung evcnt_detach(&sc->sc_unsupp_ev);
285 1.111 dyoung evcnt_detach(&sc->sc_pullup_ev);
286 1.111 dyoung evcnt_detach(&sc->sc_error_ev);
287 1.111 dyoung evcnt_detach(&sc->sc_block_ev);
288 1.111 dyoung evcnt_detach(&sc->sc_recv_ev);
289 1.111 dyoung
290 1.111 dyoung evcnt_detach(&sc->sc_oflow_ev);
291 1.111 dyoung evcnt_detach(&sc->sc_send_ev);
292 1.111 dyoung }
293 1.111 dyoung
294 1.111 dyoung static void
295 1.111 dyoung gre_evcnt_attach(struct gre_softc *sc)
296 1.111 dyoung {
297 1.111 dyoung evcnt_attach_dynamic(&sc->sc_recv_ev, EVCNT_TYPE_MISC,
298 1.111 dyoung NULL, sc->sc_if.if_xname, "recv");
299 1.111 dyoung evcnt_attach_dynamic(&sc->sc_block_ev, EVCNT_TYPE_MISC,
300 1.111 dyoung &sc->sc_recv_ev, sc->sc_if.if_xname, "would block");
301 1.111 dyoung evcnt_attach_dynamic(&sc->sc_error_ev, EVCNT_TYPE_MISC,
302 1.111 dyoung &sc->sc_recv_ev, sc->sc_if.if_xname, "error");
303 1.111 dyoung evcnt_attach_dynamic(&sc->sc_pullup_ev, EVCNT_TYPE_MISC,
304 1.112 dyoung &sc->sc_recv_ev, sc->sc_if.if_xname, "pullup failed");
305 1.111 dyoung evcnt_attach_dynamic(&sc->sc_unsupp_ev, EVCNT_TYPE_MISC,
306 1.111 dyoung &sc->sc_recv_ev, sc->sc_if.if_xname, "unsupported");
307 1.111 dyoung
308 1.111 dyoung evcnt_attach_dynamic(&sc->sc_send_ev, EVCNT_TYPE_MISC,
309 1.111 dyoung NULL, sc->sc_if.if_xname, "send");
310 1.111 dyoung evcnt_attach_dynamic(&sc->sc_oflow_ev, EVCNT_TYPE_MISC,
311 1.112 dyoung &sc->sc_send_ev, sc->sc_if.if_xname, "overflow");
312 1.62 dyoung }
313 1.62 dyoung
314 1.59 thorpej static int
315 1.59 thorpej gre_clone_create(struct if_clone *ifc, int unit)
316 1.1 hwr {
317 1.132 dyoung int rc;
318 1.8 explorer struct gre_softc *sc;
319 1.132 dyoung struct gre_soparm *sp;
320 1.1 hwr
321 1.111 dyoung sc = malloc(sizeof(struct gre_softc), M_DEVBUF, M_WAITOK|M_ZERO);
322 1.111 dyoung mutex_init(&sc->sc_mtx, MUTEX_DRIVER, IPL_SOFTNET);
323 1.111 dyoung cv_init(&sc->sc_condvar, "gre wait");
324 1.132 dyoung cv_init(&sc->sc_fp_condvar, "gre fp");
325 1.10 thorpej
326 1.136 christos if_initname(&sc->sc_if, ifc->ifc_name, unit);
327 1.10 thorpej sc->sc_if.if_softc = sc;
328 1.51 tron sc->sc_if.if_type = IFT_TUNNEL;
329 1.34 itojun sc->sc_if.if_addrlen = 0;
330 1.111 dyoung sc->sc_if.if_hdrlen = sizeof(struct ip) + sizeof(struct gre_h);
331 1.15 thorpej sc->sc_if.if_dlt = DLT_NULL;
332 1.20 itojun sc->sc_if.if_mtu = GREMTU;
333 1.10 thorpej sc->sc_if.if_flags = IFF_POINTOPOINT|IFF_MULTICAST;
334 1.10 thorpej sc->sc_if.if_output = gre_output;
335 1.10 thorpej sc->sc_if.if_ioctl = gre_ioctl;
336 1.132 dyoung sp = &sc->sc_soparm;
337 1.132 dyoung sockaddr_copy(sstosa(&sp->sp_dst), sizeof(sp->sp_dst),
338 1.132 dyoung sintocsa(&in_any));
339 1.132 dyoung sockaddr_copy(sstosa(&sp->sp_src), sizeof(sp->sp_src),
340 1.132 dyoung sintocsa(&in_any));
341 1.132 dyoung sp->sp_proto = IPPROTO_GRE;
342 1.132 dyoung sp->sp_type = SOCK_RAW;
343 1.132 dyoung
344 1.132 dyoung sc->sc_fd = -1;
345 1.132 dyoung
346 1.132 dyoung rc = kthread_create(PRI_NONE, KTHREAD_MPSAFE, NULL, gre_fp_recvloop, sc,
347 1.132 dyoung NULL, sc->sc_if.if_xname);
348 1.132 dyoung
349 1.132 dyoung if (rc != 0)
350 1.132 dyoung return -1;
351 1.111 dyoung
352 1.111 dyoung gre_evcnt_attach(sc);
353 1.111 dyoung
354 1.111 dyoung gre_bufq_init(&sc->sc_snd, 17);
355 1.35 itojun sc->sc_if.if_flags |= IFF_LINK0;
356 1.10 thorpej if_attach(&sc->sc_if);
357 1.16 thorpej if_alloc_sadl(&sc->sc_if);
358 1.1 hwr #if NBPFILTER > 0
359 1.124 matt bpfattach(&sc->sc_if, DLT_NULL, sizeof(uint32_t));
360 1.1 hwr #endif
361 1.111 dyoung sc->sc_state = GRE_S_IDLE;
362 1.87 dyoung return 0;
363 1.10 thorpej }
364 1.1 hwr
365 1.59 thorpej static int
366 1.59 thorpej gre_clone_destroy(struct ifnet *ifp)
367 1.10 thorpej {
368 1.119 dyoung int s;
369 1.10 thorpej struct gre_softc *sc = ifp->if_softc;
370 1.10 thorpej
371 1.132 dyoung GRE_DPRINTF(sc, "\n");
372 1.111 dyoung
373 1.10 thorpej #if NBPFILTER > 0
374 1.10 thorpej bpfdetach(ifp);
375 1.10 thorpej #endif
376 1.122 dyoung s = splnet();
377 1.93 dyoung if_detach(ifp);
378 1.111 dyoung
379 1.119 dyoung /* Some LWPs may still wait in gre_ioctl_lock(), however,
380 1.119 dyoung * no new LWP will enter gre_ioctl_lock(), because ifunit()
381 1.119 dyoung * cannot locate the interface any longer.
382 1.119 dyoung */
383 1.93 dyoung mutex_enter(&sc->sc_mtx);
384 1.132 dyoung GRE_DPRINTF(sc, "\n");
385 1.111 dyoung while (sc->sc_state != GRE_S_IDLE)
386 1.111 dyoung gre_wait(sc);
387 1.132 dyoung GRE_DPRINTF(sc, "\n");
388 1.111 dyoung sc->sc_state = GRE_S_DIE;
389 1.111 dyoung cv_broadcast(&sc->sc_condvar);
390 1.132 dyoung while (sc->sc_waiters > 0)
391 1.132 dyoung cv_wait(&sc->sc_condvar, &sc->sc_mtx);
392 1.119 dyoung /* At this point, no other LWP will access the gre_softc, so
393 1.119 dyoung * we can release the mutex.
394 1.119 dyoung */
395 1.93 dyoung mutex_exit(&sc->sc_mtx);
396 1.132 dyoung GRE_DPRINTF(sc, "\n");
397 1.119 dyoung /* Note that we must not hold the mutex while we call gre_reconf(). */
398 1.132 dyoung gre_reconf(sc, NULL);
399 1.132 dyoung
400 1.132 dyoung mutex_enter(&sc->sc_mtx);
401 1.132 dyoung sc->sc_msg = GRE_M_STOP;
402 1.132 dyoung cv_signal(&sc->sc_fp_condvar);
403 1.132 dyoung while (sc->sc_fp_waiters > 0)
404 1.132 dyoung cv_wait(&sc->sc_fp_condvar, &sc->sc_mtx);
405 1.132 dyoung mutex_exit(&sc->sc_mtx);
406 1.132 dyoung
407 1.119 dyoung splx(s);
408 1.93 dyoung
409 1.111 dyoung cv_destroy(&sc->sc_condvar);
410 1.135 dyoung cv_destroy(&sc->sc_fp_condvar);
411 1.93 dyoung mutex_destroy(&sc->sc_mtx);
412 1.111 dyoung gre_evcnt_detach(sc);
413 1.10 thorpej free(sc, M_DEVBUF);
414 1.53 peter
415 1.87 dyoung return 0;
416 1.1 hwr }
417 1.1 hwr
418 1.62 dyoung static void
419 1.88 christos gre_receive(struct socket *so, void *arg, int waitflag)
420 1.62 dyoung {
421 1.62 dyoung struct gre_softc *sc = (struct gre_softc *)arg;
422 1.112 dyoung int rc;
423 1.112 dyoung const struct gre_h *gh;
424 1.112 dyoung struct mbuf *m;
425 1.62 dyoung
426 1.132 dyoung GRE_DPRINTF(sc, "enter\n");
427 1.112 dyoung
428 1.112 dyoung sc->sc_recv_ev.ev_count++;
429 1.112 dyoung
430 1.112 dyoung rc = gre_soreceive(so, &m);
431 1.112 dyoung /* TBD Back off if ECONNREFUSED (indicates
432 1.112 dyoung * ICMP Port Unreachable)?
433 1.112 dyoung */
434 1.112 dyoung if (rc == EWOULDBLOCK) {
435 1.132 dyoung GRE_DPRINTF(sc, "EWOULDBLOCK\n");
436 1.112 dyoung sc->sc_block_ev.ev_count++;
437 1.112 dyoung return;
438 1.112 dyoung } else if (rc != 0 || m == NULL) {
439 1.112 dyoung GRE_DPRINTF(sc, "%s: rc %d m %p\n",
440 1.112 dyoung sc->sc_if.if_xname, rc, (void *)m);
441 1.112 dyoung sc->sc_error_ev.ev_count++;
442 1.112 dyoung return;
443 1.112 dyoung }
444 1.121 dyoung if (m->m_len < sizeof(*gh) && (m = m_pullup(m, sizeof(*gh))) == NULL) {
445 1.132 dyoung GRE_DPRINTF(sc, "m_pullup failed\n");
446 1.112 dyoung sc->sc_pullup_ev.ev_count++;
447 1.112 dyoung return;
448 1.112 dyoung }
449 1.112 dyoung gh = mtod(m, const struct gre_h *);
450 1.112 dyoung
451 1.112 dyoung if (gre_input(sc, m, 0, gh) == 0) {
452 1.112 dyoung sc->sc_unsupp_ev.ev_count++;
453 1.132 dyoung GRE_DPRINTF(sc, "dropping unsupported\n");
454 1.112 dyoung m_freem(m);
455 1.112 dyoung }
456 1.62 dyoung }
457 1.62 dyoung
458 1.62 dyoung static void
459 1.88 christos gre_upcall_add(struct socket *so, void *arg)
460 1.62 dyoung {
461 1.62 dyoung /* XXX What if the kernel already set an upcall? */
462 1.102 dyoung KASSERT((so->so_rcv.sb_flags & SB_UPCALL) == 0);
463 1.62 dyoung so->so_upcallarg = arg;
464 1.62 dyoung so->so_upcall = gre_receive;
465 1.62 dyoung so->so_rcv.sb_flags |= SB_UPCALL;
466 1.62 dyoung }
467 1.62 dyoung
468 1.62 dyoung static void
469 1.62 dyoung gre_upcall_remove(struct socket *so)
470 1.62 dyoung {
471 1.62 dyoung so->so_rcv.sb_flags &= ~SB_UPCALL;
472 1.62 dyoung so->so_upcallarg = NULL;
473 1.62 dyoung so->so_upcall = NULL;
474 1.62 dyoung }
475 1.62 dyoung
476 1.62 dyoung static int
477 1.132 dyoung gre_socreate(struct gre_softc *sc, const struct gre_soparm *sp, int *fdout)
478 1.62 dyoung {
479 1.111 dyoung const struct protosw *pr;
480 1.111 dyoung int fd, rc;
481 1.62 dyoung struct mbuf *m;
482 1.111 dyoung struct sockaddr *sa;
483 1.132 dyoung struct socket *so;
484 1.111 dyoung sa_family_t af;
485 1.138 plunky int val;
486 1.62 dyoung
487 1.132 dyoung GRE_DPRINTF(sc, "enter\n");
488 1.111 dyoung
489 1.111 dyoung af = sp->sp_src.ss_family;
490 1.132 dyoung rc = fsocreate(af, NULL, sp->sp_type, sp->sp_proto, curlwp, &fd);
491 1.62 dyoung if (rc != 0) {
492 1.132 dyoung GRE_DPRINTF(sc, "fsocreate failed\n");
493 1.62 dyoung return rc;
494 1.62 dyoung }
495 1.127 dyoung
496 1.128 dyoung if ((rc = fd_getsock(fd, &so)) != 0)
497 1.125 ad return rc;
498 1.127 dyoung
499 1.120 dyoung if ((m = getsombuf(so, MT_SONAME)) == NULL) {
500 1.62 dyoung rc = ENOBUFS;
501 1.62 dyoung goto out;
502 1.62 dyoung }
503 1.111 dyoung sa = mtod(m, struct sockaddr *);
504 1.132 dyoung sockaddr_copy(sa, MIN(MLEN, sizeof(sp->sp_src)), sstocsa(&sp->sp_src));
505 1.111 dyoung m->m_len = sp->sp_src.ss_len;
506 1.62 dyoung
507 1.127 dyoung if ((rc = sobind(so, m, curlwp)) != 0) {
508 1.132 dyoung GRE_DPRINTF(sc, "sobind failed\n");
509 1.62 dyoung goto out;
510 1.62 dyoung }
511 1.62 dyoung
512 1.132 dyoung sockaddr_copy(sa, MIN(MLEN, sizeof(sp->sp_dst)), sstocsa(&sp->sp_dst));
513 1.111 dyoung m->m_len = sp->sp_dst.ss_len;
514 1.62 dyoung
515 1.132 dyoung solock(so);
516 1.127 dyoung if ((rc = soconnect(so, m, curlwp)) != 0) {
517 1.132 dyoung GRE_DPRINTF(sc, "soconnect failed\n");
518 1.132 dyoung sounlock(so);
519 1.62 dyoung goto out;
520 1.62 dyoung }
521 1.132 dyoung sounlock(so);
522 1.62 dyoung
523 1.138 plunky m = NULL;
524 1.138 plunky
525 1.111 dyoung /* XXX convert to a (new) SOL_SOCKET call */
526 1.138 plunky pr = so->so_proto;
527 1.138 plunky KASSERT(pr != NULL);
528 1.138 plunky rc = so_setsockopt(curlwp, so, IPPROTO_IP, IP_TTL,
529 1.138 plunky &ip_gre_ttl, sizeof(ip_gre_ttl));
530 1.138 plunky if (rc != 0) {
531 1.138 plunky GRE_DPRINTF(sc, "so_setsockopt ttl failed\n");
532 1.138 plunky rc = 0;
533 1.138 plunky }
534 1.138 plunky val = 1;
535 1.138 plunky rc = so_setsockopt(curlwp, so, SOL_SOCKET, SO_NOHEADER,
536 1.138 plunky &val, sizeof(val));
537 1.138 plunky if (rc != 0) {
538 1.138 plunky GRE_DPRINTF(sc, "so_setsockopt SO_NOHEADER failed\n");
539 1.62 dyoung rc = 0;
540 1.62 dyoung }
541 1.62 dyoung out:
542 1.62 dyoung m_freem(m);
543 1.62 dyoung
544 1.62 dyoung if (rc != 0)
545 1.125 ad fd_close(fd);
546 1.125 ad else {
547 1.125 ad fd_putfile(fd);
548 1.111 dyoung *fdout = fd;
549 1.125 ad }
550 1.62 dyoung
551 1.62 dyoung return rc;
552 1.62 dyoung }
553 1.62 dyoung
554 1.111 dyoung static int
555 1.133 dyoung gre_sosend(struct socket *so, struct mbuf *top)
556 1.111 dyoung {
557 1.111 dyoung struct mbuf **mp;
558 1.111 dyoung struct proc *p;
559 1.111 dyoung long space, resid;
560 1.130 ad int error;
561 1.133 dyoung struct lwp * const l = curlwp;
562 1.111 dyoung
563 1.111 dyoung p = l->l_proc;
564 1.111 dyoung
565 1.111 dyoung resid = top->m_pkthdr.len;
566 1.111 dyoung if (p)
567 1.126 ad l->l_ru.ru_msgsnd++;
568 1.130 ad #define snderr(errno) { error = errno; goto release; }
569 1.111 dyoung
570 1.130 ad solock(so);
571 1.111 dyoung if ((error = sblock(&so->so_snd, M_NOWAIT)) != 0)
572 1.111 dyoung goto out;
573 1.111 dyoung if (so->so_state & SS_CANTSENDMORE)
574 1.111 dyoung snderr(EPIPE);
575 1.111 dyoung if (so->so_error) {
576 1.111 dyoung error = so->so_error;
577 1.111 dyoung so->so_error = 0;
578 1.111 dyoung goto release;
579 1.111 dyoung }
580 1.111 dyoung if ((so->so_state & SS_ISCONNECTED) == 0) {
581 1.111 dyoung if (so->so_proto->pr_flags & PR_CONNREQUIRED) {
582 1.111 dyoung if ((so->so_state & SS_ISCONFIRMING) == 0)
583 1.111 dyoung snderr(ENOTCONN);
584 1.111 dyoung } else
585 1.111 dyoung snderr(EDESTADDRREQ);
586 1.111 dyoung }
587 1.111 dyoung space = sbspace(&so->so_snd);
588 1.111 dyoung if (resid > so->so_snd.sb_hiwat)
589 1.111 dyoung snderr(EMSGSIZE);
590 1.111 dyoung if (space < resid)
591 1.111 dyoung snderr(EWOULDBLOCK);
592 1.111 dyoung mp = ⊤
593 1.111 dyoung /*
594 1.111 dyoung * Data is prepackaged in "top".
595 1.111 dyoung */
596 1.111 dyoung if (so->so_state & SS_CANTSENDMORE)
597 1.111 dyoung snderr(EPIPE);
598 1.111 dyoung error = (*so->so_proto->pr_usrreq)(so, PRU_SEND, top, NULL, NULL, l);
599 1.111 dyoung top = NULL;
600 1.111 dyoung mp = ⊤
601 1.111 dyoung release:
602 1.111 dyoung sbunlock(&so->so_snd);
603 1.111 dyoung out:
604 1.130 ad sounlock(so);
605 1.111 dyoung if (top != NULL)
606 1.111 dyoung m_freem(top);
607 1.111 dyoung return error;
608 1.111 dyoung }
609 1.111 dyoung
610 1.111 dyoung /* This is a stripped-down version of soreceive() that will never
611 1.111 dyoung * block. It will support SOCK_DGRAM sockets. It may also support
612 1.111 dyoung * SOCK_SEQPACKET sockets.
613 1.111 dyoung */
614 1.111 dyoung static int
615 1.111 dyoung gre_soreceive(struct socket *so, struct mbuf **mp0)
616 1.102 dyoung {
617 1.112 dyoung struct mbuf *m, **mp;
618 1.130 ad int flags, len, error, type;
619 1.111 dyoung const struct protosw *pr;
620 1.112 dyoung struct mbuf *nextrecord;
621 1.111 dyoung
622 1.111 dyoung KASSERT(mp0 != NULL);
623 1.111 dyoung
624 1.111 dyoung flags = MSG_DONTWAIT;
625 1.111 dyoung pr = so->so_proto;
626 1.111 dyoung mp = mp0;
627 1.111 dyoung type = 0;
628 1.111 dyoung
629 1.111 dyoung *mp = NULL;
630 1.111 dyoung
631 1.111 dyoung KASSERT(pr->pr_flags & PR_ATOMIC);
632 1.111 dyoung
633 1.111 dyoung if (so->so_state & SS_ISCONFIRMING)
634 1.127 dyoung (*pr->pr_usrreq)(so, PRU_RCVD, NULL, NULL, NULL, curlwp);
635 1.111 dyoung restart:
636 1.130 ad if ((error = sblock(&so->so_rcv, M_NOWAIT)) != 0) {
637 1.111 dyoung return error;
638 1.130 ad }
639 1.111 dyoung m = so->so_rcv.sb_mb;
640 1.111 dyoung /*
641 1.111 dyoung * If we have less data than requested, do not block awaiting more.
642 1.111 dyoung */
643 1.111 dyoung if (m == NULL) {
644 1.111 dyoung #ifdef DIAGNOSTIC
645 1.111 dyoung if (so->so_rcv.sb_cc)
646 1.111 dyoung panic("receive 1");
647 1.111 dyoung #endif
648 1.111 dyoung if (so->so_error) {
649 1.111 dyoung error = so->so_error;
650 1.111 dyoung so->so_error = 0;
651 1.111 dyoung } else if (so->so_state & SS_CANTRCVMORE)
652 1.111 dyoung ;
653 1.111 dyoung else if ((so->so_state & (SS_ISCONNECTED|SS_ISCONNECTING)) == 0
654 1.111 dyoung && (so->so_proto->pr_flags & PR_CONNREQUIRED))
655 1.111 dyoung error = ENOTCONN;
656 1.111 dyoung else
657 1.111 dyoung error = EWOULDBLOCK;
658 1.111 dyoung goto release;
659 1.111 dyoung }
660 1.111 dyoung /*
661 1.111 dyoung * On entry here, m points to the first record of the socket buffer.
662 1.111 dyoung * While we process the initial mbufs containing address and control
663 1.111 dyoung * info, we save a copy of m->m_nextpkt into nextrecord.
664 1.111 dyoung */
665 1.127 dyoung if (curlwp != NULL)
666 1.127 dyoung curlwp->l_ru.ru_msgrcv++;
667 1.111 dyoung KASSERT(m == so->so_rcv.sb_mb);
668 1.111 dyoung SBLASTRECORDCHK(&so->so_rcv, "soreceive 1");
669 1.111 dyoung SBLASTMBUFCHK(&so->so_rcv, "soreceive 1");
670 1.111 dyoung nextrecord = m->m_nextpkt;
671 1.111 dyoung if (pr->pr_flags & PR_ADDR) {
672 1.111 dyoung #ifdef DIAGNOSTIC
673 1.111 dyoung if (m->m_type != MT_SONAME)
674 1.111 dyoung panic("receive 1a");
675 1.111 dyoung #endif
676 1.111 dyoung sbfree(&so->so_rcv, m);
677 1.111 dyoung MFREE(m, so->so_rcv.sb_mb);
678 1.111 dyoung m = so->so_rcv.sb_mb;
679 1.111 dyoung }
680 1.111 dyoung while (m != NULL && m->m_type == MT_CONTROL && error == 0) {
681 1.111 dyoung sbfree(&so->so_rcv, m);
682 1.111 dyoung /*
683 1.111 dyoung * Dispose of any SCM_RIGHTS message that went
684 1.111 dyoung * through the read path rather than recv.
685 1.111 dyoung */
686 1.111 dyoung if (pr->pr_domain->dom_dispose &&
687 1.111 dyoung mtod(m, struct cmsghdr *)->cmsg_type == SCM_RIGHTS)
688 1.111 dyoung (*pr->pr_domain->dom_dispose)(m);
689 1.111 dyoung MFREE(m, so->so_rcv.sb_mb);
690 1.111 dyoung m = so->so_rcv.sb_mb;
691 1.111 dyoung }
692 1.111 dyoung
693 1.111 dyoung /*
694 1.111 dyoung * If m is non-NULL, we have some data to read. From now on,
695 1.111 dyoung * make sure to keep sb_lastrecord consistent when working on
696 1.111 dyoung * the last packet on the chain (nextrecord == NULL) and we
697 1.111 dyoung * change m->m_nextpkt.
698 1.111 dyoung */
699 1.111 dyoung if (m != NULL) {
700 1.111 dyoung m->m_nextpkt = nextrecord;
701 1.111 dyoung /*
702 1.111 dyoung * If nextrecord == NULL (this is a single chain),
703 1.111 dyoung * then sb_lastrecord may not be valid here if m
704 1.111 dyoung * was changed earlier.
705 1.111 dyoung */
706 1.111 dyoung if (nextrecord == NULL) {
707 1.111 dyoung KASSERT(so->so_rcv.sb_mb == m);
708 1.111 dyoung so->so_rcv.sb_lastrecord = m;
709 1.111 dyoung }
710 1.111 dyoung type = m->m_type;
711 1.111 dyoung if (type == MT_OOBDATA)
712 1.111 dyoung flags |= MSG_OOB;
713 1.111 dyoung } else {
714 1.111 dyoung KASSERT(so->so_rcv.sb_mb == m);
715 1.111 dyoung so->so_rcv.sb_mb = nextrecord;
716 1.111 dyoung SB_EMPTY_FIXUP(&so->so_rcv);
717 1.111 dyoung }
718 1.111 dyoung SBLASTRECORDCHK(&so->so_rcv, "soreceive 2");
719 1.111 dyoung SBLASTMBUFCHK(&so->so_rcv, "soreceive 2");
720 1.111 dyoung
721 1.111 dyoung while (m != NULL) {
722 1.111 dyoung if (m->m_type == MT_OOBDATA) {
723 1.111 dyoung if (type != MT_OOBDATA)
724 1.111 dyoung break;
725 1.111 dyoung } else if (type == MT_OOBDATA)
726 1.111 dyoung break;
727 1.111 dyoung #ifdef DIAGNOSTIC
728 1.111 dyoung else if (m->m_type != MT_DATA && m->m_type != MT_HEADER)
729 1.111 dyoung panic("receive 3");
730 1.111 dyoung #endif
731 1.111 dyoung so->so_state &= ~SS_RCVATMARK;
732 1.111 dyoung if (so->so_oobmark != 0 && so->so_oobmark < m->m_len)
733 1.111 dyoung break;
734 1.111 dyoung len = m->m_len;
735 1.111 dyoung /*
736 1.111 dyoung * mp is set, just pass back the mbufs.
737 1.111 dyoung * Sockbuf must be consistent here (points to current mbuf,
738 1.111 dyoung * it points to next record) when we drop priority;
739 1.111 dyoung * we must note any additions to the sockbuf when we
740 1.111 dyoung * block interrupts again.
741 1.111 dyoung */
742 1.111 dyoung if (m->m_flags & M_EOR)
743 1.111 dyoung flags |= MSG_EOR;
744 1.111 dyoung nextrecord = m->m_nextpkt;
745 1.111 dyoung sbfree(&so->so_rcv, m);
746 1.111 dyoung *mp = m;
747 1.111 dyoung mp = &m->m_next;
748 1.111 dyoung so->so_rcv.sb_mb = m = m->m_next;
749 1.111 dyoung *mp = NULL;
750 1.111 dyoung /*
751 1.111 dyoung * If m != NULL, we also know that
752 1.111 dyoung * so->so_rcv.sb_mb != NULL.
753 1.102 dyoung */
754 1.111 dyoung KASSERT(so->so_rcv.sb_mb == m);
755 1.111 dyoung if (m) {
756 1.111 dyoung m->m_nextpkt = nextrecord;
757 1.111 dyoung if (nextrecord == NULL)
758 1.111 dyoung so->so_rcv.sb_lastrecord = m;
759 1.111 dyoung } else {
760 1.111 dyoung so->so_rcv.sb_mb = nextrecord;
761 1.111 dyoung SB_EMPTY_FIXUP(&so->so_rcv);
762 1.111 dyoung }
763 1.111 dyoung SBLASTRECORDCHK(&so->so_rcv, "soreceive 3");
764 1.111 dyoung SBLASTMBUFCHK(&so->so_rcv, "soreceive 3");
765 1.111 dyoung if (so->so_oobmark) {
766 1.111 dyoung so->so_oobmark -= len;
767 1.111 dyoung if (so->so_oobmark == 0) {
768 1.111 dyoung so->so_state |= SS_RCVATMARK;
769 1.111 dyoung break;
770 1.111 dyoung }
771 1.102 dyoung }
772 1.111 dyoung if (flags & MSG_EOR)
773 1.111 dyoung break;
774 1.111 dyoung }
775 1.111 dyoung
776 1.111 dyoung if (m != NULL) {
777 1.111 dyoung m_freem(*mp);
778 1.111 dyoung *mp = NULL;
779 1.111 dyoung error = ENOMEM;
780 1.111 dyoung (void) sbdroprecord(&so->so_rcv);
781 1.111 dyoung } else {
782 1.111 dyoung /*
783 1.111 dyoung * First part is an inline SB_EMPTY_FIXUP(). Second
784 1.111 dyoung * part makes sure sb_lastrecord is up-to-date if
785 1.111 dyoung * there is still data in the socket buffer.
786 1.111 dyoung */
787 1.111 dyoung so->so_rcv.sb_mb = nextrecord;
788 1.111 dyoung if (so->so_rcv.sb_mb == NULL) {
789 1.111 dyoung so->so_rcv.sb_mbtail = NULL;
790 1.111 dyoung so->so_rcv.sb_lastrecord = NULL;
791 1.111 dyoung } else if (nextrecord->m_nextpkt == NULL)
792 1.111 dyoung so->so_rcv.sb_lastrecord = nextrecord;
793 1.111 dyoung }
794 1.111 dyoung SBLASTRECORDCHK(&so->so_rcv, "soreceive 4");
795 1.111 dyoung SBLASTMBUFCHK(&so->so_rcv, "soreceive 4");
796 1.111 dyoung if (pr->pr_flags & PR_WANTRCVD && so->so_pcb)
797 1.111 dyoung (*pr->pr_usrreq)(so, PRU_RCVD, NULL,
798 1.127 dyoung (struct mbuf *)(long)flags, NULL, curlwp);
799 1.111 dyoung if (*mp0 == NULL && (flags & MSG_EOR) == 0 &&
800 1.111 dyoung (so->so_state & SS_CANTRCVMORE) == 0) {
801 1.111 dyoung sbunlock(&so->so_rcv);
802 1.111 dyoung goto restart;
803 1.111 dyoung }
804 1.111 dyoung
805 1.111 dyoung release:
806 1.111 dyoung sbunlock(&so->so_rcv);
807 1.111 dyoung return error;
808 1.111 dyoung }
809 1.102 dyoung
810 1.102 dyoung static struct socket *
811 1.132 dyoung gre_reconf(struct gre_softc *sc, const struct gre_soparm *newsoparm)
812 1.102 dyoung {
813 1.102 dyoung struct ifnet *ifp = &sc->sc_if;
814 1.102 dyoung
815 1.132 dyoung GRE_DPRINTF(sc, "enter\n");
816 1.102 dyoung
817 1.102 dyoung shutdown:
818 1.132 dyoung if (sc->sc_soparm.sp_so != NULL) {
819 1.132 dyoung GRE_DPRINTF(sc, "\n");
820 1.132 dyoung gre_upcall_remove(sc->sc_soparm.sp_so);
821 1.118 ad softint_disestablish(sc->sc_si);
822 1.111 dyoung sc->sc_si = NULL;
823 1.132 dyoung gre_fp_send(sc, GRE_M_DELFP, NULL);
824 1.115 dyoung gre_clearconf(&sc->sc_soparm, false);
825 1.111 dyoung }
826 1.111 dyoung
827 1.114 dyoung if (newsoparm != NULL) {
828 1.132 dyoung GRE_DPRINTF(sc, "\n");
829 1.114 dyoung sc->sc_soparm = *newsoparm;
830 1.129 dyoung newsoparm = NULL;
831 1.114 dyoung }
832 1.102 dyoung
833 1.132 dyoung if (sc->sc_soparm.sp_so != NULL) {
834 1.132 dyoung GRE_DPRINTF(sc, "\n");
835 1.118 ad sc->sc_si = softint_establish(SOFTINT_NET, greintr, sc);
836 1.132 dyoung gre_upcall_add(sc->sc_soparm.sp_so, sc);
837 1.111 dyoung if ((ifp->if_flags & IFF_UP) == 0) {
838 1.132 dyoung GRE_DPRINTF(sc, "down\n");
839 1.111 dyoung goto shutdown;
840 1.111 dyoung }
841 1.102 dyoung }
842 1.111 dyoung
843 1.132 dyoung GRE_DPRINTF(sc, "\n");
844 1.132 dyoung if (sc->sc_soparm.sp_so != NULL)
845 1.102 dyoung sc->sc_if.if_flags |= IFF_RUNNING;
846 1.111 dyoung else {
847 1.111 dyoung gre_bufq_purge(&sc->sc_snd);
848 1.102 dyoung sc->sc_if.if_flags &= ~IFF_RUNNING;
849 1.111 dyoung }
850 1.132 dyoung return sc->sc_soparm.sp_so;
851 1.102 dyoung }
852 1.102 dyoung
853 1.111 dyoung static int
854 1.111 dyoung gre_input(struct gre_softc *sc, struct mbuf *m, int hlen,
855 1.111 dyoung const struct gre_h *gh)
856 1.62 dyoung {
857 1.124 matt uint16_t flags;
858 1.124 matt uint32_t af; /* af passed to BPF tap */
859 1.111 dyoung int isr, s;
860 1.62 dyoung struct ifqueue *ifq;
861 1.62 dyoung
862 1.62 dyoung sc->sc_if.if_ipackets++;
863 1.62 dyoung sc->sc_if.if_ibytes += m->m_pkthdr.len;
864 1.62 dyoung
865 1.89 dyoung hlen += sizeof(struct gre_h);
866 1.62 dyoung
867 1.89 dyoung /* process GRE flags as packet can be of variable len */
868 1.89 dyoung flags = ntohs(gh->flags);
869 1.62 dyoung
870 1.89 dyoung /* Checksum & Offset are present */
871 1.89 dyoung if ((flags & GRE_CP) | (flags & GRE_RP))
872 1.89 dyoung hlen += 4;
873 1.89 dyoung /* We don't support routing fields (variable length) */
874 1.89 dyoung if (flags & GRE_RP) {
875 1.89 dyoung sc->sc_if.if_ierrors++;
876 1.89 dyoung return 0;
877 1.89 dyoung }
878 1.89 dyoung if (flags & GRE_KP)
879 1.89 dyoung hlen += 4;
880 1.89 dyoung if (flags & GRE_SP)
881 1.89 dyoung hlen += 4;
882 1.89 dyoung
883 1.89 dyoung switch (ntohs(gh->ptype)) { /* ethertypes */
884 1.111 dyoung case ETHERTYPE_IP:
885 1.111 dyoung ifq = &ipintrq;
886 1.89 dyoung isr = NETISR_IP;
887 1.113 dyoung af = AF_INET;
888 1.89 dyoung break;
889 1.62 dyoung #ifdef NETATALK
890 1.89 dyoung case ETHERTYPE_ATALK:
891 1.89 dyoung ifq = &atintrq1;
892 1.89 dyoung isr = NETISR_ATALK;
893 1.89 dyoung af = AF_APPLETALK;
894 1.89 dyoung break;
895 1.62 dyoung #endif
896 1.62 dyoung #ifdef INET6
897 1.89 dyoung case ETHERTYPE_IPV6:
898 1.89 dyoung ifq = &ip6intrq;
899 1.89 dyoung isr = NETISR_IPV6;
900 1.89 dyoung af = AF_INET6;
901 1.89 dyoung break;
902 1.62 dyoung #endif
903 1.89 dyoung default: /* others not yet supported */
904 1.132 dyoung GRE_DPRINTF(sc, "unhandled ethertype 0x%04x\n",
905 1.89 dyoung ntohs(gh->ptype));
906 1.89 dyoung sc->sc_if.if_noproto++;
907 1.87 dyoung return 0;
908 1.62 dyoung }
909 1.62 dyoung
910 1.62 dyoung if (hlen > m->m_pkthdr.len) {
911 1.62 dyoung m_freem(m);
912 1.62 dyoung sc->sc_if.if_ierrors++;
913 1.87 dyoung return EINVAL;
914 1.62 dyoung }
915 1.62 dyoung m_adj(m, hlen);
916 1.62 dyoung
917 1.62 dyoung #if NBPFILTER > 0
918 1.62 dyoung if (sc->sc_if.if_bpf != NULL)
919 1.62 dyoung bpf_mtap_af(sc->sc_if.if_bpf, af, m);
920 1.62 dyoung #endif /*NBPFILTER > 0*/
921 1.62 dyoung
922 1.62 dyoung m->m_pkthdr.rcvif = &sc->sc_if;
923 1.62 dyoung
924 1.111 dyoung s = splnet();
925 1.62 dyoung if (IF_QFULL(ifq)) {
926 1.62 dyoung IF_DROP(ifq);
927 1.62 dyoung m_freem(m);
928 1.62 dyoung } else {
929 1.62 dyoung IF_ENQUEUE(ifq, m);
930 1.62 dyoung }
931 1.62 dyoung /* we need schednetisr since the address family may change */
932 1.62 dyoung schednetisr(isr);
933 1.111 dyoung splx(s);
934 1.62 dyoung
935 1.87 dyoung return 1; /* packet is done, no further processing needed */
936 1.62 dyoung }
937 1.62 dyoung
938 1.20 itojun /*
939 1.1 hwr * The output routine. Takes a packet and encapsulates it in the protocol
940 1.111 dyoung * given by sc->sc_soparm.sp_proto. See also RFC 1701 and RFC 2004
941 1.1 hwr */
942 1.59 thorpej static int
943 1.84 dyoung gre_output(struct ifnet *ifp, struct mbuf *m, const struct sockaddr *dst,
944 1.74 christos struct rtentry *rt)
945 1.1 hwr {
946 1.111 dyoung int error = 0;
947 1.10 thorpej struct gre_softc *sc = ifp->if_softc;
948 1.62 dyoung struct gre_h *gh;
949 1.111 dyoung struct ip *ip;
950 1.124 matt uint8_t ip_tos = 0;
951 1.124 matt uint16_t etype = 0;
952 1.24 martin
953 1.111 dyoung if ((ifp->if_flags & (IFF_UP|IFF_RUNNING)) != (IFF_UP|IFF_RUNNING)) {
954 1.37 itojun m_freem(m);
955 1.38 itojun error = ENETDOWN;
956 1.38 itojun goto end;
957 1.37 itojun }
958 1.1 hwr
959 1.113 dyoung #if NBPFILTER > 0
960 1.113 dyoung if (ifp->if_bpf != NULL)
961 1.52 christos bpf_mtap_af(ifp->if_bpf, dst->sa_family, m);
962 1.1 hwr #endif
963 1.1 hwr
964 1.26 martin m->m_flags &= ~(M_BCAST|M_MCAST);
965 1.1 hwr
966 1.132 dyoung GRE_DPRINTF(sc, "dst->sa_family=%d\n", dst->sa_family);
967 1.111 dyoung switch (dst->sa_family) {
968 1.111 dyoung case AF_INET:
969 1.89 dyoung ip = mtod(m, struct ip *);
970 1.111 dyoung ip_tos = ip->ip_tos;
971 1.111 dyoung etype = htons(ETHERTYPE_IP);
972 1.62 dyoung break;
973 1.1 hwr #ifdef NETATALK
974 1.111 dyoung case AF_APPLETALK:
975 1.111 dyoung etype = htons(ETHERTYPE_ATALK);
976 1.111 dyoung break;
977 1.1 hwr #endif
978 1.56 is #ifdef INET6
979 1.111 dyoung case AF_INET6:
980 1.111 dyoung etype = htons(ETHERTYPE_IPV6);
981 1.111 dyoung break;
982 1.56 is #endif
983 1.62 dyoung default:
984 1.1 hwr IF_DROP(&ifp->if_snd);
985 1.1 hwr m_freem(m);
986 1.111 dyoung error = EAFNOSUPPORT;
987 1.38 itojun goto end;
988 1.1 hwr }
989 1.1 hwr
990 1.111 dyoung M_PREPEND(m, sizeof(*gh), M_DONTWAIT);
991 1.62 dyoung
992 1.62 dyoung if (m == NULL) {
993 1.1 hwr IF_DROP(&ifp->if_snd);
994 1.38 itojun error = ENOBUFS;
995 1.38 itojun goto end;
996 1.1 hwr }
997 1.1 hwr
998 1.111 dyoung gh = mtod(m, struct gre_h *);
999 1.111 dyoung gh->flags = 0;
1000 1.111 dyoung gh->ptype = etype;
1001 1.111 dyoung /* XXX Need to handle IP ToS. Look at how I handle IP TTL. */
1002 1.1 hwr
1003 1.1 hwr ifp->if_opackets++;
1004 1.8 explorer ifp->if_obytes += m->m_pkthdr.len;
1005 1.62 dyoung
1006 1.1 hwr /* send it off */
1007 1.111 dyoung if ((error = gre_bufq_enqueue(&sc->sc_snd, m)) != 0) {
1008 1.111 dyoung sc->sc_oflow_ev.ev_count++;
1009 1.111 dyoung m_freem(m);
1010 1.112 dyoung } else
1011 1.118 ad softint_schedule(sc->sc_si);
1012 1.38 itojun end:
1013 1.8 explorer if (error)
1014 1.1 hwr ifp->if_oerrors++;
1015 1.87 dyoung return error;
1016 1.1 hwr }
1017 1.1 hwr
1018 1.62 dyoung static int
1019 1.62 dyoung gre_getname(struct socket *so, int req, struct mbuf *nam, struct lwp *l)
1020 1.62 dyoung {
1021 1.93 dyoung return (*so->so_proto->pr_usrreq)(so, req, NULL, nam, NULL, l);
1022 1.62 dyoung }
1023 1.62 dyoung
1024 1.62 dyoung static int
1025 1.62 dyoung gre_getsockname(struct socket *so, struct mbuf *nam, struct lwp *l)
1026 1.62 dyoung {
1027 1.62 dyoung return gre_getname(so, PRU_SOCKADDR, nam, l);
1028 1.62 dyoung }
1029 1.62 dyoung
1030 1.62 dyoung static int
1031 1.62 dyoung gre_getpeername(struct socket *so, struct mbuf *nam, struct lwp *l)
1032 1.62 dyoung {
1033 1.62 dyoung return gre_getname(so, PRU_PEERADDR, nam, l);
1034 1.62 dyoung }
1035 1.62 dyoung
1036 1.62 dyoung static int
1037 1.111 dyoung gre_getnames(struct socket *so, struct lwp *l, struct sockaddr_storage *src,
1038 1.111 dyoung struct sockaddr_storage *dst)
1039 1.62 dyoung {
1040 1.62 dyoung struct mbuf *m;
1041 1.111 dyoung struct sockaddr_storage *ss;
1042 1.62 dyoung int rc;
1043 1.62 dyoung
1044 1.120 dyoung if ((m = getsombuf(so, MT_SONAME)) == NULL)
1045 1.62 dyoung return ENOBUFS;
1046 1.62 dyoung
1047 1.111 dyoung ss = mtod(m, struct sockaddr_storage *);
1048 1.62 dyoung
1049 1.130 ad solock(so);
1050 1.62 dyoung if ((rc = gre_getsockname(so, m, l)) != 0)
1051 1.62 dyoung goto out;
1052 1.111 dyoung *src = *ss;
1053 1.62 dyoung
1054 1.62 dyoung if ((rc = gre_getpeername(so, m, l)) != 0)
1055 1.62 dyoung goto out;
1056 1.111 dyoung *dst = *ss;
1057 1.62 dyoung out:
1058 1.130 ad sounlock(so);
1059 1.62 dyoung m_freem(m);
1060 1.62 dyoung return rc;
1061 1.62 dyoung }
1062 1.62 dyoung
1063 1.93 dyoung static void
1064 1.132 dyoung gre_fp_recvloop(void *arg)
1065 1.132 dyoung {
1066 1.132 dyoung struct gre_softc *sc = arg;
1067 1.132 dyoung
1068 1.132 dyoung mutex_enter(&sc->sc_mtx);
1069 1.132 dyoung while (gre_fp_recv(sc))
1070 1.132 dyoung ;
1071 1.132 dyoung mutex_exit(&sc->sc_mtx);
1072 1.132 dyoung kthread_exit(0);
1073 1.132 dyoung }
1074 1.132 dyoung
1075 1.132 dyoung static bool
1076 1.132 dyoung gre_fp_recv(struct gre_softc *sc)
1077 1.93 dyoung {
1078 1.132 dyoung int fd, ofd, rc;
1079 1.132 dyoung file_t *fp;
1080 1.132 dyoung
1081 1.132 dyoung fp = sc->sc_fp;
1082 1.132 dyoung ofd = sc->sc_fd;
1083 1.132 dyoung fd = -1;
1084 1.132 dyoung
1085 1.132 dyoung switch (sc->sc_msg) {
1086 1.132 dyoung case GRE_M_STOP:
1087 1.132 dyoung cv_signal(&sc->sc_fp_condvar);
1088 1.132 dyoung return false;
1089 1.132 dyoung case GRE_M_SETFP:
1090 1.132 dyoung mutex_exit(&sc->sc_mtx);
1091 1.132 dyoung rc = fd_dup(fp, 0, &fd, 0);
1092 1.132 dyoung mutex_enter(&sc->sc_mtx);
1093 1.132 dyoung if (rc != 0) {
1094 1.132 dyoung sc->sc_msg = GRE_M_ERR;
1095 1.132 dyoung break;
1096 1.132 dyoung }
1097 1.132 dyoung /*FALLTHROUGH*/
1098 1.132 dyoung case GRE_M_DELFP:
1099 1.132 dyoung mutex_exit(&sc->sc_mtx);
1100 1.132 dyoung if (ofd != -1 && fd_getfile(ofd) != NULL)
1101 1.132 dyoung fd_close(ofd);
1102 1.132 dyoung mutex_enter(&sc->sc_mtx);
1103 1.132 dyoung sc->sc_fd = fd;
1104 1.132 dyoung sc->sc_msg = GRE_M_OK;
1105 1.132 dyoung break;
1106 1.132 dyoung default:
1107 1.132 dyoung gre_fp_wait(sc);
1108 1.132 dyoung return true;
1109 1.132 dyoung }
1110 1.132 dyoung cv_signal(&sc->sc_fp_condvar);
1111 1.132 dyoung return true;
1112 1.132 dyoung }
1113 1.132 dyoung
1114 1.132 dyoung static bool
1115 1.132 dyoung gre_fp_send(struct gre_softc *sc, enum gre_msg msg, file_t *fp)
1116 1.132 dyoung {
1117 1.132 dyoung bool rc;
1118 1.93 dyoung
1119 1.132 dyoung mutex_enter(&sc->sc_mtx);
1120 1.132 dyoung while (sc->sc_msg != GRE_M_NONE)
1121 1.132 dyoung gre_fp_wait(sc);
1122 1.132 dyoung sc->sc_fp = fp;
1123 1.132 dyoung sc->sc_msg = msg;
1124 1.132 dyoung cv_signal(&sc->sc_fp_condvar);
1125 1.132 dyoung while (sc->sc_msg != GRE_M_STOP && sc->sc_msg != GRE_M_OK &&
1126 1.132 dyoung sc->sc_msg != GRE_M_ERR)
1127 1.132 dyoung gre_fp_wait(sc);
1128 1.132 dyoung rc = (sc->sc_msg != GRE_M_ERR);
1129 1.132 dyoung sc->sc_msg = GRE_M_NONE;
1130 1.132 dyoung cv_signal(&sc->sc_fp_condvar);
1131 1.132 dyoung mutex_exit(&sc->sc_mtx);
1132 1.132 dyoung return rc;
1133 1.93 dyoung }
1134 1.93 dyoung
1135 1.59 thorpej static int
1136 1.111 dyoung gre_ssock(struct ifnet *ifp, struct gre_soparm *sp, int fd)
1137 1.1 hwr {
1138 1.132 dyoung int error = 0;
1139 1.111 dyoung const struct protosw *pr;
1140 1.125 ad file_t *fp;
1141 1.111 dyoung struct gre_softc *sc = ifp->if_softc;
1142 1.62 dyoung struct socket *so;
1143 1.111 dyoung struct sockaddr_storage dst, src;
1144 1.111 dyoung
1145 1.137 ad if ((fp = fd_getfile(fd)) == NULL)
1146 1.137 ad return EBADF;
1147 1.137 ad if (fp->f_type != DTYPE_SOCKET) {
1148 1.137 ad fd_putfile(fd);
1149 1.137 ad return ENOTSOCK;
1150 1.137 ad }
1151 1.111 dyoung
1152 1.132 dyoung GRE_DPRINTF(sc, "\n");
1153 1.111 dyoung
1154 1.111 dyoung so = (struct socket *)fp->f_data;
1155 1.111 dyoung pr = so->so_proto;
1156 1.132 dyoung
1157 1.132 dyoung GRE_DPRINTF(sc, "type %d, proto %d\n", pr->pr_type, pr->pr_protocol);
1158 1.132 dyoung
1159 1.111 dyoung if ((pr->pr_flags & PR_ATOMIC) == 0 ||
1160 1.111 dyoung (sp->sp_type != 0 && pr->pr_type != sp->sp_type) ||
1161 1.111 dyoung (sp->sp_proto != 0 && pr->pr_protocol != 0 &&
1162 1.111 dyoung pr->pr_protocol != sp->sp_proto)) {
1163 1.111 dyoung error = EINVAL;
1164 1.132 dyoung goto err;
1165 1.111 dyoung }
1166 1.111 dyoung
1167 1.132 dyoung GRE_DPRINTF(sc, "\n");
1168 1.111 dyoung
1169 1.111 dyoung /* check address */
1170 1.127 dyoung if ((error = gre_getnames(so, curlwp, &src, &dst)) != 0)
1171 1.132 dyoung goto err;
1172 1.111 dyoung
1173 1.132 dyoung GRE_DPRINTF(sc, "\n");
1174 1.111 dyoung
1175 1.132 dyoung if (!gre_fp_send(sc, GRE_M_SETFP, fp)) {
1176 1.132 dyoung error = EBUSY;
1177 1.132 dyoung goto err;
1178 1.132 dyoung }
1179 1.111 dyoung
1180 1.132 dyoung GRE_DPRINTF(sc, "\n");
1181 1.111 dyoung
1182 1.111 dyoung sp->sp_src = src;
1183 1.111 dyoung sp->sp_dst = dst;
1184 1.111 dyoung
1185 1.132 dyoung sp->sp_so = so;
1186 1.111 dyoung
1187 1.132 dyoung err:
1188 1.132 dyoung fd_putfile(fd);
1189 1.111 dyoung return error;
1190 1.111 dyoung }
1191 1.111 dyoung
1192 1.111 dyoung static bool
1193 1.111 dyoung sockaddr_is_anyaddr(const struct sockaddr *sa)
1194 1.111 dyoung {
1195 1.111 dyoung socklen_t anylen, salen;
1196 1.111 dyoung const void *anyaddr, *addr;
1197 1.111 dyoung
1198 1.111 dyoung if ((anyaddr = sockaddr_anyaddr(sa, &anylen)) == NULL ||
1199 1.111 dyoung (addr = sockaddr_const_addr(sa, &salen)) == NULL)
1200 1.111 dyoung return false;
1201 1.111 dyoung
1202 1.111 dyoung if (salen > anylen)
1203 1.111 dyoung return false;
1204 1.111 dyoung
1205 1.111 dyoung return memcmp(anyaddr, addr, MIN(anylen, salen)) == 0;
1206 1.111 dyoung }
1207 1.111 dyoung
1208 1.115 dyoung static bool
1209 1.111 dyoung gre_is_nullconf(const struct gre_soparm *sp)
1210 1.111 dyoung {
1211 1.111 dyoung return sockaddr_is_anyaddr(sstocsa(&sp->sp_src)) ||
1212 1.111 dyoung sockaddr_is_anyaddr(sstocsa(&sp->sp_dst));
1213 1.111 dyoung }
1214 1.111 dyoung
1215 1.111 dyoung static void
1216 1.115 dyoung gre_clearconf(struct gre_soparm *sp, bool force)
1217 1.111 dyoung {
1218 1.111 dyoung if (sp->sp_bysock || force) {
1219 1.111 dyoung sockaddr_copy(sstosa(&sp->sp_src), sizeof(sp->sp_src),
1220 1.111 dyoung sockaddr_any(sstosa(&sp->sp_src)));
1221 1.111 dyoung sockaddr_copy(sstosa(&sp->sp_dst), sizeof(sp->sp_dst),
1222 1.111 dyoung sockaddr_any(sstosa(&sp->sp_dst)));
1223 1.132 dyoung sp->sp_bysock = false;
1224 1.111 dyoung }
1225 1.132 dyoung sp->sp_so = NULL; /* XXX */
1226 1.111 dyoung }
1227 1.111 dyoung
1228 1.111 dyoung static int
1229 1.119 dyoung gre_ioctl_lock(struct gre_softc *sc)
1230 1.119 dyoung {
1231 1.119 dyoung mutex_enter(&sc->sc_mtx);
1232 1.119 dyoung
1233 1.119 dyoung while (sc->sc_state == GRE_S_IOCTL)
1234 1.119 dyoung gre_wait(sc);
1235 1.119 dyoung
1236 1.119 dyoung if (sc->sc_state != GRE_S_IDLE) {
1237 1.119 dyoung cv_signal(&sc->sc_condvar);
1238 1.119 dyoung mutex_exit(&sc->sc_mtx);
1239 1.132 dyoung GRE_DPRINTF(sc, "\n");
1240 1.119 dyoung return ENXIO;
1241 1.119 dyoung }
1242 1.119 dyoung
1243 1.119 dyoung sc->sc_state = GRE_S_IOCTL;
1244 1.119 dyoung
1245 1.119 dyoung mutex_exit(&sc->sc_mtx);
1246 1.119 dyoung return 0;
1247 1.119 dyoung }
1248 1.119 dyoung
1249 1.119 dyoung static void
1250 1.119 dyoung gre_ioctl_unlock(struct gre_softc *sc)
1251 1.119 dyoung {
1252 1.119 dyoung mutex_enter(&sc->sc_mtx);
1253 1.119 dyoung
1254 1.119 dyoung KASSERT(sc->sc_state == GRE_S_IOCTL);
1255 1.119 dyoung sc->sc_state = GRE_S_IDLE;
1256 1.119 dyoung cv_signal(&sc->sc_condvar);
1257 1.119 dyoung
1258 1.119 dyoung mutex_exit(&sc->sc_mtx);
1259 1.119 dyoung }
1260 1.119 dyoung
1261 1.119 dyoung static int
1262 1.111 dyoung gre_ioctl(struct ifnet *ifp, const u_long cmd, void *data)
1263 1.111 dyoung {
1264 1.94 christos struct ifreq *ifr;
1265 1.28 itojun struct if_laddrreq *lifr = (struct if_laddrreq *)data;
1266 1.8 explorer struct gre_softc *sc = ifp->if_softc;
1267 1.111 dyoung struct gre_soparm *sp;
1268 1.119 dyoung int fd, error = 0, oproto, otype, s;
1269 1.111 dyoung struct gre_soparm sp0;
1270 1.107 dyoung
1271 1.107 dyoung ifr = data;
1272 1.107 dyoung
1273 1.132 dyoung GRE_DPRINTF(sc, "cmd %lu\n", cmd);
1274 1.111 dyoung
1275 1.61 ad switch (cmd) {
1276 1.61 ad case SIOCSIFFLAGS:
1277 1.61 ad case SIOCSIFMTU:
1278 1.61 ad case GRESPROTO:
1279 1.61 ad case GRESADDRD:
1280 1.61 ad case GRESADDRS:
1281 1.62 dyoung case GRESSOCK:
1282 1.62 dyoung case GREDSOCK:
1283 1.61 ad case SIOCSLIFPHYADDR:
1284 1.61 ad case SIOCDIFPHYADDR:
1285 1.127 dyoung if (kauth_authorize_network(curlwp->l_cred,
1286 1.127 dyoung KAUTH_NETWORK_INTERFACE,
1287 1.70 elad KAUTH_REQ_NETWORK_INTERFACE_SETPRIV, ifp, (void *)cmd,
1288 1.70 elad NULL) != 0)
1289 1.87 dyoung return EPERM;
1290 1.61 ad break;
1291 1.61 ad default:
1292 1.61 ad break;
1293 1.61 ad }
1294 1.1 hwr
1295 1.119 dyoung if ((error = gre_ioctl_lock(sc)) != 0) {
1296 1.132 dyoung GRE_DPRINTF(sc, "\n");
1297 1.119 dyoung return error;
1298 1.111 dyoung }
1299 1.119 dyoung s = splnet();
1300 1.111 dyoung
1301 1.111 dyoung sp0 = sc->sc_soparm;
1302 1.132 dyoung sp0.sp_so = NULL;
1303 1.111 dyoung sp = &sp0;
1304 1.111 dyoung
1305 1.132 dyoung GRE_DPRINTF(sc, "\n");
1306 1.111 dyoung
1307 1.20 itojun switch (cmd) {
1308 1.139 dyoung case SIOCINITIFADDR:
1309 1.132 dyoung GRE_DPRINTF(sc, "\n");
1310 1.111 dyoung if ((ifp->if_flags & IFF_UP) != 0)
1311 1.111 dyoung break;
1312 1.115 dyoung gre_clearconf(sp, false);
1313 1.36 itojun ifp->if_flags |= IFF_UP;
1314 1.111 dyoung goto mksocket;
1315 1.55 perry case SIOCSIFDSTADDR:
1316 1.1 hwr break;
1317 1.1 hwr case SIOCSIFFLAGS:
1318 1.139 dyoung if ((error = ifioctl_common(ifp, cmd, data)) != 0)
1319 1.139 dyoung break;
1320 1.111 dyoung oproto = sp->sp_proto;
1321 1.111 dyoung otype = sp->sp_type;
1322 1.62 dyoung switch (ifr->ifr_flags & (IFF_LINK0|IFF_LINK2)) {
1323 1.62 dyoung case IFF_LINK0|IFF_LINK2:
1324 1.111 dyoung sp->sp_proto = IPPROTO_UDP;
1325 1.111 dyoung sp->sp_type = SOCK_DGRAM;
1326 1.111 dyoung break;
1327 1.111 dyoung case IFF_LINK2:
1328 1.111 dyoung sp->sp_proto = 0;
1329 1.111 dyoung sp->sp_type = 0;
1330 1.62 dyoung break;
1331 1.62 dyoung case IFF_LINK0:
1332 1.111 dyoung sp->sp_proto = IPPROTO_GRE;
1333 1.111 dyoung sp->sp_type = SOCK_RAW;
1334 1.111 dyoung break;
1335 1.111 dyoung default:
1336 1.132 dyoung GRE_DPRINTF(sc, "\n");
1337 1.111 dyoung error = EINVAL;
1338 1.111 dyoung goto out;
1339 1.111 dyoung }
1340 1.132 dyoung GRE_DPRINTF(sc, "\n");
1341 1.115 dyoung gre_clearconf(sp, false);
1342 1.111 dyoung if ((ifp->if_flags & (IFF_UP|IFF_RUNNING)) ==
1343 1.111 dyoung (IFF_UP|IFF_RUNNING) &&
1344 1.111 dyoung (oproto == sp->sp_proto || sp->sp_proto == 0) &&
1345 1.111 dyoung (otype == sp->sp_type || sp->sp_type == 0))
1346 1.111 dyoung break;
1347 1.111 dyoung switch (sp->sp_proto) {
1348 1.111 dyoung case IPPROTO_UDP:
1349 1.111 dyoung case IPPROTO_GRE:
1350 1.111 dyoung goto mksocket;
1351 1.111 dyoung default:
1352 1.111 dyoung break;
1353 1.62 dyoung }
1354 1.1 hwr break;
1355 1.20 itojun case SIOCSIFMTU:
1356 1.111 dyoung /* XXX determine MTU automatically by probing w/
1357 1.111 dyoung * XXX do-not-fragment packets?
1358 1.111 dyoung */
1359 1.27 martin if (ifr->ifr_mtu < 576) {
1360 1.1 hwr error = EINVAL;
1361 1.1 hwr break;
1362 1.1 hwr }
1363 1.123 dyoung /*FALLTHROUGH*/
1364 1.1 hwr case SIOCGIFMTU:
1365 1.123 dyoung if ((error = ifioctl_common(ifp, cmd, data)) == ENETRESET)
1366 1.123 dyoung error = 0;
1367 1.1 hwr break;
1368 1.1 hwr case SIOCADDMULTI:
1369 1.1 hwr case SIOCDELMULTI:
1370 1.106 dyoung if (ifr == NULL) {
1371 1.1 hwr error = EAFNOSUPPORT;
1372 1.1 hwr break;
1373 1.1 hwr }
1374 1.106 dyoung switch (ifreq_getaddr(cmd, ifr)->sa_family) {
1375 1.1 hwr #ifdef INET
1376 1.1 hwr case AF_INET:
1377 1.1 hwr break;
1378 1.1 hwr #endif
1379 1.56 is #ifdef INET6
1380 1.56 is case AF_INET6:
1381 1.56 is break;
1382 1.56 is #endif
1383 1.1 hwr default:
1384 1.1 hwr error = EAFNOSUPPORT;
1385 1.1 hwr break;
1386 1.1 hwr }
1387 1.1 hwr break;
1388 1.1 hwr case GRESPROTO:
1389 1.115 dyoung gre_clearconf(sp, false);
1390 1.111 dyoung oproto = sp->sp_proto;
1391 1.111 dyoung otype = sp->sp_type;
1392 1.111 dyoung sp->sp_proto = ifr->ifr_flags;
1393 1.111 dyoung switch (sp->sp_proto) {
1394 1.62 dyoung case IPPROTO_UDP:
1395 1.62 dyoung ifp->if_flags |= IFF_LINK0|IFF_LINK2;
1396 1.111 dyoung sp->sp_type = SOCK_DGRAM;
1397 1.62 dyoung break;
1398 1.40 itojun case IPPROTO_GRE:
1399 1.3 hwr ifp->if_flags |= IFF_LINK0;
1400 1.62 dyoung ifp->if_flags &= ~IFF_LINK2;
1401 1.111 dyoung sp->sp_type = SOCK_RAW;
1402 1.111 dyoung break;
1403 1.111 dyoung case 0:
1404 1.111 dyoung ifp->if_flags &= ~IFF_LINK0;
1405 1.111 dyoung ifp->if_flags |= IFF_LINK2;
1406 1.111 dyoung sp->sp_type = 0;
1407 1.111 dyoung break;
1408 1.1 hwr default:
1409 1.40 itojun error = EPROTONOSUPPORT;
1410 1.35 itojun break;
1411 1.1 hwr }
1412 1.111 dyoung if ((oproto == sp->sp_proto || sp->sp_proto == 0) &&
1413 1.111 dyoung (otype == sp->sp_type || sp->sp_type == 0))
1414 1.111 dyoung break;
1415 1.111 dyoung switch (sp->sp_proto) {
1416 1.111 dyoung case IPPROTO_UDP:
1417 1.111 dyoung case IPPROTO_GRE:
1418 1.111 dyoung goto mksocket;
1419 1.111 dyoung default:
1420 1.111 dyoung break;
1421 1.111 dyoung }
1422 1.1 hwr break;
1423 1.1 hwr case GREGPROTO:
1424 1.111 dyoung ifr->ifr_flags = sp->sp_proto;
1425 1.1 hwr break;
1426 1.1 hwr case GRESADDRS:
1427 1.1 hwr case GRESADDRD:
1428 1.115 dyoung gre_clearconf(sp, false);
1429 1.132 dyoung /* set tunnel endpoints and mark interface as up */
1430 1.111 dyoung switch (cmd) {
1431 1.111 dyoung case GRESADDRS:
1432 1.111 dyoung sockaddr_copy(sstosa(&sp->sp_src),
1433 1.111 dyoung sizeof(sp->sp_src), ifreq_getaddr(cmd, ifr));
1434 1.111 dyoung break;
1435 1.111 dyoung case GRESADDRD:
1436 1.111 dyoung sockaddr_copy(sstosa(&sp->sp_dst),
1437 1.111 dyoung sizeof(sp->sp_dst), ifreq_getaddr(cmd, ifr));
1438 1.93 dyoung break;
1439 1.63 dyoung }
1440 1.111 dyoung checkaddr:
1441 1.111 dyoung if (sockaddr_any(sstosa(&sp->sp_src)) == NULL ||
1442 1.111 dyoung sockaddr_any(sstosa(&sp->sp_dst)) == NULL) {
1443 1.93 dyoung error = EINVAL;
1444 1.93 dyoung break;
1445 1.93 dyoung }
1446 1.111 dyoung /* let gre_socreate() check the rest */
1447 1.111 dyoung mksocket:
1448 1.132 dyoung GRE_DPRINTF(sc, "\n");
1449 1.111 dyoung /* If we're administratively down, or the configuration
1450 1.111 dyoung * is empty, there's no use creating a socket.
1451 1.111 dyoung */
1452 1.111 dyoung if ((ifp->if_flags & IFF_UP) == 0 || gre_is_nullconf(sp))
1453 1.111 dyoung goto sendconf;
1454 1.111 dyoung
1455 1.132 dyoung GRE_DPRINTF(sc, "\n");
1456 1.127 dyoung fd = 0;
1457 1.127 dyoung error = gre_socreate(sc, sp, &fd);
1458 1.111 dyoung if (error != 0)
1459 1.62 dyoung break;
1460 1.62 dyoung
1461 1.111 dyoung setsock:
1462 1.132 dyoung GRE_DPRINTF(sc, "\n");
1463 1.93 dyoung
1464 1.111 dyoung error = gre_ssock(ifp, sp, fd);
1465 1.93 dyoung
1466 1.111 dyoung if (cmd != GRESSOCK) {
1467 1.132 dyoung GRE_DPRINTF(sc, "\n");
1468 1.125 ad /* XXX v. dodgy */
1469 1.125 ad if (fd_getfile(fd) != NULL)
1470 1.125 ad fd_close(fd);
1471 1.93 dyoung }
1472 1.111 dyoung
1473 1.93 dyoung if (error == 0) {
1474 1.111 dyoung sendconf:
1475 1.132 dyoung GRE_DPRINTF(sc, "\n");
1476 1.111 dyoung ifp->if_flags &= ~IFF_RUNNING;
1477 1.132 dyoung gre_reconf(sc, sp);
1478 1.93 dyoung }
1479 1.62 dyoung
1480 1.62 dyoung break;
1481 1.111 dyoung case GREGADDRS:
1482 1.111 dyoung ifreq_setaddr(cmd, ifr, sstosa(&sp->sp_src));
1483 1.111 dyoung break;
1484 1.111 dyoung case GREGADDRD:
1485 1.111 dyoung ifreq_setaddr(cmd, ifr, sstosa(&sp->sp_dst));
1486 1.111 dyoung break;
1487 1.111 dyoung case GREDSOCK:
1488 1.132 dyoung GRE_DPRINTF(sc, "\n");
1489 1.111 dyoung if (sp->sp_bysock)
1490 1.111 dyoung ifp->if_flags &= ~IFF_UP;
1491 1.115 dyoung gre_clearconf(sp, false);
1492 1.111 dyoung goto mksocket;
1493 1.111 dyoung case GRESSOCK:
1494 1.132 dyoung GRE_DPRINTF(sc, "\n");
1495 1.115 dyoung gre_clearconf(sp, true);
1496 1.111 dyoung fd = (int)ifr->ifr_value;
1497 1.132 dyoung sp->sp_bysock = true;
1498 1.111 dyoung ifp->if_flags |= IFF_UP;
1499 1.111 dyoung goto setsock;
1500 1.28 itojun case SIOCSLIFPHYADDR:
1501 1.132 dyoung GRE_DPRINTF(sc, "\n");
1502 1.111 dyoung if (lifr->addr.ss_family != lifr->dstaddr.ss_family) {
1503 1.31 itojun error = EAFNOSUPPORT;
1504 1.31 itojun break;
1505 1.31 itojun }
1506 1.111 dyoung sockaddr_copy(sstosa(&sp->sp_src), sizeof(sp->sp_src),
1507 1.111 dyoung sstosa(&lifr->addr));
1508 1.111 dyoung sockaddr_copy(sstosa(&sp->sp_dst), sizeof(sp->sp_dst),
1509 1.111 dyoung sstosa(&lifr->dstaddr));
1510 1.132 dyoung GRE_DPRINTF(sc, "\n");
1511 1.111 dyoung goto checkaddr;
1512 1.28 itojun case SIOCDIFPHYADDR:
1513 1.132 dyoung GRE_DPRINTF(sc, "\n");
1514 1.115 dyoung gre_clearconf(sp, true);
1515 1.111 dyoung ifp->if_flags &= ~IFF_UP;
1516 1.111 dyoung goto mksocket;
1517 1.28 itojun case SIOCGLIFPHYADDR:
1518 1.132 dyoung GRE_DPRINTF(sc, "\n");
1519 1.111 dyoung if (gre_is_nullconf(sp)) {
1520 1.28 itojun error = EADDRNOTAVAIL;
1521 1.28 itojun break;
1522 1.28 itojun }
1523 1.111 dyoung sockaddr_copy(sstosa(&lifr->addr), sizeof(lifr->addr),
1524 1.111 dyoung sstosa(&sp->sp_src));
1525 1.111 dyoung sockaddr_copy(sstosa(&lifr->dstaddr), sizeof(lifr->dstaddr),
1526 1.111 dyoung sstosa(&sp->sp_dst));
1527 1.132 dyoung GRE_DPRINTF(sc, "\n");
1528 1.1 hwr break;
1529 1.1 hwr default:
1530 1.139 dyoung error = ifioctl_common(ifp, cmd, data);
1531 1.31 itojun break;
1532 1.1 hwr }
1533 1.111 dyoung out:
1534 1.132 dyoung GRE_DPRINTF(sc, "\n");
1535 1.119 dyoung splx(s);
1536 1.119 dyoung gre_ioctl_unlock(sc);
1537 1.87 dyoung return error;
1538 1.1 hwr }
1539 1.1 hwr
1540 1.54 christos #endif
1541 1.54 christos
1542 1.59 thorpej void greattach(int);
1543 1.54 christos
1544 1.54 christos /* ARGSUSED */
1545 1.54 christos void
1546 1.74 christos greattach(int count)
1547 1.54 christos {
1548 1.54 christos #ifdef INET
1549 1.54 christos if_clone_attach(&gre_cloner);
1550 1.54 christos #endif
1551 1.54 christos }
1552