if_ethersubr.c revision 1.303 1 1.303 christos /* $NetBSD: if_ethersubr.c,v 1.303 2021/11/08 16:50:05 christos Exp $ */
2 1.44 itojun
3 1.44 itojun /*
4 1.44 itojun * Copyright (C) 1995, 1996, 1997, and 1998 WIDE Project.
5 1.44 itojun * All rights reserved.
6 1.120 perry *
7 1.44 itojun * Redistribution and use in source and binary forms, with or without
8 1.44 itojun * modification, are permitted provided that the following conditions
9 1.44 itojun * are met:
10 1.44 itojun * 1. Redistributions of source code must retain the above copyright
11 1.44 itojun * notice, this list of conditions and the following disclaimer.
12 1.44 itojun * 2. Redistributions in binary form must reproduce the above copyright
13 1.44 itojun * notice, this list of conditions and the following disclaimer in the
14 1.44 itojun * documentation and/or other materials provided with the distribution.
15 1.44 itojun * 3. Neither the name of the project nor the names of its contributors
16 1.44 itojun * may be used to endorse or promote products derived from this software
17 1.44 itojun * without specific prior written permission.
18 1.120 perry *
19 1.44 itojun * THIS SOFTWARE IS PROVIDED BY THE PROJECT AND CONTRIBUTORS ``AS IS'' AND
20 1.44 itojun * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
21 1.44 itojun * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
22 1.44 itojun * ARE DISCLAIMED. IN NO EVENT SHALL THE PROJECT OR CONTRIBUTORS BE LIABLE
23 1.44 itojun * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
24 1.44 itojun * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
25 1.44 itojun * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
26 1.44 itojun * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
27 1.44 itojun * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
28 1.44 itojun * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
29 1.44 itojun * SUCH DAMAGE.
30 1.44 itojun */
31 1.9 cgd
32 1.1 cgd /*
33 1.8 mycroft * Copyright (c) 1982, 1989, 1993
34 1.8 mycroft * The Regents of the University of California. All rights reserved.
35 1.1 cgd *
36 1.1 cgd * Redistribution and use in source and binary forms, with or without
37 1.1 cgd * modification, are permitted provided that the following conditions
38 1.1 cgd * are met:
39 1.1 cgd * 1. Redistributions of source code must retain the above copyright
40 1.1 cgd * notice, this list of conditions and the following disclaimer.
41 1.1 cgd * 2. Redistributions in binary form must reproduce the above copyright
42 1.1 cgd * notice, this list of conditions and the following disclaimer in the
43 1.1 cgd * documentation and/or other materials provided with the distribution.
44 1.113 agc * 3. Neither the name of the University nor the names of its contributors
45 1.1 cgd * may be used to endorse or promote products derived from this software
46 1.1 cgd * without specific prior written permission.
47 1.1 cgd *
48 1.1 cgd * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
49 1.1 cgd * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
50 1.1 cgd * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
51 1.1 cgd * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
52 1.1 cgd * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
53 1.1 cgd * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
54 1.1 cgd * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
55 1.1 cgd * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
56 1.1 cgd * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
57 1.1 cgd * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
58 1.1 cgd * SUCH DAMAGE.
59 1.1 cgd *
60 1.27 fvdl * @(#)if_ethersubr.c 8.2 (Berkeley) 4/4/96
61 1.1 cgd */
62 1.90 lukem
63 1.90 lukem #include <sys/cdefs.h>
64 1.303 christos __KERNEL_RCSID(0, "$NetBSD: if_ethersubr.c,v 1.303 2021/11/08 16:50:05 christos Exp $");
65 1.1 cgd
66 1.212 pooka #ifdef _KERNEL_OPT
67 1.33 jonathan #include "opt_inet.h"
68 1.33 jonathan #include "opt_atalk.h"
69 1.112 martin #include "opt_mbuftrace.h"
70 1.182 kefren #include "opt_mpls.h"
71 1.30 matt #include "opt_gateway.h"
72 1.135 pavel #include "opt_pppoe.h"
73 1.206 ozaki #include "opt_net_mpsafe.h"
74 1.212 pooka #endif
75 1.212 pooka
76 1.59 thorpej #include "vlan.h"
77 1.81 martin #include "pppoe.h"
78 1.78 thorpej #include "bridge.h"
79 1.93 martin #include "arp.h"
80 1.121 yamt #include "agr.h"
81 1.30 matt
82 1.200 joerg #include <sys/sysctl.h>
83 1.4 mycroft #include <sys/mbuf.h>
84 1.211 ozaki #include <sys/mutex.h>
85 1.4 mycroft #include <sys/ioctl.h>
86 1.4 mycroft #include <sys/errno.h>
87 1.158 dyoung #include <sys/device.h>
88 1.284 riastrad #include <sys/entropy.h>
89 1.207 riastrad #include <sys/rndsource.h>
90 1.216 ozaki #include <sys/cpu.h>
91 1.231 ozaki #include <sys/kmem.h>
92 1.297 yamaguch #include <sys/hook.h>
93 1.8 mycroft
94 1.4 mycroft #include <net/if.h>
95 1.4 mycroft #include <net/netisr.h>
96 1.4 mycroft #include <net/route.h>
97 1.4 mycroft #include <net/if_llc.h>
98 1.4 mycroft #include <net/if_dl.h>
99 1.8 mycroft #include <net/if_types.h>
100 1.211 ozaki #include <net/pktqueue.h>
101 1.93 martin
102 1.158 dyoung #include <net/if_media.h>
103 1.158 dyoung #include <dev/mii/mii.h>
104 1.158 dyoung #include <dev/mii/miivar.h>
105 1.158 dyoung
106 1.93 martin #if NARP == 0
107 1.93 martin /*
108 1.102 jmmv * XXX there should really be a way to issue this warning from within config(8)
109 1.93 martin */
110 1.111 martin #error You have included NETATALK or a pseudo-device in your configuration that depends on the presence of ethernet interfaces, but have no such interfaces configured. Check if you really need pseudo-device bridge, pppoe, vlan or options NETATALK.
111 1.93 martin #endif
112 1.1 cgd
113 1.69 thorpej #include <net/bpf.h>
114 1.69 thorpej
115 1.22 is #include <net/if_ether.h>
116 1.59 thorpej #include <net/if_vlanvar.h>
117 1.22 is
118 1.81 martin #if NPPPOE > 0
119 1.81 martin #include <net/if_pppoe.h>
120 1.81 martin #endif
121 1.81 martin
122 1.121 yamt #if NAGR > 0
123 1.121 yamt #include <net/agr/ieee8023_slowprotocols.h> /* XXX */
124 1.121 yamt #include <net/agr/ieee8023ad.h>
125 1.121 yamt #include <net/agr/if_agrvar.h>
126 1.121 yamt #endif
127 1.121 yamt
128 1.293 yamaguch #include <net/lagg/if_laggvar.h>
129 1.293 yamaguch
130 1.78 thorpej #if NBRIDGE > 0
131 1.78 thorpej #include <net/if_bridgevar.h>
132 1.78 thorpej #endif
133 1.78 thorpej
134 1.15 phil #include <netinet/in.h>
135 1.1 cgd #ifdef INET
136 1.4 mycroft #include <netinet/in_var.h>
137 1.1 cgd #endif
138 1.22 is #include <netinet/if_inarp.h>
139 1.1 cgd
140 1.44 itojun #ifdef INET6
141 1.44 itojun #ifndef INET
142 1.44 itojun #include <netinet/in.h>
143 1.44 itojun #endif
144 1.44 itojun #include <netinet6/in6_var.h>
145 1.44 itojun #include <netinet6/nd6.h>
146 1.44 itojun #endif
147 1.44 itojun
148 1.133 liamjfoy #include "carp.h"
149 1.133 liamjfoy #if NCARP > 0
150 1.133 liamjfoy #include <netinet/ip_carp.h>
151 1.133 liamjfoy #endif
152 1.133 liamjfoy
153 1.23 christos #ifdef NETATALK
154 1.23 christos #include <netatalk/at.h>
155 1.23 christos #include <netatalk/at_var.h>
156 1.23 christos #include <netatalk/at_extern.h>
157 1.23 christos
158 1.23 christos #define llc_snap_org_code llc_un.type_snap.org_code
159 1.23 christos #define llc_snap_ether_type llc_un.type_snap.ether_type
160 1.23 christos
161 1.23 christos extern u_char at_org_code[3];
162 1.23 christos extern u_char aarp_org_code[3];
163 1.23 christos #endif /* NETATALK */
164 1.23 christos
165 1.182 kefren #ifdef MPLS
166 1.182 kefren #include <netmpls/mpls.h>
167 1.182 kefren #include <netmpls/mpls_var.h>
168 1.182 kefren #endif
169 1.182 kefren
170 1.292 roy CTASSERT(sizeof(struct ether_addr) == 6);
171 1.292 roy CTASSERT(sizeof(struct ether_header) == 14);
172 1.292 roy
173 1.278 msaitoh #ifdef DIAGNOSTIC
174 1.123 matt static struct timeval bigpktppslim_last;
175 1.123 matt static int bigpktppslim = 2; /* XXX */
176 1.123 matt static int bigpktpps_count;
177 1.203 ozaki static kmutex_t bigpktpps_lock __cacheline_aligned;
178 1.278 msaitoh #endif
179 1.123 matt
180 1.118 yamt const uint8_t etherbroadcastaddr[ETHER_ADDR_LEN] =
181 1.118 yamt { 0xff, 0xff, 0xff, 0xff, 0xff, 0xff };
182 1.121 yamt const uint8_t ethermulticastaddr_slowprotocols[ETHER_ADDR_LEN] =
183 1.121 yamt { 0x01, 0x80, 0xc2, 0x00, 0x00, 0x02 };
184 1.8 mycroft #define senderr(e) { error = (e); goto bad;}
185 1.1 cgd
186 1.301 knakahar static pktq_rps_hash_func_t ether_pktq_rps_hash_p;
187 1.301 knakahar
188 1.293 yamaguch /* if_lagg(4) support */
189 1.293 yamaguch struct mbuf *(*lagg_input_ethernet_p)(struct ifnet *, struct mbuf *);
190 1.293 yamaguch
191 1.261 maxv static int ether_output(struct ifnet *, struct mbuf *,
192 1.261 maxv const struct sockaddr *, const struct rtentry *);
193 1.42 thorpej
194 1.1 cgd /*
195 1.1 cgd * Ethernet output routine.
196 1.1 cgd * Encapsulate a packet of type family for the local net.
197 1.22 is * Assumes that ifp is actually pointer to ethercom structure.
198 1.1 cgd */
199 1.42 thorpej static int
200 1.178 dyoung ether_output(struct ifnet * const ifp0, struct mbuf * const m0,
201 1.256 maxv const struct sockaddr * const dst, const struct rtentry *rt)
202 1.1 cgd {
203 1.256 maxv uint8_t esrc[ETHER_ADDR_LEN], edst[ETHER_ADDR_LEN];
204 1.162 matt uint16_t etype = 0;
205 1.122 christos int error = 0, hdrcmplt = 0;
206 1.29 mrg struct mbuf *m = m0;
207 1.151 dyoung struct mbuf *mcopy = NULL;
208 1.29 mrg struct ether_header *eh;
209 1.133 liamjfoy struct ifnet *ifp = ifp0;
210 1.24 christos #ifdef INET
211 1.22 is struct arphdr *ah;
212 1.260 maxv #endif
213 1.23 christos #ifdef NETATALK
214 1.23 christos struct at_ifaddr *aa;
215 1.260 maxv #endif
216 1.1 cgd
217 1.104 matt #ifdef MBUFTRACE
218 1.116 jonathan m_claimm(m, ifp->if_mowner);
219 1.104 matt #endif
220 1.133 liamjfoy
221 1.133 liamjfoy #if NCARP > 0
222 1.133 liamjfoy if (ifp->if_type == IFT_CARP) {
223 1.133 liamjfoy struct ifaddr *ifa;
224 1.227 ozaki int s = pserialize_read_enter();
225 1.133 liamjfoy
226 1.133 liamjfoy /* loop back if this is going to the carp interface */
227 1.133 liamjfoy if (dst != NULL && ifp0->if_link_state == LINK_STATE_UP &&
228 1.227 ozaki (ifa = ifa_ifwithaddr(dst)) != NULL) {
229 1.227 ozaki if (ifa->ifa_ifp == ifp0) {
230 1.227 ozaki pserialize_read_exit(s);
231 1.227 ozaki return looutput(ifp0, m, dst, rt);
232 1.227 ozaki }
233 1.227 ozaki }
234 1.227 ozaki pserialize_read_exit(s);
235 1.133 liamjfoy
236 1.133 liamjfoy ifp = ifp->if_carpdev;
237 1.133 liamjfoy /* ac = (struct arpcom *)ifp; */
238 1.133 liamjfoy
239 1.247 msaitoh if ((ifp0->if_flags & (IFF_UP | IFF_RUNNING)) !=
240 1.247 msaitoh (IFF_UP | IFF_RUNNING))
241 1.133 liamjfoy senderr(ENETDOWN);
242 1.133 liamjfoy }
243 1.260 maxv #endif
244 1.133 liamjfoy
245 1.247 msaitoh if ((ifp->if_flags & (IFF_UP | IFF_RUNNING)) != (IFF_UP | IFF_RUNNING))
246 1.8 mycroft senderr(ENETDOWN);
247 1.72 thorpej
248 1.1 cgd switch (dst->sa_family) {
249 1.1 cgd
250 1.1 cgd #ifdef INET
251 1.1 cgd case AF_INET:
252 1.261 maxv if (m->m_flags & M_BCAST) {
253 1.256 maxv memcpy(edst, etherbroadcastaddr, sizeof(edst));
254 1.261 maxv } else if (m->m_flags & M_MCAST) {
255 1.145 dyoung ETHER_MAP_IP_MULTICAST(&satocsin(dst)->sin_addr, edst);
256 1.261 maxv } else {
257 1.281 kardel error = arpresolve(ifp0, rt, m, dst, edst, sizeof(edst));
258 1.260 maxv if (error)
259 1.260 maxv return (error == EWOULDBLOCK) ? 0 : error;
260 1.224 knakahar }
261 1.3 hpeyerl /* If broadcasting on a simplex interface, loopback a copy */
262 1.3 hpeyerl if ((m->m_flags & M_BCAST) && (ifp->if_flags & IFF_SIMPLEX))
263 1.266 maxv mcopy = m_copypacket(m, M_DONTWAIT);
264 1.17 mycroft etype = htons(ETHERTYPE_IP);
265 1.8 mycroft break;
266 1.22 is
267 1.22 is case AF_ARP:
268 1.22 is ah = mtod(m, struct arphdr *);
269 1.261 maxv if (m->m_flags & M_BCAST) {
270 1.256 maxv memcpy(edst, etherbroadcastaddr, sizeof(edst));
271 1.261 maxv } else {
272 1.147 christos void *tha = ar_tha(ah);
273 1.131 mrg
274 1.173 christos if (tha == NULL) {
275 1.258 maxv /* fake with ARPHRD_IEEE1394 */
276 1.236 maxv m_freem(m);
277 1.173 christos return 0;
278 1.173 christos }
279 1.146 dyoung memcpy(edst, tha, sizeof(edst));
280 1.131 mrg }
281 1.120 perry
282 1.22 is ah->ar_hrd = htons(ARPHRD_ETHER);
283 1.22 is
284 1.107 itojun switch (ntohs(ah->ar_op)) {
285 1.22 is case ARPOP_REVREQUEST:
286 1.22 is case ARPOP_REVREPLY:
287 1.22 is etype = htons(ETHERTYPE_REVARP);
288 1.22 is break;
289 1.22 is
290 1.22 is case ARPOP_REQUEST:
291 1.22 is case ARPOP_REPLY:
292 1.22 is default:
293 1.22 is etype = htons(ETHERTYPE_ARP);
294 1.22 is }
295 1.22 is break;
296 1.1 cgd #endif
297 1.256 maxv
298 1.44 itojun #ifdef INET6
299 1.44 itojun case AF_INET6:
300 1.261 maxv if (m->m_flags & M_BCAST) {
301 1.256 maxv memcpy(edst, etherbroadcastaddr, sizeof(edst));
302 1.261 maxv } else if (m->m_flags & M_MCAST) {
303 1.238 ozaki ETHER_MAP_IPV6_MULTICAST(&satocsin6(dst)->sin6_addr,
304 1.238 ozaki edst);
305 1.238 ozaki } else {
306 1.281 kardel error = nd6_resolve(ifp0, rt, m, dst, edst,
307 1.238 ozaki sizeof(edst));
308 1.261 maxv if (error)
309 1.261 maxv return (error == EWOULDBLOCK) ? 0 : error;
310 1.51 itojun }
311 1.44 itojun etype = htons(ETHERTYPE_IPV6);
312 1.44 itojun break;
313 1.44 itojun #endif
314 1.256 maxv
315 1.23 christos #ifdef NETATALK
316 1.250 maxv case AF_APPLETALK: {
317 1.227 ozaki struct ifaddr *ifa;
318 1.227 ozaki int s;
319 1.227 ozaki
320 1.224 knakahar KERNEL_LOCK(1, NULL);
321 1.256 maxv
322 1.226 rjs if (!aarpresolve(ifp, m, (const struct sockaddr_at *)dst, edst)) {
323 1.224 knakahar KERNEL_UNLOCK_ONE(NULL);
324 1.261 maxv return 0;
325 1.23 christos }
326 1.256 maxv
327 1.23 christos /*
328 1.23 christos * ifaddr is the first thing in at_ifaddr
329 1.23 christos */
330 1.227 ozaki s = pserialize_read_enter();
331 1.227 ozaki ifa = at_ifawithnet((const struct sockaddr_at *)dst, ifp);
332 1.227 ozaki if (ifa == NULL) {
333 1.227 ozaki pserialize_read_exit(s);
334 1.227 ozaki KERNEL_UNLOCK_ONE(NULL);
335 1.260 maxv senderr(EADDRNOTAVAIL);
336 1.224 knakahar }
337 1.227 ozaki aa = (struct at_ifaddr *)ifa;
338 1.120 perry
339 1.23 christos /*
340 1.23 christos * In the phase 2 case, we need to prepend an mbuf for the
341 1.265 maxv * llc header.
342 1.23 christos */
343 1.23 christos if (aa->aa_flags & AFA_PHASE2) {
344 1.23 christos struct llc llc;
345 1.23 christos
346 1.43 bouyer M_PREPEND(m, sizeof(struct llc), M_DONTWAIT);
347 1.256 maxv if (m == NULL) {
348 1.260 maxv pserialize_read_exit(s);
349 1.256 maxv KERNEL_UNLOCK_ONE(NULL);
350 1.256 maxv senderr(ENOBUFS);
351 1.256 maxv }
352 1.256 maxv
353 1.23 christos llc.llc_dsap = llc.llc_ssap = LLC_SNAP_LSAP;
354 1.23 christos llc.llc_control = LLC_UI;
355 1.146 dyoung memcpy(llc.llc_snap_org_code, at_org_code,
356 1.23 christos sizeof(llc.llc_snap_org_code));
357 1.38 kim llc.llc_snap_ether_type = htons(ETHERTYPE_ATALK);
358 1.147 christos memcpy(mtod(m, void *), &llc, sizeof(struct llc));
359 1.23 christos } else {
360 1.38 kim etype = htons(ETHERTYPE_ATALK);
361 1.23 christos }
362 1.227 ozaki pserialize_read_exit(s);
363 1.224 knakahar KERNEL_UNLOCK_ONE(NULL);
364 1.23 christos break;
365 1.250 maxv }
366 1.23 christos #endif /* NETATALK */
367 1.256 maxv
368 1.31 thorpej case pseudo_AF_HDRCMPLT:
369 1.31 thorpej hdrcmplt = 1;
370 1.146 dyoung memcpy(esrc,
371 1.146 dyoung ((const struct ether_header *)dst->sa_data)->ether_shost,
372 1.146 dyoung sizeof(esrc));
373 1.31 thorpej /* FALLTHROUGH */
374 1.31 thorpej
375 1.1 cgd case AF_UNSPEC:
376 1.250 maxv memcpy(edst,
377 1.146 dyoung ((const struct ether_header *)dst->sa_data)->ether_dhost,
378 1.146 dyoung sizeof(edst));
379 1.8 mycroft /* AF_UNSPEC doesn't swap the byte order of the ether_type. */
380 1.145 dyoung etype = ((const struct ether_header *)dst->sa_data)->ether_type;
381 1.8 mycroft break;
382 1.1 cgd
383 1.1 cgd default:
384 1.21 christos printf("%s: can't handle af%d\n", ifp->if_xname,
385 1.261 maxv dst->sa_family);
386 1.8 mycroft senderr(EAFNOSUPPORT);
387 1.1 cgd }
388 1.1 cgd
389 1.182 kefren #ifdef MPLS
390 1.210 ozaki {
391 1.210 ozaki struct m_tag *mtag;
392 1.271 maxv mtag = m_tag_find(m, PACKET_TAG_MPLS);
393 1.210 ozaki if (mtag != NULL) {
394 1.210 ozaki /* Having the tag itself indicates it's MPLS */
395 1.184 dyoung etype = htons(ETHERTYPE_MPLS);
396 1.210 ozaki m_tag_delete(m, mtag);
397 1.210 ozaki }
398 1.184 dyoung }
399 1.182 kefren #endif
400 1.182 kefren
401 1.1 cgd if (mcopy)
402 1.145 dyoung (void)looutput(ifp, mcopy, dst, rt);
403 1.16 mycroft
404 1.256 maxv KASSERT((m->m_flags & M_PKTHDR) != 0);
405 1.256 maxv
406 1.256 maxv /*
407 1.256 maxv * If no ether type is set, this must be a 802.2 formatted packet.
408 1.50 matt */
409 1.50 matt if (etype == 0)
410 1.50 matt etype = htons(m->m_pkthdr.len);
411 1.256 maxv
412 1.1 cgd /*
413 1.256 maxv * Add local net header. If no space in first mbuf, allocate another.
414 1.1 cgd */
415 1.256 maxv M_PREPEND(m, sizeof(struct ether_header), M_DONTWAIT);
416 1.256 maxv if (m == NULL)
417 1.8 mycroft senderr(ENOBUFS);
418 1.256 maxv
419 1.1 cgd eh = mtod(m, struct ether_header *);
420 1.96 thorpej /* Note: etype is already in network byte order. */
421 1.256 maxv memcpy(&eh->ether_type, &etype, sizeof(eh->ether_type));
422 1.250 maxv memcpy(eh->ether_dhost, edst, sizeof(edst));
423 1.261 maxv if (hdrcmplt) {
424 1.146 dyoung memcpy(eh->ether_shost, esrc, sizeof(eh->ether_shost));
425 1.261 maxv } else {
426 1.153 dyoung memcpy(eh->ether_shost, CLLADDR(ifp->if_sadl),
427 1.31 thorpej sizeof(eh->ether_shost));
428 1.261 maxv }
429 1.77 thorpej
430 1.133 liamjfoy #if NCARP > 0
431 1.133 liamjfoy if (ifp0 != ifp && ifp0->if_type == IFT_CARP) {
432 1.153 dyoung memcpy(eh->ether_shost, CLLADDR(ifp0->if_sadl),
433 1.133 liamjfoy sizeof(eh->ether_shost));
434 1.133 liamjfoy }
435 1.256 maxv #endif
436 1.133 liamjfoy
437 1.195 rmind if ((error = pfil_run_hooks(ifp->if_pfil, &m, ifp, PFIL_OUT)) != 0)
438 1.261 maxv return error;
439 1.77 thorpej if (m == NULL)
440 1.261 maxv return 0;
441 1.77 thorpej
442 1.78 thorpej #if NBRIDGE > 0
443 1.78 thorpej /*
444 1.78 thorpej * Bridges require special output handling.
445 1.78 thorpej */
446 1.78 thorpej if (ifp->if_bridge)
447 1.256 maxv return bridge_output(ifp, m, NULL, NULL);
448 1.78 thorpej #endif
449 1.78 thorpej
450 1.133 liamjfoy #if NCARP > 0
451 1.133 liamjfoy if (ifp != ifp0)
452 1.282 thorpej if_statadd(ifp0, if_obytes, m->m_pkthdr.len + ETHER_HDR_LEN);
453 1.256 maxv #endif
454 1.133 liamjfoy
455 1.77 thorpej #ifdef ALTQ
456 1.224 knakahar KERNEL_LOCK(1, NULL);
457 1.77 thorpej /*
458 1.77 thorpej * If ALTQ is enabled on the parent interface, do
459 1.77 thorpej * classification; the queueing discipline might not
460 1.77 thorpej * require classification, but might require the
461 1.77 thorpej * address family/header pointer in the pktattr.
462 1.77 thorpej */
463 1.77 thorpej if (ALTQ_IS_ENABLED(&ifp->if_snd))
464 1.220 knakahar altq_etherclassify(&ifp->if_snd, m);
465 1.224 knakahar KERNEL_UNLOCK_ONE(NULL);
466 1.77 thorpej #endif
467 1.221 knakahar return ifq_enqueue(ifp, m);
468 1.1 cgd
469 1.1 cgd bad:
470 1.288 ozaki if_statinc(ifp, if_oerrors);
471 1.1 cgd if (m)
472 1.1 cgd m_freem(m);
473 1.261 maxv return error;
474 1.1 cgd }
475 1.76 thorpej
476 1.76 thorpej #ifdef ALTQ
477 1.76 thorpej /*
478 1.76 thorpej * This routine is a slight hack to allow a packet to be classified
479 1.76 thorpej * if the Ethernet headers are present. It will go away when ALTQ's
480 1.76 thorpej * classification engine understands link headers.
481 1.261 maxv *
482 1.261 maxv * XXX: We may need to do m_pullups here. First to ensure struct ether_header
483 1.261 maxv * is indeed contiguous, then to read the LLC and so on.
484 1.76 thorpej */
485 1.76 thorpej void
486 1.220 knakahar altq_etherclassify(struct ifaltq *ifq, struct mbuf *m)
487 1.76 thorpej {
488 1.76 thorpej struct ether_header *eh;
489 1.255 maxv struct mbuf *mtop = m;
490 1.162 matt uint16_t ether_type;
491 1.76 thorpej int hlen, af, hdrsize;
492 1.147 christos void *hdr;
493 1.76 thorpej
494 1.255 maxv KASSERT((mtop->m_flags & M_PKTHDR) != 0);
495 1.255 maxv
496 1.76 thorpej hlen = ETHER_HDR_LEN;
497 1.76 thorpej eh = mtod(m, struct ether_header *);
498 1.76 thorpej
499 1.76 thorpej ether_type = htons(eh->ether_type);
500 1.76 thorpej
501 1.76 thorpej if (ether_type < ETHERMTU) {
502 1.76 thorpej /* LLC/SNAP */
503 1.76 thorpej struct llc *llc = (struct llc *)(eh + 1);
504 1.76 thorpej hlen += 8;
505 1.76 thorpej
506 1.76 thorpej if (m->m_len < hlen ||
507 1.76 thorpej llc->llc_dsap != LLC_SNAP_LSAP ||
508 1.76 thorpej llc->llc_ssap != LLC_SNAP_LSAP ||
509 1.76 thorpej llc->llc_control != LLC_UI) {
510 1.76 thorpej /* Not SNAP. */
511 1.76 thorpej goto bad;
512 1.76 thorpej }
513 1.76 thorpej
514 1.76 thorpej ether_type = htons(llc->llc_un.type_snap.ether_type);
515 1.76 thorpej }
516 1.76 thorpej
517 1.76 thorpej switch (ether_type) {
518 1.76 thorpej case ETHERTYPE_IP:
519 1.76 thorpej af = AF_INET;
520 1.76 thorpej hdrsize = 20; /* sizeof(struct ip) */
521 1.76 thorpej break;
522 1.76 thorpej
523 1.76 thorpej case ETHERTYPE_IPV6:
524 1.76 thorpej af = AF_INET6;
525 1.76 thorpej hdrsize = 40; /* sizeof(struct ip6_hdr) */
526 1.76 thorpej break;
527 1.76 thorpej
528 1.76 thorpej default:
529 1.76 thorpej af = AF_UNSPEC;
530 1.76 thorpej hdrsize = 0;
531 1.76 thorpej break;
532 1.76 thorpej }
533 1.76 thorpej
534 1.95 itojun while (m->m_len <= hlen) {
535 1.95 itojun hlen -= m->m_len;
536 1.95 itojun m = m->m_next;
537 1.255 maxv if (m == NULL)
538 1.255 maxv goto bad;
539 1.95 itojun }
540 1.255 maxv
541 1.76 thorpej if (m->m_len < (hlen + hdrsize)) {
542 1.76 thorpej /*
543 1.95 itojun * protocol header not in a single mbuf.
544 1.95 itojun * We can't cope with this situation right
545 1.76 thorpej * now (but it shouldn't ever happen, really, anyhow).
546 1.76 thorpej */
547 1.92 itojun #ifdef DEBUG
548 1.78 thorpej printf("altq_etherclassify: headers span multiple mbufs: "
549 1.78 thorpej "%d < %d\n", m->m_len, (hlen + hdrsize));
550 1.92 itojun #endif
551 1.76 thorpej goto bad;
552 1.76 thorpej }
553 1.76 thorpej
554 1.76 thorpej m->m_data += hlen;
555 1.76 thorpej m->m_len -= hlen;
556 1.76 thorpej
557 1.147 christos hdr = mtod(m, void *);
558 1.76 thorpej
559 1.255 maxv if (ALTQ_NEEDS_CLASSIFY(ifq)) {
560 1.255 maxv mtop->m_pkthdr.pattr_class =
561 1.76 thorpej (*ifq->altq_classify)(ifq->altq_clfier, m, af);
562 1.255 maxv }
563 1.255 maxv mtop->m_pkthdr.pattr_af = af;
564 1.255 maxv mtop->m_pkthdr.pattr_hdr = hdr;
565 1.76 thorpej
566 1.76 thorpej m->m_data -= hlen;
567 1.76 thorpej m->m_len += hlen;
568 1.76 thorpej
569 1.76 thorpej return;
570 1.76 thorpej
571 1.250 maxv bad:
572 1.255 maxv mtop->m_pkthdr.pattr_class = NULL;
573 1.255 maxv mtop->m_pkthdr.pattr_hdr = NULL;
574 1.255 maxv mtop->m_pkthdr.pattr_af = AF_UNSPEC;
575 1.76 thorpej }
576 1.76 thorpej #endif /* ALTQ */
577 1.1 cgd
578 1.286 ozaki #if defined (LLC) || defined (NETATALK)
579 1.286 ozaki static void
580 1.286 ozaki ether_input_llc(struct ifnet *ifp, struct mbuf *m, struct ether_header *eh)
581 1.286 ozaki {
582 1.286 ozaki struct ifqueue *inq = NULL;
583 1.286 ozaki int isr = 0;
584 1.286 ozaki struct llc *l;
585 1.286 ozaki
586 1.286 ozaki if (m->m_len < sizeof(*eh) + sizeof(struct llc))
587 1.286 ozaki goto drop;
588 1.286 ozaki
589 1.286 ozaki l = (struct llc *)(eh+1);
590 1.286 ozaki switch (l->llc_dsap) {
591 1.286 ozaki #ifdef NETATALK
592 1.286 ozaki case LLC_SNAP_LSAP:
593 1.286 ozaki switch (l->llc_control) {
594 1.286 ozaki case LLC_UI:
595 1.286 ozaki if (l->llc_ssap != LLC_SNAP_LSAP)
596 1.286 ozaki goto drop;
597 1.286 ozaki
598 1.286 ozaki if (memcmp(&(l->llc_snap_org_code)[0],
599 1.286 ozaki at_org_code, sizeof(at_org_code)) == 0 &&
600 1.286 ozaki ntohs(l->llc_snap_ether_type) ==
601 1.286 ozaki ETHERTYPE_ATALK) {
602 1.286 ozaki inq = &atintrq2;
603 1.286 ozaki m_adj(m, sizeof(struct ether_header)
604 1.286 ozaki + sizeof(struct llc));
605 1.286 ozaki isr = NETISR_ATALK;
606 1.286 ozaki break;
607 1.286 ozaki }
608 1.286 ozaki
609 1.286 ozaki if (memcmp(&(l->llc_snap_org_code)[0],
610 1.286 ozaki aarp_org_code,
611 1.286 ozaki sizeof(aarp_org_code)) == 0 &&
612 1.286 ozaki ntohs(l->llc_snap_ether_type) ==
613 1.286 ozaki ETHERTYPE_AARP) {
614 1.286 ozaki m_adj(m, sizeof(struct ether_header)
615 1.286 ozaki + sizeof(struct llc));
616 1.286 ozaki aarpinput(ifp, m); /* XXX queue? */
617 1.286 ozaki return;
618 1.286 ozaki }
619 1.286 ozaki
620 1.286 ozaki default:
621 1.286 ozaki goto drop;
622 1.286 ozaki }
623 1.286 ozaki break;
624 1.286 ozaki #endif
625 1.286 ozaki default:
626 1.286 ozaki goto drop;
627 1.286 ozaki }
628 1.286 ozaki
629 1.286 ozaki KASSERT(inq != NULL);
630 1.286 ozaki IFQ_ENQUEUE_ISR(inq, m, isr);
631 1.286 ozaki return;
632 1.286 ozaki
633 1.286 ozaki drop:
634 1.286 ozaki m_freem(m);
635 1.287 ozaki if_statinc(ifp, if_ierrors); /* XXX should have a dedicated counter? */
636 1.286 ozaki return;
637 1.286 ozaki }
638 1.286 ozaki #endif /* defined (LLC) || defined (NETATALK) */
639 1.286 ozaki
640 1.1 cgd /*
641 1.1 cgd * Process a received Ethernet packet;
642 1.42 thorpej * the packet is in the mbuf chain m with
643 1.42 thorpej * the ether header.
644 1.1 cgd */
645 1.133 liamjfoy void
646 1.58 matt ether_input(struct ifnet *ifp, struct mbuf *m)
647 1.1 cgd {
648 1.91 thorpej struct ethercom *ec = (struct ethercom *) ifp;
649 1.199 rmind pktqueue_t *pktq = NULL;
650 1.199 rmind struct ifqueue *inq = NULL;
651 1.162 matt uint16_t etype;
652 1.42 thorpej struct ether_header *eh;
653 1.187 matt size_t ehlen;
654 1.204 tls static int earlypkts;
655 1.198 msaitoh int isr = 0;
656 1.294 yamaguch #if NAGR > 0
657 1.294 yamaguch void *agrprivate;
658 1.294 yamaguch #endif
659 1.1 cgd
660 1.216 ozaki KASSERT(!cpu_intr_p());
661 1.253 maxv KASSERT((m->m_flags & M_PKTHDR) != 0);
662 1.216 ozaki
663 1.287 ozaki if ((ifp->if_flags & IFF_UP) == 0)
664 1.287 ozaki goto drop;
665 1.290 roy
666 1.291 roy #ifdef MBUFTRACE
667 1.291 roy m_claimm(m, &ec->ec_rx_mowner);
668 1.291 roy #endif
669 1.291 roy
670 1.292 roy if (__predict_false(m->m_len < sizeof(*eh))) {
671 1.303 christos if ((m = m_pullup(m, sizeof(*eh))) == NULL) {
672 1.303 christos if_statinc(ifp, if_ierrors);
673 1.303 christos return;
674 1.303 christos }
675 1.267 maxv }
676 1.42 thorpej
677 1.42 thorpej eh = mtod(m, struct ether_header *);
678 1.63 thorpej etype = ntohs(eh->ether_type);
679 1.187 matt ehlen = sizeof(*eh);
680 1.63 thorpej
681 1.284 riastrad if (__predict_false(earlypkts < 100 ||
682 1.284 riastrad entropy_epoch() == (unsigned)-1)) {
683 1.204 tls rnd_add_data(NULL, eh, ehlen, 0);
684 1.204 tls earlypkts++;
685 1.204 tls }
686 1.204 tls
687 1.63 thorpej /*
688 1.258 maxv * Determine if the packet is within its size limits. For MPLS the
689 1.258 maxv * header length is variable, so we skip the check.
690 1.63 thorpej */
691 1.182 kefren if (etype != ETHERTYPE_MPLS && m->m_pkthdr.len >
692 1.83 thorpej ETHER_MAX_FRAME(ifp, etype, m->m_flags & M_HASFCS)) {
693 1.278 msaitoh #ifdef DIAGNOSTIC
694 1.203 ozaki mutex_enter(&bigpktpps_lock);
695 1.123 matt if (ppsratecheck(&bigpktppslim_last, &bigpktpps_count,
696 1.261 maxv bigpktppslim)) {
697 1.123 matt printf("%s: discarding oversize frame (len=%d)\n",
698 1.123 matt ifp->if_xname, m->m_pkthdr.len);
699 1.123 matt }
700 1.203 ozaki mutex_exit(&bigpktpps_lock);
701 1.278 msaitoh #endif
702 1.287 ozaki goto drop;
703 1.63 thorpej }
704 1.77 thorpej
705 1.84 thorpej if (ETHER_IS_MULTICAST(eh->ether_dhost)) {
706 1.84 thorpej /*
707 1.84 thorpej * If this is not a simplex interface, drop the packet
708 1.84 thorpej * if it came from us.
709 1.84 thorpej */
710 1.84 thorpej if ((ifp->if_flags & IFF_SIMPLEX) == 0 &&
711 1.153 dyoung memcmp(CLLADDR(ifp->if_sadl), eh->ether_shost,
712 1.84 thorpej ETHER_ADDR_LEN) == 0) {
713 1.287 ozaki goto drop;
714 1.84 thorpej }
715 1.84 thorpej
716 1.84 thorpej if (memcmp(etherbroadcastaddr,
717 1.84 thorpej eh->ether_dhost, ETHER_ADDR_LEN) == 0)
718 1.84 thorpej m->m_flags |= M_BCAST;
719 1.84 thorpej else
720 1.84 thorpej m->m_flags |= M_MCAST;
721 1.282 thorpej if_statinc(ifp, if_imcasts);
722 1.84 thorpej }
723 1.84 thorpej
724 1.79 thorpej /* If the CRC is still on the packet, trim it off. */
725 1.79 thorpej if (m->m_flags & M_HASFCS) {
726 1.79 thorpej m_adj(m, -ETHER_CRC_LEN);
727 1.79 thorpej m->m_flags &= ~M_HASFCS;
728 1.79 thorpej }
729 1.79 thorpej
730 1.282 thorpej if_statadd(ifp, if_ibytes, m->m_pkthdr.len);
731 1.78 thorpej
732 1.201 ozaki #if NCARP > 0
733 1.201 ozaki if (__predict_false(ifp->if_carp && ifp->if_type != IFT_CARP)) {
734 1.201 ozaki /*
735 1.261 maxv * Clear M_PROMISC, in case the packet comes from a
736 1.261 maxv * vlan.
737 1.201 ozaki */
738 1.137 rpaulo m->m_flags &= ~M_PROMISC;
739 1.201 ozaki if (carp_input(m, (uint8_t *)&eh->ether_shost,
740 1.201 ozaki (uint8_t *)&eh->ether_dhost, eh->ether_type) == 0)
741 1.137 rpaulo return;
742 1.201 ozaki }
743 1.253 maxv #endif
744 1.250 maxv
745 1.247 msaitoh if ((m->m_flags & (M_BCAST | M_MCAST | M_PROMISC)) == 0 &&
746 1.201 ozaki (ifp->if_flags & IFF_PROMISC) != 0 &&
747 1.201 ozaki memcmp(CLLADDR(ifp->if_sadl), eh->ether_dhost,
748 1.261 maxv ETHER_ADDR_LEN) != 0) {
749 1.201 ozaki m->m_flags |= M_PROMISC;
750 1.70 bouyer }
751 1.78 thorpej
752 1.106 bouyer if ((m->m_flags & M_PROMISC) == 0) {
753 1.195 rmind if (pfil_run_hooks(ifp->if_pfil, &m, ifp, PFIL_IN) != 0)
754 1.106 bouyer return;
755 1.106 bouyer if (m == NULL)
756 1.106 bouyer return;
757 1.78 thorpej
758 1.106 bouyer eh = mtod(m, struct ether_header *);
759 1.106 bouyer etype = ntohs(eh->ether_type);
760 1.106 bouyer }
761 1.70 bouyer
762 1.172 darran #if NAGR > 0
763 1.294 yamaguch if (ifp->if_type != IFT_IEEE8023ADLAG) {
764 1.294 yamaguch agrprivate = ifp->if_lagg;
765 1.294 yamaguch } else {
766 1.294 yamaguch agrprivate = NULL;
767 1.294 yamaguch }
768 1.294 yamaguch if (agrprivate != NULL &&
769 1.172 darran __predict_true(etype != ETHERTYPE_SLOWPROTOCOLS)) {
770 1.172 darran m->m_flags &= ~M_PROMISC;
771 1.172 darran agr_input(ifp, m);
772 1.172 darran return;
773 1.172 darran }
774 1.253 maxv #endif
775 1.172 darran
776 1.293 yamaguch /* Handle input from a lagg(4) port */
777 1.293 yamaguch if (ifp->if_type == IFT_IEEE8023ADLAG) {
778 1.293 yamaguch KASSERT(lagg_input_ethernet_p != NULL);
779 1.293 yamaguch m = (*lagg_input_ethernet_p)(ifp, m);
780 1.293 yamaguch if (m == NULL)
781 1.293 yamaguch return;
782 1.293 yamaguch }
783 1.293 yamaguch
784 1.91 thorpej /*
785 1.91 thorpej * If VLANs are configured on the interface, check to
786 1.91 thorpej * see if the device performed the decapsulation and
787 1.91 thorpej * provided us with the tag.
788 1.91 thorpej */
789 1.244 knakahar if (ec->ec_nvlans && vlan_has_tag(m)) {
790 1.70 bouyer #if NVLAN > 0
791 1.70 bouyer /*
792 1.70 bouyer * vlan_input() will either recursively call ether_input()
793 1.70 bouyer * or drop the packet.
794 1.70 bouyer */
795 1.91 thorpej vlan_input(ifp, m);
796 1.287 ozaki return;
797 1.91 thorpej #else
798 1.287 ozaki goto drop;
799 1.70 bouyer #endif
800 1.61 thorpej }
801 1.1 cgd
802 1.59 thorpej /*
803 1.59 thorpej * Handle protocols that expect to have the Ethernet header
804 1.59 thorpej * (and possibly FCS) intact.
805 1.59 thorpej */
806 1.59 thorpej switch (etype) {
807 1.187 matt case ETHERTYPE_VLAN: {
808 1.187 matt struct ether_vlan_header *evl = (void *)eh;
809 1.253 maxv
810 1.187 matt /*
811 1.187 matt * If there is a tag of 0, then the VLAN header was probably
812 1.187 matt * just being used to store the priority. Extract the ether
813 1.250 maxv * type, and if IP or IPV6, let them deal with it.
814 1.187 matt */
815 1.254 maxv if (m->m_len >= sizeof(*evl) &&
816 1.302 ryo EVL_VLANOFTAG(ntohs(evl->evl_tag)) == 0) {
817 1.187 matt etype = ntohs(evl->evl_proto);
818 1.187 matt ehlen = sizeof(*evl);
819 1.253 maxv if ((m->m_flags & M_PROMISC) == 0 &&
820 1.253 maxv (etype == ETHERTYPE_IP ||
821 1.253 maxv etype == ETHERTYPE_IPV6))
822 1.187 matt break;
823 1.187 matt }
824 1.253 maxv
825 1.59 thorpej #if NVLAN > 0
826 1.59 thorpej /*
827 1.59 thorpej * vlan_input() will either recursively call ether_input()
828 1.59 thorpej * or drop the packet.
829 1.59 thorpej */
830 1.287 ozaki if (ec->ec_nvlans != 0) {
831 1.63 thorpej vlan_input(ifp, m);
832 1.287 ozaki return;
833 1.287 ozaki } else
834 1.253 maxv #endif
835 1.287 ozaki goto drop;
836 1.187 matt }
837 1.253 maxv
838 1.81 martin #if NPPPOE > 0
839 1.81 martin case ETHERTYPE_PPPOEDISC:
840 1.218 ozaki pppoedisc_input(ifp, m);
841 1.218 ozaki return;
842 1.253 maxv
843 1.81 martin case ETHERTYPE_PPPOE:
844 1.218 ozaki pppoe_input(ifp, m);
845 1.81 martin return;
846 1.253 maxv #endif
847 1.253 maxv
848 1.121 yamt case ETHERTYPE_SLOWPROTOCOLS: {
849 1.121 yamt uint8_t subtype;
850 1.121 yamt
851 1.287 ozaki if (m->m_pkthdr.len < sizeof(*eh) + sizeof(subtype))
852 1.287 ozaki goto drop;
853 1.253 maxv
854 1.121 yamt m_copydata(m, sizeof(*eh), sizeof(subtype), &subtype);
855 1.121 yamt switch (subtype) {
856 1.121 yamt #if NAGR > 0
857 1.121 yamt case SLOWPROTOCOLS_SUBTYPE_LACP:
858 1.294 yamaguch if (agrprivate != NULL) {
859 1.121 yamt ieee8023ad_lacp_input(ifp, m);
860 1.121 yamt return;
861 1.121 yamt }
862 1.121 yamt break;
863 1.121 yamt
864 1.121 yamt case SLOWPROTOCOLS_SUBTYPE_MARKER:
865 1.294 yamaguch if (agrprivate != NULL) {
866 1.121 yamt ieee8023ad_marker_input(ifp, m);
867 1.121 yamt return;
868 1.121 yamt }
869 1.121 yamt break;
870 1.261 maxv #endif
871 1.253 maxv
872 1.121 yamt default:
873 1.121 yamt if (subtype == 0 || subtype > 10) {
874 1.121 yamt /* illegal value */
875 1.303 christos goto error;
876 1.121 yamt }
877 1.121 yamt /* unknown subtype */
878 1.121 yamt break;
879 1.121 yamt }
880 1.121 yamt }
881 1.273 mrg /* FALLTHROUGH */
882 1.59 thorpej default:
883 1.287 ozaki if (m->m_flags & M_PROMISC)
884 1.287 ozaki goto drop;
885 1.59 thorpej }
886 1.42 thorpej
887 1.45 thorpej /* If the CRC is still on the packet, trim it off. */
888 1.79 thorpej if (m->m_flags & M_HASFCS) {
889 1.45 thorpej m_adj(m, -ETHER_CRC_LEN);
890 1.79 thorpej m->m_flags &= ~M_HASFCS;
891 1.79 thorpej }
892 1.42 thorpej
893 1.286 ozaki /* etype represents the size of the payload in this case */
894 1.286 ozaki if (etype <= ETHERMTU + sizeof(struct ether_header)) {
895 1.286 ozaki KASSERT(ehlen == sizeof(*eh));
896 1.286 ozaki #if defined (LLC) || defined (NETATALK)
897 1.286 ozaki ether_input_llc(ifp, m, eh);
898 1.286 ozaki return;
899 1.286 ozaki #else
900 1.303 christos goto error;
901 1.286 ozaki #endif
902 1.286 ozaki }
903 1.139 is
904 1.286 ozaki /* Strip off the Ethernet header. */
905 1.286 ozaki m_adj(m, ehlen);
906 1.286 ozaki
907 1.286 ozaki switch (etype) {
908 1.1 cgd #ifdef INET
909 1.286 ozaki case ETHERTYPE_IP:
910 1.30 matt #ifdef GATEWAY
911 1.286 ozaki if (ipflow_fastforward(m))
912 1.286 ozaki return;
913 1.30 matt #endif
914 1.286 ozaki pktq = ip_pktq;
915 1.286 ozaki break;
916 1.1 cgd
917 1.286 ozaki case ETHERTYPE_ARP:
918 1.286 ozaki isr = NETISR_ARP;
919 1.286 ozaki inq = &arpintrq;
920 1.286 ozaki break;
921 1.7 glass
922 1.286 ozaki case ETHERTYPE_REVARP:
923 1.286 ozaki revarpinput(m); /* XXX queue? */
924 1.286 ozaki return;
925 1.1 cgd #endif
926 1.253 maxv
927 1.44 itojun #ifdef INET6
928 1.286 ozaki case ETHERTYPE_IPV6:
929 1.287 ozaki if (__predict_false(!in6_present))
930 1.287 ozaki goto drop;
931 1.250 maxv #ifdef GATEWAY
932 1.286 ozaki if (ip6flow_fastforward(&m))
933 1.286 ozaki return;
934 1.148 liamjfoy #endif
935 1.286 ozaki pktq = ip6_pktq;
936 1.286 ozaki break;
937 1.44 itojun #endif
938 1.253 maxv
939 1.23 christos #ifdef NETATALK
940 1.286 ozaki case ETHERTYPE_ATALK:
941 1.286 ozaki isr = NETISR_ATALK;
942 1.286 ozaki inq = &atintrq1;
943 1.286 ozaki break;
944 1.253 maxv
945 1.286 ozaki case ETHERTYPE_AARP:
946 1.286 ozaki aarpinput(ifp, m); /* XXX queue? */
947 1.286 ozaki return;
948 1.253 maxv #endif
949 1.253 maxv
950 1.182 kefren #ifdef MPLS
951 1.286 ozaki case ETHERTYPE_MPLS:
952 1.286 ozaki isr = NETISR_MPLS;
953 1.286 ozaki inq = &mplsintrq;
954 1.286 ozaki break;
955 1.182 kefren #endif
956 1.253 maxv
957 1.286 ozaki default:
958 1.287 ozaki goto drop;
959 1.1 cgd }
960 1.1 cgd
961 1.199 rmind if (__predict_true(pktq)) {
962 1.301 knakahar const uint32_t h = pktq_rps_hash(ðer_pktq_rps_hash_p, m);
963 1.199 rmind if (__predict_false(!pktq_enqueue(pktq, m, h))) {
964 1.199 rmind m_freem(m);
965 1.199 rmind }
966 1.199 rmind return;
967 1.199 rmind }
968 1.199 rmind
969 1.199 rmind if (__predict_false(!inq)) {
970 1.199 rmind /* Should not happen. */
971 1.303 christos goto error;
972 1.199 rmind }
973 1.228 ozaki
974 1.285 ozaki IFQ_ENQUEUE_ISR(inq, m, isr);
975 1.287 ozaki return;
976 1.287 ozaki
977 1.287 ozaki drop:
978 1.287 ozaki m_freem(m);
979 1.303 christos if_statinc(ifp, if_iqdrops); /* XXX should have a dedicated counter? */
980 1.303 christos return;
981 1.303 christos error:
982 1.303 christos m_freem(m);
983 1.287 ozaki if_statinc(ifp, if_ierrors); /* XXX should have a dedicated counter? */
984 1.303 christos return;
985 1.1 cgd }
986 1.1 cgd
987 1.1 cgd /*
988 1.1 cgd * Convert Ethernet address to printable (loggable) representation.
989 1.1 cgd */
990 1.1 cgd char *
991 1.58 matt ether_sprintf(const u_char *ap)
992 1.1 cgd {
993 1.129 christos static char etherbuf[3 * ETHER_ADDR_LEN];
994 1.129 christos return ether_snprintf(etherbuf, sizeof(etherbuf), ap);
995 1.129 christos }
996 1.129 christos
997 1.129 christos char *
998 1.129 christos ether_snprintf(char *buf, size_t len, const u_char *ap)
999 1.129 christos {
1000 1.129 christos char *cp = buf;
1001 1.129 christos size_t i;
1002 1.1 cgd
1003 1.129 christos for (i = 0; i < len / 3; i++) {
1004 1.124 christos *cp++ = hexdigits[*ap >> 4];
1005 1.124 christos *cp++ = hexdigits[*ap++ & 0xf];
1006 1.1 cgd *cp++ = ':';
1007 1.1 cgd }
1008 1.129 christos *--cp = '\0';
1009 1.129 christos return buf;
1010 1.1 cgd }
1011 1.8 mycroft
1012 1.8 mycroft /*
1013 1.8 mycroft * Perform common duties while attaching to interface list
1014 1.8 mycroft */
1015 1.8 mycroft void
1016 1.162 matt ether_ifattach(struct ifnet *ifp, const uint8_t *lla)
1017 1.8 mycroft {
1018 1.104 matt struct ethercom *ec = (struct ethercom *)ifp;
1019 1.297 yamaguch char xnamebuf[HOOKNAMSIZ];
1020 1.8 mycroft
1021 1.8 mycroft ifp->if_type = IFT_ETHER;
1022 1.94 enami ifp->if_hdrlen = ETHER_HDR_LEN;
1023 1.73 thorpej ifp->if_dlt = DLT_EN10MB;
1024 1.8 mycroft ifp->if_mtu = ETHERMTU;
1025 1.12 mycroft ifp->if_output = ether_output;
1026 1.216 ozaki ifp->_if_input = ether_input;
1027 1.54 thorpej if (ifp->if_baudrate == 0)
1028 1.54 thorpej ifp->if_baudrate = IF_Mbps(10); /* just a default */
1029 1.75 thorpej
1030 1.230 ozaki if (lla != NULL)
1031 1.230 ozaki if_set_sadl(ifp, lla, ETHER_ADDR_LEN, !ETHER_IS_LOCAL(lla));
1032 1.75 thorpej
1033 1.104 matt LIST_INIT(&ec->ec_multiaddrs);
1034 1.276 msaitoh SIMPLEQ_INIT(&ec->ec_vids);
1035 1.233 ozaki ec->ec_lock = mutex_obj_alloc(MUTEX_DEFAULT, IPL_NET);
1036 1.274 ozaki ec->ec_flags = 0;
1037 1.26 is ifp->if_broadcastaddr = etherbroadcastaddr;
1038 1.177 joerg bpf_attach(ifp, DLT_EN10MB, sizeof(struct ether_header));
1039 1.297 yamaguch snprintf(xnamebuf, sizeof(xnamebuf),
1040 1.297 yamaguch "%s-ether_ifdetachhooks", ifp->if_xname);
1041 1.297 yamaguch ec->ec_ifdetach_hooks = simplehook_create(IPL_NET, xnamebuf);
1042 1.104 matt #ifdef MBUFTRACE
1043 1.283 thorpej mowner_init_owner(&ec->ec_tx_mowner, ifp->if_xname, "tx");
1044 1.283 thorpej mowner_init_owner(&ec->ec_rx_mowner, ifp->if_xname, "rx");
1045 1.104 matt MOWNER_ATTACH(&ec->ec_tx_mowner);
1046 1.104 matt MOWNER_ATTACH(&ec->ec_rx_mowner);
1047 1.104 matt ifp->if_mowner = &ec->ec_tx_mowner;
1048 1.104 matt #endif
1049 1.52 thorpej }
1050 1.52 thorpej
1051 1.52 thorpej void
1052 1.58 matt ether_ifdetach(struct ifnet *ifp)
1053 1.52 thorpej {
1054 1.63 thorpej struct ethercom *ec = (void *) ifp;
1055 1.63 thorpej struct ether_multi *enm;
1056 1.69 thorpej
1057 1.269 ozaki IFNET_ASSERT_UNLOCKED(ifp);
1058 1.190 christos /*
1059 1.190 christos * Prevent further calls to ioctl (for example turning off
1060 1.190 christos * promiscuous mode from the bridge code), which eventually can
1061 1.190 christos * call if_init() which can cause panics because the interface
1062 1.190 christos * is in the process of being detached. Return device not configured
1063 1.190 christos * instead.
1064 1.190 christos */
1065 1.280 christos ifp->if_ioctl = __FPTRCAST(int (*)(struct ifnet *, u_long, void *),
1066 1.280 christos enxio);
1067 1.190 christos
1068 1.297 yamaguch simplehook_dohooks(ec->ec_ifdetach_hooks);
1069 1.297 yamaguch KASSERT(!simplehook_has_hooks(ec->ec_ifdetach_hooks));
1070 1.297 yamaguch simplehook_destroy(ec->ec_ifdetach_hooks);
1071 1.297 yamaguch
1072 1.177 joerg bpf_detach(ifp);
1073 1.63 thorpej
1074 1.245 msaitoh ETHER_LOCK(ec);
1075 1.276 msaitoh KASSERT(ec->ec_nvlans == 0);
1076 1.63 thorpej while ((enm = LIST_FIRST(&ec->ec_multiaddrs)) != NULL) {
1077 1.63 thorpej LIST_REMOVE(enm, enm_list);
1078 1.248 ozaki kmem_free(enm, sizeof(*enm));
1079 1.63 thorpej ec->ec_multicnt--;
1080 1.63 thorpej }
1081 1.245 msaitoh ETHER_UNLOCK(ec);
1082 1.52 thorpej
1083 1.252 maxv mutex_obj_free(ec->ec_lock);
1084 1.253 maxv ec->ec_lock = NULL;
1085 1.231 ozaki
1086 1.189 chs ifp->if_mowner = NULL;
1087 1.104 matt MOWNER_DETACH(&ec->ec_rx_mowner);
1088 1.104 matt MOWNER_DETACH(&ec->ec_tx_mowner);
1089 1.53 thorpej }
1090 1.53 thorpej
1091 1.297 yamaguch void *
1092 1.297 yamaguch ether_ifdetachhook_establish(struct ifnet *ifp,
1093 1.297 yamaguch void (*fn)(void *), void *arg)
1094 1.297 yamaguch {
1095 1.297 yamaguch struct ethercom *ec;
1096 1.297 yamaguch khook_t *hk;
1097 1.297 yamaguch
1098 1.297 yamaguch if (ifp->if_type != IFT_ETHER)
1099 1.297 yamaguch return NULL;
1100 1.297 yamaguch
1101 1.297 yamaguch ec = (struct ethercom *)ifp;
1102 1.297 yamaguch hk = simplehook_establish(ec->ec_ifdetach_hooks,
1103 1.297 yamaguch fn, arg);
1104 1.297 yamaguch
1105 1.297 yamaguch return (void *)hk;
1106 1.297 yamaguch }
1107 1.297 yamaguch
1108 1.297 yamaguch void
1109 1.297 yamaguch ether_ifdetachhook_disestablish(struct ifnet *ifp,
1110 1.297 yamaguch void *vhook, kmutex_t *lock)
1111 1.297 yamaguch {
1112 1.297 yamaguch struct ethercom *ec;
1113 1.297 yamaguch
1114 1.297 yamaguch if (vhook == NULL)
1115 1.297 yamaguch return;
1116 1.297 yamaguch
1117 1.297 yamaguch ec = (struct ethercom *)ifp;
1118 1.297 yamaguch simplehook_disestablish(ec->ec_ifdetach_hooks, vhook, lock);
1119 1.297 yamaguch }
1120 1.297 yamaguch
1121 1.56 thorpej #if 0
1122 1.56 thorpej /*
1123 1.56 thorpej * This is for reference. We have a table-driven version
1124 1.56 thorpej * of the little-endian crc32 generator, which is faster
1125 1.56 thorpej * than the double-loop.
1126 1.56 thorpej */
1127 1.162 matt uint32_t
1128 1.162 matt ether_crc32_le(const uint8_t *buf, size_t len)
1129 1.53 thorpej {
1130 1.162 matt uint32_t c, crc, carry;
1131 1.53 thorpej size_t i, j;
1132 1.53 thorpej
1133 1.53 thorpej crc = 0xffffffffU; /* initial value */
1134 1.53 thorpej
1135 1.53 thorpej for (i = 0; i < len; i++) {
1136 1.53 thorpej c = buf[i];
1137 1.53 thorpej for (j = 0; j < 8; j++) {
1138 1.53 thorpej carry = ((crc & 0x01) ? 1 : 0) ^ (c & 0x01);
1139 1.53 thorpej crc >>= 1;
1140 1.53 thorpej c >>= 1;
1141 1.53 thorpej if (carry)
1142 1.56 thorpej crc = (crc ^ ETHER_CRC_POLY_LE);
1143 1.53 thorpej }
1144 1.53 thorpej }
1145 1.53 thorpej
1146 1.53 thorpej return (crc);
1147 1.53 thorpej }
1148 1.56 thorpej #else
1149 1.162 matt uint32_t
1150 1.162 matt ether_crc32_le(const uint8_t *buf, size_t len)
1151 1.56 thorpej {
1152 1.162 matt static const uint32_t crctab[] = {
1153 1.56 thorpej 0x00000000, 0x1db71064, 0x3b6e20c8, 0x26d930ac,
1154 1.56 thorpej 0x76dc4190, 0x6b6b51f4, 0x4db26158, 0x5005713c,
1155 1.56 thorpej 0xedb88320, 0xf00f9344, 0xd6d6a3e8, 0xcb61b38c,
1156 1.56 thorpej 0x9b64c2b0, 0x86d3d2d4, 0xa00ae278, 0xbdbdf21c
1157 1.56 thorpej };
1158 1.162 matt uint32_t crc;
1159 1.98 thorpej size_t i;
1160 1.56 thorpej
1161 1.56 thorpej crc = 0xffffffffU; /* initial value */
1162 1.56 thorpej
1163 1.56 thorpej for (i = 0; i < len; i++) {
1164 1.56 thorpej crc ^= buf[i];
1165 1.56 thorpej crc = (crc >> 4) ^ crctab[crc & 0xf];
1166 1.56 thorpej crc = (crc >> 4) ^ crctab[crc & 0xf];
1167 1.56 thorpej }
1168 1.56 thorpej
1169 1.56 thorpej return (crc);
1170 1.56 thorpej }
1171 1.56 thorpej #endif
1172 1.53 thorpej
1173 1.162 matt uint32_t
1174 1.162 matt ether_crc32_be(const uint8_t *buf, size_t len)
1175 1.53 thorpej {
1176 1.162 matt uint32_t c, crc, carry;
1177 1.53 thorpej size_t i, j;
1178 1.53 thorpej
1179 1.53 thorpej crc = 0xffffffffU; /* initial value */
1180 1.53 thorpej
1181 1.53 thorpej for (i = 0; i < len; i++) {
1182 1.53 thorpej c = buf[i];
1183 1.53 thorpej for (j = 0; j < 8; j++) {
1184 1.53 thorpej carry = ((crc & 0x80000000U) ? 1 : 0) ^ (c & 0x01);
1185 1.53 thorpej crc <<= 1;
1186 1.53 thorpej c >>= 1;
1187 1.53 thorpej if (carry)
1188 1.53 thorpej crc = (crc ^ ETHER_CRC_POLY_BE) | carry;
1189 1.53 thorpej }
1190 1.53 thorpej }
1191 1.53 thorpej
1192 1.53 thorpej return (crc);
1193 1.8 mycroft }
1194 1.8 mycroft
1195 1.48 is #ifdef INET
1196 1.118 yamt const uint8_t ether_ipmulticast_min[ETHER_ADDR_LEN] =
1197 1.118 yamt { 0x01, 0x00, 0x5e, 0x00, 0x00, 0x00 };
1198 1.118 yamt const uint8_t ether_ipmulticast_max[ETHER_ADDR_LEN] =
1199 1.118 yamt { 0x01, 0x00, 0x5e, 0x7f, 0xff, 0xff };
1200 1.48 is #endif
1201 1.44 itojun #ifdef INET6
1202 1.118 yamt const uint8_t ether_ip6multicast_min[ETHER_ADDR_LEN] =
1203 1.118 yamt { 0x33, 0x33, 0x00, 0x00, 0x00, 0x00 };
1204 1.118 yamt const uint8_t ether_ip6multicast_max[ETHER_ADDR_LEN] =
1205 1.118 yamt { 0x33, 0x33, 0xff, 0xff, 0xff, 0xff };
1206 1.44 itojun #endif
1207 1.60 enami
1208 1.3 hpeyerl /*
1209 1.138 rpaulo * ether_aton implementation, not using a static buffer.
1210 1.138 rpaulo */
1211 1.138 rpaulo int
1212 1.180 christos ether_aton_r(u_char *dest, size_t len, const char *str)
1213 1.138 rpaulo {
1214 1.250 maxv const u_char *cp = (const void *)str;
1215 1.180 christos u_char *ep;
1216 1.180 christos
1217 1.185 tsutsui #define atox(c) (((c) <= '9') ? ((c) - '0') : ((toupper(c) - 'A') + 10))
1218 1.180 christos
1219 1.180 christos if (len < ETHER_ADDR_LEN)
1220 1.180 christos return ENOSPC;
1221 1.180 christos
1222 1.180 christos ep = dest + ETHER_ADDR_LEN;
1223 1.250 maxv
1224 1.180 christos while (*cp) {
1225 1.250 maxv if (!isxdigit(*cp))
1226 1.250 maxv return EINVAL;
1227 1.252 maxv
1228 1.180 christos *dest = atox(*cp);
1229 1.180 christos cp++;
1230 1.250 maxv if (isxdigit(*cp)) {
1231 1.250 maxv *dest = (*dest << 4) | atox(*cp);
1232 1.180 christos cp++;
1233 1.250 maxv }
1234 1.252 maxv dest++;
1235 1.252 maxv
1236 1.180 christos if (dest == ep)
1237 1.252 maxv return (*cp == '\0') ? 0 : ENAMETOOLONG;
1238 1.252 maxv
1239 1.180 christos switch (*cp) {
1240 1.180 christos case ':':
1241 1.180 christos case '-':
1242 1.180 christos case '.':
1243 1.179 jakllsch cp++;
1244 1.180 christos break;
1245 1.179 jakllsch }
1246 1.250 maxv }
1247 1.180 christos return ENOBUFS;
1248 1.138 rpaulo }
1249 1.138 rpaulo
1250 1.138 rpaulo /*
1251 1.60 enami * Convert a sockaddr into an Ethernet address or range of Ethernet
1252 1.60 enami * addresses.
1253 1.3 hpeyerl */
1254 1.3 hpeyerl int
1255 1.162 matt ether_multiaddr(const struct sockaddr *sa, uint8_t addrlo[ETHER_ADDR_LEN],
1256 1.162 matt uint8_t addrhi[ETHER_ADDR_LEN])
1257 1.3 hpeyerl {
1258 1.24 christos #ifdef INET
1259 1.155 dyoung const struct sockaddr_in *sin;
1260 1.261 maxv #endif
1261 1.44 itojun #ifdef INET6
1262 1.155 dyoung const struct sockaddr_in6 *sin6;
1263 1.261 maxv #endif
1264 1.3 hpeyerl
1265 1.60 enami switch (sa->sa_family) {
1266 1.3 hpeyerl
1267 1.3 hpeyerl case AF_UNSPEC:
1268 1.146 dyoung memcpy(addrlo, sa->sa_data, ETHER_ADDR_LEN);
1269 1.146 dyoung memcpy(addrhi, addrlo, ETHER_ADDR_LEN);
1270 1.3 hpeyerl break;
1271 1.3 hpeyerl
1272 1.3 hpeyerl #ifdef INET
1273 1.3 hpeyerl case AF_INET:
1274 1.155 dyoung sin = satocsin(sa);
1275 1.3 hpeyerl if (sin->sin_addr.s_addr == INADDR_ANY) {
1276 1.3 hpeyerl /*
1277 1.60 enami * An IP address of INADDR_ANY means listen to
1278 1.60 enami * or stop listening to all of the Ethernet
1279 1.60 enami * multicast addresses used for IP.
1280 1.3 hpeyerl * (This is for the sake of IP multicast routers.)
1281 1.3 hpeyerl */
1282 1.146 dyoung memcpy(addrlo, ether_ipmulticast_min, ETHER_ADDR_LEN);
1283 1.146 dyoung memcpy(addrhi, ether_ipmulticast_max, ETHER_ADDR_LEN);
1284 1.252 maxv } else {
1285 1.3 hpeyerl ETHER_MAP_IP_MULTICAST(&sin->sin_addr, addrlo);
1286 1.146 dyoung memcpy(addrhi, addrlo, ETHER_ADDR_LEN);
1287 1.3 hpeyerl }
1288 1.3 hpeyerl break;
1289 1.3 hpeyerl #endif
1290 1.44 itojun #ifdef INET6
1291 1.44 itojun case AF_INET6:
1292 1.155 dyoung sin6 = satocsin6(sa);
1293 1.47 itojun if (IN6_IS_ADDR_UNSPECIFIED(&sin6->sin6_addr)) {
1294 1.44 itojun /*
1295 1.60 enami * An IP6 address of 0 means listen to or stop
1296 1.60 enami * listening to all of the Ethernet multicast
1297 1.60 enami * address used for IP6.
1298 1.44 itojun * (This is used for multicast routers.)
1299 1.44 itojun */
1300 1.146 dyoung memcpy(addrlo, ether_ip6multicast_min, ETHER_ADDR_LEN);
1301 1.146 dyoung memcpy(addrhi, ether_ip6multicast_max, ETHER_ADDR_LEN);
1302 1.44 itojun } else {
1303 1.44 itojun ETHER_MAP_IPV6_MULTICAST(&sin6->sin6_addr, addrlo);
1304 1.146 dyoung memcpy(addrhi, addrlo, ETHER_ADDR_LEN);
1305 1.44 itojun }
1306 1.44 itojun break;
1307 1.44 itojun #endif
1308 1.3 hpeyerl
1309 1.3 hpeyerl default:
1310 1.146 dyoung return EAFNOSUPPORT;
1311 1.60 enami }
1312 1.146 dyoung return 0;
1313 1.60 enami }
1314 1.60 enami
1315 1.60 enami /*
1316 1.60 enami * Add an Ethernet multicast address or range of addresses to the list for a
1317 1.60 enami * given interface.
1318 1.60 enami */
1319 1.60 enami int
1320 1.155 dyoung ether_addmulti(const struct sockaddr *sa, struct ethercom *ec)
1321 1.60 enami {
1322 1.231 ozaki struct ether_multi *enm, *_enm;
1323 1.60 enami u_char addrlo[ETHER_ADDR_LEN];
1324 1.60 enami u_char addrhi[ETHER_ADDR_LEN];
1325 1.237 skrll int error = 0;
1326 1.231 ozaki
1327 1.231 ozaki /* Allocate out of lock */
1328 1.248 ozaki enm = kmem_alloc(sizeof(*enm), KM_SLEEP);
1329 1.60 enami
1330 1.245 msaitoh ETHER_LOCK(ec);
1331 1.155 dyoung error = ether_multiaddr(sa, addrlo, addrhi);
1332 1.231 ozaki if (error != 0)
1333 1.231 ozaki goto out;
1334 1.3 hpeyerl
1335 1.3 hpeyerl /*
1336 1.3 hpeyerl * Verify that we have valid Ethernet multicast addresses.
1337 1.3 hpeyerl */
1338 1.186 yamt if (!ETHER_IS_MULTICAST(addrlo) || !ETHER_IS_MULTICAST(addrhi)) {
1339 1.231 ozaki error = EINVAL;
1340 1.231 ozaki goto out;
1341 1.3 hpeyerl }
1342 1.252 maxv
1343 1.3 hpeyerl /*
1344 1.3 hpeyerl * See if the address range is already in the list.
1345 1.3 hpeyerl */
1346 1.270 yamaguch _enm = ether_lookup_multi(addrlo, addrhi, ec);
1347 1.231 ozaki if (_enm != NULL) {
1348 1.3 hpeyerl /*
1349 1.3 hpeyerl * Found it; just increment the reference count.
1350 1.3 hpeyerl */
1351 1.231 ozaki ++_enm->enm_refcount;
1352 1.231 ozaki error = 0;
1353 1.231 ozaki goto out;
1354 1.3 hpeyerl }
1355 1.252 maxv
1356 1.3 hpeyerl /*
1357 1.239 ozaki * Link a new multicast record into the interface's multicast list.
1358 1.3 hpeyerl */
1359 1.252 maxv memcpy(enm->enm_addrlo, addrlo, ETHER_ADDR_LEN);
1360 1.252 maxv memcpy(enm->enm_addrhi, addrhi, ETHER_ADDR_LEN);
1361 1.3 hpeyerl enm->enm_refcount = 1;
1362 1.22 is LIST_INSERT_HEAD(&ec->ec_multiaddrs, enm, enm_list);
1363 1.22 is ec->ec_multicnt++;
1364 1.252 maxv
1365 1.3 hpeyerl /*
1366 1.3 hpeyerl * Return ENETRESET to inform the driver that the list has changed
1367 1.3 hpeyerl * and its reception filter should be adjusted accordingly.
1368 1.3 hpeyerl */
1369 1.231 ozaki error = ENETRESET;
1370 1.231 ozaki enm = NULL;
1371 1.252 maxv
1372 1.231 ozaki out:
1373 1.245 msaitoh ETHER_UNLOCK(ec);
1374 1.231 ozaki if (enm != NULL)
1375 1.248 ozaki kmem_free(enm, sizeof(*enm));
1376 1.231 ozaki return error;
1377 1.3 hpeyerl }
1378 1.3 hpeyerl
1379 1.3 hpeyerl /*
1380 1.3 hpeyerl * Delete a multicast address record.
1381 1.3 hpeyerl */
1382 1.3 hpeyerl int
1383 1.155 dyoung ether_delmulti(const struct sockaddr *sa, struct ethercom *ec)
1384 1.3 hpeyerl {
1385 1.29 mrg struct ether_multi *enm;
1386 1.60 enami u_char addrlo[ETHER_ADDR_LEN];
1387 1.60 enami u_char addrhi[ETHER_ADDR_LEN];
1388 1.237 skrll int error;
1389 1.3 hpeyerl
1390 1.245 msaitoh ETHER_LOCK(ec);
1391 1.155 dyoung error = ether_multiaddr(sa, addrlo, addrhi);
1392 1.231 ozaki if (error != 0)
1393 1.231 ozaki goto error;
1394 1.3 hpeyerl
1395 1.3 hpeyerl /*
1396 1.252 maxv * Look up the address in our list.
1397 1.3 hpeyerl */
1398 1.270 yamaguch enm = ether_lookup_multi(addrlo, addrhi, ec);
1399 1.3 hpeyerl if (enm == NULL) {
1400 1.231 ozaki error = ENXIO;
1401 1.231 ozaki goto error;
1402 1.3 hpeyerl }
1403 1.3 hpeyerl if (--enm->enm_refcount != 0) {
1404 1.3 hpeyerl /*
1405 1.3 hpeyerl * Still some claims to this record.
1406 1.3 hpeyerl */
1407 1.231 ozaki error = 0;
1408 1.231 ozaki goto error;
1409 1.3 hpeyerl }
1410 1.252 maxv
1411 1.3 hpeyerl /*
1412 1.3 hpeyerl * No remaining claims to this record; unlink and free it.
1413 1.3 hpeyerl */
1414 1.13 mycroft LIST_REMOVE(enm, enm_list);
1415 1.22 is ec->ec_multicnt--;
1416 1.245 msaitoh ETHER_UNLOCK(ec);
1417 1.252 maxv kmem_free(enm, sizeof(*enm));
1418 1.231 ozaki
1419 1.3 hpeyerl /*
1420 1.3 hpeyerl * Return ENETRESET to inform the driver that the list has changed
1421 1.3 hpeyerl * and its reception filter should be adjusted accordingly.
1422 1.3 hpeyerl */
1423 1.231 ozaki return ENETRESET;
1424 1.252 maxv
1425 1.231 ozaki error:
1426 1.245 msaitoh ETHER_UNLOCK(ec);
1427 1.231 ozaki return error;
1428 1.66 thorpej }
1429 1.66 thorpej
1430 1.170 dyoung void
1431 1.170 dyoung ether_set_ifflags_cb(struct ethercom *ec, ether_cb_t cb)
1432 1.170 dyoung {
1433 1.170 dyoung ec->ec_ifflags_cb = cb;
1434 1.170 dyoung }
1435 1.170 dyoung
1436 1.276 msaitoh void
1437 1.276 msaitoh ether_set_vlan_cb(struct ethercom *ec, ether_vlancb_t cb)
1438 1.276 msaitoh {
1439 1.276 msaitoh
1440 1.276 msaitoh ec->ec_vlan_cb = cb;
1441 1.276 msaitoh }
1442 1.276 msaitoh
1443 1.272 msaitoh static int
1444 1.272 msaitoh ether_ioctl_reinit(struct ethercom *ec)
1445 1.272 msaitoh {
1446 1.272 msaitoh struct ifnet *ifp = &ec->ec_if;
1447 1.272 msaitoh int error;
1448 1.272 msaitoh
1449 1.272 msaitoh switch (ifp->if_flags & (IFF_UP | IFF_RUNNING)) {
1450 1.272 msaitoh case IFF_RUNNING:
1451 1.272 msaitoh /*
1452 1.272 msaitoh * If interface is marked down and it is running,
1453 1.272 msaitoh * then stop and disable it.
1454 1.272 msaitoh */
1455 1.272 msaitoh (*ifp->if_stop)(ifp, 1);
1456 1.272 msaitoh break;
1457 1.272 msaitoh case IFF_UP:
1458 1.272 msaitoh /*
1459 1.272 msaitoh * If interface is marked up and it is stopped, then
1460 1.272 msaitoh * start it.
1461 1.272 msaitoh */
1462 1.272 msaitoh return (*ifp->if_init)(ifp);
1463 1.272 msaitoh case IFF_UP | IFF_RUNNING:
1464 1.272 msaitoh error = 0;
1465 1.272 msaitoh if (ec->ec_ifflags_cb != NULL) {
1466 1.272 msaitoh error = (*ec->ec_ifflags_cb)(ec);
1467 1.272 msaitoh if (error == ENETRESET) {
1468 1.272 msaitoh /*
1469 1.272 msaitoh * Reset the interface to pick up
1470 1.272 msaitoh * changes in any other flags that
1471 1.272 msaitoh * affect the hardware state.
1472 1.272 msaitoh */
1473 1.272 msaitoh return (*ifp->if_init)(ifp);
1474 1.272 msaitoh }
1475 1.272 msaitoh } else
1476 1.272 msaitoh error = (*ifp->if_init)(ifp);
1477 1.272 msaitoh return error;
1478 1.272 msaitoh case 0:
1479 1.272 msaitoh break;
1480 1.272 msaitoh }
1481 1.272 msaitoh
1482 1.272 msaitoh return 0;
1483 1.272 msaitoh }
1484 1.272 msaitoh
1485 1.66 thorpej /*
1486 1.66 thorpej * Common ioctls for Ethernet interfaces. Note, we must be
1487 1.66 thorpej * called at splnet().
1488 1.66 thorpej */
1489 1.66 thorpej int
1490 1.147 christos ether_ioctl(struct ifnet *ifp, u_long cmd, void *data)
1491 1.66 thorpej {
1492 1.272 msaitoh struct ethercom *ec = (void *)ifp;
1493 1.193 msaitoh struct eccapreq *eccr;
1494 1.66 thorpej struct ifreq *ifr = (struct ifreq *)data;
1495 1.170 dyoung struct if_laddrreq *iflr = data;
1496 1.170 dyoung const struct sockaddr_dl *sdl;
1497 1.170 dyoung static const uint8_t zero[ETHER_ADDR_LEN];
1498 1.169 dyoung int error;
1499 1.66 thorpej
1500 1.66 thorpej switch (cmd) {
1501 1.170 dyoung case SIOCINITIFADDR:
1502 1.191 matt {
1503 1.191 matt struct ifaddr *ifa = (struct ifaddr *)data;
1504 1.191 matt if (ifa->ifa_addr->sa_family != AF_LINK
1505 1.247 msaitoh && (ifp->if_flags & (IFF_UP | IFF_RUNNING)) !=
1506 1.247 msaitoh (IFF_UP | IFF_RUNNING)) {
1507 1.170 dyoung ifp->if_flags |= IFF_UP;
1508 1.170 dyoung if ((error = (*ifp->if_init)(ifp)) != 0)
1509 1.170 dyoung return error;
1510 1.170 dyoung }
1511 1.66 thorpej #ifdef INET
1512 1.191 matt if (ifa->ifa_addr->sa_family == AF_INET)
1513 1.191 matt arp_ifinit(ifp, ifa);
1514 1.252 maxv #endif
1515 1.169 dyoung return 0;
1516 1.191 matt }
1517 1.66 thorpej
1518 1.66 thorpej case SIOCSIFMTU:
1519 1.82 thorpej {
1520 1.82 thorpej int maxmtu;
1521 1.82 thorpej
1522 1.82 thorpej if (ec->ec_capabilities & ETHERCAP_JUMBO_MTU)
1523 1.82 thorpej maxmtu = ETHERMTU_JUMBO;
1524 1.82 thorpej else
1525 1.82 thorpej maxmtu = ETHERMTU;
1526 1.82 thorpej
1527 1.82 thorpej if (ifr->ifr_mtu < ETHERMIN || ifr->ifr_mtu > maxmtu)
1528 1.169 dyoung return EINVAL;
1529 1.169 dyoung else if ((error = ifioctl_common(ifp, cmd, data)) != ENETRESET)
1530 1.169 dyoung return error;
1531 1.169 dyoung else if (ifp->if_flags & IFF_UP) {
1532 1.88 thorpej /* Make sure the device notices the MTU change. */
1533 1.169 dyoung return (*ifp->if_init)(ifp);
1534 1.169 dyoung } else
1535 1.169 dyoung return 0;
1536 1.82 thorpej }
1537 1.66 thorpej
1538 1.66 thorpej case SIOCSIFFLAGS:
1539 1.170 dyoung if ((error = ifioctl_common(ifp, cmd, data)) != 0)
1540 1.170 dyoung return error;
1541 1.272 msaitoh return ether_ioctl_reinit(ec);
1542 1.274 ozaki case SIOCGIFFLAGS:
1543 1.274 ozaki error = ifioctl_common(ifp, cmd, data);
1544 1.274 ozaki if (error == 0) {
1545 1.274 ozaki /* Set IFF_ALLMULTI for backcompat */
1546 1.274 ozaki ifr->ifr_flags |= (ec->ec_flags & ETHER_F_ALLMULTI) ?
1547 1.274 ozaki IFF_ALLMULTI : 0;
1548 1.274 ozaki }
1549 1.274 ozaki return error;
1550 1.193 msaitoh case SIOCGETHERCAP:
1551 1.193 msaitoh eccr = (struct eccapreq *)data;
1552 1.193 msaitoh eccr->eccr_capabilities = ec->ec_capabilities;
1553 1.193 msaitoh eccr->eccr_capenable = ec->ec_capenable;
1554 1.193 msaitoh return 0;
1555 1.272 msaitoh case SIOCSETHERCAP:
1556 1.272 msaitoh eccr = (struct eccapreq *)data;
1557 1.272 msaitoh if ((eccr->eccr_capenable & ~ec->ec_capabilities) != 0)
1558 1.272 msaitoh return EINVAL;
1559 1.272 msaitoh if (eccr->eccr_capenable == ec->ec_capenable)
1560 1.272 msaitoh return 0;
1561 1.272 msaitoh #if 0 /* notyet */
1562 1.272 msaitoh ec->ec_capenable = (ec->ec_capenable & ETHERCAP_CANTCHANGE)
1563 1.272 msaitoh | (eccr->eccr_capenable & ~ETHERCAP_CANTCHANGE);
1564 1.272 msaitoh #else
1565 1.272 msaitoh ec->ec_capenable = eccr->eccr_capenable;
1566 1.272 msaitoh #endif
1567 1.272 msaitoh return ether_ioctl_reinit(ec);
1568 1.66 thorpej case SIOCADDMULTI:
1569 1.169 dyoung return ether_addmulti(ifreq_getaddr(cmd, ifr), ec);
1570 1.66 thorpej case SIOCDELMULTI:
1571 1.169 dyoung return ether_delmulti(ifreq_getaddr(cmd, ifr), ec);
1572 1.160 dyoung case SIOCSIFMEDIA:
1573 1.160 dyoung case SIOCGIFMEDIA:
1574 1.275 msaitoh if (ec->ec_mii != NULL)
1575 1.275 msaitoh return ifmedia_ioctl(ifp, ifr, &ec->ec_mii->mii_media,
1576 1.275 msaitoh cmd);
1577 1.275 msaitoh else if (ec->ec_ifmedia != NULL)
1578 1.275 msaitoh return ifmedia_ioctl(ifp, ifr, ec->ec_ifmedia, cmd);
1579 1.275 msaitoh else
1580 1.169 dyoung return ENOTTY;
1581 1.275 msaitoh break;
1582 1.170 dyoung case SIOCALIFADDR:
1583 1.170 dyoung sdl = satocsdl(sstocsa(&iflr->addr));
1584 1.170 dyoung if (sdl->sdl_family != AF_LINK)
1585 1.170 dyoung ;
1586 1.170 dyoung else if (ETHER_IS_MULTICAST(CLLADDR(sdl)))
1587 1.170 dyoung return EINVAL;
1588 1.170 dyoung else if (memcmp(zero, CLLADDR(sdl), sizeof(zero)) == 0)
1589 1.170 dyoung return EINVAL;
1590 1.170 dyoung /*FALLTHROUGH*/
1591 1.170 dyoung default:
1592 1.161 dyoung return ifioctl_common(ifp, cmd, data);
1593 1.66 thorpej }
1594 1.169 dyoung return 0;
1595 1.3 hpeyerl }
1596 1.200 joerg
1597 1.215 christos /*
1598 1.215 christos * Enable/disable passing VLAN packets if the parent interface supports it.
1599 1.215 christos * Return:
1600 1.215 christos * 0: Ok
1601 1.215 christos * -1: Parent interface does not support vlans
1602 1.215 christos * >0: Error
1603 1.215 christos */
1604 1.215 christos int
1605 1.215 christos ether_enable_vlan_mtu(struct ifnet *ifp)
1606 1.215 christos {
1607 1.215 christos int error;
1608 1.215 christos struct ethercom *ec = (void *)ifp;
1609 1.215 christos
1610 1.215 christos /* Parent does not support VLAN's */
1611 1.215 christos if ((ec->ec_capabilities & ETHERCAP_VLAN_MTU) == 0)
1612 1.215 christos return -1;
1613 1.215 christos
1614 1.215 christos /*
1615 1.215 christos * Parent supports the VLAN_MTU capability,
1616 1.215 christos * i.e. can Tx/Rx larger than ETHER_MAX_LEN frames;
1617 1.215 christos * enable it.
1618 1.215 christos */
1619 1.215 christos ec->ec_capenable |= ETHERCAP_VLAN_MTU;
1620 1.215 christos
1621 1.215 christos /* Interface is down, defer for later */
1622 1.215 christos if ((ifp->if_flags & IFF_UP) == 0)
1623 1.215 christos return 0;
1624 1.215 christos
1625 1.215 christos if ((error = if_flags_set(ifp, ifp->if_flags)) == 0)
1626 1.215 christos return 0;
1627 1.215 christos
1628 1.215 christos ec->ec_capenable &= ~ETHERCAP_VLAN_MTU;
1629 1.215 christos return error;
1630 1.215 christos }
1631 1.215 christos
1632 1.215 christos int
1633 1.215 christos ether_disable_vlan_mtu(struct ifnet *ifp)
1634 1.215 christos {
1635 1.215 christos int error;
1636 1.215 christos struct ethercom *ec = (void *)ifp;
1637 1.215 christos
1638 1.215 christos /* We still have VLAN's, defer for later */
1639 1.215 christos if (ec->ec_nvlans != 0)
1640 1.215 christos return 0;
1641 1.215 christos
1642 1.215 christos /* Parent does not support VLAB's, nothing to do. */
1643 1.215 christos if ((ec->ec_capenable & ETHERCAP_VLAN_MTU) == 0)
1644 1.215 christos return -1;
1645 1.215 christos
1646 1.215 christos /*
1647 1.215 christos * Disable Tx/Rx of VLAN-sized frames.
1648 1.215 christos */
1649 1.215 christos ec->ec_capenable &= ~ETHERCAP_VLAN_MTU;
1650 1.250 maxv
1651 1.215 christos /* Interface is down, defer for later */
1652 1.215 christos if ((ifp->if_flags & IFF_UP) == 0)
1653 1.215 christos return 0;
1654 1.215 christos
1655 1.215 christos if ((error = if_flags_set(ifp, ifp->if_flags)) == 0)
1656 1.215 christos return 0;
1657 1.215 christos
1658 1.215 christos ec->ec_capenable |= ETHERCAP_VLAN_MTU;
1659 1.215 christos return error;
1660 1.215 christos }
1661 1.215 christos
1662 1.200 joerg static int
1663 1.200 joerg ether_multicast_sysctl(SYSCTLFN_ARGS)
1664 1.200 joerg {
1665 1.200 joerg struct ether_multi *enm;
1666 1.200 joerg struct ifnet *ifp;
1667 1.200 joerg struct ethercom *ec;
1668 1.223 ozaki int error = 0;
1669 1.200 joerg size_t written;
1670 1.223 ozaki struct psref psref;
1671 1.237 skrll int bound;
1672 1.233 ozaki unsigned int multicnt;
1673 1.233 ozaki struct ether_multi_sysctl *addrs;
1674 1.233 ozaki int i;
1675 1.200 joerg
1676 1.200 joerg if (namelen != 1)
1677 1.200 joerg return EINVAL;
1678 1.200 joerg
1679 1.223 ozaki bound = curlwp_bind();
1680 1.223 ozaki ifp = if_get_byindex(name[0], &psref);
1681 1.223 ozaki if (ifp == NULL) {
1682 1.223 ozaki error = ENODEV;
1683 1.223 ozaki goto out;
1684 1.223 ozaki }
1685 1.200 joerg if (ifp->if_type != IFT_ETHER) {
1686 1.223 ozaki if_put(ifp, &psref);
1687 1.200 joerg *oldlenp = 0;
1688 1.223 ozaki goto out;
1689 1.200 joerg }
1690 1.200 joerg ec = (struct ethercom *)ifp;
1691 1.200 joerg
1692 1.200 joerg if (oldp == NULL) {
1693 1.223 ozaki if_put(ifp, &psref);
1694 1.233 ozaki *oldlenp = ec->ec_multicnt * sizeof(*addrs);
1695 1.223 ozaki goto out;
1696 1.200 joerg }
1697 1.200 joerg
1698 1.233 ozaki /*
1699 1.233 ozaki * ec->ec_lock is a spin mutex so we cannot call sysctl_copyout, which
1700 1.251 maxv * is sleepable, while holding it. Copy data to a local buffer first
1701 1.251 maxv * with the lock taken and then call sysctl_copyout without holding it.
1702 1.233 ozaki */
1703 1.233 ozaki retry:
1704 1.233 ozaki multicnt = ec->ec_multicnt;
1705 1.251 maxv
1706 1.251 maxv if (multicnt == 0) {
1707 1.251 maxv if_put(ifp, &psref);
1708 1.251 maxv *oldlenp = 0;
1709 1.251 maxv goto out;
1710 1.251 maxv }
1711 1.251 maxv
1712 1.252 maxv addrs = kmem_zalloc(sizeof(*addrs) * multicnt, KM_SLEEP);
1713 1.200 joerg
1714 1.245 msaitoh ETHER_LOCK(ec);
1715 1.251 maxv if (multicnt != ec->ec_multicnt) {
1716 1.251 maxv /* The number of multicast addresses has changed */
1717 1.245 msaitoh ETHER_UNLOCK(ec);
1718 1.233 ozaki kmem_free(addrs, sizeof(*addrs) * multicnt);
1719 1.233 ozaki goto retry;
1720 1.233 ozaki }
1721 1.233 ozaki
1722 1.233 ozaki i = 0;
1723 1.200 joerg LIST_FOREACH(enm, &ec->ec_multiaddrs, enm_list) {
1724 1.233 ozaki struct ether_multi_sysctl *addr = &addrs[i];
1725 1.233 ozaki addr->enm_refcount = enm->enm_refcount;
1726 1.233 ozaki memcpy(addr->enm_addrlo, enm->enm_addrlo, ETHER_ADDR_LEN);
1727 1.233 ozaki memcpy(addr->enm_addrhi, enm->enm_addrhi, ETHER_ADDR_LEN);
1728 1.233 ozaki i++;
1729 1.233 ozaki }
1730 1.245 msaitoh ETHER_UNLOCK(ec);
1731 1.233 ozaki
1732 1.233 ozaki error = 0;
1733 1.233 ozaki written = 0;
1734 1.233 ozaki for (i = 0; i < multicnt; i++) {
1735 1.233 ozaki struct ether_multi_sysctl *addr = &addrs[i];
1736 1.233 ozaki
1737 1.233 ozaki if (written + sizeof(*addr) > *oldlenp)
1738 1.200 joerg break;
1739 1.233 ozaki error = sysctl_copyout(l, addr, oldp, sizeof(*addr));
1740 1.200 joerg if (error)
1741 1.200 joerg break;
1742 1.233 ozaki written += sizeof(*addr);
1743 1.233 ozaki oldp = (char *)oldp + sizeof(*addr);
1744 1.200 joerg }
1745 1.233 ozaki kmem_free(addrs, sizeof(*addrs) * multicnt);
1746 1.233 ozaki
1747 1.223 ozaki if_put(ifp, &psref);
1748 1.200 joerg
1749 1.200 joerg *oldlenp = written;
1750 1.223 ozaki out:
1751 1.223 ozaki curlwp_bindx(bound);
1752 1.200 joerg return error;
1753 1.200 joerg }
1754 1.200 joerg
1755 1.234 ozaki static void
1756 1.234 ozaki ether_sysctl_setup(struct sysctllog **clog)
1757 1.200 joerg {
1758 1.200 joerg const struct sysctlnode *rnode = NULL;
1759 1.200 joerg
1760 1.200 joerg sysctl_createv(clog, 0, NULL, &rnode,
1761 1.200 joerg CTLFLAG_PERMANENT,
1762 1.200 joerg CTLTYPE_NODE, "ether",
1763 1.200 joerg SYSCTL_DESCR("Ethernet-specific information"),
1764 1.200 joerg NULL, 0, NULL, 0,
1765 1.200 joerg CTL_NET, CTL_CREATE, CTL_EOL);
1766 1.200 joerg
1767 1.200 joerg sysctl_createv(clog, 0, &rnode, NULL,
1768 1.200 joerg CTLFLAG_PERMANENT,
1769 1.200 joerg CTLTYPE_NODE, "multicast",
1770 1.200 joerg SYSCTL_DESCR("multicast addresses"),
1771 1.200 joerg ether_multicast_sysctl, 0, NULL, 0,
1772 1.200 joerg CTL_CREATE, CTL_EOL);
1773 1.301 knakahar
1774 1.301 knakahar sysctl_createv(clog, 0, &rnode, NULL,
1775 1.301 knakahar CTLFLAG_PERMANENT | CTLFLAG_READWRITE,
1776 1.301 knakahar CTLTYPE_STRING, "rps_hash",
1777 1.301 knakahar SYSCTL_DESCR("Interface rps hash function control"),
1778 1.301 knakahar sysctl_pktq_rps_hash_handler, 0, (void *)ðer_pktq_rps_hash_p,
1779 1.301 knakahar PKTQ_RPS_HASH_NAME_LEN,
1780 1.301 knakahar CTL_CREATE, CTL_EOL);
1781 1.200 joerg }
1782 1.203 ozaki
1783 1.203 ozaki void
1784 1.203 ozaki etherinit(void)
1785 1.203 ozaki {
1786 1.234 ozaki
1787 1.278 msaitoh #ifdef DIAGNOSTIC
1788 1.203 ozaki mutex_init(&bigpktpps_lock, MUTEX_DEFAULT, IPL_NET);
1789 1.278 msaitoh #endif
1790 1.301 knakahar ether_pktq_rps_hash_p = pktq_rps_hash_default;
1791 1.234 ozaki ether_sysctl_setup(NULL);
1792 1.203 ozaki }
1793