if_ethersubr.c revision 1.301 1 1.301 knakahar /* $NetBSD: if_ethersubr.c,v 1.301 2021/10/11 05:13:11 knakahara Exp $ */
2 1.44 itojun
3 1.44 itojun /*
4 1.44 itojun * Copyright (C) 1995, 1996, 1997, and 1998 WIDE Project.
5 1.44 itojun * All rights reserved.
6 1.120 perry *
7 1.44 itojun * Redistribution and use in source and binary forms, with or without
8 1.44 itojun * modification, are permitted provided that the following conditions
9 1.44 itojun * are met:
10 1.44 itojun * 1. Redistributions of source code must retain the above copyright
11 1.44 itojun * notice, this list of conditions and the following disclaimer.
12 1.44 itojun * 2. Redistributions in binary form must reproduce the above copyright
13 1.44 itojun * notice, this list of conditions and the following disclaimer in the
14 1.44 itojun * documentation and/or other materials provided with the distribution.
15 1.44 itojun * 3. Neither the name of the project nor the names of its contributors
16 1.44 itojun * may be used to endorse or promote products derived from this software
17 1.44 itojun * without specific prior written permission.
18 1.120 perry *
19 1.44 itojun * THIS SOFTWARE IS PROVIDED BY THE PROJECT AND CONTRIBUTORS ``AS IS'' AND
20 1.44 itojun * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
21 1.44 itojun * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
22 1.44 itojun * ARE DISCLAIMED. IN NO EVENT SHALL THE PROJECT OR CONTRIBUTORS BE LIABLE
23 1.44 itojun * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
24 1.44 itojun * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
25 1.44 itojun * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
26 1.44 itojun * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
27 1.44 itojun * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
28 1.44 itojun * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
29 1.44 itojun * SUCH DAMAGE.
30 1.44 itojun */
31 1.9 cgd
32 1.1 cgd /*
33 1.8 mycroft * Copyright (c) 1982, 1989, 1993
34 1.8 mycroft * The Regents of the University of California. All rights reserved.
35 1.1 cgd *
36 1.1 cgd * Redistribution and use in source and binary forms, with or without
37 1.1 cgd * modification, are permitted provided that the following conditions
38 1.1 cgd * are met:
39 1.1 cgd * 1. Redistributions of source code must retain the above copyright
40 1.1 cgd * notice, this list of conditions and the following disclaimer.
41 1.1 cgd * 2. Redistributions in binary form must reproduce the above copyright
42 1.1 cgd * notice, this list of conditions and the following disclaimer in the
43 1.1 cgd * documentation and/or other materials provided with the distribution.
44 1.113 agc * 3. Neither the name of the University nor the names of its contributors
45 1.1 cgd * may be used to endorse or promote products derived from this software
46 1.1 cgd * without specific prior written permission.
47 1.1 cgd *
48 1.1 cgd * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
49 1.1 cgd * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
50 1.1 cgd * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
51 1.1 cgd * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
52 1.1 cgd * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
53 1.1 cgd * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
54 1.1 cgd * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
55 1.1 cgd * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
56 1.1 cgd * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
57 1.1 cgd * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
58 1.1 cgd * SUCH DAMAGE.
59 1.1 cgd *
60 1.27 fvdl * @(#)if_ethersubr.c 8.2 (Berkeley) 4/4/96
61 1.1 cgd */
62 1.90 lukem
63 1.90 lukem #include <sys/cdefs.h>
64 1.301 knakahar __KERNEL_RCSID(0, "$NetBSD: if_ethersubr.c,v 1.301 2021/10/11 05:13:11 knakahara Exp $");
65 1.1 cgd
66 1.212 pooka #ifdef _KERNEL_OPT
67 1.33 jonathan #include "opt_inet.h"
68 1.33 jonathan #include "opt_atalk.h"
69 1.112 martin #include "opt_mbuftrace.h"
70 1.182 kefren #include "opt_mpls.h"
71 1.30 matt #include "opt_gateway.h"
72 1.135 pavel #include "opt_pppoe.h"
73 1.206 ozaki #include "opt_net_mpsafe.h"
74 1.212 pooka #endif
75 1.212 pooka
76 1.59 thorpej #include "vlan.h"
77 1.81 martin #include "pppoe.h"
78 1.78 thorpej #include "bridge.h"
79 1.93 martin #include "arp.h"
80 1.121 yamt #include "agr.h"
81 1.30 matt
82 1.200 joerg #include <sys/sysctl.h>
83 1.4 mycroft #include <sys/mbuf.h>
84 1.211 ozaki #include <sys/mutex.h>
85 1.4 mycroft #include <sys/ioctl.h>
86 1.4 mycroft #include <sys/errno.h>
87 1.158 dyoung #include <sys/device.h>
88 1.284 riastrad #include <sys/entropy.h>
89 1.207 riastrad #include <sys/rndsource.h>
90 1.216 ozaki #include <sys/cpu.h>
91 1.231 ozaki #include <sys/kmem.h>
92 1.297 yamaguch #include <sys/hook.h>
93 1.8 mycroft
94 1.4 mycroft #include <net/if.h>
95 1.4 mycroft #include <net/netisr.h>
96 1.4 mycroft #include <net/route.h>
97 1.4 mycroft #include <net/if_llc.h>
98 1.4 mycroft #include <net/if_dl.h>
99 1.8 mycroft #include <net/if_types.h>
100 1.211 ozaki #include <net/pktqueue.h>
101 1.93 martin
102 1.158 dyoung #include <net/if_media.h>
103 1.158 dyoung #include <dev/mii/mii.h>
104 1.158 dyoung #include <dev/mii/miivar.h>
105 1.158 dyoung
106 1.93 martin #if NARP == 0
107 1.93 martin /*
108 1.102 jmmv * XXX there should really be a way to issue this warning from within config(8)
109 1.93 martin */
110 1.111 martin #error You have included NETATALK or a pseudo-device in your configuration that depends on the presence of ethernet interfaces, but have no such interfaces configured. Check if you really need pseudo-device bridge, pppoe, vlan or options NETATALK.
111 1.93 martin #endif
112 1.1 cgd
113 1.69 thorpej #include <net/bpf.h>
114 1.69 thorpej
115 1.22 is #include <net/if_ether.h>
116 1.59 thorpej #include <net/if_vlanvar.h>
117 1.22 is
118 1.81 martin #if NPPPOE > 0
119 1.81 martin #include <net/if_pppoe.h>
120 1.81 martin #endif
121 1.81 martin
122 1.121 yamt #if NAGR > 0
123 1.121 yamt #include <net/agr/ieee8023_slowprotocols.h> /* XXX */
124 1.121 yamt #include <net/agr/ieee8023ad.h>
125 1.121 yamt #include <net/agr/if_agrvar.h>
126 1.121 yamt #endif
127 1.121 yamt
128 1.293 yamaguch #include <net/lagg/if_laggvar.h>
129 1.293 yamaguch
130 1.78 thorpej #if NBRIDGE > 0
131 1.78 thorpej #include <net/if_bridgevar.h>
132 1.78 thorpej #endif
133 1.78 thorpej
134 1.15 phil #include <netinet/in.h>
135 1.1 cgd #ifdef INET
136 1.4 mycroft #include <netinet/in_var.h>
137 1.1 cgd #endif
138 1.22 is #include <netinet/if_inarp.h>
139 1.1 cgd
140 1.44 itojun #ifdef INET6
141 1.44 itojun #ifndef INET
142 1.44 itojun #include <netinet/in.h>
143 1.44 itojun #endif
144 1.44 itojun #include <netinet6/in6_var.h>
145 1.44 itojun #include <netinet6/nd6.h>
146 1.44 itojun #endif
147 1.44 itojun
148 1.133 liamjfoy #include "carp.h"
149 1.133 liamjfoy #if NCARP > 0
150 1.133 liamjfoy #include <netinet/ip_carp.h>
151 1.133 liamjfoy #endif
152 1.133 liamjfoy
153 1.23 christos #ifdef NETATALK
154 1.23 christos #include <netatalk/at.h>
155 1.23 christos #include <netatalk/at_var.h>
156 1.23 christos #include <netatalk/at_extern.h>
157 1.23 christos
158 1.23 christos #define llc_snap_org_code llc_un.type_snap.org_code
159 1.23 christos #define llc_snap_ether_type llc_un.type_snap.ether_type
160 1.23 christos
161 1.23 christos extern u_char at_org_code[3];
162 1.23 christos extern u_char aarp_org_code[3];
163 1.23 christos #endif /* NETATALK */
164 1.23 christos
165 1.182 kefren #ifdef MPLS
166 1.182 kefren #include <netmpls/mpls.h>
167 1.182 kefren #include <netmpls/mpls_var.h>
168 1.182 kefren #endif
169 1.182 kefren
170 1.292 roy CTASSERT(sizeof(struct ether_addr) == 6);
171 1.292 roy CTASSERT(sizeof(struct ether_header) == 14);
172 1.292 roy
173 1.278 msaitoh #ifdef DIAGNOSTIC
174 1.123 matt static struct timeval bigpktppslim_last;
175 1.123 matt static int bigpktppslim = 2; /* XXX */
176 1.123 matt static int bigpktpps_count;
177 1.203 ozaki static kmutex_t bigpktpps_lock __cacheline_aligned;
178 1.278 msaitoh #endif
179 1.123 matt
180 1.118 yamt const uint8_t etherbroadcastaddr[ETHER_ADDR_LEN] =
181 1.118 yamt { 0xff, 0xff, 0xff, 0xff, 0xff, 0xff };
182 1.121 yamt const uint8_t ethermulticastaddr_slowprotocols[ETHER_ADDR_LEN] =
183 1.121 yamt { 0x01, 0x80, 0xc2, 0x00, 0x00, 0x02 };
184 1.8 mycroft #define senderr(e) { error = (e); goto bad;}
185 1.1 cgd
186 1.301 knakahar static pktq_rps_hash_func_t ether_pktq_rps_hash_p;
187 1.301 knakahar
188 1.293 yamaguch /* if_lagg(4) support */
189 1.293 yamaguch struct mbuf *(*lagg_input_ethernet_p)(struct ifnet *, struct mbuf *);
190 1.293 yamaguch
191 1.261 maxv static int ether_output(struct ifnet *, struct mbuf *,
192 1.261 maxv const struct sockaddr *, const struct rtentry *);
193 1.42 thorpej
194 1.1 cgd /*
195 1.1 cgd * Ethernet output routine.
196 1.1 cgd * Encapsulate a packet of type family for the local net.
197 1.22 is * Assumes that ifp is actually pointer to ethercom structure.
198 1.1 cgd */
199 1.42 thorpej static int
200 1.178 dyoung ether_output(struct ifnet * const ifp0, struct mbuf * const m0,
201 1.256 maxv const struct sockaddr * const dst, const struct rtentry *rt)
202 1.1 cgd {
203 1.256 maxv uint8_t esrc[ETHER_ADDR_LEN], edst[ETHER_ADDR_LEN];
204 1.162 matt uint16_t etype = 0;
205 1.122 christos int error = 0, hdrcmplt = 0;
206 1.29 mrg struct mbuf *m = m0;
207 1.151 dyoung struct mbuf *mcopy = NULL;
208 1.29 mrg struct ether_header *eh;
209 1.133 liamjfoy struct ifnet *ifp = ifp0;
210 1.24 christos #ifdef INET
211 1.22 is struct arphdr *ah;
212 1.260 maxv #endif
213 1.23 christos #ifdef NETATALK
214 1.23 christos struct at_ifaddr *aa;
215 1.260 maxv #endif
216 1.1 cgd
217 1.104 matt #ifdef MBUFTRACE
218 1.116 jonathan m_claimm(m, ifp->if_mowner);
219 1.104 matt #endif
220 1.133 liamjfoy
221 1.133 liamjfoy #if NCARP > 0
222 1.133 liamjfoy if (ifp->if_type == IFT_CARP) {
223 1.133 liamjfoy struct ifaddr *ifa;
224 1.227 ozaki int s = pserialize_read_enter();
225 1.133 liamjfoy
226 1.133 liamjfoy /* loop back if this is going to the carp interface */
227 1.133 liamjfoy if (dst != NULL && ifp0->if_link_state == LINK_STATE_UP &&
228 1.227 ozaki (ifa = ifa_ifwithaddr(dst)) != NULL) {
229 1.227 ozaki if (ifa->ifa_ifp == ifp0) {
230 1.227 ozaki pserialize_read_exit(s);
231 1.227 ozaki return looutput(ifp0, m, dst, rt);
232 1.227 ozaki }
233 1.227 ozaki }
234 1.227 ozaki pserialize_read_exit(s);
235 1.133 liamjfoy
236 1.133 liamjfoy ifp = ifp->if_carpdev;
237 1.133 liamjfoy /* ac = (struct arpcom *)ifp; */
238 1.133 liamjfoy
239 1.247 msaitoh if ((ifp0->if_flags & (IFF_UP | IFF_RUNNING)) !=
240 1.247 msaitoh (IFF_UP | IFF_RUNNING))
241 1.133 liamjfoy senderr(ENETDOWN);
242 1.133 liamjfoy }
243 1.260 maxv #endif
244 1.133 liamjfoy
245 1.247 msaitoh if ((ifp->if_flags & (IFF_UP | IFF_RUNNING)) != (IFF_UP | IFF_RUNNING))
246 1.8 mycroft senderr(ENETDOWN);
247 1.72 thorpej
248 1.1 cgd switch (dst->sa_family) {
249 1.1 cgd
250 1.1 cgd #ifdef INET
251 1.1 cgd case AF_INET:
252 1.261 maxv if (m->m_flags & M_BCAST) {
253 1.256 maxv memcpy(edst, etherbroadcastaddr, sizeof(edst));
254 1.261 maxv } else if (m->m_flags & M_MCAST) {
255 1.145 dyoung ETHER_MAP_IP_MULTICAST(&satocsin(dst)->sin_addr, edst);
256 1.261 maxv } else {
257 1.281 kardel error = arpresolve(ifp0, rt, m, dst, edst, sizeof(edst));
258 1.260 maxv if (error)
259 1.260 maxv return (error == EWOULDBLOCK) ? 0 : error;
260 1.224 knakahar }
261 1.3 hpeyerl /* If broadcasting on a simplex interface, loopback a copy */
262 1.3 hpeyerl if ((m->m_flags & M_BCAST) && (ifp->if_flags & IFF_SIMPLEX))
263 1.266 maxv mcopy = m_copypacket(m, M_DONTWAIT);
264 1.17 mycroft etype = htons(ETHERTYPE_IP);
265 1.8 mycroft break;
266 1.22 is
267 1.22 is case AF_ARP:
268 1.22 is ah = mtod(m, struct arphdr *);
269 1.261 maxv if (m->m_flags & M_BCAST) {
270 1.256 maxv memcpy(edst, etherbroadcastaddr, sizeof(edst));
271 1.261 maxv } else {
272 1.147 christos void *tha = ar_tha(ah);
273 1.131 mrg
274 1.173 christos if (tha == NULL) {
275 1.258 maxv /* fake with ARPHRD_IEEE1394 */
276 1.236 maxv m_freem(m);
277 1.173 christos return 0;
278 1.173 christos }
279 1.146 dyoung memcpy(edst, tha, sizeof(edst));
280 1.131 mrg }
281 1.120 perry
282 1.22 is ah->ar_hrd = htons(ARPHRD_ETHER);
283 1.22 is
284 1.107 itojun switch (ntohs(ah->ar_op)) {
285 1.22 is case ARPOP_REVREQUEST:
286 1.22 is case ARPOP_REVREPLY:
287 1.22 is etype = htons(ETHERTYPE_REVARP);
288 1.22 is break;
289 1.22 is
290 1.22 is case ARPOP_REQUEST:
291 1.22 is case ARPOP_REPLY:
292 1.22 is default:
293 1.22 is etype = htons(ETHERTYPE_ARP);
294 1.22 is }
295 1.22 is break;
296 1.1 cgd #endif
297 1.256 maxv
298 1.44 itojun #ifdef INET6
299 1.44 itojun case AF_INET6:
300 1.261 maxv if (m->m_flags & M_BCAST) {
301 1.256 maxv memcpy(edst, etherbroadcastaddr, sizeof(edst));
302 1.261 maxv } else if (m->m_flags & M_MCAST) {
303 1.238 ozaki ETHER_MAP_IPV6_MULTICAST(&satocsin6(dst)->sin6_addr,
304 1.238 ozaki edst);
305 1.238 ozaki } else {
306 1.281 kardel error = nd6_resolve(ifp0, rt, m, dst, edst,
307 1.238 ozaki sizeof(edst));
308 1.261 maxv if (error)
309 1.261 maxv return (error == EWOULDBLOCK) ? 0 : error;
310 1.51 itojun }
311 1.44 itojun etype = htons(ETHERTYPE_IPV6);
312 1.44 itojun break;
313 1.44 itojun #endif
314 1.256 maxv
315 1.23 christos #ifdef NETATALK
316 1.250 maxv case AF_APPLETALK: {
317 1.227 ozaki struct ifaddr *ifa;
318 1.227 ozaki int s;
319 1.227 ozaki
320 1.224 knakahar KERNEL_LOCK(1, NULL);
321 1.256 maxv
322 1.226 rjs if (!aarpresolve(ifp, m, (const struct sockaddr_at *)dst, edst)) {
323 1.224 knakahar KERNEL_UNLOCK_ONE(NULL);
324 1.261 maxv return 0;
325 1.23 christos }
326 1.256 maxv
327 1.23 christos /*
328 1.23 christos * ifaddr is the first thing in at_ifaddr
329 1.23 christos */
330 1.227 ozaki s = pserialize_read_enter();
331 1.227 ozaki ifa = at_ifawithnet((const struct sockaddr_at *)dst, ifp);
332 1.227 ozaki if (ifa == NULL) {
333 1.227 ozaki pserialize_read_exit(s);
334 1.227 ozaki KERNEL_UNLOCK_ONE(NULL);
335 1.260 maxv senderr(EADDRNOTAVAIL);
336 1.224 knakahar }
337 1.227 ozaki aa = (struct at_ifaddr *)ifa;
338 1.120 perry
339 1.23 christos /*
340 1.23 christos * In the phase 2 case, we need to prepend an mbuf for the
341 1.265 maxv * llc header.
342 1.23 christos */
343 1.23 christos if (aa->aa_flags & AFA_PHASE2) {
344 1.23 christos struct llc llc;
345 1.23 christos
346 1.43 bouyer M_PREPEND(m, sizeof(struct llc), M_DONTWAIT);
347 1.256 maxv if (m == NULL) {
348 1.260 maxv pserialize_read_exit(s);
349 1.256 maxv KERNEL_UNLOCK_ONE(NULL);
350 1.256 maxv senderr(ENOBUFS);
351 1.256 maxv }
352 1.256 maxv
353 1.23 christos llc.llc_dsap = llc.llc_ssap = LLC_SNAP_LSAP;
354 1.23 christos llc.llc_control = LLC_UI;
355 1.146 dyoung memcpy(llc.llc_snap_org_code, at_org_code,
356 1.23 christos sizeof(llc.llc_snap_org_code));
357 1.38 kim llc.llc_snap_ether_type = htons(ETHERTYPE_ATALK);
358 1.147 christos memcpy(mtod(m, void *), &llc, sizeof(struct llc));
359 1.23 christos } else {
360 1.38 kim etype = htons(ETHERTYPE_ATALK);
361 1.23 christos }
362 1.227 ozaki pserialize_read_exit(s);
363 1.224 knakahar KERNEL_UNLOCK_ONE(NULL);
364 1.23 christos break;
365 1.250 maxv }
366 1.23 christos #endif /* NETATALK */
367 1.256 maxv
368 1.31 thorpej case pseudo_AF_HDRCMPLT:
369 1.31 thorpej hdrcmplt = 1;
370 1.146 dyoung memcpy(esrc,
371 1.146 dyoung ((const struct ether_header *)dst->sa_data)->ether_shost,
372 1.146 dyoung sizeof(esrc));
373 1.31 thorpej /* FALLTHROUGH */
374 1.31 thorpej
375 1.1 cgd case AF_UNSPEC:
376 1.250 maxv memcpy(edst,
377 1.146 dyoung ((const struct ether_header *)dst->sa_data)->ether_dhost,
378 1.146 dyoung sizeof(edst));
379 1.8 mycroft /* AF_UNSPEC doesn't swap the byte order of the ether_type. */
380 1.145 dyoung etype = ((const struct ether_header *)dst->sa_data)->ether_type;
381 1.8 mycroft break;
382 1.1 cgd
383 1.1 cgd default:
384 1.21 christos printf("%s: can't handle af%d\n", ifp->if_xname,
385 1.261 maxv dst->sa_family);
386 1.8 mycroft senderr(EAFNOSUPPORT);
387 1.1 cgd }
388 1.1 cgd
389 1.182 kefren #ifdef MPLS
390 1.210 ozaki {
391 1.210 ozaki struct m_tag *mtag;
392 1.271 maxv mtag = m_tag_find(m, PACKET_TAG_MPLS);
393 1.210 ozaki if (mtag != NULL) {
394 1.210 ozaki /* Having the tag itself indicates it's MPLS */
395 1.184 dyoung etype = htons(ETHERTYPE_MPLS);
396 1.210 ozaki m_tag_delete(m, mtag);
397 1.210 ozaki }
398 1.184 dyoung }
399 1.182 kefren #endif
400 1.182 kefren
401 1.1 cgd if (mcopy)
402 1.145 dyoung (void)looutput(ifp, mcopy, dst, rt);
403 1.16 mycroft
404 1.256 maxv KASSERT((m->m_flags & M_PKTHDR) != 0);
405 1.256 maxv
406 1.256 maxv /*
407 1.256 maxv * If no ether type is set, this must be a 802.2 formatted packet.
408 1.50 matt */
409 1.50 matt if (etype == 0)
410 1.50 matt etype = htons(m->m_pkthdr.len);
411 1.256 maxv
412 1.1 cgd /*
413 1.256 maxv * Add local net header. If no space in first mbuf, allocate another.
414 1.1 cgd */
415 1.256 maxv M_PREPEND(m, sizeof(struct ether_header), M_DONTWAIT);
416 1.256 maxv if (m == NULL)
417 1.8 mycroft senderr(ENOBUFS);
418 1.256 maxv
419 1.1 cgd eh = mtod(m, struct ether_header *);
420 1.96 thorpej /* Note: etype is already in network byte order. */
421 1.256 maxv memcpy(&eh->ether_type, &etype, sizeof(eh->ether_type));
422 1.250 maxv memcpy(eh->ether_dhost, edst, sizeof(edst));
423 1.261 maxv if (hdrcmplt) {
424 1.146 dyoung memcpy(eh->ether_shost, esrc, sizeof(eh->ether_shost));
425 1.261 maxv } else {
426 1.153 dyoung memcpy(eh->ether_shost, CLLADDR(ifp->if_sadl),
427 1.31 thorpej sizeof(eh->ether_shost));
428 1.261 maxv }
429 1.77 thorpej
430 1.133 liamjfoy #if NCARP > 0
431 1.133 liamjfoy if (ifp0 != ifp && ifp0->if_type == IFT_CARP) {
432 1.153 dyoung memcpy(eh->ether_shost, CLLADDR(ifp0->if_sadl),
433 1.133 liamjfoy sizeof(eh->ether_shost));
434 1.133 liamjfoy }
435 1.256 maxv #endif
436 1.133 liamjfoy
437 1.195 rmind if ((error = pfil_run_hooks(ifp->if_pfil, &m, ifp, PFIL_OUT)) != 0)
438 1.261 maxv return error;
439 1.77 thorpej if (m == NULL)
440 1.261 maxv return 0;
441 1.77 thorpej
442 1.78 thorpej #if NBRIDGE > 0
443 1.78 thorpej /*
444 1.78 thorpej * Bridges require special output handling.
445 1.78 thorpej */
446 1.78 thorpej if (ifp->if_bridge)
447 1.256 maxv return bridge_output(ifp, m, NULL, NULL);
448 1.78 thorpej #endif
449 1.78 thorpej
450 1.133 liamjfoy #if NCARP > 0
451 1.133 liamjfoy if (ifp != ifp0)
452 1.282 thorpej if_statadd(ifp0, if_obytes, m->m_pkthdr.len + ETHER_HDR_LEN);
453 1.256 maxv #endif
454 1.133 liamjfoy
455 1.77 thorpej #ifdef ALTQ
456 1.224 knakahar KERNEL_LOCK(1, NULL);
457 1.77 thorpej /*
458 1.77 thorpej * If ALTQ is enabled on the parent interface, do
459 1.77 thorpej * classification; the queueing discipline might not
460 1.77 thorpej * require classification, but might require the
461 1.77 thorpej * address family/header pointer in the pktattr.
462 1.77 thorpej */
463 1.77 thorpej if (ALTQ_IS_ENABLED(&ifp->if_snd))
464 1.220 knakahar altq_etherclassify(&ifp->if_snd, m);
465 1.224 knakahar KERNEL_UNLOCK_ONE(NULL);
466 1.77 thorpej #endif
467 1.221 knakahar return ifq_enqueue(ifp, m);
468 1.1 cgd
469 1.1 cgd bad:
470 1.288 ozaki if_statinc(ifp, if_oerrors);
471 1.1 cgd if (m)
472 1.1 cgd m_freem(m);
473 1.261 maxv return error;
474 1.1 cgd }
475 1.76 thorpej
476 1.76 thorpej #ifdef ALTQ
477 1.76 thorpej /*
478 1.76 thorpej * This routine is a slight hack to allow a packet to be classified
479 1.76 thorpej * if the Ethernet headers are present. It will go away when ALTQ's
480 1.76 thorpej * classification engine understands link headers.
481 1.261 maxv *
482 1.261 maxv * XXX: We may need to do m_pullups here. First to ensure struct ether_header
483 1.261 maxv * is indeed contiguous, then to read the LLC and so on.
484 1.76 thorpej */
485 1.76 thorpej void
486 1.220 knakahar altq_etherclassify(struct ifaltq *ifq, struct mbuf *m)
487 1.76 thorpej {
488 1.76 thorpej struct ether_header *eh;
489 1.255 maxv struct mbuf *mtop = m;
490 1.162 matt uint16_t ether_type;
491 1.76 thorpej int hlen, af, hdrsize;
492 1.147 christos void *hdr;
493 1.76 thorpej
494 1.255 maxv KASSERT((mtop->m_flags & M_PKTHDR) != 0);
495 1.255 maxv
496 1.76 thorpej hlen = ETHER_HDR_LEN;
497 1.76 thorpej eh = mtod(m, struct ether_header *);
498 1.76 thorpej
499 1.76 thorpej ether_type = htons(eh->ether_type);
500 1.76 thorpej
501 1.76 thorpej if (ether_type < ETHERMTU) {
502 1.76 thorpej /* LLC/SNAP */
503 1.76 thorpej struct llc *llc = (struct llc *)(eh + 1);
504 1.76 thorpej hlen += 8;
505 1.76 thorpej
506 1.76 thorpej if (m->m_len < hlen ||
507 1.76 thorpej llc->llc_dsap != LLC_SNAP_LSAP ||
508 1.76 thorpej llc->llc_ssap != LLC_SNAP_LSAP ||
509 1.76 thorpej llc->llc_control != LLC_UI) {
510 1.76 thorpej /* Not SNAP. */
511 1.76 thorpej goto bad;
512 1.76 thorpej }
513 1.76 thorpej
514 1.76 thorpej ether_type = htons(llc->llc_un.type_snap.ether_type);
515 1.76 thorpej }
516 1.76 thorpej
517 1.76 thorpej switch (ether_type) {
518 1.76 thorpej case ETHERTYPE_IP:
519 1.76 thorpej af = AF_INET;
520 1.76 thorpej hdrsize = 20; /* sizeof(struct ip) */
521 1.76 thorpej break;
522 1.76 thorpej
523 1.76 thorpej case ETHERTYPE_IPV6:
524 1.76 thorpej af = AF_INET6;
525 1.76 thorpej hdrsize = 40; /* sizeof(struct ip6_hdr) */
526 1.76 thorpej break;
527 1.76 thorpej
528 1.76 thorpej default:
529 1.76 thorpej af = AF_UNSPEC;
530 1.76 thorpej hdrsize = 0;
531 1.76 thorpej break;
532 1.76 thorpej }
533 1.76 thorpej
534 1.95 itojun while (m->m_len <= hlen) {
535 1.95 itojun hlen -= m->m_len;
536 1.95 itojun m = m->m_next;
537 1.255 maxv if (m == NULL)
538 1.255 maxv goto bad;
539 1.95 itojun }
540 1.255 maxv
541 1.76 thorpej if (m->m_len < (hlen + hdrsize)) {
542 1.76 thorpej /*
543 1.95 itojun * protocol header not in a single mbuf.
544 1.95 itojun * We can't cope with this situation right
545 1.76 thorpej * now (but it shouldn't ever happen, really, anyhow).
546 1.76 thorpej */
547 1.92 itojun #ifdef DEBUG
548 1.78 thorpej printf("altq_etherclassify: headers span multiple mbufs: "
549 1.78 thorpej "%d < %d\n", m->m_len, (hlen + hdrsize));
550 1.92 itojun #endif
551 1.76 thorpej goto bad;
552 1.76 thorpej }
553 1.76 thorpej
554 1.76 thorpej m->m_data += hlen;
555 1.76 thorpej m->m_len -= hlen;
556 1.76 thorpej
557 1.147 christos hdr = mtod(m, void *);
558 1.76 thorpej
559 1.255 maxv if (ALTQ_NEEDS_CLASSIFY(ifq)) {
560 1.255 maxv mtop->m_pkthdr.pattr_class =
561 1.76 thorpej (*ifq->altq_classify)(ifq->altq_clfier, m, af);
562 1.255 maxv }
563 1.255 maxv mtop->m_pkthdr.pattr_af = af;
564 1.255 maxv mtop->m_pkthdr.pattr_hdr = hdr;
565 1.76 thorpej
566 1.76 thorpej m->m_data -= hlen;
567 1.76 thorpej m->m_len += hlen;
568 1.76 thorpej
569 1.76 thorpej return;
570 1.76 thorpej
571 1.250 maxv bad:
572 1.255 maxv mtop->m_pkthdr.pattr_class = NULL;
573 1.255 maxv mtop->m_pkthdr.pattr_hdr = NULL;
574 1.255 maxv mtop->m_pkthdr.pattr_af = AF_UNSPEC;
575 1.76 thorpej }
576 1.76 thorpej #endif /* ALTQ */
577 1.1 cgd
578 1.286 ozaki #if defined (LLC) || defined (NETATALK)
579 1.286 ozaki static void
580 1.286 ozaki ether_input_llc(struct ifnet *ifp, struct mbuf *m, struct ether_header *eh)
581 1.286 ozaki {
582 1.286 ozaki struct ifqueue *inq = NULL;
583 1.286 ozaki int isr = 0;
584 1.286 ozaki struct llc *l;
585 1.286 ozaki
586 1.286 ozaki if (m->m_len < sizeof(*eh) + sizeof(struct llc))
587 1.286 ozaki goto drop;
588 1.286 ozaki
589 1.286 ozaki l = (struct llc *)(eh+1);
590 1.286 ozaki switch (l->llc_dsap) {
591 1.286 ozaki #ifdef NETATALK
592 1.286 ozaki case LLC_SNAP_LSAP:
593 1.286 ozaki switch (l->llc_control) {
594 1.286 ozaki case LLC_UI:
595 1.286 ozaki if (l->llc_ssap != LLC_SNAP_LSAP)
596 1.286 ozaki goto drop;
597 1.286 ozaki
598 1.286 ozaki if (memcmp(&(l->llc_snap_org_code)[0],
599 1.286 ozaki at_org_code, sizeof(at_org_code)) == 0 &&
600 1.286 ozaki ntohs(l->llc_snap_ether_type) ==
601 1.286 ozaki ETHERTYPE_ATALK) {
602 1.286 ozaki inq = &atintrq2;
603 1.286 ozaki m_adj(m, sizeof(struct ether_header)
604 1.286 ozaki + sizeof(struct llc));
605 1.286 ozaki isr = NETISR_ATALK;
606 1.286 ozaki break;
607 1.286 ozaki }
608 1.286 ozaki
609 1.286 ozaki if (memcmp(&(l->llc_snap_org_code)[0],
610 1.286 ozaki aarp_org_code,
611 1.286 ozaki sizeof(aarp_org_code)) == 0 &&
612 1.286 ozaki ntohs(l->llc_snap_ether_type) ==
613 1.286 ozaki ETHERTYPE_AARP) {
614 1.286 ozaki m_adj(m, sizeof(struct ether_header)
615 1.286 ozaki + sizeof(struct llc));
616 1.286 ozaki aarpinput(ifp, m); /* XXX queue? */
617 1.286 ozaki return;
618 1.286 ozaki }
619 1.286 ozaki
620 1.286 ozaki default:
621 1.286 ozaki goto drop;
622 1.286 ozaki }
623 1.286 ozaki break;
624 1.286 ozaki #endif
625 1.286 ozaki default:
626 1.286 ozaki goto drop;
627 1.286 ozaki }
628 1.286 ozaki
629 1.286 ozaki KASSERT(inq != NULL);
630 1.286 ozaki IFQ_ENQUEUE_ISR(inq, m, isr);
631 1.286 ozaki return;
632 1.286 ozaki
633 1.286 ozaki drop:
634 1.286 ozaki m_freem(m);
635 1.287 ozaki if_statinc(ifp, if_ierrors); /* XXX should have a dedicated counter? */
636 1.286 ozaki return;
637 1.286 ozaki }
638 1.286 ozaki #endif /* defined (LLC) || defined (NETATALK) */
639 1.286 ozaki
640 1.1 cgd /*
641 1.1 cgd * Process a received Ethernet packet;
642 1.42 thorpej * the packet is in the mbuf chain m with
643 1.42 thorpej * the ether header.
644 1.1 cgd */
645 1.133 liamjfoy void
646 1.58 matt ether_input(struct ifnet *ifp, struct mbuf *m)
647 1.1 cgd {
648 1.91 thorpej struct ethercom *ec = (struct ethercom *) ifp;
649 1.199 rmind pktqueue_t *pktq = NULL;
650 1.199 rmind struct ifqueue *inq = NULL;
651 1.162 matt uint16_t etype;
652 1.42 thorpej struct ether_header *eh;
653 1.187 matt size_t ehlen;
654 1.204 tls static int earlypkts;
655 1.198 msaitoh int isr = 0;
656 1.294 yamaguch #if NAGR > 0
657 1.294 yamaguch void *agrprivate;
658 1.294 yamaguch #endif
659 1.1 cgd
660 1.216 ozaki KASSERT(!cpu_intr_p());
661 1.253 maxv KASSERT((m->m_flags & M_PKTHDR) != 0);
662 1.216 ozaki
663 1.287 ozaki if ((ifp->if_flags & IFF_UP) == 0)
664 1.287 ozaki goto drop;
665 1.290 roy
666 1.291 roy #ifdef MBUFTRACE
667 1.291 roy m_claimm(m, &ec->ec_rx_mowner);
668 1.291 roy #endif
669 1.291 roy
670 1.292 roy if (__predict_false(m->m_len < sizeof(*eh))) {
671 1.290 roy if ((m = m_pullup(m, sizeof(*eh))) == NULL)
672 1.287 ozaki goto dropped;
673 1.267 maxv }
674 1.42 thorpej
675 1.42 thorpej eh = mtod(m, struct ether_header *);
676 1.63 thorpej etype = ntohs(eh->ether_type);
677 1.187 matt ehlen = sizeof(*eh);
678 1.63 thorpej
679 1.284 riastrad if (__predict_false(earlypkts < 100 ||
680 1.284 riastrad entropy_epoch() == (unsigned)-1)) {
681 1.204 tls rnd_add_data(NULL, eh, ehlen, 0);
682 1.204 tls earlypkts++;
683 1.204 tls }
684 1.204 tls
685 1.63 thorpej /*
686 1.258 maxv * Determine if the packet is within its size limits. For MPLS the
687 1.258 maxv * header length is variable, so we skip the check.
688 1.63 thorpej */
689 1.182 kefren if (etype != ETHERTYPE_MPLS && m->m_pkthdr.len >
690 1.83 thorpej ETHER_MAX_FRAME(ifp, etype, m->m_flags & M_HASFCS)) {
691 1.278 msaitoh #ifdef DIAGNOSTIC
692 1.203 ozaki mutex_enter(&bigpktpps_lock);
693 1.123 matt if (ppsratecheck(&bigpktppslim_last, &bigpktpps_count,
694 1.261 maxv bigpktppslim)) {
695 1.123 matt printf("%s: discarding oversize frame (len=%d)\n",
696 1.123 matt ifp->if_xname, m->m_pkthdr.len);
697 1.123 matt }
698 1.203 ozaki mutex_exit(&bigpktpps_lock);
699 1.278 msaitoh #endif
700 1.287 ozaki goto drop;
701 1.63 thorpej }
702 1.77 thorpej
703 1.84 thorpej if (ETHER_IS_MULTICAST(eh->ether_dhost)) {
704 1.84 thorpej /*
705 1.84 thorpej * If this is not a simplex interface, drop the packet
706 1.84 thorpej * if it came from us.
707 1.84 thorpej */
708 1.84 thorpej if ((ifp->if_flags & IFF_SIMPLEX) == 0 &&
709 1.153 dyoung memcmp(CLLADDR(ifp->if_sadl), eh->ether_shost,
710 1.84 thorpej ETHER_ADDR_LEN) == 0) {
711 1.287 ozaki goto drop;
712 1.84 thorpej }
713 1.84 thorpej
714 1.84 thorpej if (memcmp(etherbroadcastaddr,
715 1.84 thorpej eh->ether_dhost, ETHER_ADDR_LEN) == 0)
716 1.84 thorpej m->m_flags |= M_BCAST;
717 1.84 thorpej else
718 1.84 thorpej m->m_flags |= M_MCAST;
719 1.282 thorpej if_statinc(ifp, if_imcasts);
720 1.84 thorpej }
721 1.84 thorpej
722 1.79 thorpej /* If the CRC is still on the packet, trim it off. */
723 1.79 thorpej if (m->m_flags & M_HASFCS) {
724 1.79 thorpej m_adj(m, -ETHER_CRC_LEN);
725 1.79 thorpej m->m_flags &= ~M_HASFCS;
726 1.79 thorpej }
727 1.79 thorpej
728 1.282 thorpej if_statadd(ifp, if_ibytes, m->m_pkthdr.len);
729 1.78 thorpej
730 1.201 ozaki #if NCARP > 0
731 1.201 ozaki if (__predict_false(ifp->if_carp && ifp->if_type != IFT_CARP)) {
732 1.201 ozaki /*
733 1.261 maxv * Clear M_PROMISC, in case the packet comes from a
734 1.261 maxv * vlan.
735 1.201 ozaki */
736 1.137 rpaulo m->m_flags &= ~M_PROMISC;
737 1.201 ozaki if (carp_input(m, (uint8_t *)&eh->ether_shost,
738 1.201 ozaki (uint8_t *)&eh->ether_dhost, eh->ether_type) == 0)
739 1.137 rpaulo return;
740 1.201 ozaki }
741 1.253 maxv #endif
742 1.250 maxv
743 1.247 msaitoh if ((m->m_flags & (M_BCAST | M_MCAST | M_PROMISC)) == 0 &&
744 1.201 ozaki (ifp->if_flags & IFF_PROMISC) != 0 &&
745 1.201 ozaki memcmp(CLLADDR(ifp->if_sadl), eh->ether_dhost,
746 1.261 maxv ETHER_ADDR_LEN) != 0) {
747 1.201 ozaki m->m_flags |= M_PROMISC;
748 1.70 bouyer }
749 1.78 thorpej
750 1.106 bouyer if ((m->m_flags & M_PROMISC) == 0) {
751 1.195 rmind if (pfil_run_hooks(ifp->if_pfil, &m, ifp, PFIL_IN) != 0)
752 1.106 bouyer return;
753 1.106 bouyer if (m == NULL)
754 1.106 bouyer return;
755 1.78 thorpej
756 1.106 bouyer eh = mtod(m, struct ether_header *);
757 1.106 bouyer etype = ntohs(eh->ether_type);
758 1.106 bouyer }
759 1.70 bouyer
760 1.172 darran #if NAGR > 0
761 1.294 yamaguch if (ifp->if_type != IFT_IEEE8023ADLAG) {
762 1.294 yamaguch agrprivate = ifp->if_lagg;
763 1.294 yamaguch } else {
764 1.294 yamaguch agrprivate = NULL;
765 1.294 yamaguch }
766 1.294 yamaguch if (agrprivate != NULL &&
767 1.172 darran __predict_true(etype != ETHERTYPE_SLOWPROTOCOLS)) {
768 1.172 darran m->m_flags &= ~M_PROMISC;
769 1.172 darran agr_input(ifp, m);
770 1.172 darran return;
771 1.172 darran }
772 1.253 maxv #endif
773 1.172 darran
774 1.293 yamaguch /* Handle input from a lagg(4) port */
775 1.293 yamaguch if (ifp->if_type == IFT_IEEE8023ADLAG) {
776 1.293 yamaguch KASSERT(lagg_input_ethernet_p != NULL);
777 1.293 yamaguch m = (*lagg_input_ethernet_p)(ifp, m);
778 1.293 yamaguch if (m == NULL)
779 1.293 yamaguch return;
780 1.293 yamaguch }
781 1.293 yamaguch
782 1.91 thorpej /*
783 1.91 thorpej * If VLANs are configured on the interface, check to
784 1.91 thorpej * see if the device performed the decapsulation and
785 1.91 thorpej * provided us with the tag.
786 1.91 thorpej */
787 1.244 knakahar if (ec->ec_nvlans && vlan_has_tag(m)) {
788 1.70 bouyer #if NVLAN > 0
789 1.70 bouyer /*
790 1.70 bouyer * vlan_input() will either recursively call ether_input()
791 1.70 bouyer * or drop the packet.
792 1.70 bouyer */
793 1.91 thorpej vlan_input(ifp, m);
794 1.287 ozaki return;
795 1.91 thorpej #else
796 1.287 ozaki goto drop;
797 1.70 bouyer #endif
798 1.61 thorpej }
799 1.1 cgd
800 1.59 thorpej /*
801 1.59 thorpej * Handle protocols that expect to have the Ethernet header
802 1.59 thorpej * (and possibly FCS) intact.
803 1.59 thorpej */
804 1.59 thorpej switch (etype) {
805 1.187 matt case ETHERTYPE_VLAN: {
806 1.187 matt struct ether_vlan_header *evl = (void *)eh;
807 1.253 maxv
808 1.187 matt /*
809 1.187 matt * If there is a tag of 0, then the VLAN header was probably
810 1.187 matt * just being used to store the priority. Extract the ether
811 1.250 maxv * type, and if IP or IPV6, let them deal with it.
812 1.187 matt */
813 1.254 maxv if (m->m_len >= sizeof(*evl) &&
814 1.253 maxv EVL_VLANOFTAG(evl->evl_tag) == 0) {
815 1.187 matt etype = ntohs(evl->evl_proto);
816 1.187 matt ehlen = sizeof(*evl);
817 1.253 maxv if ((m->m_flags & M_PROMISC) == 0 &&
818 1.253 maxv (etype == ETHERTYPE_IP ||
819 1.253 maxv etype == ETHERTYPE_IPV6))
820 1.187 matt break;
821 1.187 matt }
822 1.253 maxv
823 1.59 thorpej #if NVLAN > 0
824 1.59 thorpej /*
825 1.59 thorpej * vlan_input() will either recursively call ether_input()
826 1.59 thorpej * or drop the packet.
827 1.59 thorpej */
828 1.287 ozaki if (ec->ec_nvlans != 0) {
829 1.63 thorpej vlan_input(ifp, m);
830 1.287 ozaki return;
831 1.287 ozaki } else
832 1.253 maxv #endif
833 1.287 ozaki goto drop;
834 1.187 matt }
835 1.253 maxv
836 1.81 martin #if NPPPOE > 0
837 1.81 martin case ETHERTYPE_PPPOEDISC:
838 1.218 ozaki pppoedisc_input(ifp, m);
839 1.218 ozaki return;
840 1.253 maxv
841 1.81 martin case ETHERTYPE_PPPOE:
842 1.218 ozaki pppoe_input(ifp, m);
843 1.81 martin return;
844 1.253 maxv #endif
845 1.253 maxv
846 1.121 yamt case ETHERTYPE_SLOWPROTOCOLS: {
847 1.121 yamt uint8_t subtype;
848 1.121 yamt
849 1.287 ozaki if (m->m_pkthdr.len < sizeof(*eh) + sizeof(subtype))
850 1.287 ozaki goto drop;
851 1.253 maxv
852 1.121 yamt m_copydata(m, sizeof(*eh), sizeof(subtype), &subtype);
853 1.121 yamt switch (subtype) {
854 1.121 yamt #if NAGR > 0
855 1.121 yamt case SLOWPROTOCOLS_SUBTYPE_LACP:
856 1.294 yamaguch if (agrprivate != NULL) {
857 1.121 yamt ieee8023ad_lacp_input(ifp, m);
858 1.121 yamt return;
859 1.121 yamt }
860 1.121 yamt break;
861 1.121 yamt
862 1.121 yamt case SLOWPROTOCOLS_SUBTYPE_MARKER:
863 1.294 yamaguch if (agrprivate != NULL) {
864 1.121 yamt ieee8023ad_marker_input(ifp, m);
865 1.121 yamt return;
866 1.121 yamt }
867 1.121 yamt break;
868 1.261 maxv #endif
869 1.253 maxv
870 1.121 yamt default:
871 1.121 yamt if (subtype == 0 || subtype > 10) {
872 1.121 yamt /* illegal value */
873 1.287 ozaki goto drop;
874 1.121 yamt }
875 1.121 yamt /* unknown subtype */
876 1.121 yamt break;
877 1.121 yamt }
878 1.121 yamt }
879 1.273 mrg /* FALLTHROUGH */
880 1.59 thorpej default:
881 1.287 ozaki if (m->m_flags & M_PROMISC)
882 1.287 ozaki goto drop;
883 1.59 thorpej }
884 1.42 thorpej
885 1.45 thorpej /* If the CRC is still on the packet, trim it off. */
886 1.79 thorpej if (m->m_flags & M_HASFCS) {
887 1.45 thorpej m_adj(m, -ETHER_CRC_LEN);
888 1.79 thorpej m->m_flags &= ~M_HASFCS;
889 1.79 thorpej }
890 1.42 thorpej
891 1.286 ozaki /* etype represents the size of the payload in this case */
892 1.286 ozaki if (etype <= ETHERMTU + sizeof(struct ether_header)) {
893 1.286 ozaki KASSERT(ehlen == sizeof(*eh));
894 1.286 ozaki #if defined (LLC) || defined (NETATALK)
895 1.286 ozaki ether_input_llc(ifp, m, eh);
896 1.286 ozaki return;
897 1.286 ozaki #else
898 1.287 ozaki goto drop;
899 1.286 ozaki #endif
900 1.286 ozaki }
901 1.139 is
902 1.286 ozaki /* Strip off the Ethernet header. */
903 1.286 ozaki m_adj(m, ehlen);
904 1.286 ozaki
905 1.286 ozaki switch (etype) {
906 1.1 cgd #ifdef INET
907 1.286 ozaki case ETHERTYPE_IP:
908 1.30 matt #ifdef GATEWAY
909 1.286 ozaki if (ipflow_fastforward(m))
910 1.286 ozaki return;
911 1.30 matt #endif
912 1.286 ozaki pktq = ip_pktq;
913 1.286 ozaki break;
914 1.1 cgd
915 1.286 ozaki case ETHERTYPE_ARP:
916 1.286 ozaki isr = NETISR_ARP;
917 1.286 ozaki inq = &arpintrq;
918 1.286 ozaki break;
919 1.7 glass
920 1.286 ozaki case ETHERTYPE_REVARP:
921 1.286 ozaki revarpinput(m); /* XXX queue? */
922 1.286 ozaki return;
923 1.1 cgd #endif
924 1.253 maxv
925 1.44 itojun #ifdef INET6
926 1.286 ozaki case ETHERTYPE_IPV6:
927 1.287 ozaki if (__predict_false(!in6_present))
928 1.287 ozaki goto drop;
929 1.250 maxv #ifdef GATEWAY
930 1.286 ozaki if (ip6flow_fastforward(&m))
931 1.286 ozaki return;
932 1.148 liamjfoy #endif
933 1.286 ozaki pktq = ip6_pktq;
934 1.286 ozaki break;
935 1.44 itojun #endif
936 1.253 maxv
937 1.23 christos #ifdef NETATALK
938 1.286 ozaki case ETHERTYPE_ATALK:
939 1.286 ozaki isr = NETISR_ATALK;
940 1.286 ozaki inq = &atintrq1;
941 1.286 ozaki break;
942 1.253 maxv
943 1.286 ozaki case ETHERTYPE_AARP:
944 1.286 ozaki aarpinput(ifp, m); /* XXX queue? */
945 1.286 ozaki return;
946 1.253 maxv #endif
947 1.253 maxv
948 1.182 kefren #ifdef MPLS
949 1.286 ozaki case ETHERTYPE_MPLS:
950 1.286 ozaki isr = NETISR_MPLS;
951 1.286 ozaki inq = &mplsintrq;
952 1.286 ozaki break;
953 1.182 kefren #endif
954 1.253 maxv
955 1.286 ozaki default:
956 1.287 ozaki goto drop;
957 1.1 cgd }
958 1.1 cgd
959 1.199 rmind if (__predict_true(pktq)) {
960 1.301 knakahar const uint32_t h = pktq_rps_hash(ðer_pktq_rps_hash_p, m);
961 1.199 rmind if (__predict_false(!pktq_enqueue(pktq, m, h))) {
962 1.199 rmind m_freem(m);
963 1.199 rmind }
964 1.199 rmind return;
965 1.199 rmind }
966 1.199 rmind
967 1.199 rmind if (__predict_false(!inq)) {
968 1.199 rmind /* Should not happen. */
969 1.287 ozaki goto drop;
970 1.199 rmind }
971 1.228 ozaki
972 1.285 ozaki IFQ_ENQUEUE_ISR(inq, m, isr);
973 1.287 ozaki return;
974 1.287 ozaki
975 1.287 ozaki drop:
976 1.287 ozaki m_freem(m);
977 1.287 ozaki dropped:
978 1.287 ozaki if_statinc(ifp, if_ierrors); /* XXX should have a dedicated counter? */
979 1.1 cgd }
980 1.1 cgd
981 1.1 cgd /*
982 1.1 cgd * Convert Ethernet address to printable (loggable) representation.
983 1.1 cgd */
984 1.1 cgd char *
985 1.58 matt ether_sprintf(const u_char *ap)
986 1.1 cgd {
987 1.129 christos static char etherbuf[3 * ETHER_ADDR_LEN];
988 1.129 christos return ether_snprintf(etherbuf, sizeof(etherbuf), ap);
989 1.129 christos }
990 1.129 christos
991 1.129 christos char *
992 1.129 christos ether_snprintf(char *buf, size_t len, const u_char *ap)
993 1.129 christos {
994 1.129 christos char *cp = buf;
995 1.129 christos size_t i;
996 1.1 cgd
997 1.129 christos for (i = 0; i < len / 3; i++) {
998 1.124 christos *cp++ = hexdigits[*ap >> 4];
999 1.124 christos *cp++ = hexdigits[*ap++ & 0xf];
1000 1.1 cgd *cp++ = ':';
1001 1.1 cgd }
1002 1.129 christos *--cp = '\0';
1003 1.129 christos return buf;
1004 1.1 cgd }
1005 1.8 mycroft
1006 1.8 mycroft /*
1007 1.8 mycroft * Perform common duties while attaching to interface list
1008 1.8 mycroft */
1009 1.8 mycroft void
1010 1.162 matt ether_ifattach(struct ifnet *ifp, const uint8_t *lla)
1011 1.8 mycroft {
1012 1.104 matt struct ethercom *ec = (struct ethercom *)ifp;
1013 1.297 yamaguch char xnamebuf[HOOKNAMSIZ];
1014 1.8 mycroft
1015 1.8 mycroft ifp->if_type = IFT_ETHER;
1016 1.94 enami ifp->if_hdrlen = ETHER_HDR_LEN;
1017 1.73 thorpej ifp->if_dlt = DLT_EN10MB;
1018 1.8 mycroft ifp->if_mtu = ETHERMTU;
1019 1.12 mycroft ifp->if_output = ether_output;
1020 1.216 ozaki ifp->_if_input = ether_input;
1021 1.54 thorpej if (ifp->if_baudrate == 0)
1022 1.54 thorpej ifp->if_baudrate = IF_Mbps(10); /* just a default */
1023 1.75 thorpej
1024 1.230 ozaki if (lla != NULL)
1025 1.230 ozaki if_set_sadl(ifp, lla, ETHER_ADDR_LEN, !ETHER_IS_LOCAL(lla));
1026 1.75 thorpej
1027 1.104 matt LIST_INIT(&ec->ec_multiaddrs);
1028 1.276 msaitoh SIMPLEQ_INIT(&ec->ec_vids);
1029 1.233 ozaki ec->ec_lock = mutex_obj_alloc(MUTEX_DEFAULT, IPL_NET);
1030 1.274 ozaki ec->ec_flags = 0;
1031 1.26 is ifp->if_broadcastaddr = etherbroadcastaddr;
1032 1.177 joerg bpf_attach(ifp, DLT_EN10MB, sizeof(struct ether_header));
1033 1.297 yamaguch snprintf(xnamebuf, sizeof(xnamebuf),
1034 1.297 yamaguch "%s-ether_ifdetachhooks", ifp->if_xname);
1035 1.297 yamaguch ec->ec_ifdetach_hooks = simplehook_create(IPL_NET, xnamebuf);
1036 1.104 matt #ifdef MBUFTRACE
1037 1.283 thorpej mowner_init_owner(&ec->ec_tx_mowner, ifp->if_xname, "tx");
1038 1.283 thorpej mowner_init_owner(&ec->ec_rx_mowner, ifp->if_xname, "rx");
1039 1.104 matt MOWNER_ATTACH(&ec->ec_tx_mowner);
1040 1.104 matt MOWNER_ATTACH(&ec->ec_rx_mowner);
1041 1.104 matt ifp->if_mowner = &ec->ec_tx_mowner;
1042 1.104 matt #endif
1043 1.52 thorpej }
1044 1.52 thorpej
1045 1.52 thorpej void
1046 1.58 matt ether_ifdetach(struct ifnet *ifp)
1047 1.52 thorpej {
1048 1.63 thorpej struct ethercom *ec = (void *) ifp;
1049 1.63 thorpej struct ether_multi *enm;
1050 1.69 thorpej
1051 1.269 ozaki IFNET_ASSERT_UNLOCKED(ifp);
1052 1.190 christos /*
1053 1.190 christos * Prevent further calls to ioctl (for example turning off
1054 1.190 christos * promiscuous mode from the bridge code), which eventually can
1055 1.190 christos * call if_init() which can cause panics because the interface
1056 1.190 christos * is in the process of being detached. Return device not configured
1057 1.190 christos * instead.
1058 1.190 christos */
1059 1.280 christos ifp->if_ioctl = __FPTRCAST(int (*)(struct ifnet *, u_long, void *),
1060 1.280 christos enxio);
1061 1.190 christos
1062 1.297 yamaguch simplehook_dohooks(ec->ec_ifdetach_hooks);
1063 1.297 yamaguch KASSERT(!simplehook_has_hooks(ec->ec_ifdetach_hooks));
1064 1.297 yamaguch simplehook_destroy(ec->ec_ifdetach_hooks);
1065 1.297 yamaguch
1066 1.177 joerg bpf_detach(ifp);
1067 1.63 thorpej
1068 1.245 msaitoh ETHER_LOCK(ec);
1069 1.276 msaitoh KASSERT(ec->ec_nvlans == 0);
1070 1.63 thorpej while ((enm = LIST_FIRST(&ec->ec_multiaddrs)) != NULL) {
1071 1.63 thorpej LIST_REMOVE(enm, enm_list);
1072 1.248 ozaki kmem_free(enm, sizeof(*enm));
1073 1.63 thorpej ec->ec_multicnt--;
1074 1.63 thorpej }
1075 1.245 msaitoh ETHER_UNLOCK(ec);
1076 1.52 thorpej
1077 1.252 maxv mutex_obj_free(ec->ec_lock);
1078 1.253 maxv ec->ec_lock = NULL;
1079 1.231 ozaki
1080 1.189 chs ifp->if_mowner = NULL;
1081 1.104 matt MOWNER_DETACH(&ec->ec_rx_mowner);
1082 1.104 matt MOWNER_DETACH(&ec->ec_tx_mowner);
1083 1.53 thorpej }
1084 1.53 thorpej
1085 1.297 yamaguch void *
1086 1.297 yamaguch ether_ifdetachhook_establish(struct ifnet *ifp,
1087 1.297 yamaguch void (*fn)(void *), void *arg)
1088 1.297 yamaguch {
1089 1.297 yamaguch struct ethercom *ec;
1090 1.297 yamaguch khook_t *hk;
1091 1.297 yamaguch
1092 1.297 yamaguch if (ifp->if_type != IFT_ETHER)
1093 1.297 yamaguch return NULL;
1094 1.297 yamaguch
1095 1.297 yamaguch ec = (struct ethercom *)ifp;
1096 1.297 yamaguch hk = simplehook_establish(ec->ec_ifdetach_hooks,
1097 1.297 yamaguch fn, arg);
1098 1.297 yamaguch
1099 1.297 yamaguch return (void *)hk;
1100 1.297 yamaguch }
1101 1.297 yamaguch
1102 1.297 yamaguch void
1103 1.297 yamaguch ether_ifdetachhook_disestablish(struct ifnet *ifp,
1104 1.297 yamaguch void *vhook, kmutex_t *lock)
1105 1.297 yamaguch {
1106 1.297 yamaguch struct ethercom *ec;
1107 1.297 yamaguch
1108 1.297 yamaguch if (vhook == NULL)
1109 1.297 yamaguch return;
1110 1.297 yamaguch
1111 1.297 yamaguch ec = (struct ethercom *)ifp;
1112 1.297 yamaguch simplehook_disestablish(ec->ec_ifdetach_hooks, vhook, lock);
1113 1.297 yamaguch }
1114 1.297 yamaguch
1115 1.56 thorpej #if 0
1116 1.56 thorpej /*
1117 1.56 thorpej * This is for reference. We have a table-driven version
1118 1.56 thorpej * of the little-endian crc32 generator, which is faster
1119 1.56 thorpej * than the double-loop.
1120 1.56 thorpej */
1121 1.162 matt uint32_t
1122 1.162 matt ether_crc32_le(const uint8_t *buf, size_t len)
1123 1.53 thorpej {
1124 1.162 matt uint32_t c, crc, carry;
1125 1.53 thorpej size_t i, j;
1126 1.53 thorpej
1127 1.53 thorpej crc = 0xffffffffU; /* initial value */
1128 1.53 thorpej
1129 1.53 thorpej for (i = 0; i < len; i++) {
1130 1.53 thorpej c = buf[i];
1131 1.53 thorpej for (j = 0; j < 8; j++) {
1132 1.53 thorpej carry = ((crc & 0x01) ? 1 : 0) ^ (c & 0x01);
1133 1.53 thorpej crc >>= 1;
1134 1.53 thorpej c >>= 1;
1135 1.53 thorpej if (carry)
1136 1.56 thorpej crc = (crc ^ ETHER_CRC_POLY_LE);
1137 1.53 thorpej }
1138 1.53 thorpej }
1139 1.53 thorpej
1140 1.53 thorpej return (crc);
1141 1.53 thorpej }
1142 1.56 thorpej #else
1143 1.162 matt uint32_t
1144 1.162 matt ether_crc32_le(const uint8_t *buf, size_t len)
1145 1.56 thorpej {
1146 1.162 matt static const uint32_t crctab[] = {
1147 1.56 thorpej 0x00000000, 0x1db71064, 0x3b6e20c8, 0x26d930ac,
1148 1.56 thorpej 0x76dc4190, 0x6b6b51f4, 0x4db26158, 0x5005713c,
1149 1.56 thorpej 0xedb88320, 0xf00f9344, 0xd6d6a3e8, 0xcb61b38c,
1150 1.56 thorpej 0x9b64c2b0, 0x86d3d2d4, 0xa00ae278, 0xbdbdf21c
1151 1.56 thorpej };
1152 1.162 matt uint32_t crc;
1153 1.98 thorpej size_t i;
1154 1.56 thorpej
1155 1.56 thorpej crc = 0xffffffffU; /* initial value */
1156 1.56 thorpej
1157 1.56 thorpej for (i = 0; i < len; i++) {
1158 1.56 thorpej crc ^= buf[i];
1159 1.56 thorpej crc = (crc >> 4) ^ crctab[crc & 0xf];
1160 1.56 thorpej crc = (crc >> 4) ^ crctab[crc & 0xf];
1161 1.56 thorpej }
1162 1.56 thorpej
1163 1.56 thorpej return (crc);
1164 1.56 thorpej }
1165 1.56 thorpej #endif
1166 1.53 thorpej
1167 1.162 matt uint32_t
1168 1.162 matt ether_crc32_be(const uint8_t *buf, size_t len)
1169 1.53 thorpej {
1170 1.162 matt uint32_t c, crc, carry;
1171 1.53 thorpej size_t i, j;
1172 1.53 thorpej
1173 1.53 thorpej crc = 0xffffffffU; /* initial value */
1174 1.53 thorpej
1175 1.53 thorpej for (i = 0; i < len; i++) {
1176 1.53 thorpej c = buf[i];
1177 1.53 thorpej for (j = 0; j < 8; j++) {
1178 1.53 thorpej carry = ((crc & 0x80000000U) ? 1 : 0) ^ (c & 0x01);
1179 1.53 thorpej crc <<= 1;
1180 1.53 thorpej c >>= 1;
1181 1.53 thorpej if (carry)
1182 1.53 thorpej crc = (crc ^ ETHER_CRC_POLY_BE) | carry;
1183 1.53 thorpej }
1184 1.53 thorpej }
1185 1.53 thorpej
1186 1.53 thorpej return (crc);
1187 1.8 mycroft }
1188 1.8 mycroft
1189 1.48 is #ifdef INET
1190 1.118 yamt const uint8_t ether_ipmulticast_min[ETHER_ADDR_LEN] =
1191 1.118 yamt { 0x01, 0x00, 0x5e, 0x00, 0x00, 0x00 };
1192 1.118 yamt const uint8_t ether_ipmulticast_max[ETHER_ADDR_LEN] =
1193 1.118 yamt { 0x01, 0x00, 0x5e, 0x7f, 0xff, 0xff };
1194 1.48 is #endif
1195 1.44 itojun #ifdef INET6
1196 1.118 yamt const uint8_t ether_ip6multicast_min[ETHER_ADDR_LEN] =
1197 1.118 yamt { 0x33, 0x33, 0x00, 0x00, 0x00, 0x00 };
1198 1.118 yamt const uint8_t ether_ip6multicast_max[ETHER_ADDR_LEN] =
1199 1.118 yamt { 0x33, 0x33, 0xff, 0xff, 0xff, 0xff };
1200 1.44 itojun #endif
1201 1.60 enami
1202 1.3 hpeyerl /*
1203 1.138 rpaulo * ether_aton implementation, not using a static buffer.
1204 1.138 rpaulo */
1205 1.138 rpaulo int
1206 1.180 christos ether_aton_r(u_char *dest, size_t len, const char *str)
1207 1.138 rpaulo {
1208 1.250 maxv const u_char *cp = (const void *)str;
1209 1.180 christos u_char *ep;
1210 1.180 christos
1211 1.185 tsutsui #define atox(c) (((c) <= '9') ? ((c) - '0') : ((toupper(c) - 'A') + 10))
1212 1.180 christos
1213 1.180 christos if (len < ETHER_ADDR_LEN)
1214 1.180 christos return ENOSPC;
1215 1.180 christos
1216 1.180 christos ep = dest + ETHER_ADDR_LEN;
1217 1.250 maxv
1218 1.180 christos while (*cp) {
1219 1.250 maxv if (!isxdigit(*cp))
1220 1.250 maxv return EINVAL;
1221 1.252 maxv
1222 1.180 christos *dest = atox(*cp);
1223 1.180 christos cp++;
1224 1.250 maxv if (isxdigit(*cp)) {
1225 1.250 maxv *dest = (*dest << 4) | atox(*cp);
1226 1.180 christos cp++;
1227 1.250 maxv }
1228 1.252 maxv dest++;
1229 1.252 maxv
1230 1.180 christos if (dest == ep)
1231 1.252 maxv return (*cp == '\0') ? 0 : ENAMETOOLONG;
1232 1.252 maxv
1233 1.180 christos switch (*cp) {
1234 1.180 christos case ':':
1235 1.180 christos case '-':
1236 1.180 christos case '.':
1237 1.179 jakllsch cp++;
1238 1.180 christos break;
1239 1.179 jakllsch }
1240 1.250 maxv }
1241 1.180 christos return ENOBUFS;
1242 1.138 rpaulo }
1243 1.138 rpaulo
1244 1.138 rpaulo /*
1245 1.60 enami * Convert a sockaddr into an Ethernet address or range of Ethernet
1246 1.60 enami * addresses.
1247 1.3 hpeyerl */
1248 1.3 hpeyerl int
1249 1.162 matt ether_multiaddr(const struct sockaddr *sa, uint8_t addrlo[ETHER_ADDR_LEN],
1250 1.162 matt uint8_t addrhi[ETHER_ADDR_LEN])
1251 1.3 hpeyerl {
1252 1.24 christos #ifdef INET
1253 1.155 dyoung const struct sockaddr_in *sin;
1254 1.261 maxv #endif
1255 1.44 itojun #ifdef INET6
1256 1.155 dyoung const struct sockaddr_in6 *sin6;
1257 1.261 maxv #endif
1258 1.3 hpeyerl
1259 1.60 enami switch (sa->sa_family) {
1260 1.3 hpeyerl
1261 1.3 hpeyerl case AF_UNSPEC:
1262 1.146 dyoung memcpy(addrlo, sa->sa_data, ETHER_ADDR_LEN);
1263 1.146 dyoung memcpy(addrhi, addrlo, ETHER_ADDR_LEN);
1264 1.3 hpeyerl break;
1265 1.3 hpeyerl
1266 1.3 hpeyerl #ifdef INET
1267 1.3 hpeyerl case AF_INET:
1268 1.155 dyoung sin = satocsin(sa);
1269 1.3 hpeyerl if (sin->sin_addr.s_addr == INADDR_ANY) {
1270 1.3 hpeyerl /*
1271 1.60 enami * An IP address of INADDR_ANY means listen to
1272 1.60 enami * or stop listening to all of the Ethernet
1273 1.60 enami * multicast addresses used for IP.
1274 1.3 hpeyerl * (This is for the sake of IP multicast routers.)
1275 1.3 hpeyerl */
1276 1.146 dyoung memcpy(addrlo, ether_ipmulticast_min, ETHER_ADDR_LEN);
1277 1.146 dyoung memcpy(addrhi, ether_ipmulticast_max, ETHER_ADDR_LEN);
1278 1.252 maxv } else {
1279 1.3 hpeyerl ETHER_MAP_IP_MULTICAST(&sin->sin_addr, addrlo);
1280 1.146 dyoung memcpy(addrhi, addrlo, ETHER_ADDR_LEN);
1281 1.3 hpeyerl }
1282 1.3 hpeyerl break;
1283 1.3 hpeyerl #endif
1284 1.44 itojun #ifdef INET6
1285 1.44 itojun case AF_INET6:
1286 1.155 dyoung sin6 = satocsin6(sa);
1287 1.47 itojun if (IN6_IS_ADDR_UNSPECIFIED(&sin6->sin6_addr)) {
1288 1.44 itojun /*
1289 1.60 enami * An IP6 address of 0 means listen to or stop
1290 1.60 enami * listening to all of the Ethernet multicast
1291 1.60 enami * address used for IP6.
1292 1.44 itojun * (This is used for multicast routers.)
1293 1.44 itojun */
1294 1.146 dyoung memcpy(addrlo, ether_ip6multicast_min, ETHER_ADDR_LEN);
1295 1.146 dyoung memcpy(addrhi, ether_ip6multicast_max, ETHER_ADDR_LEN);
1296 1.44 itojun } else {
1297 1.44 itojun ETHER_MAP_IPV6_MULTICAST(&sin6->sin6_addr, addrlo);
1298 1.146 dyoung memcpy(addrhi, addrlo, ETHER_ADDR_LEN);
1299 1.44 itojun }
1300 1.44 itojun break;
1301 1.44 itojun #endif
1302 1.3 hpeyerl
1303 1.3 hpeyerl default:
1304 1.146 dyoung return EAFNOSUPPORT;
1305 1.60 enami }
1306 1.146 dyoung return 0;
1307 1.60 enami }
1308 1.60 enami
1309 1.60 enami /*
1310 1.60 enami * Add an Ethernet multicast address or range of addresses to the list for a
1311 1.60 enami * given interface.
1312 1.60 enami */
1313 1.60 enami int
1314 1.155 dyoung ether_addmulti(const struct sockaddr *sa, struct ethercom *ec)
1315 1.60 enami {
1316 1.231 ozaki struct ether_multi *enm, *_enm;
1317 1.60 enami u_char addrlo[ETHER_ADDR_LEN];
1318 1.60 enami u_char addrhi[ETHER_ADDR_LEN];
1319 1.237 skrll int error = 0;
1320 1.231 ozaki
1321 1.231 ozaki /* Allocate out of lock */
1322 1.248 ozaki enm = kmem_alloc(sizeof(*enm), KM_SLEEP);
1323 1.60 enami
1324 1.245 msaitoh ETHER_LOCK(ec);
1325 1.155 dyoung error = ether_multiaddr(sa, addrlo, addrhi);
1326 1.231 ozaki if (error != 0)
1327 1.231 ozaki goto out;
1328 1.3 hpeyerl
1329 1.3 hpeyerl /*
1330 1.3 hpeyerl * Verify that we have valid Ethernet multicast addresses.
1331 1.3 hpeyerl */
1332 1.186 yamt if (!ETHER_IS_MULTICAST(addrlo) || !ETHER_IS_MULTICAST(addrhi)) {
1333 1.231 ozaki error = EINVAL;
1334 1.231 ozaki goto out;
1335 1.3 hpeyerl }
1336 1.252 maxv
1337 1.3 hpeyerl /*
1338 1.3 hpeyerl * See if the address range is already in the list.
1339 1.3 hpeyerl */
1340 1.270 yamaguch _enm = ether_lookup_multi(addrlo, addrhi, ec);
1341 1.231 ozaki if (_enm != NULL) {
1342 1.3 hpeyerl /*
1343 1.3 hpeyerl * Found it; just increment the reference count.
1344 1.3 hpeyerl */
1345 1.231 ozaki ++_enm->enm_refcount;
1346 1.231 ozaki error = 0;
1347 1.231 ozaki goto out;
1348 1.3 hpeyerl }
1349 1.252 maxv
1350 1.3 hpeyerl /*
1351 1.239 ozaki * Link a new multicast record into the interface's multicast list.
1352 1.3 hpeyerl */
1353 1.252 maxv memcpy(enm->enm_addrlo, addrlo, ETHER_ADDR_LEN);
1354 1.252 maxv memcpy(enm->enm_addrhi, addrhi, ETHER_ADDR_LEN);
1355 1.3 hpeyerl enm->enm_refcount = 1;
1356 1.22 is LIST_INSERT_HEAD(&ec->ec_multiaddrs, enm, enm_list);
1357 1.22 is ec->ec_multicnt++;
1358 1.252 maxv
1359 1.3 hpeyerl /*
1360 1.3 hpeyerl * Return ENETRESET to inform the driver that the list has changed
1361 1.3 hpeyerl * and its reception filter should be adjusted accordingly.
1362 1.3 hpeyerl */
1363 1.231 ozaki error = ENETRESET;
1364 1.231 ozaki enm = NULL;
1365 1.252 maxv
1366 1.231 ozaki out:
1367 1.245 msaitoh ETHER_UNLOCK(ec);
1368 1.231 ozaki if (enm != NULL)
1369 1.248 ozaki kmem_free(enm, sizeof(*enm));
1370 1.231 ozaki return error;
1371 1.3 hpeyerl }
1372 1.3 hpeyerl
1373 1.3 hpeyerl /*
1374 1.3 hpeyerl * Delete a multicast address record.
1375 1.3 hpeyerl */
1376 1.3 hpeyerl int
1377 1.155 dyoung ether_delmulti(const struct sockaddr *sa, struct ethercom *ec)
1378 1.3 hpeyerl {
1379 1.29 mrg struct ether_multi *enm;
1380 1.60 enami u_char addrlo[ETHER_ADDR_LEN];
1381 1.60 enami u_char addrhi[ETHER_ADDR_LEN];
1382 1.237 skrll int error;
1383 1.3 hpeyerl
1384 1.245 msaitoh ETHER_LOCK(ec);
1385 1.155 dyoung error = ether_multiaddr(sa, addrlo, addrhi);
1386 1.231 ozaki if (error != 0)
1387 1.231 ozaki goto error;
1388 1.3 hpeyerl
1389 1.3 hpeyerl /*
1390 1.252 maxv * Look up the address in our list.
1391 1.3 hpeyerl */
1392 1.270 yamaguch enm = ether_lookup_multi(addrlo, addrhi, ec);
1393 1.3 hpeyerl if (enm == NULL) {
1394 1.231 ozaki error = ENXIO;
1395 1.231 ozaki goto error;
1396 1.3 hpeyerl }
1397 1.3 hpeyerl if (--enm->enm_refcount != 0) {
1398 1.3 hpeyerl /*
1399 1.3 hpeyerl * Still some claims to this record.
1400 1.3 hpeyerl */
1401 1.231 ozaki error = 0;
1402 1.231 ozaki goto error;
1403 1.3 hpeyerl }
1404 1.252 maxv
1405 1.3 hpeyerl /*
1406 1.3 hpeyerl * No remaining claims to this record; unlink and free it.
1407 1.3 hpeyerl */
1408 1.13 mycroft LIST_REMOVE(enm, enm_list);
1409 1.22 is ec->ec_multicnt--;
1410 1.245 msaitoh ETHER_UNLOCK(ec);
1411 1.252 maxv kmem_free(enm, sizeof(*enm));
1412 1.231 ozaki
1413 1.3 hpeyerl /*
1414 1.3 hpeyerl * Return ENETRESET to inform the driver that the list has changed
1415 1.3 hpeyerl * and its reception filter should be adjusted accordingly.
1416 1.3 hpeyerl */
1417 1.231 ozaki return ENETRESET;
1418 1.252 maxv
1419 1.231 ozaki error:
1420 1.245 msaitoh ETHER_UNLOCK(ec);
1421 1.231 ozaki return error;
1422 1.66 thorpej }
1423 1.66 thorpej
1424 1.170 dyoung void
1425 1.170 dyoung ether_set_ifflags_cb(struct ethercom *ec, ether_cb_t cb)
1426 1.170 dyoung {
1427 1.170 dyoung ec->ec_ifflags_cb = cb;
1428 1.170 dyoung }
1429 1.170 dyoung
1430 1.276 msaitoh void
1431 1.276 msaitoh ether_set_vlan_cb(struct ethercom *ec, ether_vlancb_t cb)
1432 1.276 msaitoh {
1433 1.276 msaitoh
1434 1.276 msaitoh ec->ec_vlan_cb = cb;
1435 1.276 msaitoh }
1436 1.276 msaitoh
1437 1.272 msaitoh static int
1438 1.272 msaitoh ether_ioctl_reinit(struct ethercom *ec)
1439 1.272 msaitoh {
1440 1.272 msaitoh struct ifnet *ifp = &ec->ec_if;
1441 1.272 msaitoh int error;
1442 1.272 msaitoh
1443 1.272 msaitoh switch (ifp->if_flags & (IFF_UP | IFF_RUNNING)) {
1444 1.272 msaitoh case IFF_RUNNING:
1445 1.272 msaitoh /*
1446 1.272 msaitoh * If interface is marked down and it is running,
1447 1.272 msaitoh * then stop and disable it.
1448 1.272 msaitoh */
1449 1.272 msaitoh (*ifp->if_stop)(ifp, 1);
1450 1.272 msaitoh break;
1451 1.272 msaitoh case IFF_UP:
1452 1.272 msaitoh /*
1453 1.272 msaitoh * If interface is marked up and it is stopped, then
1454 1.272 msaitoh * start it.
1455 1.272 msaitoh */
1456 1.272 msaitoh return (*ifp->if_init)(ifp);
1457 1.272 msaitoh case IFF_UP | IFF_RUNNING:
1458 1.272 msaitoh error = 0;
1459 1.272 msaitoh if (ec->ec_ifflags_cb != NULL) {
1460 1.272 msaitoh error = (*ec->ec_ifflags_cb)(ec);
1461 1.272 msaitoh if (error == ENETRESET) {
1462 1.272 msaitoh /*
1463 1.272 msaitoh * Reset the interface to pick up
1464 1.272 msaitoh * changes in any other flags that
1465 1.272 msaitoh * affect the hardware state.
1466 1.272 msaitoh */
1467 1.272 msaitoh return (*ifp->if_init)(ifp);
1468 1.272 msaitoh }
1469 1.272 msaitoh } else
1470 1.272 msaitoh error = (*ifp->if_init)(ifp);
1471 1.272 msaitoh return error;
1472 1.272 msaitoh case 0:
1473 1.272 msaitoh break;
1474 1.272 msaitoh }
1475 1.272 msaitoh
1476 1.272 msaitoh return 0;
1477 1.272 msaitoh }
1478 1.272 msaitoh
1479 1.66 thorpej /*
1480 1.66 thorpej * Common ioctls for Ethernet interfaces. Note, we must be
1481 1.66 thorpej * called at splnet().
1482 1.66 thorpej */
1483 1.66 thorpej int
1484 1.147 christos ether_ioctl(struct ifnet *ifp, u_long cmd, void *data)
1485 1.66 thorpej {
1486 1.272 msaitoh struct ethercom *ec = (void *)ifp;
1487 1.193 msaitoh struct eccapreq *eccr;
1488 1.66 thorpej struct ifreq *ifr = (struct ifreq *)data;
1489 1.170 dyoung struct if_laddrreq *iflr = data;
1490 1.170 dyoung const struct sockaddr_dl *sdl;
1491 1.170 dyoung static const uint8_t zero[ETHER_ADDR_LEN];
1492 1.169 dyoung int error;
1493 1.66 thorpej
1494 1.66 thorpej switch (cmd) {
1495 1.170 dyoung case SIOCINITIFADDR:
1496 1.191 matt {
1497 1.191 matt struct ifaddr *ifa = (struct ifaddr *)data;
1498 1.191 matt if (ifa->ifa_addr->sa_family != AF_LINK
1499 1.247 msaitoh && (ifp->if_flags & (IFF_UP | IFF_RUNNING)) !=
1500 1.247 msaitoh (IFF_UP | IFF_RUNNING)) {
1501 1.170 dyoung ifp->if_flags |= IFF_UP;
1502 1.170 dyoung if ((error = (*ifp->if_init)(ifp)) != 0)
1503 1.170 dyoung return error;
1504 1.170 dyoung }
1505 1.66 thorpej #ifdef INET
1506 1.191 matt if (ifa->ifa_addr->sa_family == AF_INET)
1507 1.191 matt arp_ifinit(ifp, ifa);
1508 1.252 maxv #endif
1509 1.169 dyoung return 0;
1510 1.191 matt }
1511 1.66 thorpej
1512 1.66 thorpej case SIOCSIFMTU:
1513 1.82 thorpej {
1514 1.82 thorpej int maxmtu;
1515 1.82 thorpej
1516 1.82 thorpej if (ec->ec_capabilities & ETHERCAP_JUMBO_MTU)
1517 1.82 thorpej maxmtu = ETHERMTU_JUMBO;
1518 1.82 thorpej else
1519 1.82 thorpej maxmtu = ETHERMTU;
1520 1.82 thorpej
1521 1.82 thorpej if (ifr->ifr_mtu < ETHERMIN || ifr->ifr_mtu > maxmtu)
1522 1.169 dyoung return EINVAL;
1523 1.169 dyoung else if ((error = ifioctl_common(ifp, cmd, data)) != ENETRESET)
1524 1.169 dyoung return error;
1525 1.169 dyoung else if (ifp->if_flags & IFF_UP) {
1526 1.88 thorpej /* Make sure the device notices the MTU change. */
1527 1.169 dyoung return (*ifp->if_init)(ifp);
1528 1.169 dyoung } else
1529 1.169 dyoung return 0;
1530 1.82 thorpej }
1531 1.66 thorpej
1532 1.66 thorpej case SIOCSIFFLAGS:
1533 1.170 dyoung if ((error = ifioctl_common(ifp, cmd, data)) != 0)
1534 1.170 dyoung return error;
1535 1.272 msaitoh return ether_ioctl_reinit(ec);
1536 1.274 ozaki case SIOCGIFFLAGS:
1537 1.274 ozaki error = ifioctl_common(ifp, cmd, data);
1538 1.274 ozaki if (error == 0) {
1539 1.274 ozaki /* Set IFF_ALLMULTI for backcompat */
1540 1.274 ozaki ifr->ifr_flags |= (ec->ec_flags & ETHER_F_ALLMULTI) ?
1541 1.274 ozaki IFF_ALLMULTI : 0;
1542 1.274 ozaki }
1543 1.274 ozaki return error;
1544 1.193 msaitoh case SIOCGETHERCAP:
1545 1.193 msaitoh eccr = (struct eccapreq *)data;
1546 1.193 msaitoh eccr->eccr_capabilities = ec->ec_capabilities;
1547 1.193 msaitoh eccr->eccr_capenable = ec->ec_capenable;
1548 1.193 msaitoh return 0;
1549 1.272 msaitoh case SIOCSETHERCAP:
1550 1.272 msaitoh eccr = (struct eccapreq *)data;
1551 1.272 msaitoh if ((eccr->eccr_capenable & ~ec->ec_capabilities) != 0)
1552 1.272 msaitoh return EINVAL;
1553 1.272 msaitoh if (eccr->eccr_capenable == ec->ec_capenable)
1554 1.272 msaitoh return 0;
1555 1.272 msaitoh #if 0 /* notyet */
1556 1.272 msaitoh ec->ec_capenable = (ec->ec_capenable & ETHERCAP_CANTCHANGE)
1557 1.272 msaitoh | (eccr->eccr_capenable & ~ETHERCAP_CANTCHANGE);
1558 1.272 msaitoh #else
1559 1.272 msaitoh ec->ec_capenable = eccr->eccr_capenable;
1560 1.272 msaitoh #endif
1561 1.272 msaitoh return ether_ioctl_reinit(ec);
1562 1.66 thorpej case SIOCADDMULTI:
1563 1.169 dyoung return ether_addmulti(ifreq_getaddr(cmd, ifr), ec);
1564 1.66 thorpej case SIOCDELMULTI:
1565 1.169 dyoung return ether_delmulti(ifreq_getaddr(cmd, ifr), ec);
1566 1.160 dyoung case SIOCSIFMEDIA:
1567 1.160 dyoung case SIOCGIFMEDIA:
1568 1.275 msaitoh if (ec->ec_mii != NULL)
1569 1.275 msaitoh return ifmedia_ioctl(ifp, ifr, &ec->ec_mii->mii_media,
1570 1.275 msaitoh cmd);
1571 1.275 msaitoh else if (ec->ec_ifmedia != NULL)
1572 1.275 msaitoh return ifmedia_ioctl(ifp, ifr, ec->ec_ifmedia, cmd);
1573 1.275 msaitoh else
1574 1.169 dyoung return ENOTTY;
1575 1.275 msaitoh break;
1576 1.170 dyoung case SIOCALIFADDR:
1577 1.170 dyoung sdl = satocsdl(sstocsa(&iflr->addr));
1578 1.170 dyoung if (sdl->sdl_family != AF_LINK)
1579 1.170 dyoung ;
1580 1.170 dyoung else if (ETHER_IS_MULTICAST(CLLADDR(sdl)))
1581 1.170 dyoung return EINVAL;
1582 1.170 dyoung else if (memcmp(zero, CLLADDR(sdl), sizeof(zero)) == 0)
1583 1.170 dyoung return EINVAL;
1584 1.170 dyoung /*FALLTHROUGH*/
1585 1.170 dyoung default:
1586 1.161 dyoung return ifioctl_common(ifp, cmd, data);
1587 1.66 thorpej }
1588 1.169 dyoung return 0;
1589 1.3 hpeyerl }
1590 1.200 joerg
1591 1.215 christos /*
1592 1.215 christos * Enable/disable passing VLAN packets if the parent interface supports it.
1593 1.215 christos * Return:
1594 1.215 christos * 0: Ok
1595 1.215 christos * -1: Parent interface does not support vlans
1596 1.215 christos * >0: Error
1597 1.215 christos */
1598 1.215 christos int
1599 1.215 christos ether_enable_vlan_mtu(struct ifnet *ifp)
1600 1.215 christos {
1601 1.215 christos int error;
1602 1.215 christos struct ethercom *ec = (void *)ifp;
1603 1.215 christos
1604 1.215 christos /* Parent does not support VLAN's */
1605 1.215 christos if ((ec->ec_capabilities & ETHERCAP_VLAN_MTU) == 0)
1606 1.215 christos return -1;
1607 1.215 christos
1608 1.215 christos /*
1609 1.215 christos * Parent supports the VLAN_MTU capability,
1610 1.215 christos * i.e. can Tx/Rx larger than ETHER_MAX_LEN frames;
1611 1.215 christos * enable it.
1612 1.215 christos */
1613 1.215 christos ec->ec_capenable |= ETHERCAP_VLAN_MTU;
1614 1.215 christos
1615 1.215 christos /* Interface is down, defer for later */
1616 1.215 christos if ((ifp->if_flags & IFF_UP) == 0)
1617 1.215 christos return 0;
1618 1.215 christos
1619 1.215 christos if ((error = if_flags_set(ifp, ifp->if_flags)) == 0)
1620 1.215 christos return 0;
1621 1.215 christos
1622 1.215 christos ec->ec_capenable &= ~ETHERCAP_VLAN_MTU;
1623 1.215 christos return error;
1624 1.215 christos }
1625 1.215 christos
1626 1.215 christos int
1627 1.215 christos ether_disable_vlan_mtu(struct ifnet *ifp)
1628 1.215 christos {
1629 1.215 christos int error;
1630 1.215 christos struct ethercom *ec = (void *)ifp;
1631 1.215 christos
1632 1.215 christos /* We still have VLAN's, defer for later */
1633 1.215 christos if (ec->ec_nvlans != 0)
1634 1.215 christos return 0;
1635 1.215 christos
1636 1.215 christos /* Parent does not support VLAB's, nothing to do. */
1637 1.215 christos if ((ec->ec_capenable & ETHERCAP_VLAN_MTU) == 0)
1638 1.215 christos return -1;
1639 1.215 christos
1640 1.215 christos /*
1641 1.215 christos * Disable Tx/Rx of VLAN-sized frames.
1642 1.215 christos */
1643 1.215 christos ec->ec_capenable &= ~ETHERCAP_VLAN_MTU;
1644 1.250 maxv
1645 1.215 christos /* Interface is down, defer for later */
1646 1.215 christos if ((ifp->if_flags & IFF_UP) == 0)
1647 1.215 christos return 0;
1648 1.215 christos
1649 1.215 christos if ((error = if_flags_set(ifp, ifp->if_flags)) == 0)
1650 1.215 christos return 0;
1651 1.215 christos
1652 1.215 christos ec->ec_capenable |= ETHERCAP_VLAN_MTU;
1653 1.215 christos return error;
1654 1.215 christos }
1655 1.215 christos
1656 1.200 joerg static int
1657 1.200 joerg ether_multicast_sysctl(SYSCTLFN_ARGS)
1658 1.200 joerg {
1659 1.200 joerg struct ether_multi *enm;
1660 1.200 joerg struct ifnet *ifp;
1661 1.200 joerg struct ethercom *ec;
1662 1.223 ozaki int error = 0;
1663 1.200 joerg size_t written;
1664 1.223 ozaki struct psref psref;
1665 1.237 skrll int bound;
1666 1.233 ozaki unsigned int multicnt;
1667 1.233 ozaki struct ether_multi_sysctl *addrs;
1668 1.233 ozaki int i;
1669 1.200 joerg
1670 1.200 joerg if (namelen != 1)
1671 1.200 joerg return EINVAL;
1672 1.200 joerg
1673 1.223 ozaki bound = curlwp_bind();
1674 1.223 ozaki ifp = if_get_byindex(name[0], &psref);
1675 1.223 ozaki if (ifp == NULL) {
1676 1.223 ozaki error = ENODEV;
1677 1.223 ozaki goto out;
1678 1.223 ozaki }
1679 1.200 joerg if (ifp->if_type != IFT_ETHER) {
1680 1.223 ozaki if_put(ifp, &psref);
1681 1.200 joerg *oldlenp = 0;
1682 1.223 ozaki goto out;
1683 1.200 joerg }
1684 1.200 joerg ec = (struct ethercom *)ifp;
1685 1.200 joerg
1686 1.200 joerg if (oldp == NULL) {
1687 1.223 ozaki if_put(ifp, &psref);
1688 1.233 ozaki *oldlenp = ec->ec_multicnt * sizeof(*addrs);
1689 1.223 ozaki goto out;
1690 1.200 joerg }
1691 1.200 joerg
1692 1.233 ozaki /*
1693 1.233 ozaki * ec->ec_lock is a spin mutex so we cannot call sysctl_copyout, which
1694 1.251 maxv * is sleepable, while holding it. Copy data to a local buffer first
1695 1.251 maxv * with the lock taken and then call sysctl_copyout without holding it.
1696 1.233 ozaki */
1697 1.233 ozaki retry:
1698 1.233 ozaki multicnt = ec->ec_multicnt;
1699 1.251 maxv
1700 1.251 maxv if (multicnt == 0) {
1701 1.251 maxv if_put(ifp, &psref);
1702 1.251 maxv *oldlenp = 0;
1703 1.251 maxv goto out;
1704 1.251 maxv }
1705 1.251 maxv
1706 1.252 maxv addrs = kmem_zalloc(sizeof(*addrs) * multicnt, KM_SLEEP);
1707 1.200 joerg
1708 1.245 msaitoh ETHER_LOCK(ec);
1709 1.251 maxv if (multicnt != ec->ec_multicnt) {
1710 1.251 maxv /* The number of multicast addresses has changed */
1711 1.245 msaitoh ETHER_UNLOCK(ec);
1712 1.233 ozaki kmem_free(addrs, sizeof(*addrs) * multicnt);
1713 1.233 ozaki goto retry;
1714 1.233 ozaki }
1715 1.233 ozaki
1716 1.233 ozaki i = 0;
1717 1.200 joerg LIST_FOREACH(enm, &ec->ec_multiaddrs, enm_list) {
1718 1.233 ozaki struct ether_multi_sysctl *addr = &addrs[i];
1719 1.233 ozaki addr->enm_refcount = enm->enm_refcount;
1720 1.233 ozaki memcpy(addr->enm_addrlo, enm->enm_addrlo, ETHER_ADDR_LEN);
1721 1.233 ozaki memcpy(addr->enm_addrhi, enm->enm_addrhi, ETHER_ADDR_LEN);
1722 1.233 ozaki i++;
1723 1.233 ozaki }
1724 1.245 msaitoh ETHER_UNLOCK(ec);
1725 1.233 ozaki
1726 1.233 ozaki error = 0;
1727 1.233 ozaki written = 0;
1728 1.233 ozaki for (i = 0; i < multicnt; i++) {
1729 1.233 ozaki struct ether_multi_sysctl *addr = &addrs[i];
1730 1.233 ozaki
1731 1.233 ozaki if (written + sizeof(*addr) > *oldlenp)
1732 1.200 joerg break;
1733 1.233 ozaki error = sysctl_copyout(l, addr, oldp, sizeof(*addr));
1734 1.200 joerg if (error)
1735 1.200 joerg break;
1736 1.233 ozaki written += sizeof(*addr);
1737 1.233 ozaki oldp = (char *)oldp + sizeof(*addr);
1738 1.200 joerg }
1739 1.233 ozaki kmem_free(addrs, sizeof(*addrs) * multicnt);
1740 1.233 ozaki
1741 1.223 ozaki if_put(ifp, &psref);
1742 1.200 joerg
1743 1.200 joerg *oldlenp = written;
1744 1.223 ozaki out:
1745 1.223 ozaki curlwp_bindx(bound);
1746 1.200 joerg return error;
1747 1.200 joerg }
1748 1.200 joerg
1749 1.234 ozaki static void
1750 1.234 ozaki ether_sysctl_setup(struct sysctllog **clog)
1751 1.200 joerg {
1752 1.200 joerg const struct sysctlnode *rnode = NULL;
1753 1.200 joerg
1754 1.200 joerg sysctl_createv(clog, 0, NULL, &rnode,
1755 1.200 joerg CTLFLAG_PERMANENT,
1756 1.200 joerg CTLTYPE_NODE, "ether",
1757 1.200 joerg SYSCTL_DESCR("Ethernet-specific information"),
1758 1.200 joerg NULL, 0, NULL, 0,
1759 1.200 joerg CTL_NET, CTL_CREATE, CTL_EOL);
1760 1.200 joerg
1761 1.200 joerg sysctl_createv(clog, 0, &rnode, NULL,
1762 1.200 joerg CTLFLAG_PERMANENT,
1763 1.200 joerg CTLTYPE_NODE, "multicast",
1764 1.200 joerg SYSCTL_DESCR("multicast addresses"),
1765 1.200 joerg ether_multicast_sysctl, 0, NULL, 0,
1766 1.200 joerg CTL_CREATE, CTL_EOL);
1767 1.301 knakahar
1768 1.301 knakahar sysctl_createv(clog, 0, &rnode, NULL,
1769 1.301 knakahar CTLFLAG_PERMANENT | CTLFLAG_READWRITE,
1770 1.301 knakahar CTLTYPE_STRING, "rps_hash",
1771 1.301 knakahar SYSCTL_DESCR("Interface rps hash function control"),
1772 1.301 knakahar sysctl_pktq_rps_hash_handler, 0, (void *)ðer_pktq_rps_hash_p,
1773 1.301 knakahar PKTQ_RPS_HASH_NAME_LEN,
1774 1.301 knakahar CTL_CREATE, CTL_EOL);
1775 1.200 joerg }
1776 1.203 ozaki
1777 1.203 ozaki void
1778 1.203 ozaki etherinit(void)
1779 1.203 ozaki {
1780 1.234 ozaki
1781 1.278 msaitoh #ifdef DIAGNOSTIC
1782 1.203 ozaki mutex_init(&bigpktpps_lock, MUTEX_DEFAULT, IPL_NET);
1783 1.278 msaitoh #endif
1784 1.301 knakahar ether_pktq_rps_hash_p = pktq_rps_hash_default;
1785 1.234 ozaki ether_sysctl_setup(NULL);
1786 1.203 ozaki }
1787