Home | History | Annotate | Line # | Download | only in net
if_ethersubr.c revision 1.294
      1  1.294  yamaguch /*	$NetBSD: if_ethersubr.c,v 1.294 2021/09/30 03:15:25 yamaguchi Exp $	*/
      2   1.44    itojun 
      3   1.44    itojun /*
      4   1.44    itojun  * Copyright (C) 1995, 1996, 1997, and 1998 WIDE Project.
      5   1.44    itojun  * All rights reserved.
      6  1.120     perry  *
      7   1.44    itojun  * Redistribution and use in source and binary forms, with or without
      8   1.44    itojun  * modification, are permitted provided that the following conditions
      9   1.44    itojun  * are met:
     10   1.44    itojun  * 1. Redistributions of source code must retain the above copyright
     11   1.44    itojun  *    notice, this list of conditions and the following disclaimer.
     12   1.44    itojun  * 2. Redistributions in binary form must reproduce the above copyright
     13   1.44    itojun  *    notice, this list of conditions and the following disclaimer in the
     14   1.44    itojun  *    documentation and/or other materials provided with the distribution.
     15   1.44    itojun  * 3. Neither the name of the project nor the names of its contributors
     16   1.44    itojun  *    may be used to endorse or promote products derived from this software
     17   1.44    itojun  *    without specific prior written permission.
     18  1.120     perry  *
     19   1.44    itojun  * THIS SOFTWARE IS PROVIDED BY THE PROJECT AND CONTRIBUTORS ``AS IS'' AND
     20   1.44    itojun  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     21   1.44    itojun  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     22   1.44    itojun  * ARE DISCLAIMED.  IN NO EVENT SHALL THE PROJECT OR CONTRIBUTORS BE LIABLE
     23   1.44    itojun  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     24   1.44    itojun  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     25   1.44    itojun  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     26   1.44    itojun  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     27   1.44    itojun  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     28   1.44    itojun  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     29   1.44    itojun  * SUCH DAMAGE.
     30   1.44    itojun  */
     31    1.9       cgd 
     32    1.1       cgd /*
     33    1.8   mycroft  * Copyright (c) 1982, 1989, 1993
     34    1.8   mycroft  *	The Regents of the University of California.  All rights reserved.
     35    1.1       cgd  *
     36    1.1       cgd  * Redistribution and use in source and binary forms, with or without
     37    1.1       cgd  * modification, are permitted provided that the following conditions
     38    1.1       cgd  * are met:
     39    1.1       cgd  * 1. Redistributions of source code must retain the above copyright
     40    1.1       cgd  *    notice, this list of conditions and the following disclaimer.
     41    1.1       cgd  * 2. Redistributions in binary form must reproduce the above copyright
     42    1.1       cgd  *    notice, this list of conditions and the following disclaimer in the
     43    1.1       cgd  *    documentation and/or other materials provided with the distribution.
     44  1.113       agc  * 3. Neither the name of the University nor the names of its contributors
     45    1.1       cgd  *    may be used to endorse or promote products derived from this software
     46    1.1       cgd  *    without specific prior written permission.
     47    1.1       cgd  *
     48    1.1       cgd  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
     49    1.1       cgd  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     50    1.1       cgd  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     51    1.1       cgd  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
     52    1.1       cgd  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     53    1.1       cgd  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     54    1.1       cgd  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     55    1.1       cgd  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     56    1.1       cgd  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     57    1.1       cgd  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     58    1.1       cgd  * SUCH DAMAGE.
     59    1.1       cgd  *
     60   1.27      fvdl  *	@(#)if_ethersubr.c	8.2 (Berkeley) 4/4/96
     61    1.1       cgd  */
     62   1.90     lukem 
     63   1.90     lukem #include <sys/cdefs.h>
     64  1.294  yamaguch __KERNEL_RCSID(0, "$NetBSD: if_ethersubr.c,v 1.294 2021/09/30 03:15:25 yamaguchi Exp $");
     65    1.1       cgd 
     66  1.212     pooka #ifdef _KERNEL_OPT
     67   1.33  jonathan #include "opt_inet.h"
     68   1.33  jonathan #include "opt_atalk.h"
     69  1.112    martin #include "opt_mbuftrace.h"
     70  1.182    kefren #include "opt_mpls.h"
     71   1.30      matt #include "opt_gateway.h"
     72  1.135     pavel #include "opt_pppoe.h"
     73  1.206     ozaki #include "opt_net_mpsafe.h"
     74  1.212     pooka #endif
     75  1.212     pooka 
     76   1.59   thorpej #include "vlan.h"
     77   1.81    martin #include "pppoe.h"
     78   1.78   thorpej #include "bridge.h"
     79   1.93    martin #include "arp.h"
     80  1.121      yamt #include "agr.h"
     81  1.293  yamaguch #include "lagg.h"
     82   1.30      matt 
     83  1.200     joerg #include <sys/sysctl.h>
     84    1.4   mycroft #include <sys/mbuf.h>
     85  1.211     ozaki #include <sys/mutex.h>
     86    1.4   mycroft #include <sys/ioctl.h>
     87    1.4   mycroft #include <sys/errno.h>
     88  1.158    dyoung #include <sys/device.h>
     89  1.284  riastrad #include <sys/entropy.h>
     90  1.207  riastrad #include <sys/rndsource.h>
     91  1.216     ozaki #include <sys/cpu.h>
     92  1.231     ozaki #include <sys/kmem.h>
     93    1.8   mycroft 
     94    1.4   mycroft #include <net/if.h>
     95    1.4   mycroft #include <net/netisr.h>
     96    1.4   mycroft #include <net/route.h>
     97    1.4   mycroft #include <net/if_llc.h>
     98    1.4   mycroft #include <net/if_dl.h>
     99    1.8   mycroft #include <net/if_types.h>
    100  1.211     ozaki #include <net/pktqueue.h>
    101   1.93    martin 
    102  1.158    dyoung #include <net/if_media.h>
    103  1.158    dyoung #include <dev/mii/mii.h>
    104  1.158    dyoung #include <dev/mii/miivar.h>
    105  1.158    dyoung 
    106   1.93    martin #if NARP == 0
    107   1.93    martin /*
    108  1.102      jmmv  * XXX there should really be a way to issue this warning from within config(8)
    109   1.93    martin  */
    110  1.111    martin #error You have included NETATALK or a pseudo-device in your configuration that depends on the presence of ethernet interfaces, but have no such interfaces configured. Check if you really need pseudo-device bridge, pppoe, vlan or options NETATALK.
    111   1.93    martin #endif
    112    1.1       cgd 
    113   1.69   thorpej #include <net/bpf.h>
    114   1.69   thorpej 
    115   1.22        is #include <net/if_ether.h>
    116   1.59   thorpej #include <net/if_vlanvar.h>
    117   1.22        is 
    118   1.81    martin #if NPPPOE > 0
    119   1.81    martin #include <net/if_pppoe.h>
    120   1.81    martin #endif
    121   1.81    martin 
    122  1.121      yamt #if NAGR > 0
    123  1.121      yamt #include <net/agr/ieee8023_slowprotocols.h>	/* XXX */
    124  1.121      yamt #include <net/agr/ieee8023ad.h>
    125  1.121      yamt #include <net/agr/if_agrvar.h>
    126  1.121      yamt #endif
    127  1.121      yamt 
    128  1.293  yamaguch #include <net/lagg/if_laggvar.h>
    129  1.293  yamaguch 
    130   1.78   thorpej #if NBRIDGE > 0
    131   1.78   thorpej #include <net/if_bridgevar.h>
    132   1.78   thorpej #endif
    133   1.78   thorpej 
    134   1.15      phil #include <netinet/in.h>
    135    1.1       cgd #ifdef INET
    136    1.4   mycroft #include <netinet/in_var.h>
    137    1.1       cgd #endif
    138   1.22        is #include <netinet/if_inarp.h>
    139    1.1       cgd 
    140   1.44    itojun #ifdef INET6
    141   1.44    itojun #ifndef INET
    142   1.44    itojun #include <netinet/in.h>
    143   1.44    itojun #endif
    144   1.44    itojun #include <netinet6/in6_var.h>
    145   1.44    itojun #include <netinet6/nd6.h>
    146   1.44    itojun #endif
    147   1.44    itojun 
    148  1.133  liamjfoy #include "carp.h"
    149  1.133  liamjfoy #if NCARP > 0
    150  1.133  liamjfoy #include <netinet/ip_carp.h>
    151  1.133  liamjfoy #endif
    152  1.133  liamjfoy 
    153   1.23  christos #ifdef NETATALK
    154   1.23  christos #include <netatalk/at.h>
    155   1.23  christos #include <netatalk/at_var.h>
    156   1.23  christos #include <netatalk/at_extern.h>
    157   1.23  christos 
    158   1.23  christos #define llc_snap_org_code llc_un.type_snap.org_code
    159   1.23  christos #define llc_snap_ether_type llc_un.type_snap.ether_type
    160   1.23  christos 
    161   1.23  christos extern u_char	at_org_code[3];
    162   1.23  christos extern u_char	aarp_org_code[3];
    163   1.23  christos #endif /* NETATALK */
    164   1.23  christos 
    165  1.182    kefren #ifdef MPLS
    166  1.182    kefren #include <netmpls/mpls.h>
    167  1.182    kefren #include <netmpls/mpls_var.h>
    168  1.182    kefren #endif
    169  1.182    kefren 
    170  1.292       roy CTASSERT(sizeof(struct ether_addr) == 6);
    171  1.292       roy CTASSERT(sizeof(struct ether_header) == 14);
    172  1.292       roy 
    173  1.278   msaitoh #ifdef DIAGNOSTIC
    174  1.123      matt static struct timeval bigpktppslim_last;
    175  1.123      matt static int bigpktppslim = 2;	/* XXX */
    176  1.123      matt static int bigpktpps_count;
    177  1.203     ozaki static kmutex_t bigpktpps_lock __cacheline_aligned;
    178  1.278   msaitoh #endif
    179  1.123      matt 
    180  1.118      yamt const uint8_t etherbroadcastaddr[ETHER_ADDR_LEN] =
    181  1.118      yamt     { 0xff, 0xff, 0xff, 0xff, 0xff, 0xff };
    182  1.121      yamt const uint8_t ethermulticastaddr_slowprotocols[ETHER_ADDR_LEN] =
    183  1.121      yamt     { 0x01, 0x80, 0xc2, 0x00, 0x00, 0x02 };
    184    1.8   mycroft #define senderr(e) { error = (e); goto bad;}
    185    1.1       cgd 
    186  1.293  yamaguch /* if_lagg(4) support */
    187  1.293  yamaguch struct mbuf *(*lagg_input_ethernet_p)(struct ifnet *, struct mbuf *);
    188  1.293  yamaguch 
    189  1.261      maxv static int ether_output(struct ifnet *, struct mbuf *,
    190  1.261      maxv     const struct sockaddr *, const struct rtentry *);
    191   1.42   thorpej 
    192    1.1       cgd /*
    193    1.1       cgd  * Ethernet output routine.
    194    1.1       cgd  * Encapsulate a packet of type family for the local net.
    195   1.22        is  * Assumes that ifp is actually pointer to ethercom structure.
    196    1.1       cgd  */
    197   1.42   thorpej static int
    198  1.178    dyoung ether_output(struct ifnet * const ifp0, struct mbuf * const m0,
    199  1.256      maxv     const struct sockaddr * const dst, const struct rtentry *rt)
    200    1.1       cgd {
    201  1.256      maxv 	uint8_t esrc[ETHER_ADDR_LEN], edst[ETHER_ADDR_LEN];
    202  1.162      matt 	uint16_t etype = 0;
    203  1.122  christos 	int error = 0, hdrcmplt = 0;
    204   1.29       mrg 	struct mbuf *m = m0;
    205  1.151    dyoung 	struct mbuf *mcopy = NULL;
    206   1.29       mrg 	struct ether_header *eh;
    207  1.133  liamjfoy 	struct ifnet *ifp = ifp0;
    208   1.24  christos #ifdef INET
    209   1.22        is 	struct arphdr *ah;
    210  1.260      maxv #endif
    211   1.23  christos #ifdef NETATALK
    212   1.23  christos 	struct at_ifaddr *aa;
    213  1.260      maxv #endif
    214    1.1       cgd 
    215  1.104      matt #ifdef MBUFTRACE
    216  1.116  jonathan 	m_claimm(m, ifp->if_mowner);
    217  1.104      matt #endif
    218  1.133  liamjfoy 
    219  1.133  liamjfoy #if NCARP > 0
    220  1.133  liamjfoy 	if (ifp->if_type == IFT_CARP) {
    221  1.133  liamjfoy 		struct ifaddr *ifa;
    222  1.227     ozaki 		int s = pserialize_read_enter();
    223  1.133  liamjfoy 
    224  1.133  liamjfoy 		/* loop back if this is going to the carp interface */
    225  1.133  liamjfoy 		if (dst != NULL && ifp0->if_link_state == LINK_STATE_UP &&
    226  1.227     ozaki 		    (ifa = ifa_ifwithaddr(dst)) != NULL) {
    227  1.227     ozaki 			if (ifa->ifa_ifp == ifp0) {
    228  1.227     ozaki 				pserialize_read_exit(s);
    229  1.227     ozaki 				return looutput(ifp0, m, dst, rt);
    230  1.227     ozaki 			}
    231  1.227     ozaki 		}
    232  1.227     ozaki 		pserialize_read_exit(s);
    233  1.133  liamjfoy 
    234  1.133  liamjfoy 		ifp = ifp->if_carpdev;
    235  1.133  liamjfoy 		/* ac = (struct arpcom *)ifp; */
    236  1.133  liamjfoy 
    237  1.247   msaitoh 		if ((ifp0->if_flags & (IFF_UP | IFF_RUNNING)) !=
    238  1.247   msaitoh 		    (IFF_UP | IFF_RUNNING))
    239  1.133  liamjfoy 			senderr(ENETDOWN);
    240  1.133  liamjfoy 	}
    241  1.260      maxv #endif
    242  1.133  liamjfoy 
    243  1.247   msaitoh 	if ((ifp->if_flags & (IFF_UP | IFF_RUNNING)) != (IFF_UP | IFF_RUNNING))
    244    1.8   mycroft 		senderr(ENETDOWN);
    245   1.72   thorpej 
    246    1.1       cgd 	switch (dst->sa_family) {
    247    1.1       cgd 
    248    1.1       cgd #ifdef INET
    249    1.1       cgd 	case AF_INET:
    250  1.261      maxv 		if (m->m_flags & M_BCAST) {
    251  1.256      maxv 			memcpy(edst, etherbroadcastaddr, sizeof(edst));
    252  1.261      maxv 		} else if (m->m_flags & M_MCAST) {
    253  1.145    dyoung 			ETHER_MAP_IP_MULTICAST(&satocsin(dst)->sin_addr, edst);
    254  1.261      maxv 		} else {
    255  1.281    kardel 			error = arpresolve(ifp0, rt, m, dst, edst, sizeof(edst));
    256  1.260      maxv 			if (error)
    257  1.260      maxv 				return (error == EWOULDBLOCK) ? 0 : error;
    258  1.224  knakahar 		}
    259    1.3   hpeyerl 		/* If broadcasting on a simplex interface, loopback a copy */
    260    1.3   hpeyerl 		if ((m->m_flags & M_BCAST) && (ifp->if_flags & IFF_SIMPLEX))
    261  1.266      maxv 			mcopy = m_copypacket(m, M_DONTWAIT);
    262   1.17   mycroft 		etype = htons(ETHERTYPE_IP);
    263    1.8   mycroft 		break;
    264   1.22        is 
    265   1.22        is 	case AF_ARP:
    266   1.22        is 		ah = mtod(m, struct arphdr *);
    267  1.261      maxv 		if (m->m_flags & M_BCAST) {
    268  1.256      maxv 			memcpy(edst, etherbroadcastaddr, sizeof(edst));
    269  1.261      maxv 		} else {
    270  1.147  christos 			void *tha = ar_tha(ah);
    271  1.131       mrg 
    272  1.173  christos 			if (tha == NULL) {
    273  1.258      maxv 				/* fake with ARPHRD_IEEE1394 */
    274  1.236      maxv 				m_freem(m);
    275  1.173  christos 				return 0;
    276  1.173  christos 			}
    277  1.146    dyoung 			memcpy(edst, tha, sizeof(edst));
    278  1.131       mrg 		}
    279  1.120     perry 
    280   1.22        is 		ah->ar_hrd = htons(ARPHRD_ETHER);
    281   1.22        is 
    282  1.107    itojun 		switch (ntohs(ah->ar_op)) {
    283   1.22        is 		case ARPOP_REVREQUEST:
    284   1.22        is 		case ARPOP_REVREPLY:
    285   1.22        is 			etype = htons(ETHERTYPE_REVARP);
    286   1.22        is 			break;
    287   1.22        is 
    288   1.22        is 		case ARPOP_REQUEST:
    289   1.22        is 		case ARPOP_REPLY:
    290   1.22        is 		default:
    291   1.22        is 			etype = htons(ETHERTYPE_ARP);
    292   1.22        is 		}
    293   1.22        is 		break;
    294    1.1       cgd #endif
    295  1.256      maxv 
    296   1.44    itojun #ifdef INET6
    297   1.44    itojun 	case AF_INET6:
    298  1.261      maxv 		if (m->m_flags & M_BCAST) {
    299  1.256      maxv 			memcpy(edst, etherbroadcastaddr, sizeof(edst));
    300  1.261      maxv 		} else if (m->m_flags & M_MCAST) {
    301  1.238     ozaki 			ETHER_MAP_IPV6_MULTICAST(&satocsin6(dst)->sin6_addr,
    302  1.238     ozaki 			    edst);
    303  1.238     ozaki 		} else {
    304  1.281    kardel 			error = nd6_resolve(ifp0, rt, m, dst, edst,
    305  1.238     ozaki 			    sizeof(edst));
    306  1.261      maxv 			if (error)
    307  1.261      maxv 				return (error == EWOULDBLOCK) ? 0 : error;
    308   1.51    itojun 		}
    309   1.44    itojun 		etype = htons(ETHERTYPE_IPV6);
    310   1.44    itojun 		break;
    311   1.44    itojun #endif
    312  1.256      maxv 
    313   1.23  christos #ifdef NETATALK
    314  1.250      maxv 	case AF_APPLETALK: {
    315  1.227     ozaki 		struct ifaddr *ifa;
    316  1.227     ozaki 		int s;
    317  1.227     ozaki 
    318  1.224  knakahar 		KERNEL_LOCK(1, NULL);
    319  1.256      maxv 
    320  1.226       rjs 		if (!aarpresolve(ifp, m, (const struct sockaddr_at *)dst, edst)) {
    321  1.224  knakahar 			KERNEL_UNLOCK_ONE(NULL);
    322  1.261      maxv 			return 0;
    323   1.23  christos 		}
    324  1.256      maxv 
    325   1.23  christos 		/*
    326   1.23  christos 		 * ifaddr is the first thing in at_ifaddr
    327   1.23  christos 		 */
    328  1.227     ozaki 		s = pserialize_read_enter();
    329  1.227     ozaki 		ifa = at_ifawithnet((const struct sockaddr_at *)dst, ifp);
    330  1.227     ozaki 		if (ifa == NULL) {
    331  1.227     ozaki 			pserialize_read_exit(s);
    332  1.227     ozaki 			KERNEL_UNLOCK_ONE(NULL);
    333  1.260      maxv 			senderr(EADDRNOTAVAIL);
    334  1.224  knakahar 		}
    335  1.227     ozaki 		aa = (struct at_ifaddr *)ifa;
    336  1.120     perry 
    337   1.23  christos 		/*
    338   1.23  christos 		 * In the phase 2 case, we need to prepend an mbuf for the
    339  1.265      maxv 		 * llc header.
    340   1.23  christos 		 */
    341   1.23  christos 		if (aa->aa_flags & AFA_PHASE2) {
    342   1.23  christos 			struct llc llc;
    343   1.23  christos 
    344   1.43    bouyer 			M_PREPEND(m, sizeof(struct llc), M_DONTWAIT);
    345  1.256      maxv 			if (m == NULL) {
    346  1.260      maxv 				pserialize_read_exit(s);
    347  1.256      maxv 				KERNEL_UNLOCK_ONE(NULL);
    348  1.256      maxv 				senderr(ENOBUFS);
    349  1.256      maxv 			}
    350  1.256      maxv 
    351   1.23  christos 			llc.llc_dsap = llc.llc_ssap = LLC_SNAP_LSAP;
    352   1.23  christos 			llc.llc_control = LLC_UI;
    353  1.146    dyoung 			memcpy(llc.llc_snap_org_code, at_org_code,
    354   1.23  christos 			    sizeof(llc.llc_snap_org_code));
    355   1.38       kim 			llc.llc_snap_ether_type = htons(ETHERTYPE_ATALK);
    356  1.147  christos 			memcpy(mtod(m, void *), &llc, sizeof(struct llc));
    357   1.23  christos 		} else {
    358   1.38       kim 			etype = htons(ETHERTYPE_ATALK);
    359   1.23  christos 		}
    360  1.227     ozaki 		pserialize_read_exit(s);
    361  1.224  knakahar 		KERNEL_UNLOCK_ONE(NULL);
    362   1.23  christos 		break;
    363  1.250      maxv 	}
    364   1.23  christos #endif /* NETATALK */
    365  1.256      maxv 
    366   1.31   thorpej 	case pseudo_AF_HDRCMPLT:
    367   1.31   thorpej 		hdrcmplt = 1;
    368  1.146    dyoung 		memcpy(esrc,
    369  1.146    dyoung 		    ((const struct ether_header *)dst->sa_data)->ether_shost,
    370  1.146    dyoung 		    sizeof(esrc));
    371   1.31   thorpej 		/* FALLTHROUGH */
    372   1.31   thorpej 
    373    1.1       cgd 	case AF_UNSPEC:
    374  1.250      maxv 		memcpy(edst,
    375  1.146    dyoung 		    ((const struct ether_header *)dst->sa_data)->ether_dhost,
    376  1.146    dyoung 		    sizeof(edst));
    377    1.8   mycroft 		/* AF_UNSPEC doesn't swap the byte order of the ether_type. */
    378  1.145    dyoung 		etype = ((const struct ether_header *)dst->sa_data)->ether_type;
    379    1.8   mycroft 		break;
    380    1.1       cgd 
    381    1.1       cgd 	default:
    382   1.21  christos 		printf("%s: can't handle af%d\n", ifp->if_xname,
    383  1.261      maxv 		    dst->sa_family);
    384    1.8   mycroft 		senderr(EAFNOSUPPORT);
    385    1.1       cgd 	}
    386    1.1       cgd 
    387  1.182    kefren #ifdef MPLS
    388  1.210     ozaki 	{
    389  1.210     ozaki 		struct m_tag *mtag;
    390  1.271      maxv 		mtag = m_tag_find(m, PACKET_TAG_MPLS);
    391  1.210     ozaki 		if (mtag != NULL) {
    392  1.210     ozaki 			/* Having the tag itself indicates it's MPLS */
    393  1.184    dyoung 			etype = htons(ETHERTYPE_MPLS);
    394  1.210     ozaki 			m_tag_delete(m, mtag);
    395  1.210     ozaki 		}
    396  1.184    dyoung 	}
    397  1.182    kefren #endif
    398  1.182    kefren 
    399    1.1       cgd 	if (mcopy)
    400  1.145    dyoung 		(void)looutput(ifp, mcopy, dst, rt);
    401   1.16   mycroft 
    402  1.256      maxv 	KASSERT((m->m_flags & M_PKTHDR) != 0);
    403  1.256      maxv 
    404  1.256      maxv 	/*
    405  1.256      maxv 	 * If no ether type is set, this must be a 802.2 formatted packet.
    406   1.50      matt 	 */
    407   1.50      matt 	if (etype == 0)
    408   1.50      matt 		etype = htons(m->m_pkthdr.len);
    409  1.256      maxv 
    410    1.1       cgd 	/*
    411  1.256      maxv 	 * Add local net header. If no space in first mbuf, allocate another.
    412    1.1       cgd 	 */
    413  1.256      maxv 	M_PREPEND(m, sizeof(struct ether_header), M_DONTWAIT);
    414  1.256      maxv 	if (m == NULL)
    415    1.8   mycroft 		senderr(ENOBUFS);
    416  1.256      maxv 
    417    1.1       cgd 	eh = mtod(m, struct ether_header *);
    418   1.96   thorpej 	/* Note: etype is already in network byte order. */
    419  1.256      maxv 	memcpy(&eh->ether_type, &etype, sizeof(eh->ether_type));
    420  1.250      maxv 	memcpy(eh->ether_dhost, edst, sizeof(edst));
    421  1.261      maxv 	if (hdrcmplt) {
    422  1.146    dyoung 		memcpy(eh->ether_shost, esrc, sizeof(eh->ether_shost));
    423  1.261      maxv 	} else {
    424  1.153    dyoung 	 	memcpy(eh->ether_shost, CLLADDR(ifp->if_sadl),
    425   1.31   thorpej 		    sizeof(eh->ether_shost));
    426  1.261      maxv 	}
    427   1.77   thorpej 
    428  1.133  liamjfoy #if NCARP > 0
    429  1.133  liamjfoy 	if (ifp0 != ifp && ifp0->if_type == IFT_CARP) {
    430  1.153    dyoung 	 	memcpy(eh->ether_shost, CLLADDR(ifp0->if_sadl),
    431  1.133  liamjfoy 		    sizeof(eh->ether_shost));
    432  1.133  liamjfoy 	}
    433  1.256      maxv #endif
    434  1.133  liamjfoy 
    435  1.195     rmind 	if ((error = pfil_run_hooks(ifp->if_pfil, &m, ifp, PFIL_OUT)) != 0)
    436  1.261      maxv 		return error;
    437   1.77   thorpej 	if (m == NULL)
    438  1.261      maxv 		return 0;
    439   1.77   thorpej 
    440   1.78   thorpej #if NBRIDGE > 0
    441   1.78   thorpej 	/*
    442   1.78   thorpej 	 * Bridges require special output handling.
    443   1.78   thorpej 	 */
    444   1.78   thorpej 	if (ifp->if_bridge)
    445  1.256      maxv 		return bridge_output(ifp, m, NULL, NULL);
    446   1.78   thorpej #endif
    447   1.78   thorpej 
    448  1.133  liamjfoy #if NCARP > 0
    449  1.133  liamjfoy 	if (ifp != ifp0)
    450  1.282   thorpej 		if_statadd(ifp0, if_obytes, m->m_pkthdr.len + ETHER_HDR_LEN);
    451  1.256      maxv #endif
    452  1.133  liamjfoy 
    453   1.77   thorpej #ifdef ALTQ
    454  1.224  knakahar 	KERNEL_LOCK(1, NULL);
    455   1.77   thorpej 	/*
    456   1.77   thorpej 	 * If ALTQ is enabled on the parent interface, do
    457   1.77   thorpej 	 * classification; the queueing discipline might not
    458   1.77   thorpej 	 * require classification, but might require the
    459   1.77   thorpej 	 * address family/header pointer in the pktattr.
    460   1.77   thorpej 	 */
    461   1.77   thorpej 	if (ALTQ_IS_ENABLED(&ifp->if_snd))
    462  1.220  knakahar 		altq_etherclassify(&ifp->if_snd, m);
    463  1.224  knakahar 	KERNEL_UNLOCK_ONE(NULL);
    464   1.77   thorpej #endif
    465  1.221  knakahar 	return ifq_enqueue(ifp, m);
    466    1.1       cgd 
    467    1.1       cgd bad:
    468  1.288     ozaki 	if_statinc(ifp, if_oerrors);
    469    1.1       cgd 	if (m)
    470    1.1       cgd 		m_freem(m);
    471  1.261      maxv 	return error;
    472    1.1       cgd }
    473   1.76   thorpej 
    474   1.76   thorpej #ifdef ALTQ
    475   1.76   thorpej /*
    476   1.76   thorpej  * This routine is a slight hack to allow a packet to be classified
    477   1.76   thorpej  * if the Ethernet headers are present.  It will go away when ALTQ's
    478   1.76   thorpej  * classification engine understands link headers.
    479  1.261      maxv  *
    480  1.261      maxv  * XXX: We may need to do m_pullups here. First to ensure struct ether_header
    481  1.261      maxv  * is indeed contiguous, then to read the LLC and so on.
    482   1.76   thorpej  */
    483   1.76   thorpej void
    484  1.220  knakahar altq_etherclassify(struct ifaltq *ifq, struct mbuf *m)
    485   1.76   thorpej {
    486   1.76   thorpej 	struct ether_header *eh;
    487  1.255      maxv 	struct mbuf *mtop = m;
    488  1.162      matt 	uint16_t ether_type;
    489   1.76   thorpej 	int hlen, af, hdrsize;
    490  1.147  christos 	void *hdr;
    491   1.76   thorpej 
    492  1.255      maxv 	KASSERT((mtop->m_flags & M_PKTHDR) != 0);
    493  1.255      maxv 
    494   1.76   thorpej 	hlen = ETHER_HDR_LEN;
    495   1.76   thorpej 	eh = mtod(m, struct ether_header *);
    496   1.76   thorpej 
    497   1.76   thorpej 	ether_type = htons(eh->ether_type);
    498   1.76   thorpej 
    499   1.76   thorpej 	if (ether_type < ETHERMTU) {
    500   1.76   thorpej 		/* LLC/SNAP */
    501   1.76   thorpej 		struct llc *llc = (struct llc *)(eh + 1);
    502   1.76   thorpej 		hlen += 8;
    503   1.76   thorpej 
    504   1.76   thorpej 		if (m->m_len < hlen ||
    505   1.76   thorpej 		    llc->llc_dsap != LLC_SNAP_LSAP ||
    506   1.76   thorpej 		    llc->llc_ssap != LLC_SNAP_LSAP ||
    507   1.76   thorpej 		    llc->llc_control != LLC_UI) {
    508   1.76   thorpej 			/* Not SNAP. */
    509   1.76   thorpej 			goto bad;
    510   1.76   thorpej 		}
    511   1.76   thorpej 
    512   1.76   thorpej 		ether_type = htons(llc->llc_un.type_snap.ether_type);
    513   1.76   thorpej 	}
    514   1.76   thorpej 
    515   1.76   thorpej 	switch (ether_type) {
    516   1.76   thorpej 	case ETHERTYPE_IP:
    517   1.76   thorpej 		af = AF_INET;
    518   1.76   thorpej 		hdrsize = 20;		/* sizeof(struct ip) */
    519   1.76   thorpej 		break;
    520   1.76   thorpej 
    521   1.76   thorpej 	case ETHERTYPE_IPV6:
    522   1.76   thorpej 		af = AF_INET6;
    523   1.76   thorpej 		hdrsize = 40;		/* sizeof(struct ip6_hdr) */
    524   1.76   thorpej 		break;
    525   1.76   thorpej 
    526   1.76   thorpej 	default:
    527   1.76   thorpej 		af = AF_UNSPEC;
    528   1.76   thorpej 		hdrsize = 0;
    529   1.76   thorpej 		break;
    530   1.76   thorpej 	}
    531   1.76   thorpej 
    532   1.95    itojun 	while (m->m_len <= hlen) {
    533   1.95    itojun 		hlen -= m->m_len;
    534   1.95    itojun 		m = m->m_next;
    535  1.255      maxv 		if (m == NULL)
    536  1.255      maxv 			goto bad;
    537   1.95    itojun 	}
    538  1.255      maxv 
    539   1.76   thorpej 	if (m->m_len < (hlen + hdrsize)) {
    540   1.76   thorpej 		/*
    541   1.95    itojun 		 * protocol header not in a single mbuf.
    542   1.95    itojun 		 * We can't cope with this situation right
    543   1.76   thorpej 		 * now (but it shouldn't ever happen, really, anyhow).
    544   1.76   thorpej 		 */
    545   1.92    itojun #ifdef DEBUG
    546   1.78   thorpej 		printf("altq_etherclassify: headers span multiple mbufs: "
    547   1.78   thorpej 		    "%d < %d\n", m->m_len, (hlen + hdrsize));
    548   1.92    itojun #endif
    549   1.76   thorpej 		goto bad;
    550   1.76   thorpej 	}
    551   1.76   thorpej 
    552   1.76   thorpej 	m->m_data += hlen;
    553   1.76   thorpej 	m->m_len -= hlen;
    554   1.76   thorpej 
    555  1.147  christos 	hdr = mtod(m, void *);
    556   1.76   thorpej 
    557  1.255      maxv 	if (ALTQ_NEEDS_CLASSIFY(ifq)) {
    558  1.255      maxv 		mtop->m_pkthdr.pattr_class =
    559   1.76   thorpej 		    (*ifq->altq_classify)(ifq->altq_clfier, m, af);
    560  1.255      maxv 	}
    561  1.255      maxv 	mtop->m_pkthdr.pattr_af = af;
    562  1.255      maxv 	mtop->m_pkthdr.pattr_hdr = hdr;
    563   1.76   thorpej 
    564   1.76   thorpej 	m->m_data -= hlen;
    565   1.76   thorpej 	m->m_len += hlen;
    566   1.76   thorpej 
    567   1.76   thorpej 	return;
    568   1.76   thorpej 
    569  1.250      maxv bad:
    570  1.255      maxv 	mtop->m_pkthdr.pattr_class = NULL;
    571  1.255      maxv 	mtop->m_pkthdr.pattr_hdr = NULL;
    572  1.255      maxv 	mtop->m_pkthdr.pattr_af = AF_UNSPEC;
    573   1.76   thorpej }
    574   1.76   thorpej #endif /* ALTQ */
    575    1.1       cgd 
    576  1.286     ozaki #if defined (LLC) || defined (NETATALK)
    577  1.286     ozaki static void
    578  1.286     ozaki ether_input_llc(struct ifnet *ifp, struct mbuf *m, struct ether_header *eh)
    579  1.286     ozaki {
    580  1.286     ozaki 	struct ifqueue *inq = NULL;
    581  1.286     ozaki 	int isr = 0;
    582  1.286     ozaki 	struct llc *l;
    583  1.286     ozaki 
    584  1.286     ozaki 	if (m->m_len < sizeof(*eh) + sizeof(struct llc))
    585  1.286     ozaki 		goto drop;
    586  1.286     ozaki 
    587  1.286     ozaki 	l = (struct llc *)(eh+1);
    588  1.286     ozaki 	switch (l->llc_dsap) {
    589  1.286     ozaki #ifdef NETATALK
    590  1.286     ozaki 	case LLC_SNAP_LSAP:
    591  1.286     ozaki 		switch (l->llc_control) {
    592  1.286     ozaki 		case LLC_UI:
    593  1.286     ozaki 			if (l->llc_ssap != LLC_SNAP_LSAP)
    594  1.286     ozaki 				goto drop;
    595  1.286     ozaki 
    596  1.286     ozaki 			if (memcmp(&(l->llc_snap_org_code)[0],
    597  1.286     ozaki 			    at_org_code, sizeof(at_org_code)) == 0 &&
    598  1.286     ozaki 			    ntohs(l->llc_snap_ether_type) ==
    599  1.286     ozaki 			    ETHERTYPE_ATALK) {
    600  1.286     ozaki 				inq = &atintrq2;
    601  1.286     ozaki 				m_adj(m, sizeof(struct ether_header)
    602  1.286     ozaki 				    + sizeof(struct llc));
    603  1.286     ozaki 				isr = NETISR_ATALK;
    604  1.286     ozaki 				break;
    605  1.286     ozaki 			}
    606  1.286     ozaki 
    607  1.286     ozaki 			if (memcmp(&(l->llc_snap_org_code)[0],
    608  1.286     ozaki 			    aarp_org_code,
    609  1.286     ozaki 			    sizeof(aarp_org_code)) == 0 &&
    610  1.286     ozaki 			    ntohs(l->llc_snap_ether_type) ==
    611  1.286     ozaki 			    ETHERTYPE_AARP) {
    612  1.286     ozaki 				m_adj(m, sizeof(struct ether_header)
    613  1.286     ozaki 				    + sizeof(struct llc));
    614  1.286     ozaki 				aarpinput(ifp, m); /* XXX queue? */
    615  1.286     ozaki 				return;
    616  1.286     ozaki 			}
    617  1.286     ozaki 
    618  1.286     ozaki 		default:
    619  1.286     ozaki 			goto drop;
    620  1.286     ozaki 		}
    621  1.286     ozaki 		break;
    622  1.286     ozaki #endif
    623  1.286     ozaki 	default:
    624  1.286     ozaki 		goto drop;
    625  1.286     ozaki 	}
    626  1.286     ozaki 
    627  1.286     ozaki 	KASSERT(inq != NULL);
    628  1.286     ozaki 	IFQ_ENQUEUE_ISR(inq, m, isr);
    629  1.286     ozaki 	return;
    630  1.286     ozaki 
    631  1.286     ozaki drop:
    632  1.286     ozaki 	m_freem(m);
    633  1.287     ozaki 	if_statinc(ifp, if_ierrors); /* XXX should have a dedicated counter? */
    634  1.286     ozaki 	return;
    635  1.286     ozaki }
    636  1.286     ozaki #endif /* defined (LLC) || defined (NETATALK) */
    637  1.286     ozaki 
    638    1.1       cgd /*
    639    1.1       cgd  * Process a received Ethernet packet;
    640   1.42   thorpej  * the packet is in the mbuf chain m with
    641   1.42   thorpej  * the ether header.
    642    1.1       cgd  */
    643  1.133  liamjfoy void
    644   1.58      matt ether_input(struct ifnet *ifp, struct mbuf *m)
    645    1.1       cgd {
    646   1.91   thorpej 	struct ethercom *ec = (struct ethercom *) ifp;
    647  1.199     rmind 	pktqueue_t *pktq = NULL;
    648  1.199     rmind 	struct ifqueue *inq = NULL;
    649  1.162      matt 	uint16_t etype;
    650   1.42   thorpej 	struct ether_header *eh;
    651  1.187      matt 	size_t ehlen;
    652  1.204       tls 	static int earlypkts;
    653  1.198   msaitoh 	int isr = 0;
    654  1.294  yamaguch #if NAGR > 0
    655  1.294  yamaguch 	void *agrprivate;
    656  1.294  yamaguch #endif
    657    1.1       cgd 
    658  1.216     ozaki 	KASSERT(!cpu_intr_p());
    659  1.253      maxv 	KASSERT((m->m_flags & M_PKTHDR) != 0);
    660  1.216     ozaki 
    661  1.287     ozaki 	if ((ifp->if_flags & IFF_UP) == 0)
    662  1.287     ozaki 		goto drop;
    663  1.290       roy 
    664  1.291       roy #ifdef MBUFTRACE
    665  1.291       roy 	m_claimm(m, &ec->ec_rx_mowner);
    666  1.291       roy #endif
    667  1.291       roy 
    668  1.292       roy 	if (__predict_false(m->m_len < sizeof(*eh))) {
    669  1.290       roy 		if ((m = m_pullup(m, sizeof(*eh))) == NULL)
    670  1.287     ozaki 			goto dropped;
    671  1.267      maxv 	}
    672   1.42   thorpej 
    673   1.42   thorpej 	eh = mtod(m, struct ether_header *);
    674   1.63   thorpej 	etype = ntohs(eh->ether_type);
    675  1.187      matt 	ehlen = sizeof(*eh);
    676   1.63   thorpej 
    677  1.284  riastrad 	if (__predict_false(earlypkts < 100 ||
    678  1.284  riastrad 		entropy_epoch() == (unsigned)-1)) {
    679  1.204       tls 		rnd_add_data(NULL, eh, ehlen, 0);
    680  1.204       tls 		earlypkts++;
    681  1.204       tls 	}
    682  1.204       tls 
    683   1.63   thorpej 	/*
    684  1.258      maxv 	 * Determine if the packet is within its size limits. For MPLS the
    685  1.258      maxv 	 * header length is variable, so we skip the check.
    686   1.63   thorpej 	 */
    687  1.182    kefren 	if (etype != ETHERTYPE_MPLS && m->m_pkthdr.len >
    688   1.83   thorpej 	    ETHER_MAX_FRAME(ifp, etype, m->m_flags & M_HASFCS)) {
    689  1.278   msaitoh #ifdef DIAGNOSTIC
    690  1.203     ozaki 		mutex_enter(&bigpktpps_lock);
    691  1.123      matt 		if (ppsratecheck(&bigpktppslim_last, &bigpktpps_count,
    692  1.261      maxv 		    bigpktppslim)) {
    693  1.123      matt 			printf("%s: discarding oversize frame (len=%d)\n",
    694  1.123      matt 			    ifp->if_xname, m->m_pkthdr.len);
    695  1.123      matt 		}
    696  1.203     ozaki 		mutex_exit(&bigpktpps_lock);
    697  1.278   msaitoh #endif
    698  1.287     ozaki 		goto drop;
    699   1.63   thorpej 	}
    700   1.77   thorpej 
    701   1.84   thorpej 	if (ETHER_IS_MULTICAST(eh->ether_dhost)) {
    702   1.84   thorpej 		/*
    703   1.84   thorpej 		 * If this is not a simplex interface, drop the packet
    704   1.84   thorpej 		 * if it came from us.
    705   1.84   thorpej 		 */
    706   1.84   thorpej 		if ((ifp->if_flags & IFF_SIMPLEX) == 0 &&
    707  1.153    dyoung 		    memcmp(CLLADDR(ifp->if_sadl), eh->ether_shost,
    708   1.84   thorpej 		    ETHER_ADDR_LEN) == 0) {
    709  1.287     ozaki 			goto drop;
    710   1.84   thorpej 		}
    711   1.84   thorpej 
    712   1.84   thorpej 		if (memcmp(etherbroadcastaddr,
    713   1.84   thorpej 		    eh->ether_dhost, ETHER_ADDR_LEN) == 0)
    714   1.84   thorpej 			m->m_flags |= M_BCAST;
    715   1.84   thorpej 		else
    716   1.84   thorpej 			m->m_flags |= M_MCAST;
    717  1.282   thorpej 		if_statinc(ifp, if_imcasts);
    718   1.84   thorpej 	}
    719   1.84   thorpej 
    720   1.79   thorpej 	/* If the CRC is still on the packet, trim it off. */
    721   1.79   thorpej 	if (m->m_flags & M_HASFCS) {
    722   1.79   thorpej 		m_adj(m, -ETHER_CRC_LEN);
    723   1.79   thorpej 		m->m_flags &= ~M_HASFCS;
    724   1.79   thorpej 	}
    725   1.79   thorpej 
    726  1.282   thorpej 	if_statadd(ifp, if_ibytes, m->m_pkthdr.len);
    727   1.78   thorpej 
    728  1.201     ozaki #if NCARP > 0
    729  1.201     ozaki 	if (__predict_false(ifp->if_carp && ifp->if_type != IFT_CARP)) {
    730  1.201     ozaki 		/*
    731  1.261      maxv 		 * Clear M_PROMISC, in case the packet comes from a
    732  1.261      maxv 		 * vlan.
    733  1.201     ozaki 		 */
    734  1.137    rpaulo 		m->m_flags &= ~M_PROMISC;
    735  1.201     ozaki 		if (carp_input(m, (uint8_t *)&eh->ether_shost,
    736  1.201     ozaki 		    (uint8_t *)&eh->ether_dhost, eh->ether_type) == 0)
    737  1.137    rpaulo 			return;
    738  1.201     ozaki 	}
    739  1.253      maxv #endif
    740  1.250      maxv 
    741  1.247   msaitoh 	if ((m->m_flags & (M_BCAST | M_MCAST | M_PROMISC)) == 0 &&
    742  1.201     ozaki 	    (ifp->if_flags & IFF_PROMISC) != 0 &&
    743  1.201     ozaki 	    memcmp(CLLADDR(ifp->if_sadl), eh->ether_dhost,
    744  1.261      maxv 	     ETHER_ADDR_LEN) != 0) {
    745  1.201     ozaki 		m->m_flags |= M_PROMISC;
    746   1.70    bouyer 	}
    747   1.78   thorpej 
    748  1.106    bouyer 	if ((m->m_flags & M_PROMISC) == 0) {
    749  1.195     rmind 		if (pfil_run_hooks(ifp->if_pfil, &m, ifp, PFIL_IN) != 0)
    750  1.106    bouyer 			return;
    751  1.106    bouyer 		if (m == NULL)
    752  1.106    bouyer 			return;
    753   1.78   thorpej 
    754  1.106    bouyer 		eh = mtod(m, struct ether_header *);
    755  1.106    bouyer 		etype = ntohs(eh->ether_type);
    756  1.106    bouyer 	}
    757   1.70    bouyer 
    758  1.172    darran #if NAGR > 0
    759  1.294  yamaguch 	if (ifp->if_type != IFT_IEEE8023ADLAG) {
    760  1.294  yamaguch 		agrprivate = ifp->if_lagg;
    761  1.294  yamaguch 	} else {
    762  1.294  yamaguch 		agrprivate = NULL;
    763  1.294  yamaguch 	}
    764  1.294  yamaguch 	if (agrprivate != NULL &&
    765  1.172    darran 	    __predict_true(etype != ETHERTYPE_SLOWPROTOCOLS)) {
    766  1.172    darran 		m->m_flags &= ~M_PROMISC;
    767  1.172    darran 		agr_input(ifp, m);
    768  1.172    darran 		return;
    769  1.172    darran 	}
    770  1.253      maxv #endif
    771  1.172    darran 
    772  1.293  yamaguch 	/* Handle input from a lagg(4) port */
    773  1.293  yamaguch 	if (ifp->if_type == IFT_IEEE8023ADLAG) {
    774  1.293  yamaguch 		KASSERT(lagg_input_ethernet_p != NULL);
    775  1.293  yamaguch 		m = (*lagg_input_ethernet_p)(ifp, m);
    776  1.293  yamaguch 		if (m == NULL)
    777  1.293  yamaguch 			return;
    778  1.293  yamaguch 	}
    779  1.293  yamaguch 
    780   1.91   thorpej 	/*
    781   1.91   thorpej 	 * If VLANs are configured on the interface, check to
    782   1.91   thorpej 	 * see if the device performed the decapsulation and
    783   1.91   thorpej 	 * provided us with the tag.
    784   1.91   thorpej 	 */
    785  1.244  knakahar 	if (ec->ec_nvlans && vlan_has_tag(m)) {
    786   1.70    bouyer #if NVLAN > 0
    787   1.70    bouyer 		/*
    788   1.70    bouyer 		 * vlan_input() will either recursively call ether_input()
    789   1.70    bouyer 		 * or drop the packet.
    790   1.70    bouyer 		 */
    791   1.91   thorpej 		vlan_input(ifp, m);
    792  1.287     ozaki 		return;
    793   1.91   thorpej #else
    794  1.287     ozaki 		goto drop;
    795   1.70    bouyer #endif
    796   1.61   thorpej 	}
    797    1.1       cgd 
    798   1.59   thorpej 	/*
    799   1.59   thorpej 	 * Handle protocols that expect to have the Ethernet header
    800   1.59   thorpej 	 * (and possibly FCS) intact.
    801   1.59   thorpej 	 */
    802   1.59   thorpej 	switch (etype) {
    803  1.187      matt 	case ETHERTYPE_VLAN: {
    804  1.187      matt 		struct ether_vlan_header *evl = (void *)eh;
    805  1.253      maxv 
    806  1.187      matt 		/*
    807  1.187      matt 		 * If there is a tag of 0, then the VLAN header was probably
    808  1.187      matt 		 * just being used to store the priority.  Extract the ether
    809  1.250      maxv 		 * type, and if IP or IPV6, let them deal with it.
    810  1.187      matt 		 */
    811  1.254      maxv 		if (m->m_len >= sizeof(*evl) &&
    812  1.253      maxv 		    EVL_VLANOFTAG(evl->evl_tag) == 0) {
    813  1.187      matt 			etype = ntohs(evl->evl_proto);
    814  1.187      matt 			ehlen = sizeof(*evl);
    815  1.253      maxv 			if ((m->m_flags & M_PROMISC) == 0 &&
    816  1.253      maxv 			    (etype == ETHERTYPE_IP ||
    817  1.253      maxv 			     etype == ETHERTYPE_IPV6))
    818  1.187      matt 				break;
    819  1.187      matt 		}
    820  1.253      maxv 
    821   1.59   thorpej #if NVLAN > 0
    822   1.59   thorpej 		/*
    823   1.59   thorpej 		 * vlan_input() will either recursively call ether_input()
    824   1.59   thorpej 		 * or drop the packet.
    825   1.59   thorpej 		 */
    826  1.287     ozaki 		if (ec->ec_nvlans != 0) {
    827   1.63   thorpej 			vlan_input(ifp, m);
    828  1.287     ozaki 			return;
    829  1.287     ozaki 		} else
    830  1.253      maxv #endif
    831  1.287     ozaki 			goto drop;
    832  1.187      matt 	}
    833  1.253      maxv 
    834   1.81    martin #if NPPPOE > 0
    835   1.81    martin 	case ETHERTYPE_PPPOEDISC:
    836  1.218     ozaki 		pppoedisc_input(ifp, m);
    837  1.218     ozaki 		return;
    838  1.253      maxv 
    839   1.81    martin 	case ETHERTYPE_PPPOE:
    840  1.218     ozaki 		pppoe_input(ifp, m);
    841   1.81    martin 		return;
    842  1.253      maxv #endif
    843  1.253      maxv 
    844  1.121      yamt 	case ETHERTYPE_SLOWPROTOCOLS: {
    845  1.121      yamt 		uint8_t subtype;
    846  1.121      yamt 
    847  1.287     ozaki 		if (m->m_pkthdr.len < sizeof(*eh) + sizeof(subtype))
    848  1.287     ozaki 			goto drop;
    849  1.253      maxv 
    850  1.121      yamt 		m_copydata(m, sizeof(*eh), sizeof(subtype), &subtype);
    851  1.121      yamt 		switch (subtype) {
    852  1.121      yamt #if NAGR > 0
    853  1.121      yamt 		case SLOWPROTOCOLS_SUBTYPE_LACP:
    854  1.294  yamaguch 			if (agrprivate != NULL) {
    855  1.121      yamt 				ieee8023ad_lacp_input(ifp, m);
    856  1.121      yamt 				return;
    857  1.121      yamt 			}
    858  1.121      yamt 			break;
    859  1.121      yamt 
    860  1.121      yamt 		case SLOWPROTOCOLS_SUBTYPE_MARKER:
    861  1.294  yamaguch 			if (agrprivate != NULL) {
    862  1.121      yamt 				ieee8023ad_marker_input(ifp, m);
    863  1.121      yamt 				return;
    864  1.121      yamt 			}
    865  1.121      yamt 			break;
    866  1.261      maxv #endif
    867  1.253      maxv 
    868  1.121      yamt 		default:
    869  1.121      yamt 			if (subtype == 0 || subtype > 10) {
    870  1.121      yamt 				/* illegal value */
    871  1.287     ozaki 				goto drop;
    872  1.121      yamt 			}
    873  1.121      yamt 			/* unknown subtype */
    874  1.121      yamt 			break;
    875  1.121      yamt 		}
    876  1.121      yamt 	}
    877  1.273       mrg 	/* FALLTHROUGH */
    878   1.59   thorpej 	default:
    879  1.287     ozaki 		if (m->m_flags & M_PROMISC)
    880  1.287     ozaki 			goto drop;
    881   1.59   thorpej 	}
    882   1.42   thorpej 
    883   1.45   thorpej 	/* If the CRC is still on the packet, trim it off. */
    884   1.79   thorpej 	if (m->m_flags & M_HASFCS) {
    885   1.45   thorpej 		m_adj(m, -ETHER_CRC_LEN);
    886   1.79   thorpej 		m->m_flags &= ~M_HASFCS;
    887   1.79   thorpej 	}
    888   1.42   thorpej 
    889  1.286     ozaki 	/* etype represents the size of the payload in this case */
    890  1.286     ozaki 	if (etype <= ETHERMTU + sizeof(struct ether_header)) {
    891  1.286     ozaki 		KASSERT(ehlen == sizeof(*eh));
    892  1.286     ozaki #if defined (LLC) || defined (NETATALK)
    893  1.286     ozaki 		ether_input_llc(ifp, m, eh);
    894  1.286     ozaki 		return;
    895  1.286     ozaki #else
    896  1.287     ozaki 		goto drop;
    897  1.286     ozaki #endif
    898  1.286     ozaki 	}
    899  1.139        is 
    900  1.286     ozaki 	/* Strip off the Ethernet header. */
    901  1.286     ozaki 	m_adj(m, ehlen);
    902  1.286     ozaki 
    903  1.286     ozaki 	switch (etype) {
    904    1.1       cgd #ifdef INET
    905  1.286     ozaki 	case ETHERTYPE_IP:
    906   1.30      matt #ifdef GATEWAY
    907  1.286     ozaki 		if (ipflow_fastforward(m))
    908  1.286     ozaki 			return;
    909   1.30      matt #endif
    910  1.286     ozaki 		pktq = ip_pktq;
    911  1.286     ozaki 		break;
    912    1.1       cgd 
    913  1.286     ozaki 	case ETHERTYPE_ARP:
    914  1.286     ozaki 		isr = NETISR_ARP;
    915  1.286     ozaki 		inq = &arpintrq;
    916  1.286     ozaki 		break;
    917    1.7     glass 
    918  1.286     ozaki 	case ETHERTYPE_REVARP:
    919  1.286     ozaki 		revarpinput(m);	/* XXX queue? */
    920  1.286     ozaki 		return;
    921    1.1       cgd #endif
    922  1.253      maxv 
    923   1.44    itojun #ifdef INET6
    924  1.286     ozaki 	case ETHERTYPE_IPV6:
    925  1.287     ozaki 		if (__predict_false(!in6_present))
    926  1.287     ozaki 			goto drop;
    927  1.250      maxv #ifdef GATEWAY
    928  1.286     ozaki 		if (ip6flow_fastforward(&m))
    929  1.286     ozaki 			return;
    930  1.148  liamjfoy #endif
    931  1.286     ozaki 		pktq = ip6_pktq;
    932  1.286     ozaki 		break;
    933   1.44    itojun #endif
    934  1.253      maxv 
    935   1.23  christos #ifdef NETATALK
    936  1.286     ozaki 	case ETHERTYPE_ATALK:
    937  1.286     ozaki 		isr = NETISR_ATALK;
    938  1.286     ozaki 		inq = &atintrq1;
    939  1.286     ozaki 		break;
    940  1.253      maxv 
    941  1.286     ozaki 	case ETHERTYPE_AARP:
    942  1.286     ozaki 		aarpinput(ifp, m); /* XXX queue? */
    943  1.286     ozaki 		return;
    944  1.253      maxv #endif
    945  1.253      maxv 
    946  1.182    kefren #ifdef MPLS
    947  1.286     ozaki 	case ETHERTYPE_MPLS:
    948  1.286     ozaki 		isr = NETISR_MPLS;
    949  1.286     ozaki 		inq = &mplsintrq;
    950  1.286     ozaki 		break;
    951  1.182    kefren #endif
    952  1.253      maxv 
    953  1.286     ozaki 	default:
    954  1.287     ozaki 		goto drop;
    955    1.1       cgd 	}
    956    1.1       cgd 
    957  1.199     rmind 	if (__predict_true(pktq)) {
    958  1.229     ozaki #ifdef NET_MPSAFE
    959  1.229     ozaki 		const u_int h = curcpu()->ci_index;
    960  1.229     ozaki #else
    961  1.199     rmind 		const uint32_t h = pktq_rps_hash(m);
    962  1.229     ozaki #endif
    963  1.199     rmind 		if (__predict_false(!pktq_enqueue(pktq, m, h))) {
    964  1.199     rmind 			m_freem(m);
    965  1.199     rmind 		}
    966  1.199     rmind 		return;
    967  1.199     rmind 	}
    968  1.199     rmind 
    969  1.199     rmind 	if (__predict_false(!inq)) {
    970  1.199     rmind 		/* Should not happen. */
    971  1.287     ozaki 		goto drop;
    972  1.199     rmind 	}
    973  1.228     ozaki 
    974  1.285     ozaki 	IFQ_ENQUEUE_ISR(inq, m, isr);
    975  1.287     ozaki 	return;
    976  1.287     ozaki 
    977  1.287     ozaki drop:
    978  1.287     ozaki 	m_freem(m);
    979  1.287     ozaki dropped:
    980  1.287     ozaki 	if_statinc(ifp, if_ierrors); /* XXX should have a dedicated counter? */
    981    1.1       cgd }
    982    1.1       cgd 
    983    1.1       cgd /*
    984    1.1       cgd  * Convert Ethernet address to printable (loggable) representation.
    985    1.1       cgd  */
    986    1.1       cgd char *
    987   1.58      matt ether_sprintf(const u_char *ap)
    988    1.1       cgd {
    989  1.129  christos 	static char etherbuf[3 * ETHER_ADDR_LEN];
    990  1.129  christos 	return ether_snprintf(etherbuf, sizeof(etherbuf), ap);
    991  1.129  christos }
    992  1.129  christos 
    993  1.129  christos char *
    994  1.129  christos ether_snprintf(char *buf, size_t len, const u_char *ap)
    995  1.129  christos {
    996  1.129  christos 	char *cp = buf;
    997  1.129  christos 	size_t i;
    998    1.1       cgd 
    999  1.129  christos 	for (i = 0; i < len / 3; i++) {
   1000  1.124  christos 		*cp++ = hexdigits[*ap >> 4];
   1001  1.124  christos 		*cp++ = hexdigits[*ap++ & 0xf];
   1002    1.1       cgd 		*cp++ = ':';
   1003    1.1       cgd 	}
   1004  1.129  christos 	*--cp = '\0';
   1005  1.129  christos 	return buf;
   1006    1.1       cgd }
   1007    1.8   mycroft 
   1008  1.289       roy static void
   1009  1.289       roy ether_link_state_changed(struct ifnet *ifp, int link_state)
   1010  1.289       roy {
   1011  1.289       roy #if NVLAN > 0
   1012  1.289       roy 	struct ethercom *ec = (void *)ifp;
   1013  1.289       roy 
   1014  1.289       roy 	if (ec->ec_nvlans)
   1015  1.289       roy 		vlan_link_state_changed(ifp, link_state);
   1016  1.289       roy #endif
   1017  1.289       roy }
   1018  1.289       roy 
   1019    1.8   mycroft /*
   1020    1.8   mycroft  * Perform common duties while attaching to interface list
   1021    1.8   mycroft  */
   1022    1.8   mycroft void
   1023  1.162      matt ether_ifattach(struct ifnet *ifp, const uint8_t *lla)
   1024    1.8   mycroft {
   1025  1.104      matt 	struct ethercom *ec = (struct ethercom *)ifp;
   1026    1.8   mycroft 
   1027    1.8   mycroft 	ifp->if_type = IFT_ETHER;
   1028   1.94     enami 	ifp->if_hdrlen = ETHER_HDR_LEN;
   1029   1.73   thorpej 	ifp->if_dlt = DLT_EN10MB;
   1030    1.8   mycroft 	ifp->if_mtu = ETHERMTU;
   1031   1.12   mycroft 	ifp->if_output = ether_output;
   1032  1.216     ozaki 	ifp->_if_input = ether_input;
   1033  1.289       roy 	ifp->if_link_state_changed = ether_link_state_changed;
   1034   1.54   thorpej 	if (ifp->if_baudrate == 0)
   1035   1.54   thorpej 		ifp->if_baudrate = IF_Mbps(10);		/* just a default */
   1036   1.75   thorpej 
   1037  1.230     ozaki 	if (lla != NULL)
   1038  1.230     ozaki 		if_set_sadl(ifp, lla, ETHER_ADDR_LEN, !ETHER_IS_LOCAL(lla));
   1039   1.75   thorpej 
   1040  1.104      matt 	LIST_INIT(&ec->ec_multiaddrs);
   1041  1.276   msaitoh 	SIMPLEQ_INIT(&ec->ec_vids);
   1042  1.233     ozaki 	ec->ec_lock = mutex_obj_alloc(MUTEX_DEFAULT, IPL_NET);
   1043  1.274     ozaki 	ec->ec_flags = 0;
   1044   1.26        is 	ifp->if_broadcastaddr = etherbroadcastaddr;
   1045  1.177     joerg 	bpf_attach(ifp, DLT_EN10MB, sizeof(struct ether_header));
   1046  1.104      matt #ifdef MBUFTRACE
   1047  1.283   thorpej 	mowner_init_owner(&ec->ec_tx_mowner, ifp->if_xname, "tx");
   1048  1.283   thorpej 	mowner_init_owner(&ec->ec_rx_mowner, ifp->if_xname, "rx");
   1049  1.104      matt 	MOWNER_ATTACH(&ec->ec_tx_mowner);
   1050  1.104      matt 	MOWNER_ATTACH(&ec->ec_rx_mowner);
   1051  1.104      matt 	ifp->if_mowner = &ec->ec_tx_mowner;
   1052  1.104      matt #endif
   1053   1.52   thorpej }
   1054   1.52   thorpej 
   1055   1.52   thorpej void
   1056   1.58      matt ether_ifdetach(struct ifnet *ifp)
   1057   1.52   thorpej {
   1058   1.63   thorpej 	struct ethercom *ec = (void *) ifp;
   1059   1.63   thorpej 	struct ether_multi *enm;
   1060   1.69   thorpej 
   1061  1.269     ozaki 	IFNET_ASSERT_UNLOCKED(ifp);
   1062  1.190  christos 	/*
   1063  1.190  christos 	 * Prevent further calls to ioctl (for example turning off
   1064  1.190  christos 	 * promiscuous mode from the bridge code), which eventually can
   1065  1.190  christos 	 * call if_init() which can cause panics because the interface
   1066  1.190  christos 	 * is in the process of being detached. Return device not configured
   1067  1.190  christos 	 * instead.
   1068  1.190  christos 	 */
   1069  1.280  christos 	ifp->if_ioctl = __FPTRCAST(int (*)(struct ifnet *, u_long, void *),
   1070  1.280  christos 	    enxio);
   1071  1.190  christos 
   1072  1.115    dyoung #if NBRIDGE > 0
   1073  1.115    dyoung 	if (ifp->if_bridge)
   1074  1.115    dyoung 		bridge_ifdetach(ifp);
   1075  1.115    dyoung #endif
   1076  1.177     joerg 	bpf_detach(ifp);
   1077   1.64   thorpej #if NVLAN > 0
   1078   1.64   thorpej 	if (ec->ec_nvlans)
   1079   1.64   thorpej 		vlan_ifdetach(ifp);
   1080   1.64   thorpej #endif
   1081   1.63   thorpej 
   1082  1.293  yamaguch #if NLAGG > 0
   1083  1.293  yamaguch 	if (ifp->if_lagg)
   1084  1.293  yamaguch 		lagg_ifdetach(ifp);
   1085  1.293  yamaguch #endif
   1086  1.293  yamaguch 
   1087  1.245   msaitoh 	ETHER_LOCK(ec);
   1088  1.276   msaitoh 	KASSERT(ec->ec_nvlans == 0);
   1089   1.63   thorpej 	while ((enm = LIST_FIRST(&ec->ec_multiaddrs)) != NULL) {
   1090   1.63   thorpej 		LIST_REMOVE(enm, enm_list);
   1091  1.248     ozaki 		kmem_free(enm, sizeof(*enm));
   1092   1.63   thorpej 		ec->ec_multicnt--;
   1093   1.63   thorpej 	}
   1094  1.245   msaitoh 	ETHER_UNLOCK(ec);
   1095   1.52   thorpej 
   1096  1.252      maxv 	mutex_obj_free(ec->ec_lock);
   1097  1.253      maxv 	ec->ec_lock = NULL;
   1098  1.231     ozaki 
   1099  1.189       chs 	ifp->if_mowner = NULL;
   1100  1.104      matt 	MOWNER_DETACH(&ec->ec_rx_mowner);
   1101  1.104      matt 	MOWNER_DETACH(&ec->ec_tx_mowner);
   1102   1.53   thorpej }
   1103   1.53   thorpej 
   1104   1.56   thorpej #if 0
   1105   1.56   thorpej /*
   1106   1.56   thorpej  * This is for reference.  We have a table-driven version
   1107   1.56   thorpej  * of the little-endian crc32 generator, which is faster
   1108   1.56   thorpej  * than the double-loop.
   1109   1.56   thorpej  */
   1110  1.162      matt uint32_t
   1111  1.162      matt ether_crc32_le(const uint8_t *buf, size_t len)
   1112   1.53   thorpej {
   1113  1.162      matt 	uint32_t c, crc, carry;
   1114   1.53   thorpej 	size_t i, j;
   1115   1.53   thorpej 
   1116   1.53   thorpej 	crc = 0xffffffffU;	/* initial value */
   1117   1.53   thorpej 
   1118   1.53   thorpej 	for (i = 0; i < len; i++) {
   1119   1.53   thorpej 		c = buf[i];
   1120   1.53   thorpej 		for (j = 0; j < 8; j++) {
   1121   1.53   thorpej 			carry = ((crc & 0x01) ? 1 : 0) ^ (c & 0x01);
   1122   1.53   thorpej 			crc >>= 1;
   1123   1.53   thorpej 			c >>= 1;
   1124   1.53   thorpej 			if (carry)
   1125   1.56   thorpej 				crc = (crc ^ ETHER_CRC_POLY_LE);
   1126   1.53   thorpej 		}
   1127   1.53   thorpej 	}
   1128   1.53   thorpej 
   1129   1.53   thorpej 	return (crc);
   1130   1.53   thorpej }
   1131   1.56   thorpej #else
   1132  1.162      matt uint32_t
   1133  1.162      matt ether_crc32_le(const uint8_t *buf, size_t len)
   1134   1.56   thorpej {
   1135  1.162      matt 	static const uint32_t crctab[] = {
   1136   1.56   thorpej 		0x00000000, 0x1db71064, 0x3b6e20c8, 0x26d930ac,
   1137   1.56   thorpej 		0x76dc4190, 0x6b6b51f4, 0x4db26158, 0x5005713c,
   1138   1.56   thorpej 		0xedb88320, 0xf00f9344, 0xd6d6a3e8, 0xcb61b38c,
   1139   1.56   thorpej 		0x9b64c2b0, 0x86d3d2d4, 0xa00ae278, 0xbdbdf21c
   1140   1.56   thorpej 	};
   1141  1.162      matt 	uint32_t crc;
   1142   1.98   thorpej 	size_t i;
   1143   1.56   thorpej 
   1144   1.56   thorpej 	crc = 0xffffffffU;	/* initial value */
   1145   1.56   thorpej 
   1146   1.56   thorpej 	for (i = 0; i < len; i++) {
   1147   1.56   thorpej 		crc ^= buf[i];
   1148   1.56   thorpej 		crc = (crc >> 4) ^ crctab[crc & 0xf];
   1149   1.56   thorpej 		crc = (crc >> 4) ^ crctab[crc & 0xf];
   1150   1.56   thorpej 	}
   1151   1.56   thorpej 
   1152   1.56   thorpej 	return (crc);
   1153   1.56   thorpej }
   1154   1.56   thorpej #endif
   1155   1.53   thorpej 
   1156  1.162      matt uint32_t
   1157  1.162      matt ether_crc32_be(const uint8_t *buf, size_t len)
   1158   1.53   thorpej {
   1159  1.162      matt 	uint32_t c, crc, carry;
   1160   1.53   thorpej 	size_t i, j;
   1161   1.53   thorpej 
   1162   1.53   thorpej 	crc = 0xffffffffU;	/* initial value */
   1163   1.53   thorpej 
   1164   1.53   thorpej 	for (i = 0; i < len; i++) {
   1165   1.53   thorpej 		c = buf[i];
   1166   1.53   thorpej 		for (j = 0; j < 8; j++) {
   1167   1.53   thorpej 			carry = ((crc & 0x80000000U) ? 1 : 0) ^ (c & 0x01);
   1168   1.53   thorpej 			crc <<= 1;
   1169   1.53   thorpej 			c >>= 1;
   1170   1.53   thorpej 			if (carry)
   1171   1.53   thorpej 				crc = (crc ^ ETHER_CRC_POLY_BE) | carry;
   1172   1.53   thorpej 		}
   1173   1.53   thorpej 	}
   1174   1.53   thorpej 
   1175   1.53   thorpej 	return (crc);
   1176    1.8   mycroft }
   1177    1.8   mycroft 
   1178   1.48        is #ifdef INET
   1179  1.118      yamt const uint8_t ether_ipmulticast_min[ETHER_ADDR_LEN] =
   1180  1.118      yamt     { 0x01, 0x00, 0x5e, 0x00, 0x00, 0x00 };
   1181  1.118      yamt const uint8_t ether_ipmulticast_max[ETHER_ADDR_LEN] =
   1182  1.118      yamt     { 0x01, 0x00, 0x5e, 0x7f, 0xff, 0xff };
   1183   1.48        is #endif
   1184   1.44    itojun #ifdef INET6
   1185  1.118      yamt const uint8_t ether_ip6multicast_min[ETHER_ADDR_LEN] =
   1186  1.118      yamt     { 0x33, 0x33, 0x00, 0x00, 0x00, 0x00 };
   1187  1.118      yamt const uint8_t ether_ip6multicast_max[ETHER_ADDR_LEN] =
   1188  1.118      yamt     { 0x33, 0x33, 0xff, 0xff, 0xff, 0xff };
   1189   1.44    itojun #endif
   1190   1.60     enami 
   1191    1.3   hpeyerl /*
   1192  1.138    rpaulo  * ether_aton implementation, not using a static buffer.
   1193  1.138    rpaulo  */
   1194  1.138    rpaulo int
   1195  1.180  christos ether_aton_r(u_char *dest, size_t len, const char *str)
   1196  1.138    rpaulo {
   1197  1.250      maxv 	const u_char *cp = (const void *)str;
   1198  1.180  christos 	u_char *ep;
   1199  1.180  christos 
   1200  1.185   tsutsui #define atox(c)	(((c) <= '9') ? ((c) - '0') : ((toupper(c) - 'A') + 10))
   1201  1.180  christos 
   1202  1.180  christos 	if (len < ETHER_ADDR_LEN)
   1203  1.180  christos 		return ENOSPC;
   1204  1.180  christos 
   1205  1.180  christos 	ep = dest + ETHER_ADDR_LEN;
   1206  1.250      maxv 
   1207  1.180  christos 	while (*cp) {
   1208  1.250      maxv 		if (!isxdigit(*cp))
   1209  1.250      maxv 			return EINVAL;
   1210  1.252      maxv 
   1211  1.180  christos 		*dest = atox(*cp);
   1212  1.180  christos 		cp++;
   1213  1.250      maxv 		if (isxdigit(*cp)) {
   1214  1.250      maxv 			*dest = (*dest << 4) | atox(*cp);
   1215  1.180  christos 			cp++;
   1216  1.250      maxv 		}
   1217  1.252      maxv 		dest++;
   1218  1.252      maxv 
   1219  1.180  christos 		if (dest == ep)
   1220  1.252      maxv 			return (*cp == '\0') ? 0 : ENAMETOOLONG;
   1221  1.252      maxv 
   1222  1.180  christos 		switch (*cp) {
   1223  1.180  christos 		case ':':
   1224  1.180  christos 		case '-':
   1225  1.180  christos 		case '.':
   1226  1.179  jakllsch 			cp++;
   1227  1.180  christos 			break;
   1228  1.179  jakllsch 		}
   1229  1.250      maxv 	}
   1230  1.180  christos 	return ENOBUFS;
   1231  1.138    rpaulo }
   1232  1.138    rpaulo 
   1233  1.138    rpaulo /*
   1234   1.60     enami  * Convert a sockaddr into an Ethernet address or range of Ethernet
   1235   1.60     enami  * addresses.
   1236    1.3   hpeyerl  */
   1237    1.3   hpeyerl int
   1238  1.162      matt ether_multiaddr(const struct sockaddr *sa, uint8_t addrlo[ETHER_ADDR_LEN],
   1239  1.162      matt     uint8_t addrhi[ETHER_ADDR_LEN])
   1240    1.3   hpeyerl {
   1241   1.24  christos #ifdef INET
   1242  1.155    dyoung 	const struct sockaddr_in *sin;
   1243  1.261      maxv #endif
   1244   1.44    itojun #ifdef INET6
   1245  1.155    dyoung 	const struct sockaddr_in6 *sin6;
   1246  1.261      maxv #endif
   1247    1.3   hpeyerl 
   1248   1.60     enami 	switch (sa->sa_family) {
   1249    1.3   hpeyerl 
   1250    1.3   hpeyerl 	case AF_UNSPEC:
   1251  1.146    dyoung 		memcpy(addrlo, sa->sa_data, ETHER_ADDR_LEN);
   1252  1.146    dyoung 		memcpy(addrhi, addrlo, ETHER_ADDR_LEN);
   1253    1.3   hpeyerl 		break;
   1254    1.3   hpeyerl 
   1255    1.3   hpeyerl #ifdef INET
   1256    1.3   hpeyerl 	case AF_INET:
   1257  1.155    dyoung 		sin = satocsin(sa);
   1258    1.3   hpeyerl 		if (sin->sin_addr.s_addr == INADDR_ANY) {
   1259    1.3   hpeyerl 			/*
   1260   1.60     enami 			 * An IP address of INADDR_ANY means listen to
   1261   1.60     enami 			 * or stop listening to all of the Ethernet
   1262   1.60     enami 			 * multicast addresses used for IP.
   1263    1.3   hpeyerl 			 * (This is for the sake of IP multicast routers.)
   1264    1.3   hpeyerl 			 */
   1265  1.146    dyoung 			memcpy(addrlo, ether_ipmulticast_min, ETHER_ADDR_LEN);
   1266  1.146    dyoung 			memcpy(addrhi, ether_ipmulticast_max, ETHER_ADDR_LEN);
   1267  1.252      maxv 		} else {
   1268    1.3   hpeyerl 			ETHER_MAP_IP_MULTICAST(&sin->sin_addr, addrlo);
   1269  1.146    dyoung 			memcpy(addrhi, addrlo, ETHER_ADDR_LEN);
   1270    1.3   hpeyerl 		}
   1271    1.3   hpeyerl 		break;
   1272    1.3   hpeyerl #endif
   1273   1.44    itojun #ifdef INET6
   1274   1.44    itojun 	case AF_INET6:
   1275  1.155    dyoung 		sin6 = satocsin6(sa);
   1276   1.47    itojun 		if (IN6_IS_ADDR_UNSPECIFIED(&sin6->sin6_addr)) {
   1277   1.44    itojun 			/*
   1278   1.60     enami 			 * An IP6 address of 0 means listen to or stop
   1279   1.60     enami 			 * listening to all of the Ethernet multicast
   1280   1.60     enami 			 * address used for IP6.
   1281   1.44    itojun 			 * (This is used for multicast routers.)
   1282   1.44    itojun 			 */
   1283  1.146    dyoung 			memcpy(addrlo, ether_ip6multicast_min, ETHER_ADDR_LEN);
   1284  1.146    dyoung 			memcpy(addrhi, ether_ip6multicast_max, ETHER_ADDR_LEN);
   1285   1.44    itojun 		} else {
   1286   1.44    itojun 			ETHER_MAP_IPV6_MULTICAST(&sin6->sin6_addr, addrlo);
   1287  1.146    dyoung 			memcpy(addrhi, addrlo, ETHER_ADDR_LEN);
   1288   1.44    itojun 		}
   1289   1.44    itojun 		break;
   1290   1.44    itojun #endif
   1291    1.3   hpeyerl 
   1292    1.3   hpeyerl 	default:
   1293  1.146    dyoung 		return EAFNOSUPPORT;
   1294   1.60     enami 	}
   1295  1.146    dyoung 	return 0;
   1296   1.60     enami }
   1297   1.60     enami 
   1298   1.60     enami /*
   1299   1.60     enami  * Add an Ethernet multicast address or range of addresses to the list for a
   1300   1.60     enami  * given interface.
   1301   1.60     enami  */
   1302   1.60     enami int
   1303  1.155    dyoung ether_addmulti(const struct sockaddr *sa, struct ethercom *ec)
   1304   1.60     enami {
   1305  1.231     ozaki 	struct ether_multi *enm, *_enm;
   1306   1.60     enami 	u_char addrlo[ETHER_ADDR_LEN];
   1307   1.60     enami 	u_char addrhi[ETHER_ADDR_LEN];
   1308  1.237     skrll 	int error = 0;
   1309  1.231     ozaki 
   1310  1.231     ozaki 	/* Allocate out of lock */
   1311  1.248     ozaki 	enm = kmem_alloc(sizeof(*enm), KM_SLEEP);
   1312   1.60     enami 
   1313  1.245   msaitoh 	ETHER_LOCK(ec);
   1314  1.155    dyoung 	error = ether_multiaddr(sa, addrlo, addrhi);
   1315  1.231     ozaki 	if (error != 0)
   1316  1.231     ozaki 		goto out;
   1317    1.3   hpeyerl 
   1318    1.3   hpeyerl 	/*
   1319    1.3   hpeyerl 	 * Verify that we have valid Ethernet multicast addresses.
   1320    1.3   hpeyerl 	 */
   1321  1.186      yamt 	if (!ETHER_IS_MULTICAST(addrlo) || !ETHER_IS_MULTICAST(addrhi)) {
   1322  1.231     ozaki 		error = EINVAL;
   1323  1.231     ozaki 		goto out;
   1324    1.3   hpeyerl 	}
   1325  1.252      maxv 
   1326    1.3   hpeyerl 	/*
   1327    1.3   hpeyerl 	 * See if the address range is already in the list.
   1328    1.3   hpeyerl 	 */
   1329  1.270  yamaguch 	_enm = ether_lookup_multi(addrlo, addrhi, ec);
   1330  1.231     ozaki 	if (_enm != NULL) {
   1331    1.3   hpeyerl 		/*
   1332    1.3   hpeyerl 		 * Found it; just increment the reference count.
   1333    1.3   hpeyerl 		 */
   1334  1.231     ozaki 		++_enm->enm_refcount;
   1335  1.231     ozaki 		error = 0;
   1336  1.231     ozaki 		goto out;
   1337    1.3   hpeyerl 	}
   1338  1.252      maxv 
   1339    1.3   hpeyerl 	/*
   1340  1.239     ozaki 	 * Link a new multicast record into the interface's multicast list.
   1341    1.3   hpeyerl 	 */
   1342  1.252      maxv 	memcpy(enm->enm_addrlo, addrlo, ETHER_ADDR_LEN);
   1343  1.252      maxv 	memcpy(enm->enm_addrhi, addrhi, ETHER_ADDR_LEN);
   1344    1.3   hpeyerl 	enm->enm_refcount = 1;
   1345   1.22        is 	LIST_INSERT_HEAD(&ec->ec_multiaddrs, enm, enm_list);
   1346   1.22        is 	ec->ec_multicnt++;
   1347  1.252      maxv 
   1348    1.3   hpeyerl 	/*
   1349    1.3   hpeyerl 	 * Return ENETRESET to inform the driver that the list has changed
   1350    1.3   hpeyerl 	 * and its reception filter should be adjusted accordingly.
   1351    1.3   hpeyerl 	 */
   1352  1.231     ozaki 	error = ENETRESET;
   1353  1.231     ozaki 	enm = NULL;
   1354  1.252      maxv 
   1355  1.231     ozaki out:
   1356  1.245   msaitoh 	ETHER_UNLOCK(ec);
   1357  1.231     ozaki 	if (enm != NULL)
   1358  1.248     ozaki 		kmem_free(enm, sizeof(*enm));
   1359  1.231     ozaki 	return error;
   1360    1.3   hpeyerl }
   1361    1.3   hpeyerl 
   1362    1.3   hpeyerl /*
   1363    1.3   hpeyerl  * Delete a multicast address record.
   1364    1.3   hpeyerl  */
   1365    1.3   hpeyerl int
   1366  1.155    dyoung ether_delmulti(const struct sockaddr *sa, struct ethercom *ec)
   1367    1.3   hpeyerl {
   1368   1.29       mrg 	struct ether_multi *enm;
   1369   1.60     enami 	u_char addrlo[ETHER_ADDR_LEN];
   1370   1.60     enami 	u_char addrhi[ETHER_ADDR_LEN];
   1371  1.237     skrll 	int error;
   1372    1.3   hpeyerl 
   1373  1.245   msaitoh 	ETHER_LOCK(ec);
   1374  1.155    dyoung 	error = ether_multiaddr(sa, addrlo, addrhi);
   1375  1.231     ozaki 	if (error != 0)
   1376  1.231     ozaki 		goto error;
   1377    1.3   hpeyerl 
   1378    1.3   hpeyerl 	/*
   1379  1.252      maxv 	 * Look up the address in our list.
   1380    1.3   hpeyerl 	 */
   1381  1.270  yamaguch 	enm = ether_lookup_multi(addrlo, addrhi, ec);
   1382    1.3   hpeyerl 	if (enm == NULL) {
   1383  1.231     ozaki 		error = ENXIO;
   1384  1.231     ozaki 		goto error;
   1385    1.3   hpeyerl 	}
   1386    1.3   hpeyerl 	if (--enm->enm_refcount != 0) {
   1387    1.3   hpeyerl 		/*
   1388    1.3   hpeyerl 		 * Still some claims to this record.
   1389    1.3   hpeyerl 		 */
   1390  1.231     ozaki 		error = 0;
   1391  1.231     ozaki 		goto error;
   1392    1.3   hpeyerl 	}
   1393  1.252      maxv 
   1394    1.3   hpeyerl 	/*
   1395    1.3   hpeyerl 	 * No remaining claims to this record; unlink and free it.
   1396    1.3   hpeyerl 	 */
   1397   1.13   mycroft 	LIST_REMOVE(enm, enm_list);
   1398   1.22        is 	ec->ec_multicnt--;
   1399  1.245   msaitoh 	ETHER_UNLOCK(ec);
   1400  1.252      maxv 	kmem_free(enm, sizeof(*enm));
   1401  1.231     ozaki 
   1402    1.3   hpeyerl 	/*
   1403    1.3   hpeyerl 	 * Return ENETRESET to inform the driver that the list has changed
   1404    1.3   hpeyerl 	 * and its reception filter should be adjusted accordingly.
   1405    1.3   hpeyerl 	 */
   1406  1.231     ozaki 	return ENETRESET;
   1407  1.252      maxv 
   1408  1.231     ozaki error:
   1409  1.245   msaitoh 	ETHER_UNLOCK(ec);
   1410  1.231     ozaki 	return error;
   1411   1.66   thorpej }
   1412   1.66   thorpej 
   1413  1.170    dyoung void
   1414  1.170    dyoung ether_set_ifflags_cb(struct ethercom *ec, ether_cb_t cb)
   1415  1.170    dyoung {
   1416  1.170    dyoung 	ec->ec_ifflags_cb = cb;
   1417  1.170    dyoung }
   1418  1.170    dyoung 
   1419  1.276   msaitoh void
   1420  1.276   msaitoh ether_set_vlan_cb(struct ethercom *ec, ether_vlancb_t cb)
   1421  1.276   msaitoh {
   1422  1.276   msaitoh 
   1423  1.276   msaitoh 	ec->ec_vlan_cb = cb;
   1424  1.276   msaitoh }
   1425  1.276   msaitoh 
   1426  1.272   msaitoh static int
   1427  1.272   msaitoh ether_ioctl_reinit(struct ethercom *ec)
   1428  1.272   msaitoh {
   1429  1.272   msaitoh 	struct ifnet *ifp = &ec->ec_if;
   1430  1.272   msaitoh 	int error;
   1431  1.272   msaitoh 
   1432  1.272   msaitoh 	switch (ifp->if_flags & (IFF_UP | IFF_RUNNING)) {
   1433  1.272   msaitoh 	case IFF_RUNNING:
   1434  1.272   msaitoh 		/*
   1435  1.272   msaitoh 		 * If interface is marked down and it is running,
   1436  1.272   msaitoh 		 * then stop and disable it.
   1437  1.272   msaitoh 		 */
   1438  1.272   msaitoh 		(*ifp->if_stop)(ifp, 1);
   1439  1.272   msaitoh 		break;
   1440  1.272   msaitoh 	case IFF_UP:
   1441  1.272   msaitoh 		/*
   1442  1.272   msaitoh 		 * If interface is marked up and it is stopped, then
   1443  1.272   msaitoh 		 * start it.
   1444  1.272   msaitoh 		 */
   1445  1.272   msaitoh 		return (*ifp->if_init)(ifp);
   1446  1.272   msaitoh 	case IFF_UP | IFF_RUNNING:
   1447  1.272   msaitoh 		error = 0;
   1448  1.272   msaitoh 		if (ec->ec_ifflags_cb != NULL) {
   1449  1.272   msaitoh 			error = (*ec->ec_ifflags_cb)(ec);
   1450  1.272   msaitoh 			if (error == ENETRESET) {
   1451  1.272   msaitoh 				/*
   1452  1.272   msaitoh 				 * Reset the interface to pick up
   1453  1.272   msaitoh 				 * changes in any other flags that
   1454  1.272   msaitoh 				 * affect the hardware state.
   1455  1.272   msaitoh 				 */
   1456  1.272   msaitoh 				return (*ifp->if_init)(ifp);
   1457  1.272   msaitoh 			}
   1458  1.272   msaitoh 		} else
   1459  1.272   msaitoh 			error = (*ifp->if_init)(ifp);
   1460  1.272   msaitoh 		return error;
   1461  1.272   msaitoh 	case 0:
   1462  1.272   msaitoh 		break;
   1463  1.272   msaitoh 	}
   1464  1.272   msaitoh 
   1465  1.272   msaitoh 	return 0;
   1466  1.272   msaitoh }
   1467  1.272   msaitoh 
   1468   1.66   thorpej /*
   1469   1.66   thorpej  * Common ioctls for Ethernet interfaces.  Note, we must be
   1470   1.66   thorpej  * called at splnet().
   1471   1.66   thorpej  */
   1472   1.66   thorpej int
   1473  1.147  christos ether_ioctl(struct ifnet *ifp, u_long cmd, void *data)
   1474   1.66   thorpej {
   1475  1.272   msaitoh 	struct ethercom *ec = (void *)ifp;
   1476  1.193   msaitoh 	struct eccapreq *eccr;
   1477   1.66   thorpej 	struct ifreq *ifr = (struct ifreq *)data;
   1478  1.170    dyoung 	struct if_laddrreq *iflr = data;
   1479  1.170    dyoung 	const struct sockaddr_dl *sdl;
   1480  1.170    dyoung 	static const uint8_t zero[ETHER_ADDR_LEN];
   1481  1.169    dyoung 	int error;
   1482   1.66   thorpej 
   1483   1.66   thorpej 	switch (cmd) {
   1484  1.170    dyoung 	case SIOCINITIFADDR:
   1485  1.191      matt 	    {
   1486  1.191      matt 		struct ifaddr *ifa = (struct ifaddr *)data;
   1487  1.191      matt 		if (ifa->ifa_addr->sa_family != AF_LINK
   1488  1.247   msaitoh 		    && (ifp->if_flags & (IFF_UP | IFF_RUNNING)) !=
   1489  1.247   msaitoh 		       (IFF_UP | IFF_RUNNING)) {
   1490  1.170    dyoung 			ifp->if_flags |= IFF_UP;
   1491  1.170    dyoung 			if ((error = (*ifp->if_init)(ifp)) != 0)
   1492  1.170    dyoung 				return error;
   1493  1.170    dyoung 		}
   1494   1.66   thorpej #ifdef INET
   1495  1.191      matt 		if (ifa->ifa_addr->sa_family == AF_INET)
   1496  1.191      matt 			arp_ifinit(ifp, ifa);
   1497  1.252      maxv #endif
   1498  1.169    dyoung 		return 0;
   1499  1.191      matt 	    }
   1500   1.66   thorpej 
   1501   1.66   thorpej 	case SIOCSIFMTU:
   1502   1.82   thorpej 	    {
   1503   1.82   thorpej 		int maxmtu;
   1504   1.82   thorpej 
   1505   1.82   thorpej 		if (ec->ec_capabilities & ETHERCAP_JUMBO_MTU)
   1506   1.82   thorpej 			maxmtu = ETHERMTU_JUMBO;
   1507   1.82   thorpej 		else
   1508   1.82   thorpej 			maxmtu = ETHERMTU;
   1509   1.82   thorpej 
   1510   1.82   thorpej 		if (ifr->ifr_mtu < ETHERMIN || ifr->ifr_mtu > maxmtu)
   1511  1.169    dyoung 			return EINVAL;
   1512  1.169    dyoung 		else if ((error = ifioctl_common(ifp, cmd, data)) != ENETRESET)
   1513  1.169    dyoung 			return error;
   1514  1.169    dyoung 		else if (ifp->if_flags & IFF_UP) {
   1515   1.88   thorpej 			/* Make sure the device notices the MTU change. */
   1516  1.169    dyoung 			return (*ifp->if_init)(ifp);
   1517  1.169    dyoung 		} else
   1518  1.169    dyoung 			return 0;
   1519   1.82   thorpej 	    }
   1520   1.66   thorpej 
   1521   1.66   thorpej 	case SIOCSIFFLAGS:
   1522  1.170    dyoung 		if ((error = ifioctl_common(ifp, cmd, data)) != 0)
   1523  1.170    dyoung 			return error;
   1524  1.272   msaitoh 		return ether_ioctl_reinit(ec);
   1525  1.274     ozaki 	case SIOCGIFFLAGS:
   1526  1.274     ozaki 		error = ifioctl_common(ifp, cmd, data);
   1527  1.274     ozaki 		if (error == 0) {
   1528  1.274     ozaki 			/* Set IFF_ALLMULTI for backcompat */
   1529  1.274     ozaki 			ifr->ifr_flags |= (ec->ec_flags & ETHER_F_ALLMULTI) ?
   1530  1.274     ozaki 			    IFF_ALLMULTI : 0;
   1531  1.274     ozaki 		}
   1532  1.274     ozaki 		return error;
   1533  1.193   msaitoh 	case SIOCGETHERCAP:
   1534  1.193   msaitoh 		eccr = (struct eccapreq *)data;
   1535  1.193   msaitoh 		eccr->eccr_capabilities = ec->ec_capabilities;
   1536  1.193   msaitoh 		eccr->eccr_capenable = ec->ec_capenable;
   1537  1.193   msaitoh 		return 0;
   1538  1.272   msaitoh 	case SIOCSETHERCAP:
   1539  1.272   msaitoh 		eccr = (struct eccapreq *)data;
   1540  1.272   msaitoh 		if ((eccr->eccr_capenable & ~ec->ec_capabilities) != 0)
   1541  1.272   msaitoh 			return EINVAL;
   1542  1.272   msaitoh 		if (eccr->eccr_capenable == ec->ec_capenable)
   1543  1.272   msaitoh 			return 0;
   1544  1.272   msaitoh #if 0 /* notyet */
   1545  1.272   msaitoh 		ec->ec_capenable = (ec->ec_capenable & ETHERCAP_CANTCHANGE)
   1546  1.272   msaitoh 		    | (eccr->eccr_capenable & ~ETHERCAP_CANTCHANGE);
   1547  1.272   msaitoh #else
   1548  1.272   msaitoh 		ec->ec_capenable = eccr->eccr_capenable;
   1549  1.272   msaitoh #endif
   1550  1.272   msaitoh 		return ether_ioctl_reinit(ec);
   1551   1.66   thorpej 	case SIOCADDMULTI:
   1552  1.169    dyoung 		return ether_addmulti(ifreq_getaddr(cmd, ifr), ec);
   1553   1.66   thorpej 	case SIOCDELMULTI:
   1554  1.169    dyoung 		return ether_delmulti(ifreq_getaddr(cmd, ifr), ec);
   1555  1.160    dyoung 	case SIOCSIFMEDIA:
   1556  1.160    dyoung 	case SIOCGIFMEDIA:
   1557  1.275   msaitoh 		if (ec->ec_mii != NULL)
   1558  1.275   msaitoh 			return ifmedia_ioctl(ifp, ifr, &ec->ec_mii->mii_media,
   1559  1.275   msaitoh 			    cmd);
   1560  1.275   msaitoh 		else if (ec->ec_ifmedia != NULL)
   1561  1.275   msaitoh 			return ifmedia_ioctl(ifp, ifr, ec->ec_ifmedia, cmd);
   1562  1.275   msaitoh 		else
   1563  1.169    dyoung 			return ENOTTY;
   1564  1.275   msaitoh 		break;
   1565  1.170    dyoung 	case SIOCALIFADDR:
   1566  1.170    dyoung 		sdl = satocsdl(sstocsa(&iflr->addr));
   1567  1.170    dyoung 		if (sdl->sdl_family != AF_LINK)
   1568  1.170    dyoung 			;
   1569  1.170    dyoung 		else if (ETHER_IS_MULTICAST(CLLADDR(sdl)))
   1570  1.170    dyoung 			return EINVAL;
   1571  1.170    dyoung 		else if (memcmp(zero, CLLADDR(sdl), sizeof(zero)) == 0)
   1572  1.170    dyoung 			return EINVAL;
   1573  1.170    dyoung 		/*FALLTHROUGH*/
   1574  1.170    dyoung 	default:
   1575  1.161    dyoung 		return ifioctl_common(ifp, cmd, data);
   1576   1.66   thorpej 	}
   1577  1.169    dyoung 	return 0;
   1578    1.3   hpeyerl }
   1579  1.200     joerg 
   1580  1.215  christos /*
   1581  1.215  christos  * Enable/disable passing VLAN packets if the parent interface supports it.
   1582  1.215  christos  * Return:
   1583  1.215  christos  * 	 0: Ok
   1584  1.215  christos  *	-1: Parent interface does not support vlans
   1585  1.215  christos  *	>0: Error
   1586  1.215  christos  */
   1587  1.215  christos int
   1588  1.215  christos ether_enable_vlan_mtu(struct ifnet *ifp)
   1589  1.215  christos {
   1590  1.215  christos 	int error;
   1591  1.215  christos 	struct ethercom *ec = (void *)ifp;
   1592  1.215  christos 
   1593  1.215  christos 	/* Parent does not support VLAN's */
   1594  1.215  christos 	if ((ec->ec_capabilities & ETHERCAP_VLAN_MTU) == 0)
   1595  1.215  christos 		return -1;
   1596  1.215  christos 
   1597  1.215  christos 	/*
   1598  1.215  christos 	 * Parent supports the VLAN_MTU capability,
   1599  1.215  christos 	 * i.e. can Tx/Rx larger than ETHER_MAX_LEN frames;
   1600  1.215  christos 	 * enable it.
   1601  1.215  christos 	 */
   1602  1.215  christos 	ec->ec_capenable |= ETHERCAP_VLAN_MTU;
   1603  1.215  christos 
   1604  1.215  christos 	/* Interface is down, defer for later */
   1605  1.215  christos 	if ((ifp->if_flags & IFF_UP) == 0)
   1606  1.215  christos 		return 0;
   1607  1.215  christos 
   1608  1.215  christos 	if ((error = if_flags_set(ifp, ifp->if_flags)) == 0)
   1609  1.215  christos 		return 0;
   1610  1.215  christos 
   1611  1.215  christos 	ec->ec_capenable &= ~ETHERCAP_VLAN_MTU;
   1612  1.215  christos 	return error;
   1613  1.215  christos }
   1614  1.215  christos 
   1615  1.215  christos int
   1616  1.215  christos ether_disable_vlan_mtu(struct ifnet *ifp)
   1617  1.215  christos {
   1618  1.215  christos 	int error;
   1619  1.215  christos 	struct ethercom *ec = (void *)ifp;
   1620  1.215  christos 
   1621  1.215  christos 	/* We still have VLAN's, defer for later */
   1622  1.215  christos 	if (ec->ec_nvlans != 0)
   1623  1.215  christos 		return 0;
   1624  1.215  christos 
   1625  1.215  christos 	/* Parent does not support VLAB's, nothing to do. */
   1626  1.215  christos 	if ((ec->ec_capenable & ETHERCAP_VLAN_MTU) == 0)
   1627  1.215  christos 		return -1;
   1628  1.215  christos 
   1629  1.215  christos 	/*
   1630  1.215  christos 	 * Disable Tx/Rx of VLAN-sized frames.
   1631  1.215  christos 	 */
   1632  1.215  christos 	ec->ec_capenable &= ~ETHERCAP_VLAN_MTU;
   1633  1.250      maxv 
   1634  1.215  christos 	/* Interface is down, defer for later */
   1635  1.215  christos 	if ((ifp->if_flags & IFF_UP) == 0)
   1636  1.215  christos 		return 0;
   1637  1.215  christos 
   1638  1.215  christos 	if ((error = if_flags_set(ifp, ifp->if_flags)) == 0)
   1639  1.215  christos 		return 0;
   1640  1.215  christos 
   1641  1.215  christos 	ec->ec_capenable |= ETHERCAP_VLAN_MTU;
   1642  1.215  christos 	return error;
   1643  1.215  christos }
   1644  1.215  christos 
   1645  1.200     joerg static int
   1646  1.200     joerg ether_multicast_sysctl(SYSCTLFN_ARGS)
   1647  1.200     joerg {
   1648  1.200     joerg 	struct ether_multi *enm;
   1649  1.200     joerg 	struct ifnet *ifp;
   1650  1.200     joerg 	struct ethercom *ec;
   1651  1.223     ozaki 	int error = 0;
   1652  1.200     joerg 	size_t written;
   1653  1.223     ozaki 	struct psref psref;
   1654  1.237     skrll 	int bound;
   1655  1.233     ozaki 	unsigned int multicnt;
   1656  1.233     ozaki 	struct ether_multi_sysctl *addrs;
   1657  1.233     ozaki 	int i;
   1658  1.200     joerg 
   1659  1.200     joerg 	if (namelen != 1)
   1660  1.200     joerg 		return EINVAL;
   1661  1.200     joerg 
   1662  1.223     ozaki 	bound = curlwp_bind();
   1663  1.223     ozaki 	ifp = if_get_byindex(name[0], &psref);
   1664  1.223     ozaki 	if (ifp == NULL) {
   1665  1.223     ozaki 		error = ENODEV;
   1666  1.223     ozaki 		goto out;
   1667  1.223     ozaki 	}
   1668  1.200     joerg 	if (ifp->if_type != IFT_ETHER) {
   1669  1.223     ozaki 		if_put(ifp, &psref);
   1670  1.200     joerg 		*oldlenp = 0;
   1671  1.223     ozaki 		goto out;
   1672  1.200     joerg 	}
   1673  1.200     joerg 	ec = (struct ethercom *)ifp;
   1674  1.200     joerg 
   1675  1.200     joerg 	if (oldp == NULL) {
   1676  1.223     ozaki 		if_put(ifp, &psref);
   1677  1.233     ozaki 		*oldlenp = ec->ec_multicnt * sizeof(*addrs);
   1678  1.223     ozaki 		goto out;
   1679  1.200     joerg 	}
   1680  1.200     joerg 
   1681  1.233     ozaki 	/*
   1682  1.233     ozaki 	 * ec->ec_lock is a spin mutex so we cannot call sysctl_copyout, which
   1683  1.251      maxv 	 * is sleepable, while holding it. Copy data to a local buffer first
   1684  1.251      maxv 	 * with the lock taken and then call sysctl_copyout without holding it.
   1685  1.233     ozaki 	 */
   1686  1.233     ozaki retry:
   1687  1.233     ozaki 	multicnt = ec->ec_multicnt;
   1688  1.251      maxv 
   1689  1.251      maxv 	if (multicnt == 0) {
   1690  1.251      maxv 		if_put(ifp, &psref);
   1691  1.251      maxv 		*oldlenp = 0;
   1692  1.251      maxv 		goto out;
   1693  1.251      maxv 	}
   1694  1.251      maxv 
   1695  1.252      maxv 	addrs = kmem_zalloc(sizeof(*addrs) * multicnt, KM_SLEEP);
   1696  1.200     joerg 
   1697  1.245   msaitoh 	ETHER_LOCK(ec);
   1698  1.251      maxv 	if (multicnt != ec->ec_multicnt) {
   1699  1.251      maxv 		/* The number of multicast addresses has changed */
   1700  1.245   msaitoh 		ETHER_UNLOCK(ec);
   1701  1.233     ozaki 		kmem_free(addrs, sizeof(*addrs) * multicnt);
   1702  1.233     ozaki 		goto retry;
   1703  1.233     ozaki 	}
   1704  1.233     ozaki 
   1705  1.233     ozaki 	i = 0;
   1706  1.200     joerg 	LIST_FOREACH(enm, &ec->ec_multiaddrs, enm_list) {
   1707  1.233     ozaki 		struct ether_multi_sysctl *addr = &addrs[i];
   1708  1.233     ozaki 		addr->enm_refcount = enm->enm_refcount;
   1709  1.233     ozaki 		memcpy(addr->enm_addrlo, enm->enm_addrlo, ETHER_ADDR_LEN);
   1710  1.233     ozaki 		memcpy(addr->enm_addrhi, enm->enm_addrhi, ETHER_ADDR_LEN);
   1711  1.233     ozaki 		i++;
   1712  1.233     ozaki 	}
   1713  1.245   msaitoh 	ETHER_UNLOCK(ec);
   1714  1.233     ozaki 
   1715  1.233     ozaki 	error = 0;
   1716  1.233     ozaki 	written = 0;
   1717  1.233     ozaki 	for (i = 0; i < multicnt; i++) {
   1718  1.233     ozaki 		struct ether_multi_sysctl *addr = &addrs[i];
   1719  1.233     ozaki 
   1720  1.233     ozaki 		if (written + sizeof(*addr) > *oldlenp)
   1721  1.200     joerg 			break;
   1722  1.233     ozaki 		error = sysctl_copyout(l, addr, oldp, sizeof(*addr));
   1723  1.200     joerg 		if (error)
   1724  1.200     joerg 			break;
   1725  1.233     ozaki 		written += sizeof(*addr);
   1726  1.233     ozaki 		oldp = (char *)oldp + sizeof(*addr);
   1727  1.200     joerg 	}
   1728  1.233     ozaki 	kmem_free(addrs, sizeof(*addrs) * multicnt);
   1729  1.233     ozaki 
   1730  1.223     ozaki 	if_put(ifp, &psref);
   1731  1.200     joerg 
   1732  1.200     joerg 	*oldlenp = written;
   1733  1.223     ozaki out:
   1734  1.223     ozaki 	curlwp_bindx(bound);
   1735  1.200     joerg 	return error;
   1736  1.200     joerg }
   1737  1.200     joerg 
   1738  1.234     ozaki static void
   1739  1.234     ozaki ether_sysctl_setup(struct sysctllog **clog)
   1740  1.200     joerg {
   1741  1.200     joerg 	const struct sysctlnode *rnode = NULL;
   1742  1.200     joerg 
   1743  1.200     joerg 	sysctl_createv(clog, 0, NULL, &rnode,
   1744  1.200     joerg 		       CTLFLAG_PERMANENT,
   1745  1.200     joerg 		       CTLTYPE_NODE, "ether",
   1746  1.200     joerg 		       SYSCTL_DESCR("Ethernet-specific information"),
   1747  1.200     joerg 		       NULL, 0, NULL, 0,
   1748  1.200     joerg 		       CTL_NET, CTL_CREATE, CTL_EOL);
   1749  1.200     joerg 
   1750  1.200     joerg 	sysctl_createv(clog, 0, &rnode, NULL,
   1751  1.200     joerg 		       CTLFLAG_PERMANENT,
   1752  1.200     joerg 		       CTLTYPE_NODE, "multicast",
   1753  1.200     joerg 		       SYSCTL_DESCR("multicast addresses"),
   1754  1.200     joerg 		       ether_multicast_sysctl, 0, NULL, 0,
   1755  1.200     joerg 		       CTL_CREATE, CTL_EOL);
   1756  1.200     joerg }
   1757  1.203     ozaki 
   1758  1.203     ozaki void
   1759  1.203     ozaki etherinit(void)
   1760  1.203     ozaki {
   1761  1.234     ozaki 
   1762  1.278   msaitoh #ifdef DIAGNOSTIC
   1763  1.203     ozaki 	mutex_init(&bigpktpps_lock, MUTEX_DEFAULT, IPL_NET);
   1764  1.278   msaitoh #endif
   1765  1.234     ozaki 	ether_sysctl_setup(NULL);
   1766  1.203     ozaki }
   1767