Home | History | Annotate | Line # | Download | only in net
if_ethersubr.c revision 1.250
      1  1.250      maxv /*	$NetBSD: if_ethersubr.c,v 1.250 2017/12/09 10:51:30 maxv Exp $	*/
      2   1.44    itojun 
      3   1.44    itojun /*
      4   1.44    itojun  * Copyright (C) 1995, 1996, 1997, and 1998 WIDE Project.
      5   1.44    itojun  * All rights reserved.
      6  1.120     perry  *
      7   1.44    itojun  * Redistribution and use in source and binary forms, with or without
      8   1.44    itojun  * modification, are permitted provided that the following conditions
      9   1.44    itojun  * are met:
     10   1.44    itojun  * 1. Redistributions of source code must retain the above copyright
     11   1.44    itojun  *    notice, this list of conditions and the following disclaimer.
     12   1.44    itojun  * 2. Redistributions in binary form must reproduce the above copyright
     13   1.44    itojun  *    notice, this list of conditions and the following disclaimer in the
     14   1.44    itojun  *    documentation and/or other materials provided with the distribution.
     15   1.44    itojun  * 3. Neither the name of the project nor the names of its contributors
     16   1.44    itojun  *    may be used to endorse or promote products derived from this software
     17   1.44    itojun  *    without specific prior written permission.
     18  1.120     perry  *
     19   1.44    itojun  * THIS SOFTWARE IS PROVIDED BY THE PROJECT AND CONTRIBUTORS ``AS IS'' AND
     20   1.44    itojun  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     21   1.44    itojun  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     22   1.44    itojun  * ARE DISCLAIMED.  IN NO EVENT SHALL THE PROJECT OR CONTRIBUTORS BE LIABLE
     23   1.44    itojun  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     24   1.44    itojun  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     25   1.44    itojun  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     26   1.44    itojun  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     27   1.44    itojun  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     28   1.44    itojun  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     29   1.44    itojun  * SUCH DAMAGE.
     30   1.44    itojun  */
     31    1.9       cgd 
     32    1.1       cgd /*
     33    1.8   mycroft  * Copyright (c) 1982, 1989, 1993
     34    1.8   mycroft  *	The Regents of the University of California.  All rights reserved.
     35    1.1       cgd  *
     36    1.1       cgd  * Redistribution and use in source and binary forms, with or without
     37    1.1       cgd  * modification, are permitted provided that the following conditions
     38    1.1       cgd  * are met:
     39    1.1       cgd  * 1. Redistributions of source code must retain the above copyright
     40    1.1       cgd  *    notice, this list of conditions and the following disclaimer.
     41    1.1       cgd  * 2. Redistributions in binary form must reproduce the above copyright
     42    1.1       cgd  *    notice, this list of conditions and the following disclaimer in the
     43    1.1       cgd  *    documentation and/or other materials provided with the distribution.
     44  1.113       agc  * 3. Neither the name of the University nor the names of its contributors
     45    1.1       cgd  *    may be used to endorse or promote products derived from this software
     46    1.1       cgd  *    without specific prior written permission.
     47    1.1       cgd  *
     48    1.1       cgd  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
     49    1.1       cgd  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     50    1.1       cgd  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     51    1.1       cgd  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
     52    1.1       cgd  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     53    1.1       cgd  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     54    1.1       cgd  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     55    1.1       cgd  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     56    1.1       cgd  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     57    1.1       cgd  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     58    1.1       cgd  * SUCH DAMAGE.
     59    1.1       cgd  *
     60   1.27      fvdl  *	@(#)if_ethersubr.c	8.2 (Berkeley) 4/4/96
     61    1.1       cgd  */
     62   1.90     lukem 
     63   1.90     lukem #include <sys/cdefs.h>
     64  1.250      maxv __KERNEL_RCSID(0, "$NetBSD: if_ethersubr.c,v 1.250 2017/12/09 10:51:30 maxv Exp $");
     65    1.1       cgd 
     66  1.212     pooka #ifdef _KERNEL_OPT
     67   1.33  jonathan #include "opt_inet.h"
     68   1.33  jonathan #include "opt_atalk.h"
     69  1.112    martin #include "opt_mbuftrace.h"
     70  1.182    kefren #include "opt_mpls.h"
     71   1.30      matt #include "opt_gateway.h"
     72  1.135     pavel #include "opt_pppoe.h"
     73  1.206     ozaki #include "opt_net_mpsafe.h"
     74  1.212     pooka #endif
     75  1.212     pooka 
     76   1.59   thorpej #include "vlan.h"
     77   1.81    martin #include "pppoe.h"
     78   1.78   thorpej #include "bridge.h"
     79   1.93    martin #include "arp.h"
     80  1.121      yamt #include "agr.h"
     81   1.30      matt 
     82  1.200     joerg #include <sys/sysctl.h>
     83    1.4   mycroft #include <sys/mbuf.h>
     84  1.211     ozaki #include <sys/mutex.h>
     85    1.4   mycroft #include <sys/ioctl.h>
     86    1.4   mycroft #include <sys/errno.h>
     87  1.158    dyoung #include <sys/device.h>
     88  1.204       tls #include <sys/rnd.h>
     89  1.207  riastrad #include <sys/rndsource.h>
     90  1.216     ozaki #include <sys/cpu.h>
     91  1.231     ozaki #include <sys/kmem.h>
     92    1.8   mycroft 
     93    1.4   mycroft #include <net/if.h>
     94    1.4   mycroft #include <net/netisr.h>
     95    1.4   mycroft #include <net/route.h>
     96    1.4   mycroft #include <net/if_llc.h>
     97    1.4   mycroft #include <net/if_dl.h>
     98    1.8   mycroft #include <net/if_types.h>
     99  1.211     ozaki #include <net/pktqueue.h>
    100   1.93    martin 
    101  1.158    dyoung #include <net/if_media.h>
    102  1.158    dyoung #include <dev/mii/mii.h>
    103  1.158    dyoung #include <dev/mii/miivar.h>
    104  1.158    dyoung 
    105   1.93    martin #if NARP == 0
    106   1.93    martin /*
    107  1.102      jmmv  * XXX there should really be a way to issue this warning from within config(8)
    108   1.93    martin  */
    109  1.111    martin #error You have included NETATALK or a pseudo-device in your configuration that depends on the presence of ethernet interfaces, but have no such interfaces configured. Check if you really need pseudo-device bridge, pppoe, vlan or options NETATALK.
    110   1.93    martin #endif
    111    1.1       cgd 
    112   1.69   thorpej #include <net/bpf.h>
    113   1.69   thorpej 
    114   1.22        is #include <net/if_ether.h>
    115   1.59   thorpej #include <net/if_vlanvar.h>
    116   1.22        is 
    117   1.81    martin #if NPPPOE > 0
    118   1.81    martin #include <net/if_pppoe.h>
    119   1.81    martin #endif
    120   1.81    martin 
    121  1.121      yamt #if NAGR > 0
    122  1.121      yamt #include <net/agr/ieee8023_slowprotocols.h>	/* XXX */
    123  1.121      yamt #include <net/agr/ieee8023ad.h>
    124  1.121      yamt #include <net/agr/if_agrvar.h>
    125  1.121      yamt #endif
    126  1.121      yamt 
    127   1.78   thorpej #if NBRIDGE > 0
    128   1.78   thorpej #include <net/if_bridgevar.h>
    129   1.78   thorpej #endif
    130   1.78   thorpej 
    131   1.15      phil #include <netinet/in.h>
    132    1.1       cgd #ifdef INET
    133    1.4   mycroft #include <netinet/in_var.h>
    134    1.1       cgd #endif
    135   1.22        is #include <netinet/if_inarp.h>
    136    1.1       cgd 
    137   1.44    itojun #ifdef INET6
    138   1.44    itojun #ifndef INET
    139   1.44    itojun #include <netinet/in.h>
    140   1.44    itojun #endif
    141   1.44    itojun #include <netinet6/in6_var.h>
    142   1.44    itojun #include <netinet6/nd6.h>
    143   1.44    itojun #endif
    144   1.44    itojun 
    145    1.1       cgd 
    146  1.133  liamjfoy #include "carp.h"
    147  1.133  liamjfoy #if NCARP > 0
    148  1.133  liamjfoy #include <netinet/ip_carp.h>
    149  1.133  liamjfoy #endif
    150  1.133  liamjfoy 
    151   1.23  christos #ifdef NETATALK
    152   1.23  christos #include <netatalk/at.h>
    153   1.23  christos #include <netatalk/at_var.h>
    154   1.23  christos #include <netatalk/at_extern.h>
    155   1.23  christos 
    156   1.23  christos #define llc_snap_org_code llc_un.type_snap.org_code
    157   1.23  christos #define llc_snap_ether_type llc_un.type_snap.ether_type
    158   1.23  christos 
    159   1.23  christos extern u_char	at_org_code[3];
    160   1.23  christos extern u_char	aarp_org_code[3];
    161   1.23  christos #endif /* NETATALK */
    162   1.23  christos 
    163  1.182    kefren #ifdef MPLS
    164  1.182    kefren #include <netmpls/mpls.h>
    165  1.182    kefren #include <netmpls/mpls_var.h>
    166  1.182    kefren #endif
    167  1.182    kefren 
    168  1.123      matt static struct timeval bigpktppslim_last;
    169  1.123      matt static int bigpktppslim = 2;	/* XXX */
    170  1.123      matt static int bigpktpps_count;
    171  1.203     ozaki static kmutex_t bigpktpps_lock __cacheline_aligned;
    172  1.123      matt 
    173  1.123      matt 
    174  1.118      yamt const uint8_t etherbroadcastaddr[ETHER_ADDR_LEN] =
    175  1.118      yamt     { 0xff, 0xff, 0xff, 0xff, 0xff, 0xff };
    176  1.121      yamt const uint8_t ethermulticastaddr_slowprotocols[ETHER_ADDR_LEN] =
    177  1.121      yamt     { 0x01, 0x80, 0xc2, 0x00, 0x00, 0x02 };
    178    1.8   mycroft #define senderr(e) { error = (e); goto bad;}
    179    1.1       cgd 
    180  1.128   thorpej static	int ether_output(struct ifnet *, struct mbuf *,
    181  1.222     ozaki 	    const struct sockaddr *, const struct rtentry *);
    182   1.42   thorpej 
    183    1.1       cgd /*
    184    1.1       cgd  * Ethernet output routine.
    185    1.1       cgd  * Encapsulate a packet of type family for the local net.
    186   1.22        is  * Assumes that ifp is actually pointer to ethercom structure.
    187    1.1       cgd  */
    188   1.42   thorpej static int
    189  1.178    dyoung ether_output(struct ifnet * const ifp0, struct mbuf * const m0,
    190  1.178    dyoung 	const struct sockaddr * const dst,
    191  1.222     ozaki 	const struct rtentry *rt)
    192    1.1       cgd {
    193  1.162      matt 	uint16_t etype = 0;
    194  1.122  christos 	int error = 0, hdrcmplt = 0;
    195  1.250      maxv 	uint8_t esrc[6], edst[6];
    196   1.29       mrg 	struct mbuf *m = m0;
    197  1.151    dyoung 	struct mbuf *mcopy = NULL;
    198   1.29       mrg 	struct ether_header *eh;
    199  1.133  liamjfoy 	struct ifnet *ifp = ifp0;
    200   1.24  christos #ifdef INET
    201   1.22        is 	struct arphdr *ah;
    202   1.24  christos #endif /* INET */
    203   1.23  christos #ifdef NETATALK
    204   1.23  christos 	struct at_ifaddr *aa;
    205   1.23  christos #endif /* NETATALK */
    206    1.1       cgd 
    207  1.104      matt #ifdef MBUFTRACE
    208  1.116  jonathan 	m_claimm(m, ifp->if_mowner);
    209  1.104      matt #endif
    210  1.133  liamjfoy 
    211  1.133  liamjfoy #if NCARP > 0
    212  1.133  liamjfoy 	if (ifp->if_type == IFT_CARP) {
    213  1.133  liamjfoy 		struct ifaddr *ifa;
    214  1.227     ozaki 		int s = pserialize_read_enter();
    215  1.133  liamjfoy 
    216  1.133  liamjfoy 		/* loop back if this is going to the carp interface */
    217  1.133  liamjfoy 		if (dst != NULL && ifp0->if_link_state == LINK_STATE_UP &&
    218  1.227     ozaki 		    (ifa = ifa_ifwithaddr(dst)) != NULL) {
    219  1.227     ozaki 			if (ifa->ifa_ifp == ifp0) {
    220  1.227     ozaki 				pserialize_read_exit(s);
    221  1.227     ozaki 				return looutput(ifp0, m, dst, rt);
    222  1.227     ozaki 			}
    223  1.227     ozaki 		}
    224  1.227     ozaki 		pserialize_read_exit(s);
    225  1.133  liamjfoy 
    226  1.133  liamjfoy 		ifp = ifp->if_carpdev;
    227  1.133  liamjfoy 		/* ac = (struct arpcom *)ifp; */
    228  1.133  liamjfoy 
    229  1.247   msaitoh 		if ((ifp0->if_flags & (IFF_UP | IFF_RUNNING)) !=
    230  1.247   msaitoh 		    (IFF_UP | IFF_RUNNING))
    231  1.133  liamjfoy 			senderr(ENETDOWN);
    232  1.133  liamjfoy 	}
    233  1.133  liamjfoy #endif /* NCARP > 0 */
    234  1.133  liamjfoy 
    235  1.247   msaitoh 	if ((ifp->if_flags & (IFF_UP | IFF_RUNNING)) != (IFF_UP | IFF_RUNNING))
    236    1.8   mycroft 		senderr(ENETDOWN);
    237   1.72   thorpej 
    238    1.1       cgd 	switch (dst->sa_family) {
    239    1.1       cgd 
    240    1.1       cgd #ifdef INET
    241    1.1       cgd 	case AF_INET:
    242   1.22        is 		if (m->m_flags & M_BCAST)
    243  1.174     isaki 			(void)memcpy(edst, etherbroadcastaddr, sizeof(edst));
    244  1.145    dyoung 		else if (m->m_flags & M_MCAST)
    245  1.145    dyoung 			ETHER_MAP_IP_MULTICAST(&satocsin(dst)->sin_addr, edst);
    246  1.217  christos 		else if ((error = arpresolve(ifp, rt, m, dst, edst,
    247  1.224  knakahar 		    sizeof(edst))) != 0) {
    248  1.214       roy 			return error == EWOULDBLOCK ? 0 : error;
    249  1.224  knakahar 		}
    250    1.3   hpeyerl 		/* If broadcasting on a simplex interface, loopback a copy */
    251    1.3   hpeyerl 		if ((m->m_flags & M_BCAST) && (ifp->if_flags & IFF_SIMPLEX))
    252    1.1       cgd 			mcopy = m_copy(m, 0, (int)M_COPYALL);
    253   1.17   mycroft 		etype = htons(ETHERTYPE_IP);
    254    1.8   mycroft 		break;
    255   1.22        is 
    256   1.22        is 	case AF_ARP:
    257   1.22        is 		ah = mtod(m, struct arphdr *);
    258   1.22        is 		if (m->m_flags & M_BCAST)
    259  1.174     isaki 			(void)memcpy(edst, etherbroadcastaddr, sizeof(edst));
    260  1.131       mrg 		else {
    261  1.147  christos 			void *tha = ar_tha(ah);
    262  1.131       mrg 
    263  1.173  christos 			if (tha == NULL) {
    264  1.173  christos 				/* fake with ARPHDR_IEEE1394 */
    265  1.236      maxv 				m_freem(m);
    266  1.173  christos 				return 0;
    267  1.173  christos 			}
    268  1.146    dyoung 			memcpy(edst, tha, sizeof(edst));
    269  1.131       mrg 		}
    270  1.120     perry 
    271   1.22        is 		ah->ar_hrd = htons(ARPHRD_ETHER);
    272   1.22        is 
    273  1.107    itojun 		switch (ntohs(ah->ar_op)) {
    274   1.22        is 		case ARPOP_REVREQUEST:
    275   1.22        is 		case ARPOP_REVREPLY:
    276   1.22        is 			etype = htons(ETHERTYPE_REVARP);
    277   1.22        is 			break;
    278   1.22        is 
    279   1.22        is 		case ARPOP_REQUEST:
    280   1.22        is 		case ARPOP_REPLY:
    281   1.22        is 		default:
    282   1.22        is 			etype = htons(ETHERTYPE_ARP);
    283   1.22        is 		}
    284   1.22        is 
    285   1.22        is 		break;
    286    1.1       cgd #endif
    287   1.44    itojun #ifdef INET6
    288   1.44    itojun 	case AF_INET6:
    289  1.238     ozaki 		if (m->m_flags & M_BCAST)
    290  1.238     ozaki 			(void)memcpy(edst, etherbroadcastaddr, sizeof(edst));
    291  1.238     ozaki 		else if (m->m_flags & M_MCAST) {
    292  1.238     ozaki 			ETHER_MAP_IPV6_MULTICAST(&satocsin6(dst)->sin6_addr,
    293  1.238     ozaki 			    edst);
    294  1.238     ozaki 		} else {
    295  1.238     ozaki 			error = nd6_resolve(ifp, rt, m, dst, edst,
    296  1.238     ozaki 			    sizeof(edst));
    297  1.238     ozaki 			if (error != 0)
    298  1.238     ozaki 				return error == EWOULDBLOCK ? 0 : error;
    299   1.51    itojun 		}
    300   1.44    itojun 		etype = htons(ETHERTYPE_IPV6);
    301   1.44    itojun 		break;
    302   1.44    itojun #endif
    303   1.23  christos #ifdef NETATALK
    304  1.250      maxv 	case AF_APPLETALK: {
    305  1.227     ozaki 		struct ifaddr *ifa;
    306  1.227     ozaki 		int s;
    307  1.227     ozaki 
    308  1.224  knakahar 		KERNEL_LOCK(1, NULL);
    309  1.226       rjs 		if (!aarpresolve(ifp, m, (const struct sockaddr_at *)dst, edst)) {
    310   1.23  christos #ifdef NETATALKDEBUG
    311   1.23  christos 			printf("aarpresolv failed\n");
    312   1.23  christos #endif /* NETATALKDEBUG */
    313  1.224  knakahar 			KERNEL_UNLOCK_ONE(NULL);
    314   1.23  christos 			return (0);
    315   1.23  christos 		}
    316   1.23  christos 		/*
    317   1.23  christos 		 * ifaddr is the first thing in at_ifaddr
    318   1.23  christos 		 */
    319  1.227     ozaki 		s = pserialize_read_enter();
    320  1.227     ozaki 		ifa = at_ifawithnet((const struct sockaddr_at *)dst, ifp);
    321  1.227     ozaki 		if (ifa == NULL) {
    322  1.227     ozaki 			pserialize_read_exit(s);
    323  1.227     ozaki 			KERNEL_UNLOCK_ONE(NULL);
    324  1.227     ozaki 			goto bad;
    325  1.224  knakahar 		}
    326  1.227     ozaki 		aa = (struct at_ifaddr *)ifa;
    327  1.120     perry 
    328   1.23  christos 		/*
    329   1.23  christos 		 * In the phase 2 case, we need to prepend an mbuf for the
    330   1.23  christos 		 * llc header.  Since we must preserve the value of m,
    331   1.23  christos 		 * which is passed to us by value, we m_copy() the first
    332   1.23  christos 		 * mbuf, and use it for our llc header.
    333   1.23  christos 		 */
    334   1.23  christos 		if (aa->aa_flags & AFA_PHASE2) {
    335   1.23  christos 			struct llc llc;
    336   1.23  christos 
    337   1.43    bouyer 			M_PREPEND(m, sizeof(struct llc), M_DONTWAIT);
    338   1.23  christos 			llc.llc_dsap = llc.llc_ssap = LLC_SNAP_LSAP;
    339   1.23  christos 			llc.llc_control = LLC_UI;
    340  1.146    dyoung 			memcpy(llc.llc_snap_org_code, at_org_code,
    341   1.23  christos 			    sizeof(llc.llc_snap_org_code));
    342   1.38       kim 			llc.llc_snap_ether_type = htons(ETHERTYPE_ATALK);
    343  1.147  christos 			memcpy(mtod(m, void *), &llc, sizeof(struct llc));
    344   1.23  christos 		} else {
    345   1.38       kim 			etype = htons(ETHERTYPE_ATALK);
    346   1.23  christos 		}
    347  1.227     ozaki 		pserialize_read_exit(s);
    348  1.224  knakahar 		KERNEL_UNLOCK_ONE(NULL);
    349   1.23  christos 		break;
    350  1.250      maxv 	}
    351   1.23  christos #endif /* NETATALK */
    352   1.31   thorpej 	case pseudo_AF_HDRCMPLT:
    353   1.31   thorpej 		hdrcmplt = 1;
    354  1.146    dyoung 		memcpy(esrc,
    355  1.146    dyoung 		    ((const struct ether_header *)dst->sa_data)->ether_shost,
    356  1.146    dyoung 		    sizeof(esrc));
    357   1.31   thorpej 		/* FALLTHROUGH */
    358   1.31   thorpej 
    359    1.1       cgd 	case AF_UNSPEC:
    360  1.250      maxv 		memcpy(edst,
    361  1.146    dyoung 		    ((const struct ether_header *)dst->sa_data)->ether_dhost,
    362  1.146    dyoung 		    sizeof(edst));
    363    1.8   mycroft 		/* AF_UNSPEC doesn't swap the byte order of the ether_type. */
    364  1.145    dyoung 		etype = ((const struct ether_header *)dst->sa_data)->ether_type;
    365    1.8   mycroft 		break;
    366    1.1       cgd 
    367    1.1       cgd 	default:
    368   1.21  christos 		printf("%s: can't handle af%d\n", ifp->if_xname,
    369    1.1       cgd 			dst->sa_family);
    370    1.8   mycroft 		senderr(EAFNOSUPPORT);
    371    1.1       cgd 	}
    372    1.1       cgd 
    373  1.182    kefren #ifdef MPLS
    374  1.224  knakahar 	KERNEL_LOCK(1, NULL);
    375  1.210     ozaki 	{
    376  1.210     ozaki 		struct m_tag *mtag;
    377  1.210     ozaki 		mtag = m_tag_find(m, PACKET_TAG_MPLS, NULL);
    378  1.210     ozaki 		if (mtag != NULL) {
    379  1.210     ozaki 			/* Having the tag itself indicates it's MPLS */
    380  1.184    dyoung 			etype = htons(ETHERTYPE_MPLS);
    381  1.210     ozaki 			m_tag_delete(m, mtag);
    382  1.210     ozaki 		}
    383  1.184    dyoung 	}
    384  1.224  knakahar 	KERNEL_UNLOCK_ONE(NULL);
    385  1.182    kefren #endif
    386  1.182    kefren 
    387    1.1       cgd 	if (mcopy)
    388  1.145    dyoung 		(void)looutput(ifp, mcopy, dst, rt);
    389   1.16   mycroft 
    390   1.50      matt 	/* If no ether type is set, this must be a 802.2 formatted packet.
    391   1.50      matt 	 */
    392   1.50      matt 	if (etype == 0)
    393   1.50      matt 		etype = htons(m->m_pkthdr.len);
    394    1.1       cgd 	/*
    395    1.1       cgd 	 * Add local net header.  If no space in first mbuf,
    396    1.1       cgd 	 * allocate another.
    397    1.1       cgd 	 */
    398    1.1       cgd 	M_PREPEND(m, sizeof (struct ether_header), M_DONTWAIT);
    399    1.8   mycroft 	if (m == 0)
    400    1.8   mycroft 		senderr(ENOBUFS);
    401    1.1       cgd 	eh = mtod(m, struct ether_header *);
    402   1.96   thorpej 	/* Note: etype is already in network byte order. */
    403  1.143    cbiere 	(void)memcpy(&eh->ether_type, &etype, sizeof(eh->ether_type));
    404  1.250      maxv 	memcpy(eh->ether_dhost, edst, sizeof(edst));
    405   1.31   thorpej 	if (hdrcmplt)
    406  1.146    dyoung 		memcpy(eh->ether_shost, esrc, sizeof(eh->ether_shost));
    407   1.31   thorpej 	else
    408  1.153    dyoung 	 	memcpy(eh->ether_shost, CLLADDR(ifp->if_sadl),
    409   1.31   thorpej 		    sizeof(eh->ether_shost));
    410   1.77   thorpej 
    411  1.133  liamjfoy #if NCARP > 0
    412  1.133  liamjfoy 	if (ifp0 != ifp && ifp0->if_type == IFT_CARP) {
    413  1.153    dyoung 	 	memcpy(eh->ether_shost, CLLADDR(ifp0->if_sadl),
    414  1.133  liamjfoy 		    sizeof(eh->ether_shost));
    415  1.133  liamjfoy 	}
    416  1.133  liamjfoy #endif /* NCARP > 0 */
    417  1.133  liamjfoy 
    418  1.195     rmind 	if ((error = pfil_run_hooks(ifp->if_pfil, &m, ifp, PFIL_OUT)) != 0)
    419   1.77   thorpej 		return (error);
    420   1.77   thorpej 	if (m == NULL)
    421   1.77   thorpej 		return (0);
    422   1.77   thorpej 
    423   1.78   thorpej #if NBRIDGE > 0
    424   1.78   thorpej 	/*
    425   1.78   thorpej 	 * Bridges require special output handling.
    426   1.78   thorpej 	 */
    427   1.78   thorpej 	if (ifp->if_bridge)
    428   1.78   thorpej 		return (bridge_output(ifp, m, NULL, NULL));
    429   1.78   thorpej #endif
    430   1.78   thorpej 
    431  1.133  liamjfoy #if NCARP > 0
    432  1.133  liamjfoy 	if (ifp != ifp0)
    433  1.133  liamjfoy 		ifp0->if_obytes += m->m_pkthdr.len + ETHER_HDR_LEN;
    434  1.133  liamjfoy #endif /* NCARP > 0 */
    435  1.133  liamjfoy 
    436   1.77   thorpej #ifdef ALTQ
    437  1.224  knakahar 	KERNEL_LOCK(1, NULL);
    438   1.77   thorpej 	/*
    439   1.77   thorpej 	 * If ALTQ is enabled on the parent interface, do
    440   1.77   thorpej 	 * classification; the queueing discipline might not
    441   1.77   thorpej 	 * require classification, but might require the
    442   1.77   thorpej 	 * address family/header pointer in the pktattr.
    443   1.77   thorpej 	 */
    444   1.77   thorpej 	if (ALTQ_IS_ENABLED(&ifp->if_snd))
    445  1.220  knakahar 		altq_etherclassify(&ifp->if_snd, m);
    446  1.224  knakahar 	KERNEL_UNLOCK_ONE(NULL);
    447   1.77   thorpej #endif
    448  1.221  knakahar 	return ifq_enqueue(ifp, m);
    449    1.1       cgd 
    450    1.1       cgd bad:
    451    1.1       cgd 	if (m)
    452    1.1       cgd 		m_freem(m);
    453    1.1       cgd 	return (error);
    454    1.1       cgd }
    455   1.76   thorpej 
    456   1.76   thorpej #ifdef ALTQ
    457   1.76   thorpej /*
    458   1.76   thorpej  * This routine is a slight hack to allow a packet to be classified
    459   1.76   thorpej  * if the Ethernet headers are present.  It will go away when ALTQ's
    460   1.76   thorpej  * classification engine understands link headers.
    461   1.76   thorpej  */
    462   1.76   thorpej void
    463  1.220  knakahar altq_etherclassify(struct ifaltq *ifq, struct mbuf *m)
    464   1.76   thorpej {
    465   1.76   thorpej 	struct ether_header *eh;
    466  1.162      matt 	uint16_t ether_type;
    467   1.76   thorpej 	int hlen, af, hdrsize;
    468  1.147  christos 	void *hdr;
    469   1.76   thorpej 
    470   1.76   thorpej 	hlen = ETHER_HDR_LEN;
    471   1.76   thorpej 	eh = mtod(m, struct ether_header *);
    472   1.76   thorpej 
    473   1.76   thorpej 	ether_type = htons(eh->ether_type);
    474   1.76   thorpej 
    475   1.76   thorpej 	if (ether_type < ETHERMTU) {
    476   1.76   thorpej 		/* LLC/SNAP */
    477   1.76   thorpej 		struct llc *llc = (struct llc *)(eh + 1);
    478   1.76   thorpej 		hlen += 8;
    479   1.76   thorpej 
    480   1.76   thorpej 		if (m->m_len < hlen ||
    481   1.76   thorpej 		    llc->llc_dsap != LLC_SNAP_LSAP ||
    482   1.76   thorpej 		    llc->llc_ssap != LLC_SNAP_LSAP ||
    483   1.76   thorpej 		    llc->llc_control != LLC_UI) {
    484   1.76   thorpej 			/* Not SNAP. */
    485   1.76   thorpej 			goto bad;
    486   1.76   thorpej 		}
    487   1.76   thorpej 
    488   1.76   thorpej 		ether_type = htons(llc->llc_un.type_snap.ether_type);
    489   1.76   thorpej 	}
    490   1.76   thorpej 
    491   1.76   thorpej 	switch (ether_type) {
    492   1.76   thorpej 	case ETHERTYPE_IP:
    493   1.76   thorpej 		af = AF_INET;
    494   1.76   thorpej 		hdrsize = 20;		/* sizeof(struct ip) */
    495   1.76   thorpej 		break;
    496   1.76   thorpej 
    497   1.76   thorpej 	case ETHERTYPE_IPV6:
    498   1.76   thorpej 		af = AF_INET6;
    499   1.76   thorpej 		hdrsize = 40;		/* sizeof(struct ip6_hdr) */
    500   1.76   thorpej 		break;
    501   1.76   thorpej 
    502   1.76   thorpej 	default:
    503   1.76   thorpej 		af = AF_UNSPEC;
    504   1.76   thorpej 		hdrsize = 0;
    505   1.76   thorpej 		break;
    506   1.76   thorpej 	}
    507   1.76   thorpej 
    508   1.95    itojun 	while (m->m_len <= hlen) {
    509   1.95    itojun 		hlen -= m->m_len;
    510   1.95    itojun 		m = m->m_next;
    511   1.95    itojun 	}
    512   1.76   thorpej 	if (m->m_len < (hlen + hdrsize)) {
    513   1.76   thorpej 		/*
    514   1.95    itojun 		 * protocol header not in a single mbuf.
    515   1.95    itojun 		 * We can't cope with this situation right
    516   1.76   thorpej 		 * now (but it shouldn't ever happen, really, anyhow).
    517   1.76   thorpej 		 */
    518   1.92    itojun #ifdef DEBUG
    519   1.78   thorpej 		printf("altq_etherclassify: headers span multiple mbufs: "
    520   1.78   thorpej 		    "%d < %d\n", m->m_len, (hlen + hdrsize));
    521   1.92    itojun #endif
    522   1.76   thorpej 		goto bad;
    523   1.76   thorpej 	}
    524   1.76   thorpej 
    525   1.76   thorpej 	m->m_data += hlen;
    526   1.76   thorpej 	m->m_len -= hlen;
    527   1.76   thorpej 
    528  1.147  christos 	hdr = mtod(m, void *);
    529   1.76   thorpej 
    530   1.76   thorpej 	if (ALTQ_NEEDS_CLASSIFY(ifq))
    531  1.219  knakahar 		m->m_pkthdr.pattr_class =
    532   1.76   thorpej 		    (*ifq->altq_classify)(ifq->altq_clfier, m, af);
    533  1.219  knakahar 	m->m_pkthdr.pattr_af = af;
    534  1.219  knakahar 	m->m_pkthdr.pattr_hdr = hdr;
    535   1.76   thorpej 
    536   1.76   thorpej 	m->m_data -= hlen;
    537   1.76   thorpej 	m->m_len += hlen;
    538   1.76   thorpej 
    539   1.76   thorpej 	return;
    540   1.76   thorpej 
    541  1.250      maxv bad:
    542  1.219  knakahar 	m->m_pkthdr.pattr_class = NULL;
    543  1.219  knakahar 	m->m_pkthdr.pattr_hdr = NULL;
    544  1.219  knakahar 	m->m_pkthdr.pattr_af = AF_UNSPEC;
    545   1.76   thorpej }
    546   1.76   thorpej #endif /* ALTQ */
    547    1.1       cgd 
    548    1.1       cgd /*
    549    1.1       cgd  * Process a received Ethernet packet;
    550   1.42   thorpej  * the packet is in the mbuf chain m with
    551   1.42   thorpej  * the ether header.
    552    1.1       cgd  */
    553  1.133  liamjfoy void
    554   1.58      matt ether_input(struct ifnet *ifp, struct mbuf *m)
    555    1.1       cgd {
    556   1.91   thorpej 	struct ethercom *ec = (struct ethercom *) ifp;
    557  1.199     rmind 	pktqueue_t *pktq = NULL;
    558  1.199     rmind 	struct ifqueue *inq = NULL;
    559  1.162      matt 	uint16_t etype;
    560   1.42   thorpej 	struct ether_header *eh;
    561  1.187      matt 	size_t ehlen;
    562  1.204       tls 	static int earlypkts;
    563  1.198   msaitoh 	int isr = 0;
    564  1.194     joerg #if defined (LLC) || defined(NETATALK)
    565   1.29       mrg 	struct llc *l;
    566   1.18  christos #endif
    567    1.1       cgd 
    568  1.216     ozaki 	KASSERT(!cpu_intr_p());
    569  1.216     ozaki 
    570    1.8   mycroft 	if ((ifp->if_flags & IFF_UP) == 0) {
    571    1.8   mycroft 		m_freem(m);
    572    1.8   mycroft 		return;
    573    1.8   mycroft 	}
    574   1.42   thorpej 
    575  1.104      matt #ifdef MBUFTRACE
    576  1.116  jonathan 	m_claimm(m, &ec->ec_rx_mowner);
    577  1.104      matt #endif
    578   1.42   thorpej 	eh = mtod(m, struct ether_header *);
    579   1.63   thorpej 	etype = ntohs(eh->ether_type);
    580  1.187      matt 	ehlen = sizeof(*eh);
    581   1.63   thorpej 
    582  1.250      maxv 	if (__predict_false(earlypkts < 100 || !rnd_initial_entropy)) {
    583  1.204       tls 		rnd_add_data(NULL, eh, ehlen, 0);
    584  1.204       tls 		earlypkts++;
    585  1.204       tls 	}
    586  1.204       tls 
    587   1.63   thorpej 	/*
    588   1.63   thorpej 	 * Determine if the packet is within its size limits.
    589   1.63   thorpej 	 */
    590  1.182    kefren 	if (etype != ETHERTYPE_MPLS && m->m_pkthdr.len >
    591   1.83   thorpej 	    ETHER_MAX_FRAME(ifp, etype, m->m_flags & M_HASFCS)) {
    592  1.203     ozaki 		mutex_enter(&bigpktpps_lock);
    593  1.123      matt 		if (ppsratecheck(&bigpktppslim_last, &bigpktpps_count,
    594  1.123      matt 			    bigpktppslim)) {
    595  1.123      matt 			printf("%s: discarding oversize frame (len=%d)\n",
    596  1.123      matt 			    ifp->if_xname, m->m_pkthdr.len);
    597  1.123      matt 		}
    598  1.203     ozaki 		mutex_exit(&bigpktpps_lock);
    599   1.63   thorpej 		m_freem(m);
    600   1.63   thorpej 		return;
    601   1.63   thorpej 	}
    602   1.77   thorpej 
    603   1.84   thorpej 	if (ETHER_IS_MULTICAST(eh->ether_dhost)) {
    604   1.84   thorpej 		/*
    605   1.84   thorpej 		 * If this is not a simplex interface, drop the packet
    606   1.84   thorpej 		 * if it came from us.
    607   1.84   thorpej 		 */
    608   1.84   thorpej 		if ((ifp->if_flags & IFF_SIMPLEX) == 0 &&
    609  1.153    dyoung 		    memcmp(CLLADDR(ifp->if_sadl), eh->ether_shost,
    610   1.84   thorpej 		    ETHER_ADDR_LEN) == 0) {
    611   1.84   thorpej 			m_freem(m);
    612   1.84   thorpej 			return;
    613   1.84   thorpej 		}
    614   1.84   thorpej 
    615   1.84   thorpej 		if (memcmp(etherbroadcastaddr,
    616   1.84   thorpej 		    eh->ether_dhost, ETHER_ADDR_LEN) == 0)
    617   1.84   thorpej 			m->m_flags |= M_BCAST;
    618   1.84   thorpej 		else
    619   1.84   thorpej 			m->m_flags |= M_MCAST;
    620   1.84   thorpej 		ifp->if_imcasts++;
    621   1.84   thorpej 	}
    622   1.84   thorpej 
    623   1.79   thorpej 	/* If the CRC is still on the packet, trim it off. */
    624   1.79   thorpej 	if (m->m_flags & M_HASFCS) {
    625   1.79   thorpej 		m_adj(m, -ETHER_CRC_LEN);
    626   1.79   thorpej 		m->m_flags &= ~M_HASFCS;
    627   1.79   thorpej 	}
    628   1.79   thorpej 
    629   1.42   thorpej 	ifp->if_ibytes += m->m_pkthdr.len;
    630   1.78   thorpej 
    631  1.201     ozaki #if NCARP > 0
    632  1.201     ozaki 	if (__predict_false(ifp->if_carp && ifp->if_type != IFT_CARP)) {
    633  1.201     ozaki 		/*
    634  1.201     ozaki 		 * clear M_PROMISC, in case the packets comes from a
    635  1.201     ozaki 		 * vlan
    636  1.201     ozaki 		 */
    637  1.137    rpaulo 		m->m_flags &= ~M_PROMISC;
    638  1.201     ozaki 		if (carp_input(m, (uint8_t *)&eh->ether_shost,
    639  1.201     ozaki 		    (uint8_t *)&eh->ether_dhost, eh->ether_type) == 0)
    640  1.137    rpaulo 			return;
    641  1.201     ozaki 	}
    642  1.133  liamjfoy #endif /* NCARP > 0 */
    643  1.250      maxv 
    644  1.247   msaitoh 	if ((m->m_flags & (M_BCAST | M_MCAST | M_PROMISC)) == 0 &&
    645  1.201     ozaki 	    (ifp->if_flags & IFF_PROMISC) != 0 &&
    646  1.201     ozaki 	    memcmp(CLLADDR(ifp->if_sadl), eh->ether_dhost,
    647  1.201     ozaki 		   ETHER_ADDR_LEN) != 0) {
    648  1.201     ozaki 		m->m_flags |= M_PROMISC;
    649   1.70    bouyer 	}
    650   1.78   thorpej 
    651  1.106    bouyer 	if ((m->m_flags & M_PROMISC) == 0) {
    652  1.195     rmind 		if (pfil_run_hooks(ifp->if_pfil, &m, ifp, PFIL_IN) != 0)
    653  1.106    bouyer 			return;
    654  1.106    bouyer 		if (m == NULL)
    655  1.106    bouyer 			return;
    656   1.78   thorpej 
    657  1.106    bouyer 		eh = mtod(m, struct ether_header *);
    658  1.106    bouyer 		etype = ntohs(eh->ether_type);
    659  1.187      matt 		ehlen = sizeof(*eh);
    660  1.106    bouyer 	}
    661   1.70    bouyer 
    662  1.172    darran #if NAGR > 0
    663  1.172    darran 	if (ifp->if_agrprivate &&
    664  1.172    darran 	    __predict_true(etype != ETHERTYPE_SLOWPROTOCOLS)) {
    665  1.172    darran 		m->m_flags &= ~M_PROMISC;
    666  1.172    darran 		agr_input(ifp, m);
    667  1.172    darran 		return;
    668  1.172    darran 	}
    669  1.172    darran #endif /* NAGR > 0 */
    670  1.172    darran 
    671   1.91   thorpej 	/*
    672   1.91   thorpej 	 * If VLANs are configured on the interface, check to
    673   1.91   thorpej 	 * see if the device performed the decapsulation and
    674   1.91   thorpej 	 * provided us with the tag.
    675   1.91   thorpej 	 */
    676  1.244  knakahar 	if (ec->ec_nvlans && vlan_has_tag(m)) {
    677   1.70    bouyer #if NVLAN > 0
    678   1.70    bouyer 		/*
    679   1.70    bouyer 		 * vlan_input() will either recursively call ether_input()
    680   1.70    bouyer 		 * or drop the packet.
    681   1.70    bouyer 		 */
    682   1.91   thorpej 		vlan_input(ifp, m);
    683   1.91   thorpej #else
    684   1.91   thorpej 		m_freem(m);
    685   1.70    bouyer #endif
    686   1.61   thorpej 		return;
    687   1.61   thorpej 	}
    688    1.1       cgd 
    689   1.59   thorpej 	/*
    690   1.59   thorpej 	 * Handle protocols that expect to have the Ethernet header
    691   1.59   thorpej 	 * (and possibly FCS) intact.
    692   1.59   thorpej 	 */
    693   1.59   thorpej 	switch (etype) {
    694  1.187      matt 	case ETHERTYPE_VLAN: {
    695  1.187      matt 		struct ether_vlan_header *evl = (void *)eh;
    696  1.187      matt 		/*
    697  1.187      matt 		 * If there is a tag of 0, then the VLAN header was probably
    698  1.187      matt 		 * just being used to store the priority.  Extract the ether
    699  1.250      maxv 		 * type, and if IP or IPV6, let them deal with it.
    700  1.187      matt 		 */
    701  1.187      matt 		if (m->m_len <= sizeof(*evl)
    702  1.187      matt 		    && EVL_VLANOFTAG(evl->evl_tag) == 0) {
    703  1.187      matt 			etype = ntohs(evl->evl_proto);
    704  1.187      matt 			ehlen = sizeof(*evl);
    705  1.187      matt 			if ((m->m_flags & M_PROMISC) == 0
    706  1.187      matt 			    && (etype == ETHERTYPE_IP
    707  1.187      matt 				|| etype == ETHERTYPE_IPV6))
    708  1.187      matt 				break;
    709  1.187      matt 		}
    710   1.59   thorpej #if NVLAN > 0
    711   1.59   thorpej 		/*
    712   1.59   thorpej 		 * vlan_input() will either recursively call ether_input()
    713   1.59   thorpej 		 * or drop the packet.
    714   1.59   thorpej 		 */
    715   1.63   thorpej 		if (((struct ethercom *)ifp)->ec_nvlans != 0)
    716   1.63   thorpej 			vlan_input(ifp, m);
    717   1.65     enami 		else
    718  1.187      matt #endif /* NVLAN > 0 */
    719   1.65     enami 			m_freem(m);
    720   1.59   thorpej 		return;
    721  1.187      matt 	}
    722   1.81    martin #if NPPPOE > 0
    723   1.81    martin 	case ETHERTYPE_PPPOEDISC:
    724  1.218     ozaki 		pppoedisc_input(ifp, m);
    725  1.218     ozaki 		return;
    726   1.81    martin 	case ETHERTYPE_PPPOE:
    727  1.218     ozaki 		pppoe_input(ifp, m);
    728   1.81    martin 		return;
    729   1.81    martin #endif /* NPPPOE > 0 */
    730  1.121      yamt 	case ETHERTYPE_SLOWPROTOCOLS: {
    731  1.121      yamt 		uint8_t subtype;
    732  1.121      yamt 
    733  1.121      yamt #if defined(DIAGNOSTIC)
    734  1.121      yamt 		if (m->m_pkthdr.len < sizeof(*eh) + sizeof(subtype)) {
    735  1.121      yamt 			panic("ether_input: too short slow protocol packet");
    736  1.121      yamt 		}
    737  1.121      yamt #endif
    738  1.121      yamt 		m_copydata(m, sizeof(*eh), sizeof(subtype), &subtype);
    739  1.121      yamt 		switch (subtype) {
    740  1.121      yamt #if NAGR > 0
    741  1.121      yamt 		case SLOWPROTOCOLS_SUBTYPE_LACP:
    742  1.121      yamt 			if (ifp->if_agrprivate) {
    743  1.121      yamt 				ieee8023ad_lacp_input(ifp, m);
    744  1.121      yamt 				return;
    745  1.121      yamt 			}
    746  1.121      yamt 			break;
    747  1.121      yamt 
    748  1.121      yamt 		case SLOWPROTOCOLS_SUBTYPE_MARKER:
    749  1.121      yamt 			if (ifp->if_agrprivate) {
    750  1.121      yamt 				ieee8023ad_marker_input(ifp, m);
    751  1.121      yamt 				return;
    752  1.121      yamt 			}
    753  1.121      yamt 			break;
    754  1.121      yamt #endif /* NAGR > 0 */
    755  1.121      yamt 		default:
    756  1.121      yamt 			if (subtype == 0 || subtype > 10) {
    757  1.121      yamt 				/* illegal value */
    758  1.121      yamt 				m_freem(m);
    759  1.121      yamt 				return;
    760  1.121      yamt 			}
    761  1.121      yamt 			/* unknown subtype */
    762  1.121      yamt 			break;
    763  1.121      yamt 		}
    764  1.121      yamt 		/* FALLTHROUGH */
    765  1.121      yamt 	}
    766   1.59   thorpej 	default:
    767  1.106    bouyer 		if (m->m_flags & M_PROMISC) {
    768  1.106    bouyer 			m_freem(m);
    769  1.106    bouyer 			return;
    770  1.106    bouyer 		}
    771   1.59   thorpej 	}
    772   1.42   thorpej 
    773   1.45   thorpej 	/* If the CRC is still on the packet, trim it off. */
    774   1.79   thorpej 	if (m->m_flags & M_HASFCS) {
    775   1.45   thorpej 		m_adj(m, -ETHER_CRC_LEN);
    776   1.79   thorpej 		m->m_flags &= ~M_HASFCS;
    777   1.79   thorpej 	}
    778   1.42   thorpej 
    779  1.139        is 	if (etype > ETHERMTU + sizeof (struct ether_header)) {
    780  1.139        is 		/* Strip off the Ethernet header. */
    781  1.187      matt 		m_adj(m, ehlen);
    782  1.139        is 
    783  1.139        is 		switch (etype) {
    784    1.1       cgd #ifdef INET
    785  1.139        is 		case ETHERTYPE_IP:
    786   1.30      matt #ifdef GATEWAY
    787  1.139        is 			if (ipflow_fastforward(m))
    788  1.139        is 				return;
    789   1.30      matt #endif
    790  1.199     rmind 			pktq = ip_pktq;
    791  1.139        is 			break;
    792    1.1       cgd 
    793  1.139        is 		case ETHERTYPE_ARP:
    794  1.198   msaitoh 			isr = NETISR_ARP;
    795  1.139        is 			inq = &arpintrq;
    796  1.139        is 			break;
    797    1.7     glass 
    798  1.139        is 		case ETHERTYPE_REVARP:
    799  1.139        is 			revarpinput(m);	/* XXX queue? */
    800  1.139        is 			return;
    801    1.1       cgd #endif
    802   1.44    itojun #ifdef INET6
    803  1.139        is 		case ETHERTYPE_IPV6:
    804  1.196     pooka 			if (__predict_false(!in6_present)) {
    805  1.196     pooka 				m_freem(m);
    806  1.196     pooka 				return;
    807  1.196     pooka 			}
    808  1.250      maxv #ifdef GATEWAY
    809  1.192  christos 			if (ip6flow_fastforward(&m))
    810  1.148  liamjfoy 				return;
    811  1.148  liamjfoy #endif
    812  1.199     rmind 			pktq = ip6_pktq;
    813  1.139        is 			break;
    814   1.44    itojun #endif
    815   1.23  christos #ifdef NETATALK
    816  1.174     isaki 		case ETHERTYPE_ATALK:
    817  1.198   msaitoh 			isr = NETISR_ATALK;
    818  1.174     isaki 			inq = &atintrq1;
    819  1.174     isaki 			break;
    820  1.174     isaki 		case ETHERTYPE_AARP:
    821  1.139        is 			/* probably this should be done with a NETISR as well */
    822  1.175   mbalmer 			aarpinput(ifp, m); /* XXX */
    823  1.174     isaki 			return;
    824   1.23  christos #endif /* NETATALK */
    825  1.182    kefren #ifdef MPLS
    826  1.182    kefren 		case ETHERTYPE_MPLS:
    827  1.198   msaitoh 			isr = NETISR_MPLS;
    828  1.182    kefren 			inq = &mplsintrq;
    829  1.182    kefren 			break;
    830  1.182    kefren #endif
    831  1.139        is 		default:
    832  1.139        is 			m_freem(m);
    833  1.139        is 			return;
    834  1.139        is 		}
    835  1.139        is 	} else {
    836  1.194     joerg #if defined (LLC) || defined (NETATALK)
    837  1.249      maxv 		if (m->m_len < ehlen + sizeof(struct llc)) {
    838  1.249      maxv 			goto dropanyway;
    839  1.249      maxv 		}
    840  1.139        is 		l = (struct llc *)(eh+1);
    841    1.8   mycroft 		switch (l->llc_dsap) {
    842   1.23  christos #ifdef NETATALK
    843   1.23  christos 		case LLC_SNAP_LSAP:
    844   1.23  christos 			switch (l->llc_control) {
    845   1.23  christos 			case LLC_UI:
    846   1.23  christos 				if (l->llc_ssap != LLC_SNAP_LSAP) {
    847   1.23  christos 					goto dropanyway;
    848   1.23  christos 				}
    849  1.120     perry 
    850  1.166    dyoung 				if (memcmp(&(l->llc_snap_org_code)[0],
    851   1.23  christos 				    at_org_code, sizeof(at_org_code)) == 0 &&
    852   1.23  christos 				    ntohs(l->llc_snap_ether_type) ==
    853   1.38       kim 				    ETHERTYPE_ATALK) {
    854   1.23  christos 					inq = &atintrq2;
    855  1.139        is 					m_adj(m, sizeof(struct ether_header)
    856  1.139        is 					    + sizeof(struct llc));
    857  1.198   msaitoh 					isr = NETISR_ATALK;
    858   1.23  christos 					break;
    859   1.23  christos 				}
    860   1.23  christos 
    861  1.166    dyoung 				if (memcmp(&(l->llc_snap_org_code)[0],
    862   1.23  christos 				    aarp_org_code,
    863   1.23  christos 				    sizeof(aarp_org_code)) == 0 &&
    864   1.23  christos 				    ntohs(l->llc_snap_ether_type) ==
    865   1.23  christos 				    ETHERTYPE_AARP) {
    866  1.139        is 					m_adj( m, sizeof(struct ether_header)
    867  1.139        is 					    + sizeof(struct llc));
    868   1.23  christos 					aarpinput(ifp, m); /* XXX */
    869   1.23  christos 				    return;
    870   1.23  christos 				}
    871  1.120     perry 
    872   1.23  christos 			default:
    873   1.23  christos 				goto dropanyway;
    874   1.23  christos 			}
    875   1.23  christos 			break;
    876  1.249      maxv #endif
    877    1.1       cgd 		dropanyway:
    878    1.1       cgd 		default:
    879    1.8   mycroft 			m_freem(m);
    880    1.8   mycroft 			return;
    881    1.8   mycroft 		}
    882  1.250      maxv #else /* LLC || NETATALK */
    883  1.139        is 		m_freem(m);
    884  1.139        is 		return;
    885  1.250      maxv #endif /* LLC || NETATALK */
    886    1.1       cgd 	}
    887    1.1       cgd 
    888  1.199     rmind 	if (__predict_true(pktq)) {
    889  1.229     ozaki #ifdef NET_MPSAFE
    890  1.229     ozaki 		const u_int h = curcpu()->ci_index;
    891  1.229     ozaki #else
    892  1.199     rmind 		const uint32_t h = pktq_rps_hash(m);
    893  1.229     ozaki #endif
    894  1.199     rmind 		if (__predict_false(!pktq_enqueue(pktq, m, h))) {
    895  1.199     rmind 			m_freem(m);
    896  1.199     rmind 		}
    897  1.199     rmind 		return;
    898  1.199     rmind 	}
    899  1.199     rmind 
    900  1.199     rmind 	if (__predict_false(!inq)) {
    901  1.199     rmind 		/* Should not happen. */
    902  1.199     rmind 		m_freem(m);
    903  1.199     rmind 		return;
    904  1.199     rmind 	}
    905  1.228     ozaki 
    906  1.228     ozaki 	IFQ_LOCK(inq);
    907    1.1       cgd 	if (IF_QFULL(inq)) {
    908    1.1       cgd 		IF_DROP(inq);
    909  1.228     ozaki 		IFQ_UNLOCK(inq);
    910    1.1       cgd 		m_freem(m);
    911  1.198   msaitoh 	} else {
    912    1.1       cgd 		IF_ENQUEUE(inq, m);
    913  1.228     ozaki 		IFQ_UNLOCK(inq);
    914  1.198   msaitoh 		schednetisr(isr);
    915  1.198   msaitoh 	}
    916    1.1       cgd }
    917    1.1       cgd 
    918    1.1       cgd /*
    919    1.1       cgd  * Convert Ethernet address to printable (loggable) representation.
    920    1.1       cgd  */
    921    1.1       cgd char *
    922   1.58      matt ether_sprintf(const u_char *ap)
    923    1.1       cgd {
    924  1.129  christos 	static char etherbuf[3 * ETHER_ADDR_LEN];
    925  1.129  christos 	return ether_snprintf(etherbuf, sizeof(etherbuf), ap);
    926  1.129  christos }
    927  1.129  christos 
    928  1.129  christos char *
    929  1.129  christos ether_snprintf(char *buf, size_t len, const u_char *ap)
    930  1.129  christos {
    931  1.129  christos 	char *cp = buf;
    932  1.129  christos 	size_t i;
    933    1.1       cgd 
    934  1.129  christos 	for (i = 0; i < len / 3; i++) {
    935  1.124  christos 		*cp++ = hexdigits[*ap >> 4];
    936  1.124  christos 		*cp++ = hexdigits[*ap++ & 0xf];
    937    1.1       cgd 		*cp++ = ':';
    938    1.1       cgd 	}
    939  1.129  christos 	*--cp = '\0';
    940  1.129  christos 	return buf;
    941    1.1       cgd }
    942    1.8   mycroft 
    943    1.8   mycroft /*
    944    1.8   mycroft  * Perform common duties while attaching to interface list
    945    1.8   mycroft  */
    946    1.8   mycroft void
    947  1.162      matt ether_ifattach(struct ifnet *ifp, const uint8_t *lla)
    948    1.8   mycroft {
    949  1.104      matt 	struct ethercom *ec = (struct ethercom *)ifp;
    950    1.8   mycroft 
    951    1.8   mycroft 	ifp->if_type = IFT_ETHER;
    952   1.94     enami 	ifp->if_hdrlen = ETHER_HDR_LEN;
    953   1.73   thorpej 	ifp->if_dlt = DLT_EN10MB;
    954    1.8   mycroft 	ifp->if_mtu = ETHERMTU;
    955   1.12   mycroft 	ifp->if_output = ether_output;
    956  1.216     ozaki 	ifp->_if_input = ether_input;
    957   1.54   thorpej 	if (ifp->if_baudrate == 0)
    958   1.54   thorpej 		ifp->if_baudrate = IF_Mbps(10);		/* just a default */
    959   1.75   thorpej 
    960  1.230     ozaki 	if (lla != NULL)
    961  1.230     ozaki 		if_set_sadl(ifp, lla, ETHER_ADDR_LEN, !ETHER_IS_LOCAL(lla));
    962   1.75   thorpej 
    963  1.104      matt 	LIST_INIT(&ec->ec_multiaddrs);
    964  1.233     ozaki 	ec->ec_lock = mutex_obj_alloc(MUTEX_DEFAULT, IPL_NET);
    965   1.26        is 	ifp->if_broadcastaddr = etherbroadcastaddr;
    966  1.177     joerg 	bpf_attach(ifp, DLT_EN10MB, sizeof(struct ether_header));
    967  1.104      matt #ifdef MBUFTRACE
    968  1.108    itojun 	strlcpy(ec->ec_tx_mowner.mo_name, ifp->if_xname,
    969  1.108    itojun 	    sizeof(ec->ec_tx_mowner.mo_name));
    970  1.108    itojun 	strlcpy(ec->ec_tx_mowner.mo_descr, "tx",
    971  1.108    itojun 	    sizeof(ec->ec_tx_mowner.mo_descr));
    972  1.108    itojun 	strlcpy(ec->ec_rx_mowner.mo_name, ifp->if_xname,
    973  1.108    itojun 	    sizeof(ec->ec_rx_mowner.mo_name));
    974  1.108    itojun 	strlcpy(ec->ec_rx_mowner.mo_descr, "rx",
    975  1.108    itojun 	    sizeof(ec->ec_rx_mowner.mo_descr));
    976  1.104      matt 	MOWNER_ATTACH(&ec->ec_tx_mowner);
    977  1.104      matt 	MOWNER_ATTACH(&ec->ec_rx_mowner);
    978  1.104      matt 	ifp->if_mowner = &ec->ec_tx_mowner;
    979  1.104      matt #endif
    980   1.52   thorpej }
    981   1.52   thorpej 
    982   1.52   thorpej void
    983   1.58      matt ether_ifdetach(struct ifnet *ifp)
    984   1.52   thorpej {
    985   1.63   thorpej 	struct ethercom *ec = (void *) ifp;
    986   1.63   thorpej 	struct ether_multi *enm;
    987   1.69   thorpej 
    988  1.190  christos 	/*
    989  1.190  christos 	 * Prevent further calls to ioctl (for example turning off
    990  1.190  christos 	 * promiscuous mode from the bridge code), which eventually can
    991  1.190  christos 	 * call if_init() which can cause panics because the interface
    992  1.190  christos 	 * is in the process of being detached. Return device not configured
    993  1.190  christos 	 * instead.
    994  1.190  christos 	 */
    995  1.190  christos 	ifp->if_ioctl = (int (*)(struct ifnet *, u_long, void *))enxio;
    996  1.190  christos 
    997  1.115    dyoung #if NBRIDGE > 0
    998  1.115    dyoung 	if (ifp->if_bridge)
    999  1.115    dyoung 		bridge_ifdetach(ifp);
   1000  1.115    dyoung #endif
   1001  1.115    dyoung 
   1002  1.177     joerg 	bpf_detach(ifp);
   1003   1.64   thorpej 
   1004   1.64   thorpej #if NVLAN > 0
   1005   1.64   thorpej 	if (ec->ec_nvlans)
   1006   1.64   thorpej 		vlan_ifdetach(ifp);
   1007   1.64   thorpej #endif
   1008   1.63   thorpej 
   1009  1.245   msaitoh 	ETHER_LOCK(ec);
   1010   1.63   thorpej 	while ((enm = LIST_FIRST(&ec->ec_multiaddrs)) != NULL) {
   1011   1.63   thorpej 		LIST_REMOVE(enm, enm_list);
   1012  1.248     ozaki 		kmem_free(enm, sizeof(*enm));
   1013   1.63   thorpej 		ec->ec_multicnt--;
   1014   1.63   thorpej 	}
   1015  1.245   msaitoh 	ETHER_UNLOCK(ec);
   1016   1.52   thorpej 
   1017  1.231     ozaki 	mutex_destroy(ec->ec_lock);
   1018  1.231     ozaki 
   1019  1.189       chs 	ifp->if_mowner = NULL;
   1020  1.104      matt 	MOWNER_DETACH(&ec->ec_rx_mowner);
   1021  1.104      matt 	MOWNER_DETACH(&ec->ec_tx_mowner);
   1022   1.53   thorpej }
   1023   1.53   thorpej 
   1024   1.56   thorpej #if 0
   1025   1.56   thorpej /*
   1026   1.56   thorpej  * This is for reference.  We have a table-driven version
   1027   1.56   thorpej  * of the little-endian crc32 generator, which is faster
   1028   1.56   thorpej  * than the double-loop.
   1029   1.56   thorpej  */
   1030  1.162      matt uint32_t
   1031  1.162      matt ether_crc32_le(const uint8_t *buf, size_t len)
   1032   1.53   thorpej {
   1033  1.162      matt 	uint32_t c, crc, carry;
   1034   1.53   thorpej 	size_t i, j;
   1035   1.53   thorpej 
   1036   1.53   thorpej 	crc = 0xffffffffU;	/* initial value */
   1037   1.53   thorpej 
   1038   1.53   thorpej 	for (i = 0; i < len; i++) {
   1039   1.53   thorpej 		c = buf[i];
   1040   1.53   thorpej 		for (j = 0; j < 8; j++) {
   1041   1.53   thorpej 			carry = ((crc & 0x01) ? 1 : 0) ^ (c & 0x01);
   1042   1.53   thorpej 			crc >>= 1;
   1043   1.53   thorpej 			c >>= 1;
   1044   1.53   thorpej 			if (carry)
   1045   1.56   thorpej 				crc = (crc ^ ETHER_CRC_POLY_LE);
   1046   1.53   thorpej 		}
   1047   1.53   thorpej 	}
   1048   1.53   thorpej 
   1049   1.53   thorpej 	return (crc);
   1050   1.53   thorpej }
   1051   1.56   thorpej #else
   1052  1.162      matt uint32_t
   1053  1.162      matt ether_crc32_le(const uint8_t *buf, size_t len)
   1054   1.56   thorpej {
   1055  1.162      matt 	static const uint32_t crctab[] = {
   1056   1.56   thorpej 		0x00000000, 0x1db71064, 0x3b6e20c8, 0x26d930ac,
   1057   1.56   thorpej 		0x76dc4190, 0x6b6b51f4, 0x4db26158, 0x5005713c,
   1058   1.56   thorpej 		0xedb88320, 0xf00f9344, 0xd6d6a3e8, 0xcb61b38c,
   1059   1.56   thorpej 		0x9b64c2b0, 0x86d3d2d4, 0xa00ae278, 0xbdbdf21c
   1060   1.56   thorpej 	};
   1061  1.162      matt 	uint32_t crc;
   1062   1.98   thorpej 	size_t i;
   1063   1.56   thorpej 
   1064   1.56   thorpej 	crc = 0xffffffffU;	/* initial value */
   1065   1.56   thorpej 
   1066   1.56   thorpej 	for (i = 0; i < len; i++) {
   1067   1.56   thorpej 		crc ^= buf[i];
   1068   1.56   thorpej 		crc = (crc >> 4) ^ crctab[crc & 0xf];
   1069   1.56   thorpej 		crc = (crc >> 4) ^ crctab[crc & 0xf];
   1070   1.56   thorpej 	}
   1071   1.56   thorpej 
   1072   1.56   thorpej 	return (crc);
   1073   1.56   thorpej }
   1074   1.56   thorpej #endif
   1075   1.53   thorpej 
   1076  1.162      matt uint32_t
   1077  1.162      matt ether_crc32_be(const uint8_t *buf, size_t len)
   1078   1.53   thorpej {
   1079  1.162      matt 	uint32_t c, crc, carry;
   1080   1.53   thorpej 	size_t i, j;
   1081   1.53   thorpej 
   1082   1.53   thorpej 	crc = 0xffffffffU;	/* initial value */
   1083   1.53   thorpej 
   1084   1.53   thorpej 	for (i = 0; i < len; i++) {
   1085   1.53   thorpej 		c = buf[i];
   1086   1.53   thorpej 		for (j = 0; j < 8; j++) {
   1087   1.53   thorpej 			carry = ((crc & 0x80000000U) ? 1 : 0) ^ (c & 0x01);
   1088   1.53   thorpej 			crc <<= 1;
   1089   1.53   thorpej 			c >>= 1;
   1090   1.53   thorpej 			if (carry)
   1091   1.53   thorpej 				crc = (crc ^ ETHER_CRC_POLY_BE) | carry;
   1092   1.53   thorpej 		}
   1093   1.53   thorpej 	}
   1094   1.53   thorpej 
   1095   1.53   thorpej 	return (crc);
   1096    1.8   mycroft }
   1097    1.8   mycroft 
   1098   1.48        is #ifdef INET
   1099  1.118      yamt const uint8_t ether_ipmulticast_min[ETHER_ADDR_LEN] =
   1100  1.118      yamt     { 0x01, 0x00, 0x5e, 0x00, 0x00, 0x00 };
   1101  1.118      yamt const uint8_t ether_ipmulticast_max[ETHER_ADDR_LEN] =
   1102  1.118      yamt     { 0x01, 0x00, 0x5e, 0x7f, 0xff, 0xff };
   1103   1.48        is #endif
   1104   1.44    itojun #ifdef INET6
   1105  1.118      yamt const uint8_t ether_ip6multicast_min[ETHER_ADDR_LEN] =
   1106  1.118      yamt     { 0x33, 0x33, 0x00, 0x00, 0x00, 0x00 };
   1107  1.118      yamt const uint8_t ether_ip6multicast_max[ETHER_ADDR_LEN] =
   1108  1.118      yamt     { 0x33, 0x33, 0xff, 0xff, 0xff, 0xff };
   1109   1.44    itojun #endif
   1110   1.60     enami 
   1111    1.3   hpeyerl /*
   1112  1.138    rpaulo  * ether_aton implementation, not using a static buffer.
   1113  1.138    rpaulo  */
   1114  1.138    rpaulo int
   1115  1.180  christos ether_aton_r(u_char *dest, size_t len, const char *str)
   1116  1.138    rpaulo {
   1117  1.250      maxv 	const u_char *cp = (const void *)str;
   1118  1.180  christos 	u_char *ep;
   1119  1.180  christos 
   1120  1.185   tsutsui #define atox(c)	(((c) <= '9') ? ((c) - '0') : ((toupper(c) - 'A') + 10))
   1121  1.180  christos 
   1122  1.180  christos 	if (len < ETHER_ADDR_LEN)
   1123  1.180  christos 		return ENOSPC;
   1124  1.180  christos 
   1125  1.180  christos 	ep = dest + ETHER_ADDR_LEN;
   1126  1.250      maxv 
   1127  1.180  christos 	while (*cp) {
   1128  1.250      maxv 		if (!isxdigit(*cp))
   1129  1.250      maxv 			return EINVAL;
   1130  1.180  christos 		*dest = atox(*cp);
   1131  1.180  christos 		cp++;
   1132  1.250      maxv 		if (isxdigit(*cp)) {
   1133  1.250      maxv 			*dest = (*dest << 4) | atox(*cp);
   1134  1.180  christos 			dest++;
   1135  1.180  christos 			cp++;
   1136  1.250      maxv 		} else {
   1137  1.181  christos 			dest++;
   1138  1.250      maxv 		}
   1139  1.180  christos 		if (dest == ep)
   1140  1.180  christos 			return *cp == '\0' ? 0 : ENAMETOOLONG;
   1141  1.180  christos 		switch (*cp) {
   1142  1.180  christos 		case ':':
   1143  1.180  christos 		case '-':
   1144  1.180  christos 		case '.':
   1145  1.179  jakllsch 			cp++;
   1146  1.180  christos 			break;
   1147  1.179  jakllsch 		}
   1148  1.250      maxv 	}
   1149  1.180  christos 	return ENOBUFS;
   1150  1.138    rpaulo }
   1151  1.138    rpaulo 
   1152  1.138    rpaulo /*
   1153   1.60     enami  * Convert a sockaddr into an Ethernet address or range of Ethernet
   1154   1.60     enami  * addresses.
   1155    1.3   hpeyerl  */
   1156    1.3   hpeyerl int
   1157  1.162      matt ether_multiaddr(const struct sockaddr *sa, uint8_t addrlo[ETHER_ADDR_LEN],
   1158  1.162      matt     uint8_t addrhi[ETHER_ADDR_LEN])
   1159    1.3   hpeyerl {
   1160   1.24  christos #ifdef INET
   1161  1.155    dyoung 	const struct sockaddr_in *sin;
   1162   1.24  christos #endif /* INET */
   1163   1.44    itojun #ifdef INET6
   1164  1.155    dyoung 	const struct sockaddr_in6 *sin6;
   1165   1.44    itojun #endif /* INET6 */
   1166    1.3   hpeyerl 
   1167   1.60     enami 	switch (sa->sa_family) {
   1168    1.3   hpeyerl 
   1169    1.3   hpeyerl 	case AF_UNSPEC:
   1170  1.146    dyoung 		memcpy(addrlo, sa->sa_data, ETHER_ADDR_LEN);
   1171  1.146    dyoung 		memcpy(addrhi, addrlo, ETHER_ADDR_LEN);
   1172    1.3   hpeyerl 		break;
   1173    1.3   hpeyerl 
   1174    1.3   hpeyerl #ifdef INET
   1175    1.3   hpeyerl 	case AF_INET:
   1176  1.155    dyoung 		sin = satocsin(sa);
   1177    1.3   hpeyerl 		if (sin->sin_addr.s_addr == INADDR_ANY) {
   1178    1.3   hpeyerl 			/*
   1179   1.60     enami 			 * An IP address of INADDR_ANY means listen to
   1180   1.60     enami 			 * or stop listening to all of the Ethernet
   1181   1.60     enami 			 * multicast addresses used for IP.
   1182    1.3   hpeyerl 			 * (This is for the sake of IP multicast routers.)
   1183    1.3   hpeyerl 			 */
   1184  1.146    dyoung 			memcpy(addrlo, ether_ipmulticast_min, ETHER_ADDR_LEN);
   1185  1.146    dyoung 			memcpy(addrhi, ether_ipmulticast_max, ETHER_ADDR_LEN);
   1186    1.3   hpeyerl 		}
   1187    1.3   hpeyerl 		else {
   1188    1.3   hpeyerl 			ETHER_MAP_IP_MULTICAST(&sin->sin_addr, addrlo);
   1189  1.146    dyoung 			memcpy(addrhi, addrlo, ETHER_ADDR_LEN);
   1190    1.3   hpeyerl 		}
   1191    1.3   hpeyerl 		break;
   1192    1.3   hpeyerl #endif
   1193   1.44    itojun #ifdef INET6
   1194   1.44    itojun 	case AF_INET6:
   1195  1.155    dyoung 		sin6 = satocsin6(sa);
   1196   1.47    itojun 		if (IN6_IS_ADDR_UNSPECIFIED(&sin6->sin6_addr)) {
   1197   1.44    itojun 			/*
   1198   1.60     enami 			 * An IP6 address of 0 means listen to or stop
   1199   1.60     enami 			 * listening to all of the Ethernet multicast
   1200   1.60     enami 			 * address used for IP6.
   1201   1.44    itojun 			 * (This is used for multicast routers.)
   1202   1.44    itojun 			 */
   1203  1.146    dyoung 			memcpy(addrlo, ether_ip6multicast_min, ETHER_ADDR_LEN);
   1204  1.146    dyoung 			memcpy(addrhi, ether_ip6multicast_max, ETHER_ADDR_LEN);
   1205   1.44    itojun 		} else {
   1206   1.44    itojun 			ETHER_MAP_IPV6_MULTICAST(&sin6->sin6_addr, addrlo);
   1207  1.146    dyoung 			memcpy(addrhi, addrlo, ETHER_ADDR_LEN);
   1208   1.44    itojun 		}
   1209   1.44    itojun 		break;
   1210   1.44    itojun #endif
   1211    1.3   hpeyerl 
   1212    1.3   hpeyerl 	default:
   1213  1.146    dyoung 		return EAFNOSUPPORT;
   1214   1.60     enami 	}
   1215  1.146    dyoung 	return 0;
   1216   1.60     enami }
   1217   1.60     enami 
   1218   1.60     enami /*
   1219   1.60     enami  * Add an Ethernet multicast address or range of addresses to the list for a
   1220   1.60     enami  * given interface.
   1221   1.60     enami  */
   1222   1.60     enami int
   1223  1.155    dyoung ether_addmulti(const struct sockaddr *sa, struct ethercom *ec)
   1224   1.60     enami {
   1225  1.231     ozaki 	struct ether_multi *enm, *_enm;
   1226   1.60     enami 	u_char addrlo[ETHER_ADDR_LEN];
   1227   1.60     enami 	u_char addrhi[ETHER_ADDR_LEN];
   1228  1.237     skrll 	int error = 0;
   1229  1.231     ozaki 
   1230  1.231     ozaki 	/* Allocate out of lock */
   1231  1.248     ozaki 	enm = kmem_alloc(sizeof(*enm), KM_SLEEP);
   1232  1.231     ozaki 	if (enm == NULL)
   1233  1.231     ozaki 		return ENOBUFS;
   1234   1.60     enami 
   1235  1.245   msaitoh 	ETHER_LOCK(ec);
   1236  1.155    dyoung 	error = ether_multiaddr(sa, addrlo, addrhi);
   1237  1.231     ozaki 	if (error != 0)
   1238  1.231     ozaki 		goto out;
   1239    1.3   hpeyerl 
   1240    1.3   hpeyerl 	/*
   1241    1.3   hpeyerl 	 * Verify that we have valid Ethernet multicast addresses.
   1242    1.3   hpeyerl 	 */
   1243  1.186      yamt 	if (!ETHER_IS_MULTICAST(addrlo) || !ETHER_IS_MULTICAST(addrhi)) {
   1244  1.231     ozaki 		error = EINVAL;
   1245  1.231     ozaki 		goto out;
   1246    1.3   hpeyerl 	}
   1247    1.3   hpeyerl 	/*
   1248    1.3   hpeyerl 	 * See if the address range is already in the list.
   1249    1.3   hpeyerl 	 */
   1250  1.231     ozaki 	ETHER_LOOKUP_MULTI(addrlo, addrhi, ec, _enm);
   1251  1.231     ozaki 	if (_enm != NULL) {
   1252    1.3   hpeyerl 		/*
   1253    1.3   hpeyerl 		 * Found it; just increment the reference count.
   1254    1.3   hpeyerl 		 */
   1255  1.231     ozaki 		++_enm->enm_refcount;
   1256  1.231     ozaki 		error = 0;
   1257  1.231     ozaki 		goto out;
   1258    1.3   hpeyerl 	}
   1259    1.3   hpeyerl 	/*
   1260  1.239     ozaki 	 * Link a new multicast record into the interface's multicast list.
   1261    1.3   hpeyerl 	 */
   1262  1.146    dyoung 	memcpy(enm->enm_addrlo, addrlo, 6);
   1263  1.146    dyoung 	memcpy(enm->enm_addrhi, addrhi, 6);
   1264    1.3   hpeyerl 	enm->enm_refcount = 1;
   1265   1.22        is 	LIST_INSERT_HEAD(&ec->ec_multiaddrs, enm, enm_list);
   1266   1.22        is 	ec->ec_multicnt++;
   1267    1.3   hpeyerl 	/*
   1268    1.3   hpeyerl 	 * Return ENETRESET to inform the driver that the list has changed
   1269    1.3   hpeyerl 	 * and its reception filter should be adjusted accordingly.
   1270    1.3   hpeyerl 	 */
   1271  1.231     ozaki 	error = ENETRESET;
   1272  1.231     ozaki 	enm = NULL;
   1273  1.231     ozaki out:
   1274  1.245   msaitoh 	ETHER_UNLOCK(ec);
   1275  1.231     ozaki 	if (enm != NULL)
   1276  1.248     ozaki 		kmem_free(enm, sizeof(*enm));
   1277  1.231     ozaki 	return error;
   1278    1.3   hpeyerl }
   1279    1.3   hpeyerl 
   1280    1.3   hpeyerl /*
   1281    1.3   hpeyerl  * Delete a multicast address record.
   1282    1.3   hpeyerl  */
   1283    1.3   hpeyerl int
   1284  1.155    dyoung ether_delmulti(const struct sockaddr *sa, struct ethercom *ec)
   1285    1.3   hpeyerl {
   1286   1.29       mrg 	struct ether_multi *enm;
   1287   1.60     enami 	u_char addrlo[ETHER_ADDR_LEN];
   1288   1.60     enami 	u_char addrhi[ETHER_ADDR_LEN];
   1289  1.237     skrll 	int error;
   1290    1.3   hpeyerl 
   1291  1.245   msaitoh 	ETHER_LOCK(ec);
   1292  1.155    dyoung 	error = ether_multiaddr(sa, addrlo, addrhi);
   1293  1.231     ozaki 	if (error != 0)
   1294  1.231     ozaki 		goto error;
   1295    1.3   hpeyerl 
   1296    1.3   hpeyerl 	/*
   1297   1.66   thorpej 	 * Look ur the address in our list.
   1298    1.3   hpeyerl 	 */
   1299   1.22        is 	ETHER_LOOKUP_MULTI(addrlo, addrhi, ec, enm);
   1300    1.3   hpeyerl 	if (enm == NULL) {
   1301  1.231     ozaki 		error = ENXIO;
   1302  1.231     ozaki 		goto error;
   1303    1.3   hpeyerl 	}
   1304    1.3   hpeyerl 	if (--enm->enm_refcount != 0) {
   1305    1.3   hpeyerl 		/*
   1306    1.3   hpeyerl 		 * Still some claims to this record.
   1307    1.3   hpeyerl 		 */
   1308  1.231     ozaki 		error = 0;
   1309  1.231     ozaki 		goto error;
   1310    1.3   hpeyerl 	}
   1311    1.3   hpeyerl 	/*
   1312    1.3   hpeyerl 	 * No remaining claims to this record; unlink and free it.
   1313    1.3   hpeyerl 	 */
   1314   1.13   mycroft 	LIST_REMOVE(enm, enm_list);
   1315   1.22        is 	ec->ec_multicnt--;
   1316  1.245   msaitoh 	ETHER_UNLOCK(ec);
   1317  1.231     ozaki 
   1318  1.248     ozaki 	kmem_free(enm, sizeof(*enm));
   1319    1.3   hpeyerl 	/*
   1320    1.3   hpeyerl 	 * Return ENETRESET to inform the driver that the list has changed
   1321    1.3   hpeyerl 	 * and its reception filter should be adjusted accordingly.
   1322    1.3   hpeyerl 	 */
   1323  1.231     ozaki 	return ENETRESET;
   1324  1.231     ozaki error:
   1325  1.245   msaitoh 	ETHER_UNLOCK(ec);
   1326  1.231     ozaki 	return error;
   1327   1.66   thorpej }
   1328   1.66   thorpej 
   1329  1.170    dyoung void
   1330  1.170    dyoung ether_set_ifflags_cb(struct ethercom *ec, ether_cb_t cb)
   1331  1.170    dyoung {
   1332  1.170    dyoung 	ec->ec_ifflags_cb = cb;
   1333  1.170    dyoung }
   1334  1.170    dyoung 
   1335   1.66   thorpej /*
   1336   1.66   thorpej  * Common ioctls for Ethernet interfaces.  Note, we must be
   1337   1.66   thorpej  * called at splnet().
   1338   1.66   thorpej  */
   1339   1.66   thorpej int
   1340  1.147  christos ether_ioctl(struct ifnet *ifp, u_long cmd, void *data)
   1341   1.66   thorpej {
   1342   1.66   thorpej 	struct ethercom *ec = (void *) ifp;
   1343  1.193   msaitoh 	struct eccapreq *eccr;
   1344   1.66   thorpej 	struct ifreq *ifr = (struct ifreq *)data;
   1345  1.170    dyoung 	struct if_laddrreq *iflr = data;
   1346  1.170    dyoung 	const struct sockaddr_dl *sdl;
   1347  1.170    dyoung 	static const uint8_t zero[ETHER_ADDR_LEN];
   1348  1.169    dyoung 	int error;
   1349   1.66   thorpej 
   1350   1.66   thorpej 	switch (cmd) {
   1351  1.170    dyoung 	case SIOCINITIFADDR:
   1352  1.191      matt 	    {
   1353  1.191      matt 		struct ifaddr *ifa = (struct ifaddr *)data;
   1354  1.191      matt 		if (ifa->ifa_addr->sa_family != AF_LINK
   1355  1.247   msaitoh 		    && (ifp->if_flags & (IFF_UP | IFF_RUNNING)) !=
   1356  1.247   msaitoh 		       (IFF_UP | IFF_RUNNING)) {
   1357  1.170    dyoung 			ifp->if_flags |= IFF_UP;
   1358  1.170    dyoung 			if ((error = (*ifp->if_init)(ifp)) != 0)
   1359  1.170    dyoung 				return error;
   1360  1.170    dyoung 		}
   1361   1.66   thorpej #ifdef INET
   1362  1.191      matt 		if (ifa->ifa_addr->sa_family == AF_INET)
   1363  1.191      matt 			arp_ifinit(ifp, ifa);
   1364   1.66   thorpej #endif /* INET */
   1365  1.169    dyoung 		return 0;
   1366  1.191      matt 	    }
   1367   1.66   thorpej 
   1368   1.66   thorpej 	case SIOCSIFMTU:
   1369   1.82   thorpej 	    {
   1370   1.82   thorpej 		int maxmtu;
   1371   1.82   thorpej 
   1372   1.82   thorpej 		if (ec->ec_capabilities & ETHERCAP_JUMBO_MTU)
   1373   1.82   thorpej 			maxmtu = ETHERMTU_JUMBO;
   1374   1.82   thorpej 		else
   1375   1.82   thorpej 			maxmtu = ETHERMTU;
   1376   1.82   thorpej 
   1377   1.82   thorpej 		if (ifr->ifr_mtu < ETHERMIN || ifr->ifr_mtu > maxmtu)
   1378  1.169    dyoung 			return EINVAL;
   1379  1.169    dyoung 		else if ((error = ifioctl_common(ifp, cmd, data)) != ENETRESET)
   1380  1.169    dyoung 			return error;
   1381  1.169    dyoung 		else if (ifp->if_flags & IFF_UP) {
   1382   1.88   thorpej 			/* Make sure the device notices the MTU change. */
   1383  1.169    dyoung 			return (*ifp->if_init)(ifp);
   1384  1.169    dyoung 		} else
   1385  1.169    dyoung 			return 0;
   1386   1.82   thorpej 	    }
   1387   1.66   thorpej 
   1388   1.66   thorpej 	case SIOCSIFFLAGS:
   1389  1.170    dyoung 		if ((error = ifioctl_common(ifp, cmd, data)) != 0)
   1390  1.170    dyoung 			return error;
   1391  1.247   msaitoh 		switch (ifp->if_flags & (IFF_UP | IFF_RUNNING)) {
   1392  1.169    dyoung 		case IFF_RUNNING:
   1393   1.66   thorpej 			/*
   1394   1.66   thorpej 			 * If interface is marked down and it is running,
   1395   1.66   thorpej 			 * then stop and disable it.
   1396   1.66   thorpej 			 */
   1397   1.66   thorpej 			(*ifp->if_stop)(ifp, 1);
   1398  1.169    dyoung 			break;
   1399  1.169    dyoung 		case IFF_UP:
   1400   1.66   thorpej 			/*
   1401   1.66   thorpej 			 * If interface is marked up and it is stopped, then
   1402   1.66   thorpej 			 * start it.
   1403   1.66   thorpej 			 */
   1404  1.169    dyoung 			return (*ifp->if_init)(ifp);
   1405  1.247   msaitoh 		case IFF_UP | IFF_RUNNING:
   1406  1.170    dyoung 			error = 0;
   1407  1.247   msaitoh 			if (ec->ec_ifflags_cb != NULL) {
   1408  1.247   msaitoh 				error = (*ec->ec_ifflags_cb)(ec);
   1409  1.247   msaitoh 				if (error == ENETRESET) {
   1410  1.247   msaitoh 					/*
   1411  1.247   msaitoh 					 * Reset the interface to pick up
   1412  1.247   msaitoh 					 * changes in any other flags that
   1413  1.247   msaitoh 					 * affect the hardware state.
   1414  1.247   msaitoh 					 */
   1415  1.247   msaitoh 					return (*ifp->if_init)(ifp);
   1416  1.247   msaitoh 				}
   1417  1.247   msaitoh 			} else
   1418  1.247   msaitoh 				error = (*ifp->if_init)(ifp);
   1419  1.247   msaitoh 			return error;
   1420  1.169    dyoung 		case 0:
   1421  1.169    dyoung 			break;
   1422   1.66   thorpej 		}
   1423  1.169    dyoung 		return 0;
   1424  1.193   msaitoh 	case SIOCGETHERCAP:
   1425  1.193   msaitoh 		eccr = (struct eccapreq *)data;
   1426  1.193   msaitoh 		eccr->eccr_capabilities = ec->ec_capabilities;
   1427  1.193   msaitoh 		eccr->eccr_capenable = ec->ec_capenable;
   1428  1.193   msaitoh 		return 0;
   1429   1.66   thorpej 	case SIOCADDMULTI:
   1430  1.169    dyoung 		return ether_addmulti(ifreq_getaddr(cmd, ifr), ec);
   1431   1.66   thorpej 	case SIOCDELMULTI:
   1432  1.169    dyoung 		return ether_delmulti(ifreq_getaddr(cmd, ifr), ec);
   1433  1.160    dyoung 	case SIOCSIFMEDIA:
   1434  1.160    dyoung 	case SIOCGIFMEDIA:
   1435  1.160    dyoung 		if (ec->ec_mii == NULL)
   1436  1.169    dyoung 			return ENOTTY;
   1437  1.169    dyoung 		return ifmedia_ioctl(ifp, ifr, &ec->ec_mii->mii_media, cmd);
   1438  1.170    dyoung 	case SIOCALIFADDR:
   1439  1.170    dyoung 		sdl = satocsdl(sstocsa(&iflr->addr));
   1440  1.170    dyoung 		if (sdl->sdl_family != AF_LINK)
   1441  1.170    dyoung 			;
   1442  1.170    dyoung 		else if (ETHER_IS_MULTICAST(CLLADDR(sdl)))
   1443  1.170    dyoung 			return EINVAL;
   1444  1.170    dyoung 		else if (memcmp(zero, CLLADDR(sdl), sizeof(zero)) == 0)
   1445  1.170    dyoung 			return EINVAL;
   1446  1.170    dyoung 		/*FALLTHROUGH*/
   1447  1.170    dyoung 	default:
   1448  1.161    dyoung 		return ifioctl_common(ifp, cmd, data);
   1449   1.66   thorpej 	}
   1450  1.169    dyoung 	return 0;
   1451    1.3   hpeyerl }
   1452  1.200     joerg 
   1453  1.215  christos /*
   1454  1.215  christos  * Enable/disable passing VLAN packets if the parent interface supports it.
   1455  1.215  christos  * Return:
   1456  1.215  christos  * 	 0: Ok
   1457  1.215  christos  *	-1: Parent interface does not support vlans
   1458  1.215  christos  *	>0: Error
   1459  1.215  christos  */
   1460  1.215  christos int
   1461  1.215  christos ether_enable_vlan_mtu(struct ifnet *ifp)
   1462  1.215  christos {
   1463  1.215  christos 	int error;
   1464  1.215  christos 	struct ethercom *ec = (void *)ifp;
   1465  1.215  christos 
   1466  1.215  christos 	/* Parent does not support VLAN's */
   1467  1.215  christos 	if ((ec->ec_capabilities & ETHERCAP_VLAN_MTU) == 0)
   1468  1.215  christos 		return -1;
   1469  1.215  christos 
   1470  1.215  christos 	/*
   1471  1.215  christos 	 * Parent supports the VLAN_MTU capability,
   1472  1.215  christos 	 * i.e. can Tx/Rx larger than ETHER_MAX_LEN frames;
   1473  1.215  christos 	 * enable it.
   1474  1.215  christos 	 */
   1475  1.215  christos 	ec->ec_capenable |= ETHERCAP_VLAN_MTU;
   1476  1.215  christos 
   1477  1.215  christos 	/* Interface is down, defer for later */
   1478  1.215  christos 	if ((ifp->if_flags & IFF_UP) == 0)
   1479  1.215  christos 		return 0;
   1480  1.215  christos 
   1481  1.215  christos 	if ((error = if_flags_set(ifp, ifp->if_flags)) == 0)
   1482  1.215  christos 		return 0;
   1483  1.215  christos 
   1484  1.215  christos 	ec->ec_capenable &= ~ETHERCAP_VLAN_MTU;
   1485  1.215  christos 	return error;
   1486  1.215  christos }
   1487  1.215  christos 
   1488  1.215  christos int
   1489  1.215  christos ether_disable_vlan_mtu(struct ifnet *ifp)
   1490  1.215  christos {
   1491  1.215  christos 	int error;
   1492  1.215  christos 	struct ethercom *ec = (void *)ifp;
   1493  1.215  christos 
   1494  1.215  christos 	/* We still have VLAN's, defer for later */
   1495  1.215  christos 	if (ec->ec_nvlans != 0)
   1496  1.215  christos 		return 0;
   1497  1.215  christos 
   1498  1.215  christos 	/* Parent does not support VLAB's, nothing to do. */
   1499  1.215  christos 	if ((ec->ec_capenable & ETHERCAP_VLAN_MTU) == 0)
   1500  1.215  christos 		return -1;
   1501  1.215  christos 
   1502  1.215  christos 	/*
   1503  1.215  christos 	 * Disable Tx/Rx of VLAN-sized frames.
   1504  1.215  christos 	 */
   1505  1.215  christos 	ec->ec_capenable &= ~ETHERCAP_VLAN_MTU;
   1506  1.250      maxv 
   1507  1.215  christos 	/* Interface is down, defer for later */
   1508  1.215  christos 	if ((ifp->if_flags & IFF_UP) == 0)
   1509  1.215  christos 		return 0;
   1510  1.215  christos 
   1511  1.215  christos 	if ((error = if_flags_set(ifp, ifp->if_flags)) == 0)
   1512  1.215  christos 		return 0;
   1513  1.215  christos 
   1514  1.215  christos 	ec->ec_capenable |= ETHERCAP_VLAN_MTU;
   1515  1.215  christos 	return error;
   1516  1.215  christos }
   1517  1.215  christos 
   1518  1.200     joerg static int
   1519  1.200     joerg ether_multicast_sysctl(SYSCTLFN_ARGS)
   1520  1.200     joerg {
   1521  1.200     joerg 	struct ether_multi *enm;
   1522  1.200     joerg 	struct ifnet *ifp;
   1523  1.200     joerg 	struct ethercom *ec;
   1524  1.223     ozaki 	int error = 0;
   1525  1.200     joerg 	size_t written;
   1526  1.223     ozaki 	struct psref psref;
   1527  1.237     skrll 	int bound;
   1528  1.233     ozaki 	unsigned int multicnt;
   1529  1.233     ozaki 	struct ether_multi_sysctl *addrs;
   1530  1.233     ozaki 	int i;
   1531  1.200     joerg 
   1532  1.200     joerg 	if (namelen != 1)
   1533  1.200     joerg 		return EINVAL;
   1534  1.200     joerg 
   1535  1.223     ozaki 	bound = curlwp_bind();
   1536  1.223     ozaki 	ifp = if_get_byindex(name[0], &psref);
   1537  1.223     ozaki 	if (ifp == NULL) {
   1538  1.223     ozaki 		error = ENODEV;
   1539  1.223     ozaki 		goto out;
   1540  1.223     ozaki 	}
   1541  1.200     joerg 	if (ifp->if_type != IFT_ETHER) {
   1542  1.223     ozaki 		if_put(ifp, &psref);
   1543  1.200     joerg 		*oldlenp = 0;
   1544  1.223     ozaki 		goto out;
   1545  1.200     joerg 	}
   1546  1.200     joerg 	ec = (struct ethercom *)ifp;
   1547  1.200     joerg 
   1548  1.200     joerg 	if (oldp == NULL) {
   1549  1.223     ozaki 		if_put(ifp, &psref);
   1550  1.233     ozaki 		*oldlenp = ec->ec_multicnt * sizeof(*addrs);
   1551  1.223     ozaki 		goto out;
   1552  1.200     joerg 	}
   1553  1.200     joerg 
   1554  1.233     ozaki 	/*
   1555  1.233     ozaki 	 * ec->ec_lock is a spin mutex so we cannot call sysctl_copyout, which
   1556  1.233     ozaki 	 * is sleepable, with holding it. Copy data to a local buffer first
   1557  1.233     ozaki 	 * with holding it and then call sysctl_copyout without holding it.
   1558  1.233     ozaki 	 */
   1559  1.233     ozaki retry:
   1560  1.233     ozaki 	multicnt = ec->ec_multicnt;
   1561  1.233     ozaki 	addrs = kmem_alloc(sizeof(*addrs) * multicnt, KM_SLEEP);
   1562  1.200     joerg 
   1563  1.245   msaitoh 	ETHER_LOCK(ec);
   1564  1.233     ozaki 	if (multicnt < ec->ec_multicnt) {
   1565  1.233     ozaki 		/* The number of multicast addresses have increased */
   1566  1.245   msaitoh 		ETHER_UNLOCK(ec);
   1567  1.233     ozaki 		kmem_free(addrs, sizeof(*addrs) * multicnt);
   1568  1.233     ozaki 		goto retry;
   1569  1.233     ozaki 	}
   1570  1.233     ozaki 
   1571  1.233     ozaki 	i = 0;
   1572  1.200     joerg 	LIST_FOREACH(enm, &ec->ec_multiaddrs, enm_list) {
   1573  1.233     ozaki 		struct ether_multi_sysctl *addr = &addrs[i];
   1574  1.233     ozaki 		addr->enm_refcount = enm->enm_refcount;
   1575  1.233     ozaki 		memcpy(addr->enm_addrlo, enm->enm_addrlo, ETHER_ADDR_LEN);
   1576  1.233     ozaki 		memcpy(addr->enm_addrhi, enm->enm_addrhi, ETHER_ADDR_LEN);
   1577  1.233     ozaki 		i++;
   1578  1.233     ozaki 	}
   1579  1.245   msaitoh 	ETHER_UNLOCK(ec);
   1580  1.233     ozaki 
   1581  1.233     ozaki 	error = 0;
   1582  1.233     ozaki 	written = 0;
   1583  1.233     ozaki 	for (i = 0; i < multicnt; i++) {
   1584  1.233     ozaki 		struct ether_multi_sysctl *addr = &addrs[i];
   1585  1.233     ozaki 
   1586  1.233     ozaki 		if (written + sizeof(*addr) > *oldlenp)
   1587  1.200     joerg 			break;
   1588  1.233     ozaki 		error = sysctl_copyout(l, addr, oldp, sizeof(*addr));
   1589  1.200     joerg 		if (error)
   1590  1.200     joerg 			break;
   1591  1.233     ozaki 		written += sizeof(*addr);
   1592  1.233     ozaki 		oldp = (char *)oldp + sizeof(*addr);
   1593  1.200     joerg 	}
   1594  1.233     ozaki 	kmem_free(addrs, sizeof(*addrs) * multicnt);
   1595  1.233     ozaki 
   1596  1.223     ozaki 	if_put(ifp, &psref);
   1597  1.200     joerg 
   1598  1.200     joerg 	*oldlenp = written;
   1599  1.223     ozaki out:
   1600  1.223     ozaki 	curlwp_bindx(bound);
   1601  1.200     joerg 	return error;
   1602  1.200     joerg }
   1603  1.200     joerg 
   1604  1.234     ozaki static void
   1605  1.234     ozaki ether_sysctl_setup(struct sysctllog **clog)
   1606  1.200     joerg {
   1607  1.200     joerg 	const struct sysctlnode *rnode = NULL;
   1608  1.200     joerg 
   1609  1.200     joerg 	sysctl_createv(clog, 0, NULL, &rnode,
   1610  1.200     joerg 		       CTLFLAG_PERMANENT,
   1611  1.200     joerg 		       CTLTYPE_NODE, "ether",
   1612  1.200     joerg 		       SYSCTL_DESCR("Ethernet-specific information"),
   1613  1.200     joerg 		       NULL, 0, NULL, 0,
   1614  1.200     joerg 		       CTL_NET, CTL_CREATE, CTL_EOL);
   1615  1.200     joerg 
   1616  1.200     joerg 	sysctl_createv(clog, 0, &rnode, NULL,
   1617  1.200     joerg 		       CTLFLAG_PERMANENT,
   1618  1.200     joerg 		       CTLTYPE_NODE, "multicast",
   1619  1.200     joerg 		       SYSCTL_DESCR("multicast addresses"),
   1620  1.200     joerg 		       ether_multicast_sysctl, 0, NULL, 0,
   1621  1.200     joerg 		       CTL_CREATE, CTL_EOL);
   1622  1.200     joerg }
   1623  1.203     ozaki 
   1624  1.203     ozaki void
   1625  1.203     ozaki etherinit(void)
   1626  1.203     ozaki {
   1627  1.234     ozaki 
   1628  1.203     ozaki 	mutex_init(&bigpktpps_lock, MUTEX_DEFAULT, IPL_NET);
   1629  1.234     ozaki 	ether_sysctl_setup(NULL);
   1630  1.203     ozaki }
   1631