Home | History | Annotate | Line # | Download | only in net
bpf.c revision 1.61.4.1
      1  1.61.4.1   thorpej /*	$NetBSD: bpf.c,v 1.61.4.1 2001/09/07 04:45:41 thorpej Exp $	*/
      2      1.13       cgd 
      3      1.12   mycroft /*
      4      1.12   mycroft  * Copyright (c) 1990, 1991, 1993
      5      1.12   mycroft  *	The Regents of the University of California.  All rights reserved.
      6       1.1       cgd  *
      7       1.1       cgd  * This code is derived from the Stanford/CMU enet packet filter,
      8       1.1       cgd  * (net/enet.c) distributed as part of 4.3BSD, and code contributed
      9      1.36  christos  * to Berkeley by Steven McCanne and Van Jacobson both of Lawrence
     10       1.2       cgd  * Berkeley Laboratory.
     11       1.1       cgd  *
     12       1.1       cgd  * Redistribution and use in source and binary forms, with or without
     13       1.1       cgd  * modification, are permitted provided that the following conditions
     14       1.1       cgd  * are met:
     15       1.1       cgd  * 1. Redistributions of source code must retain the above copyright
     16       1.1       cgd  *    notice, this list of conditions and the following disclaimer.
     17       1.1       cgd  * 2. Redistributions in binary form must reproduce the above copyright
     18       1.1       cgd  *    notice, this list of conditions and the following disclaimer in the
     19       1.1       cgd  *    documentation and/or other materials provided with the distribution.
     20       1.1       cgd  * 3. All advertising materials mentioning features or use of this software
     21       1.1       cgd  *    must display the following acknowledgement:
     22       1.1       cgd  *	This product includes software developed by the University of
     23       1.1       cgd  *	California, Berkeley and its contributors.
     24       1.1       cgd  * 4. Neither the name of the University nor the names of its contributors
     25       1.1       cgd  *    may be used to endorse or promote products derived from this software
     26       1.1       cgd  *    without specific prior written permission.
     27       1.1       cgd  *
     28       1.1       cgd  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
     29       1.1       cgd  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     30       1.1       cgd  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     31       1.1       cgd  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
     32       1.1       cgd  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     33       1.1       cgd  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     34       1.1       cgd  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     35       1.1       cgd  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     36       1.1       cgd  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     37       1.1       cgd  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     38       1.1       cgd  * SUCH DAMAGE.
     39       1.1       cgd  *
     40      1.39      fvdl  *	@(#)bpf.c	8.4 (Berkeley) 1/9/95
     41      1.36  christos  * static char rcsid[] =
     42      1.36  christos  * "Header: bpf.c,v 1.67 96/09/26 22:00:52 leres Exp ";
     43       1.1       cgd  */
     44       1.1       cgd 
     45       1.1       cgd #include "bpfilter.h"
     46       1.1       cgd 
     47       1.1       cgd #include <sys/param.h>
     48       1.1       cgd #include <sys/systm.h>
     49       1.1       cgd #include <sys/mbuf.h>
     50       1.1       cgd #include <sys/buf.h>
     51      1.12   mycroft #include <sys/time.h>
     52       1.1       cgd #include <sys/proc.h>
     53       1.1       cgd #include <sys/user.h>
     54       1.1       cgd #include <sys/ioctl.h>
     55      1.11   deraadt #include <sys/map.h>
     56      1.25  christos #include <sys/conf.h>
     57      1.51     enami #include <sys/vnode.h>
     58      1.11   deraadt 
     59  1.61.4.1   thorpej #include <miscfs/specfs/specdev.h>
     60  1.61.4.1   thorpej 
     61       1.1       cgd #include <sys/file.h>
     62       1.1       cgd #include <sys/tty.h>
     63       1.1       cgd #include <sys/uio.h>
     64      1.11   deraadt 
     65       1.1       cgd #include <sys/protosw.h>
     66       1.1       cgd #include <sys/socket.h>
     67      1.30   mycroft #include <sys/errno.h>
     68      1.30   mycroft #include <sys/kernel.h>
     69      1.30   mycroft #include <sys/poll.h>
     70      1.30   mycroft 
     71      1.11   deraadt #include <net/if.h>
     72       1.8   mycroft 
     73       1.1       cgd #include <net/bpf.h>
     74       1.1       cgd #include <net/bpfdesc.h>
     75       1.1       cgd 
     76      1.35    scottr #include <net/if_arc.h>
     77      1.34        is #include <net/if_ether.h>
     78      1.34        is 
     79      1.12   mycroft #include <netinet/in.h>
     80      1.34        is #include <netinet/if_inarp.h>
     81      1.11   deraadt 
     82      1.55  jonathan #ifndef BPF_BUFSIZE
     83      1.55  jonathan # define BPF_BUFSIZE 8192		/* 4096 too small for FDDI frames */
     84      1.55  jonathan #endif
     85       1.1       cgd 
     86      1.12   mycroft #define PRINET  26			/* interruptible */
     87       1.2       cgd 
     88       1.1       cgd /*
     89       1.1       cgd  * The default read buffer size is patchable.
     90       1.1       cgd  */
     91       1.2       cgd int bpf_bufsize = BPF_BUFSIZE;
     92       1.1       cgd 
     93       1.1       cgd /*
     94       1.1       cgd  *  bpf_iflist is the list of interfaces; each corresponds to an ifnet
     95       1.1       cgd  *  bpf_dtab holds the descriptors, indexed by minor device #
     96       1.1       cgd  */
     97      1.12   mycroft struct bpf_if	*bpf_iflist;
     98       1.2       cgd struct bpf_d	bpf_dtab[NBPFILTER];
     99       1.1       cgd 
    100      1.12   mycroft static int	bpf_allocbufs __P((struct bpf_d *));
    101      1.12   mycroft static void	bpf_freed __P((struct bpf_d *));
    102      1.12   mycroft static void	bpf_ifname __P((struct ifnet *, struct ifreq *));
    103      1.43     perry static void	*bpf_mcpy __P((void *, const void *, size_t));
    104      1.36  christos static int	bpf_movein __P((struct uio *, int, int,
    105      1.24  christos 			        struct mbuf **, struct sockaddr *));
    106      1.24  christos static void	bpf_attachd __P((struct bpf_d *, struct bpf_if *));
    107      1.24  christos static void	bpf_detachd __P((struct bpf_d *));
    108      1.12   mycroft static int	bpf_setif __P((struct bpf_d *, struct ifreq *));
    109      1.15       cgd static __inline void
    110      1.12   mycroft 		bpf_wakeup __P((struct bpf_d *));
    111      1.36  christos static void	catchpacket __P((struct bpf_d *, u_char *, u_int, u_int,
    112      1.43     perry 				 void *(*)(void *, const void *, size_t)));
    113      1.12   mycroft static void	reset_d __P((struct bpf_d *));
    114      1.12   mycroft 
    115      1.12   mycroft static int
    116      1.36  christos bpf_movein(uio, linktype, mtu, mp, sockp)
    117      1.53  augustss 	struct uio *uio;
    118      1.20   mycroft 	int linktype;
    119      1.36  christos 	int mtu;
    120      1.53  augustss 	struct mbuf **mp;
    121      1.53  augustss 	struct sockaddr *sockp;
    122      1.12   mycroft {
    123      1.12   mycroft 	struct mbuf *m;
    124      1.12   mycroft 	int error;
    125      1.12   mycroft 	int len;
    126      1.12   mycroft 	int hlen;
    127      1.36  christos 	int align;
    128      1.12   mycroft 
    129      1.12   mycroft 	/*
    130      1.12   mycroft 	 * Build a sockaddr based on the data link layer type.
    131      1.12   mycroft 	 * We do this at this level because the ethernet header
    132      1.12   mycroft 	 * is copied directly into the data field of the sockaddr.
    133      1.12   mycroft 	 * In the case of SLIP, there is no header and the packet
    134      1.12   mycroft 	 * is forwarded as is.
    135      1.12   mycroft 	 * Also, we are careful to leave room at the front of the mbuf
    136      1.12   mycroft 	 * for the link level header.
    137      1.12   mycroft 	 */
    138      1.12   mycroft 	switch (linktype) {
    139      1.12   mycroft 
    140      1.12   mycroft 	case DLT_SLIP:
    141      1.12   mycroft 		sockp->sa_family = AF_INET;
    142      1.12   mycroft 		hlen = 0;
    143      1.36  christos 		align = 0;
    144      1.12   mycroft 		break;
    145      1.12   mycroft 
    146      1.12   mycroft 	case DLT_PPP:
    147      1.12   mycroft 		sockp->sa_family = AF_UNSPEC;
    148      1.12   mycroft 		hlen = 0;
    149      1.36  christos 		align = 0;
    150      1.12   mycroft 		break;
    151      1.12   mycroft 
    152      1.12   mycroft 	case DLT_EN10MB:
    153      1.12   mycroft 		sockp->sa_family = AF_UNSPEC;
    154      1.12   mycroft 		/* XXX Would MAXLINKHDR be better? */
    155      1.36  christos  		/* 6(dst)+6(src)+2(type) */
    156      1.12   mycroft 		hlen = sizeof(struct ether_header);
    157      1.36  christos 		align = 2;
    158      1.17     glass 		break;
    159      1.17     glass 
    160      1.17     glass 	case DLT_ARCNET:
    161      1.17     glass 		sockp->sa_family = AF_UNSPEC;
    162      1.17     glass 		hlen = ARC_HDRLEN;
    163      1.36  christos 		align = 5;
    164      1.12   mycroft 		break;
    165      1.12   mycroft 
    166      1.12   mycroft 	case DLT_FDDI:
    167      1.56      matt 		sockp->sa_family = AF_LINK;
    168      1.56      matt 		/* XXX 4(FORMAC)+6(dst)+6(src) */
    169      1.56      matt 		hlen = 16;
    170      1.36  christos 		align = 0;
    171      1.12   mycroft 		break;
    172      1.12   mycroft 
    173      1.12   mycroft 	case DLT_NULL:
    174      1.12   mycroft 		sockp->sa_family = AF_UNSPEC;
    175      1.12   mycroft 		hlen = 0;
    176      1.36  christos 		align = 0;
    177      1.12   mycroft 		break;
    178      1.12   mycroft 
    179      1.12   mycroft 	default:
    180      1.12   mycroft 		return (EIO);
    181      1.12   mycroft 	}
    182      1.12   mycroft 
    183      1.12   mycroft 	len = uio->uio_resid;
    184      1.36  christos 	/*
    185      1.36  christos 	 * If there aren't enough bytes for a link level header or the
    186      1.36  christos 	 * packet length exceeds the interface mtu, return an error.
    187      1.36  christos 	 */
    188      1.36  christos 	if (len < hlen || len - hlen > mtu)
    189      1.36  christos 		return (EMSGSIZE);
    190      1.36  christos 
    191      1.36  christos 	/*
    192      1.36  christos 	 * XXX Avoid complicated buffer chaining ---
    193      1.36  christos 	 * bail if it won't fit in a single mbuf.
    194      1.36  christos 	 * (Take into account possible alignment bytes)
    195      1.36  christos 	 */
    196      1.36  christos 	if ((unsigned)len > MCLBYTES - align)
    197      1.12   mycroft 		return (EIO);
    198      1.12   mycroft 
    199      1.20   mycroft 	MGETHDR(m, M_WAIT, MT_DATA);
    200      1.36  christos 	if (m == 0)
    201      1.36  christos 		return (ENOBUFS);
    202      1.20   mycroft 	m->m_pkthdr.rcvif = 0;
    203      1.20   mycroft 	m->m_pkthdr.len = len - hlen;
    204      1.36  christos 	if (len > MHLEN - align) {
    205      1.12   mycroft 		MCLGET(m, M_WAIT);
    206      1.12   mycroft 		if ((m->m_flags & M_EXT) == 0) {
    207      1.12   mycroft 			error = ENOBUFS;
    208      1.12   mycroft 			goto bad;
    209      1.12   mycroft 		}
    210      1.12   mycroft 	}
    211      1.36  christos 
    212      1.36  christos 	/* Insure the data is properly aligned */
    213      1.36  christos 	if (align > 0) {
    214      1.36  christos 		m->m_data += align;
    215      1.36  christos 		m->m_len -= align;
    216      1.36  christos 	}
    217      1.36  christos 
    218      1.54       chs 	error = uiomove(mtod(m, caddr_t), len, uio);
    219      1.36  christos 	if (error)
    220      1.36  christos 		goto bad;
    221      1.12   mycroft 	if (hlen != 0) {
    222      1.41     perry 		memcpy(sockp->sa_data, mtod(m, caddr_t), hlen);
    223      1.12   mycroft 		m->m_data += hlen; /* XXX */
    224      1.36  christos 		len -= hlen;
    225      1.12   mycroft 	}
    226      1.36  christos 	m->m_len = len;
    227      1.36  christos 	*mp = m;
    228      1.38   mycroft 	return (0);
    229      1.38   mycroft 
    230      1.38   mycroft bad:
    231      1.12   mycroft 	m_freem(m);
    232      1.12   mycroft 	return (error);
    233      1.12   mycroft }
    234       1.1       cgd 
    235       1.1       cgd /*
    236       1.2       cgd  * Attach file to the bpf interface, i.e. make d listen on bp.
    237      1.61   thorpej  * Must be called at splnet.
    238       1.1       cgd  */
    239       1.1       cgd static void
    240       1.1       cgd bpf_attachd(d, bp)
    241       1.1       cgd 	struct bpf_d *d;
    242       1.1       cgd 	struct bpf_if *bp;
    243       1.1       cgd {
    244       1.2       cgd 	/*
    245       1.2       cgd 	 * Point d at bp, and add d to the interface's list of listeners.
    246       1.2       cgd 	 * Finally, point the driver's bpf cookie at the interface so
    247       1.2       cgd 	 * it will divert packets to bpf.
    248       1.2       cgd 	 */
    249       1.1       cgd 	d->bd_bif = bp;
    250       1.1       cgd 	d->bd_next = bp->bif_dlist;
    251       1.1       cgd 	bp->bif_dlist = d;
    252       1.1       cgd 
    253       1.1       cgd 	*bp->bif_driverp = bp;
    254       1.1       cgd }
    255       1.1       cgd 
    256       1.2       cgd /*
    257       1.2       cgd  * Detach a file from its interface.
    258       1.2       cgd  */
    259       1.1       cgd static void
    260       1.1       cgd bpf_detachd(d)
    261       1.1       cgd 	struct bpf_d *d;
    262       1.1       cgd {
    263       1.1       cgd 	struct bpf_d **p;
    264       1.1       cgd 	struct bpf_if *bp;
    265       1.1       cgd 
    266       1.1       cgd 	bp = d->bd_bif;
    267       1.1       cgd 	/*
    268       1.1       cgd 	 * Check if this descriptor had requested promiscuous mode.
    269       1.1       cgd 	 * If so, turn it off.
    270       1.1       cgd 	 */
    271       1.1       cgd 	if (d->bd_promisc) {
    272      1.18   mycroft 		int error;
    273      1.18   mycroft 
    274       1.1       cgd 		d->bd_promisc = 0;
    275      1.36  christos 		/*
    276      1.36  christos 		 * Take device out of promiscuous mode.  Since we were
    277      1.36  christos 		 * able to enter promiscuous mode, we should be able
    278      1.36  christos 		 * to turn it off.  But we can get an error if
    279      1.36  christos 		 * the interface was configured down, so only panic
    280      1.36  christos 		 * if we don't get an unexpected error.
    281      1.36  christos 		 */
    282      1.36  christos   		error = ifpromisc(bp->bif_ifp, 0);
    283      1.18   mycroft 		if (error && error != EINVAL)
    284       1.2       cgd 			panic("bpf: ifpromisc failed");
    285       1.1       cgd 	}
    286       1.2       cgd 	/* Remove d from the interface's descriptor list. */
    287       1.1       cgd 	p = &bp->bif_dlist;
    288       1.1       cgd 	while (*p != d) {
    289       1.1       cgd 		p = &(*p)->bd_next;
    290       1.1       cgd 		if (*p == 0)
    291       1.1       cgd 			panic("bpf_detachd: descriptor not in list");
    292       1.1       cgd 	}
    293       1.1       cgd 	*p = (*p)->bd_next;
    294       1.1       cgd 	if (bp->bif_dlist == 0)
    295       1.1       cgd 		/*
    296       1.1       cgd 		 * Let the driver know that there are no more listeners.
    297       1.1       cgd 		 */
    298       1.1       cgd 		*d->bd_bif->bif_driverp = 0;
    299       1.1       cgd 	d->bd_bif = 0;
    300       1.1       cgd }
    301       1.1       cgd 
    302       1.1       cgd 
    303       1.1       cgd /*
    304      1.12   mycroft  * Mark a descriptor free by making it point to itself.
    305       1.1       cgd  * This is probably cheaper than marking with a constant since
    306       1.1       cgd  * the address should be in a register anyway.
    307       1.1       cgd  */
    308       1.1       cgd #define D_ISFREE(d) ((d) == (d)->bd_next)
    309       1.1       cgd #define D_MARKFREE(d) ((d)->bd_next = (d))
    310       1.1       cgd #define D_MARKUSED(d) ((d)->bd_next = 0)
    311       1.1       cgd 
    312       1.1       cgd /*
    313      1.46    bouyer  * bpfilterattach() is called at boot time.
    314      1.46    bouyer  */
    315      1.46    bouyer /* ARGSUSED */
    316      1.46    bouyer void
    317      1.46    bouyer bpfilterattach(n)
    318      1.46    bouyer 	int n;
    319      1.46    bouyer {
    320      1.46    bouyer 	int i;
    321      1.46    bouyer 	/*
    322      1.46    bouyer 	 * Mark all the descriptors free.
    323      1.46    bouyer 	 */
    324      1.46    bouyer 	for (i = 0; i < NBPFILTER; ++i)
    325      1.46    bouyer 		D_MARKFREE(&bpf_dtab[i]);
    326      1.46    bouyer 
    327      1.46    bouyer }
    328      1.46    bouyer 
    329      1.46    bouyer /*
    330       1.2       cgd  * Open ethernet device.  Returns ENXIO for illegal minor device number,
    331       1.2       cgd  * EBUSY if file is open by another process.
    332       1.1       cgd  */
    333       1.1       cgd /* ARGSUSED */
    334       1.1       cgd int
    335  1.61.4.1   thorpej bpfopen(devvp, flag, mode, p)
    336  1.61.4.1   thorpej 	struct vnode *devvp;
    337       1.1       cgd 	int flag;
    338      1.24  christos 	int mode;
    339      1.24  christos 	struct proc *p;
    340       1.1       cgd {
    341      1.53  augustss 	struct bpf_d *d;
    342      1.12   mycroft 
    343  1.61.4.1   thorpej 	if (minor(devvp->v_rdev) >= NBPFILTER)
    344       1.1       cgd 		return (ENXIO);
    345       1.1       cgd 	/*
    346       1.1       cgd 	 * Each minor can be opened by only one process.  If the requested
    347       1.1       cgd 	 * minor is in use, return EBUSY.
    348       1.1       cgd 	 */
    349  1.61.4.1   thorpej 	d = &bpf_dtab[minor(devvp->v_rdev)];
    350       1.2       cgd 	if (!D_ISFREE(d))
    351       1.1       cgd 		return (EBUSY);
    352       1.2       cgd 
    353       1.2       cgd 	/* Mark "free" and do most initialization. */
    354      1.41     perry 	memset((char *)d, 0, sizeof(*d));
    355       1.2       cgd 	d->bd_bufsize = bpf_bufsize;
    356       1.1       cgd 
    357  1.61.4.1   thorpej 	devvp->v_devcookie = d;
    358  1.61.4.1   thorpej 
    359       1.1       cgd 	return (0);
    360       1.1       cgd }
    361       1.1       cgd 
    362       1.1       cgd /*
    363       1.1       cgd  * Close the descriptor by detaching it from its interface,
    364       1.1       cgd  * deallocating its buffers, and marking it free.
    365       1.1       cgd  */
    366       1.1       cgd /* ARGSUSED */
    367       1.2       cgd int
    368  1.61.4.1   thorpej bpfclose(devvp, flag, mode, p)
    369  1.61.4.1   thorpej 	struct vnode *devvp;
    370       1.1       cgd 	int flag;
    371      1.24  christos 	int mode;
    372      1.24  christos 	struct proc *p;
    373       1.1       cgd {
    374  1.61.4.1   thorpej 	struct bpf_d *d = devvp->v_devcookie;
    375      1.53  augustss 	int s;
    376       1.1       cgd 
    377      1.61   thorpej 	s = splnet();
    378       1.1       cgd 	if (d->bd_bif)
    379       1.1       cgd 		bpf_detachd(d);
    380       1.1       cgd 	splx(s);
    381       1.2       cgd 	bpf_freed(d);
    382       1.2       cgd 
    383       1.2       cgd 	return (0);
    384       1.2       cgd }
    385       1.2       cgd 
    386       1.2       cgd /*
    387       1.1       cgd  * Rotate the packet buffers in descriptor d.  Move the store buffer
    388      1.12   mycroft  * into the hold slot, and the free buffer into the store slot.
    389       1.1       cgd  * Zero the length of the new store buffer.
    390       1.1       cgd  */
    391       1.1       cgd #define ROTATE_BUFFERS(d) \
    392       1.1       cgd 	(d)->bd_hbuf = (d)->bd_sbuf; \
    393       1.1       cgd 	(d)->bd_hlen = (d)->bd_slen; \
    394       1.1       cgd 	(d)->bd_sbuf = (d)->bd_fbuf; \
    395       1.1       cgd 	(d)->bd_slen = 0; \
    396      1.12   mycroft 	(d)->bd_fbuf = 0;
    397       1.1       cgd /*
    398       1.1       cgd  *  bpfread - read next chunk of packets from buffers
    399       1.1       cgd  */
    400       1.1       cgd int
    401  1.61.4.1   thorpej bpfread(devvp, uio, ioflag)
    402  1.61.4.1   thorpej 	struct vnode *devvp;
    403      1.53  augustss 	struct uio *uio;
    404      1.24  christos 	int ioflag;
    405       1.1       cgd {
    406  1.61.4.1   thorpej 	struct bpf_d *d = devvp->v_devcookie;
    407       1.1       cgd 	int error;
    408       1.1       cgd 	int s;
    409       1.1       cgd 
    410       1.1       cgd 	/*
    411      1.12   mycroft 	 * Restrict application to use a buffer the same size as
    412       1.1       cgd 	 * as kernel buffers.
    413       1.1       cgd 	 */
    414       1.1       cgd 	if (uio->uio_resid != d->bd_bufsize)
    415       1.1       cgd 		return (EINVAL);
    416       1.1       cgd 
    417      1.61   thorpej 	s = splnet();
    418       1.1       cgd 	/*
    419       1.2       cgd 	 * If the hold buffer is empty, then do a timed sleep, which
    420       1.2       cgd 	 * ends when the timeout expires or when enough packets
    421       1.2       cgd 	 * have arrived to fill the store buffer.
    422       1.1       cgd 	 */
    423       1.1       cgd 	while (d->bd_hbuf == 0) {
    424      1.36  christos 		if (d->bd_immediate) {
    425      1.36  christos 			if (d->bd_slen == 0) {
    426      1.36  christos 				splx(s);
    427      1.36  christos 				return (EWOULDBLOCK);
    428      1.36  christos 			}
    429       1.1       cgd 			/*
    430       1.1       cgd 			 * A packet(s) either arrived since the previous
    431       1.1       cgd 			 * read or arrived while we were asleep.
    432       1.1       cgd 			 * Rotate the buffers and return what's here.
    433       1.1       cgd 			 */
    434       1.1       cgd 			ROTATE_BUFFERS(d);
    435       1.1       cgd 			break;
    436       1.1       cgd 		}
    437      1.23   thorpej 		if (d->bd_rtout != -1)
    438      1.54       chs 			error = tsleep((caddr_t)d, PRINET|PCATCH, "bpf",
    439      1.23   thorpej 					  d->bd_rtout);
    440      1.60   thorpej 		else {
    441      1.60   thorpej 			if (d->bd_rtout == -1) {
    442      1.60   thorpej 				/* User requested non-blocking I/O */
    443      1.60   thorpej 				error = EWOULDBLOCK;
    444      1.60   thorpej 			} else
    445      1.60   thorpej 				error = 0;
    446      1.60   thorpej 		}
    447      1.12   mycroft 		if (error == EINTR || error == ERESTART) {
    448      1.12   mycroft 			splx(s);
    449      1.12   mycroft 			return (error);
    450      1.12   mycroft 		}
    451      1.12   mycroft 		if (error == EWOULDBLOCK) {
    452      1.12   mycroft 			/*
    453      1.12   mycroft 			 * On a timeout, return what's in the buffer,
    454      1.12   mycroft 			 * which may be nothing.  If there is something
    455      1.12   mycroft 			 * in the store buffer, we can rotate the buffers.
    456      1.12   mycroft 			 */
    457      1.12   mycroft 			if (d->bd_hbuf)
    458       1.1       cgd 				/*
    459      1.12   mycroft 				 * We filled up the buffer in between
    460      1.12   mycroft 				 * getting the timeout and arriving
    461      1.12   mycroft 				 * here, so we don't need to rotate.
    462       1.1       cgd 				 */
    463       1.1       cgd 				break;
    464      1.12   mycroft 
    465      1.12   mycroft 			if (d->bd_slen == 0) {
    466      1.12   mycroft 				splx(s);
    467      1.12   mycroft 				return (0);
    468       1.1       cgd 			}
    469      1.12   mycroft 			ROTATE_BUFFERS(d);
    470      1.12   mycroft 			break;
    471       1.1       cgd 		}
    472      1.36  christos 		if (error != 0)
    473      1.36  christos 			goto done;
    474       1.1       cgd 	}
    475       1.1       cgd 	/*
    476       1.1       cgd 	 * At this point, we know we have something in the hold slot.
    477       1.1       cgd 	 */
    478       1.1       cgd 	splx(s);
    479      1.12   mycroft 
    480      1.12   mycroft 	/*
    481       1.1       cgd 	 * Move data from hold buffer into user space.
    482       1.1       cgd 	 * We know the entire buffer is transferred since
    483       1.1       cgd 	 * we checked above that the read buffer is bpf_bufsize bytes.
    484       1.1       cgd 	 */
    485      1.54       chs 	error = uiomove(d->bd_hbuf, d->bd_hlen, uio);
    486       1.1       cgd 
    487      1.61   thorpej 	s = splnet();
    488       1.1       cgd 	d->bd_fbuf = d->bd_hbuf;
    489       1.1       cgd 	d->bd_hbuf = 0;
    490       1.2       cgd 	d->bd_hlen = 0;
    491      1.36  christos done:
    492       1.1       cgd 	splx(s);
    493       1.1       cgd 	return (error);
    494       1.1       cgd }
    495       1.1       cgd 
    496       1.1       cgd 
    497       1.1       cgd /*
    498      1.12   mycroft  * If there are processes sleeping on this descriptor, wake them up.
    499       1.1       cgd  */
    500      1.15       cgd static __inline void
    501       1.1       cgd bpf_wakeup(d)
    502      1.53  augustss 	struct bpf_d *d;
    503       1.1       cgd {
    504      1.23   thorpej 	struct proc *p;
    505      1.23   thorpej 
    506       1.1       cgd 	wakeup((caddr_t)d);
    507      1.44   thorpej 	if (d->bd_async) {
    508      1.23   thorpej 		if (d->bd_pgid > 0)
    509      1.37  christos 			gsignal (d->bd_pgid, SIGIO);
    510      1.57     jhawk 		else if (d->bd_pgid && (p = pfind (-d->bd_pgid)) != NULL)
    511      1.37  christos 			psignal (p, SIGIO);
    512      1.44   thorpej 	}
    513      1.23   thorpej 
    514       1.2       cgd 	selwakeup(&d->bd_sel);
    515       1.2       cgd 	/* XXX */
    516       1.2       cgd 	d->bd_sel.si_pid = 0;
    517       1.1       cgd }
    518       1.1       cgd 
    519       1.1       cgd int
    520  1.61.4.1   thorpej bpfwrite(devvp, uio, ioflag)
    521  1.61.4.1   thorpej 	struct vnode *devvp;
    522       1.1       cgd 	struct uio *uio;
    523      1.24  christos 	int ioflag;
    524       1.1       cgd {
    525  1.61.4.1   thorpej 	struct bpf_d *d = devvp->v_devcookie;
    526      1.12   mycroft 	struct ifnet *ifp;
    527      1.12   mycroft 	struct mbuf *m;
    528      1.12   mycroft 	int error, s;
    529      1.56      matt 	static struct sockaddr_storage dst;
    530       1.1       cgd 
    531      1.12   mycroft 	if (d->bd_bif == 0)
    532       1.1       cgd 		return (ENXIO);
    533       1.1       cgd 
    534      1.12   mycroft 	ifp = d->bd_bif->bif_ifp;
    535      1.11   deraadt 
    536      1.12   mycroft 	if (uio->uio_resid == 0)
    537      1.12   mycroft 		return (0);
    538      1.11   deraadt 
    539      1.56      matt 	error = bpf_movein(uio, (int)d->bd_bif->bif_dlt, ifp->if_mtu, &m,
    540      1.56      matt 		(struct sockaddr *) &dst);
    541      1.12   mycroft 	if (error)
    542      1.12   mycroft 		return (error);
    543      1.11   deraadt 
    544      1.20   mycroft 	if (m->m_pkthdr.len > ifp->if_mtu)
    545       1.1       cgd 		return (EMSGSIZE);
    546       1.1       cgd 
    547      1.40   thorpej 	if (d->bd_hdrcmplt)
    548      1.56      matt 		dst.ss_family = pseudo_AF_HDRCMPLT;
    549      1.40   thorpej 
    550      1.21   mycroft 	s = splsoftnet();
    551      1.56      matt 	error = (*ifp->if_output)(ifp, m, (struct sockaddr *) &dst, NULL);
    552       1.1       cgd 	splx(s);
    553       1.1       cgd 	/*
    554      1.12   mycroft 	 * The driver frees the mbuf.
    555       1.1       cgd 	 */
    556       1.1       cgd 	return (error);
    557       1.1       cgd }
    558       1.1       cgd 
    559       1.1       cgd /*
    560       1.2       cgd  * Reset a descriptor by flushing its packet buffer and clearing the
    561      1.61   thorpej  * receive and drop counts.  Should be called at splnet.
    562       1.1       cgd  */
    563       1.1       cgd static void
    564       1.1       cgd reset_d(d)
    565       1.1       cgd 	struct bpf_d *d;
    566       1.1       cgd {
    567       1.1       cgd 	if (d->bd_hbuf) {
    568       1.1       cgd 		/* Free the hold buffer. */
    569       1.1       cgd 		d->bd_fbuf = d->bd_hbuf;
    570       1.1       cgd 		d->bd_hbuf = 0;
    571       1.1       cgd 	}
    572       1.1       cgd 	d->bd_slen = 0;
    573       1.2       cgd 	d->bd_hlen = 0;
    574       1.1       cgd 	d->bd_rcount = 0;
    575       1.1       cgd 	d->bd_dcount = 0;
    576       1.1       cgd }
    577       1.1       cgd 
    578      1.36  christos #ifdef BPF_KERN_FILTER
    579      1.36  christos extern struct bpf_insn *bpf_tcp_filter;
    580      1.36  christos extern struct bpf_insn *bpf_udp_filter;
    581      1.36  christos #endif
    582      1.36  christos 
    583       1.1       cgd /*
    584       1.1       cgd  *  FIONREAD		Check for read packet available.
    585       1.1       cgd  *  BIOCGBLEN		Get buffer len [for read()].
    586       1.1       cgd  *  BIOCSETF		Set ethernet read filter.
    587       1.1       cgd  *  BIOCFLUSH		Flush read packet buffer.
    588       1.1       cgd  *  BIOCPROMISC		Put interface into promiscuous mode.
    589       1.1       cgd  *  BIOCGDLT		Get link layer type.
    590       1.1       cgd  *  BIOCGETIF		Get interface name.
    591       1.1       cgd  *  BIOCSETIF		Set interface.
    592       1.1       cgd  *  BIOCSRTIMEOUT	Set read timeout.
    593       1.1       cgd  *  BIOCGRTIMEOUT	Get read timeout.
    594       1.1       cgd  *  BIOCGSTATS		Get packet stats.
    595       1.1       cgd  *  BIOCIMMEDIATE	Set immediate mode.
    596       1.2       cgd  *  BIOCVERSION		Get filter language version.
    597      1.40   thorpej  *  BIOGHDRCMPLT	Get "header already complete" flag.
    598      1.40   thorpej  *  BIOSHDRCMPLT	Set "header already complete" flag.
    599       1.1       cgd  */
    600       1.1       cgd /* ARGSUSED */
    601       1.1       cgd int
    602  1.61.4.1   thorpej bpfioctl(devvp, cmd, addr, flag, p)
    603  1.61.4.1   thorpej 	struct vnode *devvp;
    604      1.16       cgd 	u_long cmd;
    605       1.1       cgd 	caddr_t addr;
    606       1.1       cgd 	int flag;
    607      1.24  christos 	struct proc *p;
    608       1.1       cgd {
    609  1.61.4.1   thorpej 	struct bpf_d *d = devvp->v_devcookie;
    610       1.1       cgd 	int s, error = 0;
    611      1.36  christos #ifdef BPF_KERN_FILTER
    612      1.53  augustss 	struct bpf_insn **p;
    613      1.36  christos #endif
    614       1.1       cgd 
    615       1.1       cgd 	switch (cmd) {
    616       1.1       cgd 
    617       1.1       cgd 	default:
    618       1.1       cgd 		error = EINVAL;
    619       1.1       cgd 		break;
    620       1.1       cgd 
    621       1.1       cgd 	/*
    622       1.1       cgd 	 * Check for read packet available.
    623       1.1       cgd 	 */
    624       1.1       cgd 	case FIONREAD:
    625       1.1       cgd 		{
    626       1.1       cgd 			int n;
    627      1.12   mycroft 
    628      1.61   thorpej 			s = splnet();
    629       1.1       cgd 			n = d->bd_slen;
    630      1.12   mycroft 			if (d->bd_hbuf)
    631       1.1       cgd 				n += d->bd_hlen;
    632       1.1       cgd 			splx(s);
    633       1.1       cgd 
    634       1.1       cgd 			*(int *)addr = n;
    635       1.1       cgd 			break;
    636       1.1       cgd 		}
    637       1.1       cgd 
    638       1.1       cgd 	/*
    639       1.2       cgd 	 * Get buffer len [for read()].
    640       1.1       cgd 	 */
    641       1.2       cgd 	case BIOCGBLEN:
    642       1.2       cgd 		*(u_int *)addr = d->bd_bufsize;
    643       1.1       cgd 		break;
    644       1.2       cgd 
    645       1.1       cgd 	/*
    646       1.2       cgd 	 * Set buffer length.
    647       1.1       cgd 	 */
    648       1.2       cgd 	case BIOCSBLEN:
    649       1.2       cgd 		if (d->bd_bif != 0)
    650       1.2       cgd 			error = EINVAL;
    651       1.2       cgd 		else {
    652      1.53  augustss 			u_int size = *(u_int *)addr;
    653       1.2       cgd 
    654       1.2       cgd 			if (size > BPF_MAXBUFSIZE)
    655       1.2       cgd 				*(u_int *)addr = size = BPF_MAXBUFSIZE;
    656       1.2       cgd 			else if (size < BPF_MINBUFSIZE)
    657       1.2       cgd 				*(u_int *)addr = size = BPF_MINBUFSIZE;
    658       1.2       cgd 			d->bd_bufsize = size;
    659       1.2       cgd 		}
    660       1.1       cgd 		break;
    661       1.1       cgd 
    662       1.1       cgd 	/*
    663       1.2       cgd 	 * Set link layer read filter.
    664       1.1       cgd 	 */
    665      1.12   mycroft 	case BIOCSETF:
    666       1.1       cgd 		error = bpf_setf(d, (struct bpf_program *)addr);
    667       1.1       cgd 		break;
    668       1.1       cgd 
    669      1.36  christos #ifdef BPF_KERN_FILTER
    670      1.36  christos 	/*
    671      1.36  christos 	 * Set TCP or UDP reject filter.
    672      1.36  christos 	 */
    673      1.36  christos 	case BIOCSTCPF:
    674      1.36  christos 	case BIOCSUDPF:
    675      1.36  christos 		if (!suser()) {
    676      1.36  christos 			error = EPERM;
    677      1.36  christos 			break;
    678      1.36  christos 		}
    679      1.36  christos 
    680      1.36  christos 		/* Validate and store filter */
    681      1.36  christos 		error = bpf_setf(d, (struct bpf_program *)addr);
    682      1.36  christos 
    683      1.36  christos 		/* Free possible old filter */
    684      1.36  christos 		if (cmd == BIOCSTCPF)
    685      1.36  christos 			p = &bpf_tcp_filter;
    686      1.36  christos 		else
    687      1.36  christos 			p = &bpf_udp_filter;
    688      1.36  christos 		if (*p != NULL)
    689      1.36  christos 			free((caddr_t)*p, M_DEVBUF);
    690      1.36  christos 
    691      1.36  christos 		/* Steal new filter (noop if error) */
    692      1.61   thorpej 		s = splnet();
    693      1.36  christos 		*p = d->bd_filter;
    694      1.36  christos 		d->bd_filter = NULL;
    695      1.36  christos 		splx(s);
    696      1.36  christos 		break;
    697      1.36  christos #endif
    698      1.36  christos 
    699       1.1       cgd 	/*
    700       1.1       cgd 	 * Flush read packet buffer.
    701       1.1       cgd 	 */
    702       1.1       cgd 	case BIOCFLUSH:
    703      1.61   thorpej 		s = splnet();
    704       1.1       cgd 		reset_d(d);
    705       1.1       cgd 		splx(s);
    706       1.1       cgd 		break;
    707       1.1       cgd 
    708       1.1       cgd 	/*
    709       1.1       cgd 	 * Put interface into promiscuous mode.
    710       1.1       cgd 	 */
    711       1.1       cgd 	case BIOCPROMISC:
    712       1.1       cgd 		if (d->bd_bif == 0) {
    713       1.1       cgd 			/*
    714       1.1       cgd 			 * No interface attached yet.
    715       1.1       cgd 			 */
    716       1.1       cgd 			error = EINVAL;
    717       1.1       cgd 			break;
    718       1.1       cgd 		}
    719      1.61   thorpej 		s = splnet();
    720       1.1       cgd 		if (d->bd_promisc == 0) {
    721       1.1       cgd 			error = ifpromisc(d->bd_bif->bif_ifp, 1);
    722       1.2       cgd 			if (error == 0)
    723       1.2       cgd 				d->bd_promisc = 1;
    724       1.1       cgd 		}
    725       1.1       cgd 		splx(s);
    726       1.1       cgd 		break;
    727       1.1       cgd 
    728       1.1       cgd 	/*
    729       1.1       cgd 	 * Get device parameters.
    730       1.1       cgd 	 */
    731       1.1       cgd 	case BIOCGDLT:
    732       1.1       cgd 		if (d->bd_bif == 0)
    733       1.1       cgd 			error = EINVAL;
    734       1.1       cgd 		else
    735       1.1       cgd 			*(u_int *)addr = d->bd_bif->bif_dlt;
    736       1.1       cgd 		break;
    737       1.1       cgd 
    738       1.1       cgd 	/*
    739       1.1       cgd 	 * Set interface name.
    740       1.1       cgd 	 */
    741       1.1       cgd 	case BIOCGETIF:
    742       1.1       cgd 		if (d->bd_bif == 0)
    743       1.1       cgd 			error = EINVAL;
    744       1.1       cgd 		else
    745       1.1       cgd 			bpf_ifname(d->bd_bif->bif_ifp, (struct ifreq *)addr);
    746       1.1       cgd 		break;
    747       1.1       cgd 
    748       1.1       cgd 	/*
    749       1.1       cgd 	 * Set interface.
    750       1.1       cgd 	 */
    751       1.1       cgd 	case BIOCSETIF:
    752       1.1       cgd 		error = bpf_setif(d, (struct ifreq *)addr);
    753       1.1       cgd 		break;
    754       1.1       cgd 
    755       1.1       cgd 	/*
    756       1.1       cgd 	 * Set read timeout.
    757       1.1       cgd 	 */
    758      1.12   mycroft 	case BIOCSRTIMEOUT:
    759       1.1       cgd 		{
    760       1.1       cgd 			struct timeval *tv = (struct timeval *)addr;
    761       1.1       cgd 
    762      1.19       cgd 			/* Compute number of ticks. */
    763      1.19       cgd 			d->bd_rtout = tv->tv_sec * hz + tv->tv_usec / tick;
    764      1.33   thorpej 			if ((d->bd_rtout == 0) && (tv->tv_usec != 0))
    765      1.33   thorpej 				d->bd_rtout = 1;
    766       1.1       cgd 			break;
    767       1.1       cgd 		}
    768       1.1       cgd 
    769       1.1       cgd 	/*
    770       1.1       cgd 	 * Get read timeout.
    771       1.1       cgd 	 */
    772      1.12   mycroft 	case BIOCGRTIMEOUT:
    773       1.1       cgd 		{
    774       1.1       cgd 			struct timeval *tv = (struct timeval *)addr;
    775       1.1       cgd 
    776      1.19       cgd 			tv->tv_sec = d->bd_rtout / hz;
    777      1.19       cgd 			tv->tv_usec = (d->bd_rtout % hz) * tick;
    778       1.1       cgd 			break;
    779       1.1       cgd 		}
    780       1.1       cgd 
    781       1.1       cgd 	/*
    782       1.1       cgd 	 * Get packet stats.
    783       1.1       cgd 	 */
    784       1.1       cgd 	case BIOCGSTATS:
    785       1.1       cgd 		{
    786       1.1       cgd 			struct bpf_stat *bs = (struct bpf_stat *)addr;
    787       1.1       cgd 
    788       1.1       cgd 			bs->bs_recv = d->bd_rcount;
    789       1.1       cgd 			bs->bs_drop = d->bd_dcount;
    790       1.1       cgd 			break;
    791       1.1       cgd 		}
    792       1.1       cgd 
    793       1.1       cgd 	/*
    794       1.1       cgd 	 * Set immediate mode.
    795       1.1       cgd 	 */
    796       1.1       cgd 	case BIOCIMMEDIATE:
    797       1.1       cgd 		d->bd_immediate = *(u_int *)addr;
    798       1.1       cgd 		break;
    799       1.2       cgd 
    800       1.2       cgd 	case BIOCVERSION:
    801       1.2       cgd 		{
    802       1.2       cgd 			struct bpf_version *bv = (struct bpf_version *)addr;
    803       1.2       cgd 
    804       1.2       cgd 			bv->bv_major = BPF_MAJOR_VERSION;
    805       1.2       cgd 			bv->bv_minor = BPF_MINOR_VERSION;
    806       1.2       cgd 			break;
    807      1.12   mycroft 		}
    808      1.23   thorpej 
    809      1.40   thorpej 	case BIOCGHDRCMPLT:	/* get "header already complete" flag */
    810      1.40   thorpej 		*(u_int *)addr = d->bd_hdrcmplt;
    811      1.40   thorpej 		break;
    812      1.40   thorpej 
    813      1.40   thorpej 	case BIOCSHDRCMPLT:	/* set "header already complete" flag */
    814      1.40   thorpej 		d->bd_hdrcmplt = *(u_int *)addr ? 1 : 0;
    815      1.40   thorpej 		break;
    816      1.23   thorpej 
    817      1.23   thorpej 	case FIONBIO:		/* Non-blocking I/O */
    818      1.23   thorpej 		if (*(int *)addr)
    819      1.23   thorpej 			d->bd_rtout = -1;
    820      1.23   thorpej 		else
    821      1.23   thorpej 			d->bd_rtout = 0;
    822      1.23   thorpej 		break;
    823      1.23   thorpej 
    824      1.23   thorpej 	case FIOASYNC:		/* Send signal on receive packets */
    825      1.23   thorpej 		d->bd_async = *(int *)addr;
    826      1.23   thorpej 		break;
    827      1.23   thorpej 
    828      1.23   thorpej 	/*
    829      1.23   thorpej 	 * N.B.  ioctl (FIOSETOWN) and fcntl (F_SETOWN) both end up doing
    830      1.23   thorpej 	 * the equivalent of a TIOCSPGRP and hence end up here.  *However*
    831      1.23   thorpej 	 * TIOCSPGRP's arg is a process group if it's positive and a process
    832      1.23   thorpej 	 * id if it's negative.  This is exactly the opposite of what the
    833      1.23   thorpej 	 * other two functions want!  Therefore there is code in ioctl and
    834      1.23   thorpej 	 * fcntl to negate the arg before calling here.
    835      1.23   thorpej 	 */
    836      1.23   thorpej 	case TIOCSPGRP:		/* Process or group to send signals to */
    837      1.23   thorpej 		d->bd_pgid = *(int *)addr;
    838      1.23   thorpej 		break;
    839      1.23   thorpej 
    840      1.23   thorpej 	case TIOCGPGRP:
    841      1.23   thorpej 		*(int *)addr = d->bd_pgid;
    842      1.23   thorpej 		break;
    843       1.1       cgd 	}
    844       1.1       cgd 	return (error);
    845       1.1       cgd }
    846       1.1       cgd 
    847      1.12   mycroft /*
    848       1.2       cgd  * Set d's packet filter program to fp.  If this file already has a filter,
    849       1.1       cgd  * free it and replace it.  Returns EINVAL for bogus requests.
    850       1.1       cgd  */
    851       1.1       cgd int
    852       1.1       cgd bpf_setf(d, fp)
    853       1.1       cgd 	struct bpf_d *d;
    854       1.1       cgd 	struct bpf_program *fp;
    855       1.1       cgd {
    856       1.1       cgd 	struct bpf_insn *fcode, *old;
    857       1.1       cgd 	u_int flen, size;
    858       1.1       cgd 	int s;
    859       1.1       cgd 
    860       1.1       cgd 	old = d->bd_filter;
    861       1.1       cgd 	if (fp->bf_insns == 0) {
    862       1.1       cgd 		if (fp->bf_len != 0)
    863       1.1       cgd 			return (EINVAL);
    864      1.61   thorpej 		s = splnet();
    865       1.1       cgd 		d->bd_filter = 0;
    866       1.1       cgd 		reset_d(d);
    867       1.1       cgd 		splx(s);
    868       1.1       cgd 		if (old != 0)
    869       1.1       cgd 			free((caddr_t)old, M_DEVBUF);
    870       1.1       cgd 		return (0);
    871       1.1       cgd 	}
    872       1.1       cgd 	flen = fp->bf_len;
    873       1.1       cgd 	if (flen > BPF_MAXINSNS)
    874       1.1       cgd 		return (EINVAL);
    875       1.1       cgd 
    876       1.1       cgd 	size = flen * sizeof(*fp->bf_insns);
    877       1.1       cgd 	fcode = (struct bpf_insn *)malloc(size, M_DEVBUF, M_WAITOK);
    878       1.2       cgd 	if (copyin((caddr_t)fp->bf_insns, (caddr_t)fcode, size) == 0 &&
    879       1.2       cgd 	    bpf_validate(fcode, (int)flen)) {
    880      1.61   thorpej 		s = splnet();
    881       1.1       cgd 		d->bd_filter = fcode;
    882       1.1       cgd 		reset_d(d);
    883       1.1       cgd 		splx(s);
    884       1.1       cgd 		if (old != 0)
    885       1.1       cgd 			free((caddr_t)old, M_DEVBUF);
    886       1.1       cgd 
    887       1.1       cgd 		return (0);
    888       1.1       cgd 	}
    889       1.1       cgd 	free((caddr_t)fcode, M_DEVBUF);
    890       1.1       cgd 	return (EINVAL);
    891       1.1       cgd }
    892       1.1       cgd 
    893       1.1       cgd /*
    894       1.2       cgd  * Detach a file from its current interface (if attached at all) and attach
    895       1.2       cgd  * to the interface indicated by the name stored in ifr.
    896       1.2       cgd  * Return an errno or 0.
    897       1.1       cgd  */
    898       1.1       cgd static int
    899       1.1       cgd bpf_setif(d, ifr)
    900       1.1       cgd 	struct bpf_d *d;
    901       1.1       cgd 	struct ifreq *ifr;
    902       1.1       cgd {
    903       1.1       cgd 	struct bpf_if *bp;
    904       1.1       cgd 	char *cp;
    905      1.26   thorpej 	int unit_seen, i, s, error;
    906       1.1       cgd 
    907       1.1       cgd 	/*
    908      1.26   thorpej 	 * Make sure the provided name has a unit number, and default
    909      1.26   thorpej 	 * it to '0' if not specified.
    910      1.26   thorpej 	 * XXX This is ugly ... do this differently?
    911       1.1       cgd 	 */
    912      1.26   thorpej 	unit_seen = 0;
    913       1.1       cgd 	cp = ifr->ifr_name;
    914      1.26   thorpej 	cp[sizeof(ifr->ifr_name) - 1] = '\0';	/* sanity */
    915      1.26   thorpej 	while (*cp++)
    916      1.26   thorpej 		if (*cp >= '0' && *cp <= '9')
    917      1.26   thorpej 			unit_seen = 1;
    918      1.26   thorpej 	if (!unit_seen) {
    919      1.26   thorpej 		/* Make sure to leave room for the '\0'. */
    920      1.26   thorpej 		for (i = 0; i < (IFNAMSIZ - 1); ++i) {
    921      1.26   thorpej 			if ((ifr->ifr_name[i] >= 'a' &&
    922      1.26   thorpej 			     ifr->ifr_name[i] <= 'z') ||
    923      1.26   thorpej 			    (ifr->ifr_name[i] >= 'A' &&
    924      1.26   thorpej 			     ifr->ifr_name[i] <= 'Z'))
    925      1.26   thorpej 				continue;
    926      1.26   thorpej 			ifr->ifr_name[i] = '0';
    927       1.1       cgd 		}
    928       1.1       cgd 	}
    929      1.26   thorpej 
    930       1.1       cgd 	/*
    931       1.1       cgd 	 * Look through attached interfaces for the named one.
    932       1.1       cgd 	 */
    933       1.1       cgd 	for (bp = bpf_iflist; bp != 0; bp = bp->bif_next) {
    934       1.1       cgd 		struct ifnet *ifp = bp->bif_ifp;
    935       1.1       cgd 
    936      1.26   thorpej 		if (ifp == 0 ||
    937      1.26   thorpej 		    strcmp(ifp->if_xname, ifr->ifr_name) != 0)
    938       1.1       cgd 			continue;
    939       1.1       cgd 		/*
    940       1.2       cgd 		 * We found the requested interface.
    941       1.1       cgd 		 * If it's not up, return an error.
    942       1.2       cgd 		 * Allocate the packet buffers if we need to.
    943       1.2       cgd 		 * If we're already attached to requested interface,
    944       1.2       cgd 		 * just flush the buffer.
    945       1.1       cgd 		 */
    946       1.1       cgd 		if ((ifp->if_flags & IFF_UP) == 0)
    947       1.1       cgd 			return (ENETDOWN);
    948       1.2       cgd 
    949       1.2       cgd 		if (d->bd_sbuf == 0) {
    950       1.2       cgd 			error = bpf_allocbufs(d);
    951       1.2       cgd 			if (error != 0)
    952       1.2       cgd 				return (error);
    953       1.2       cgd 		}
    954      1.61   thorpej 		s = splnet();
    955       1.1       cgd 		if (bp != d->bd_bif) {
    956       1.1       cgd 			if (d->bd_bif)
    957      1.12   mycroft 				/*
    958       1.1       cgd 				 * Detach if attached to something else.
    959       1.1       cgd 				 */
    960       1.1       cgd 				bpf_detachd(d);
    961       1.1       cgd 
    962       1.1       cgd 			bpf_attachd(d, bp);
    963       1.1       cgd 		}
    964       1.1       cgd 		reset_d(d);
    965       1.1       cgd 		splx(s);
    966       1.1       cgd 		return (0);
    967       1.1       cgd 	}
    968       1.1       cgd 	/* Not found. */
    969       1.1       cgd 	return (ENXIO);
    970       1.1       cgd }
    971       1.1       cgd 
    972       1.1       cgd /*
    973      1.26   thorpej  * Copy the interface name to the ifreq.
    974       1.1       cgd  */
    975       1.1       cgd static void
    976       1.1       cgd bpf_ifname(ifp, ifr)
    977       1.1       cgd 	struct ifnet *ifp;
    978       1.1       cgd 	struct ifreq *ifr;
    979       1.1       cgd {
    980       1.1       cgd 
    981      1.41     perry 	memcpy(ifr->ifr_name, ifp->if_xname, IFNAMSIZ);
    982       1.1       cgd }
    983       1.1       cgd 
    984       1.1       cgd /*
    985      1.36  christos  * Support for poll() system call
    986       1.1       cgd  *
    987       1.2       cgd  * Return true iff the specific operation will not block indefinitely.
    988       1.2       cgd  * Otherwise, return false but make a note that a selwakeup() must be done.
    989       1.1       cgd  */
    990       1.1       cgd int
    991  1.61.4.1   thorpej bpfpoll(devvp, events, p)
    992  1.61.4.1   thorpej 	struct vnode *devvp;
    993      1.30   mycroft 	int events;
    994       1.1       cgd 	struct proc *p;
    995       1.1       cgd {
    996  1.61.4.1   thorpej 	struct bpf_d *d = devvp->v_devcookie;
    997      1.30   mycroft 	int revents = 0;
    998      1.61   thorpej 	int s = splnet();
    999      1.12   mycroft 
   1000       1.1       cgd 	/*
   1001       1.1       cgd 	 * An imitation of the FIONREAD ioctl code.
   1002       1.1       cgd 	 */
   1003      1.44   thorpej 	if (events & (POLLIN | POLLRDNORM)) {
   1004      1.30   mycroft 		if (d->bd_hlen != 0 || (d->bd_immediate && d->bd_slen != 0))
   1005      1.30   mycroft 			revents |= events & (POLLIN | POLLRDNORM);
   1006      1.30   mycroft 		else
   1007      1.30   mycroft 			selrecord(p, &d->bd_sel);
   1008      1.44   thorpej 	}
   1009      1.12   mycroft 
   1010      1.12   mycroft 	splx(s);
   1011      1.30   mycroft 	return (revents);
   1012       1.1       cgd }
   1013       1.1       cgd 
   1014       1.1       cgd /*
   1015       1.2       cgd  * Incoming linkage from device drivers.  Process the packet pkt, of length
   1016       1.2       cgd  * pktlen, which is stored in a contiguous buffer.  The packet is parsed
   1017       1.2       cgd  * by each process' filter, and if accepted, stashed into the corresponding
   1018       1.2       cgd  * buffer.
   1019       1.1       cgd  */
   1020       1.1       cgd void
   1021       1.1       cgd bpf_tap(arg, pkt, pktlen)
   1022       1.1       cgd 	caddr_t arg;
   1023      1.53  augustss 	u_char *pkt;
   1024      1.53  augustss 	u_int pktlen;
   1025       1.1       cgd {
   1026       1.1       cgd 	struct bpf_if *bp;
   1027      1.53  augustss 	struct bpf_d *d;
   1028      1.53  augustss 	u_int slen;
   1029       1.1       cgd 	/*
   1030       1.1       cgd 	 * Note that the ipl does not have to be raised at this point.
   1031       1.1       cgd 	 * The only problem that could arise here is that if two different
   1032       1.1       cgd 	 * interfaces shared any data.  This is not the case.
   1033       1.1       cgd 	 */
   1034       1.1       cgd 	bp = (struct bpf_if *)arg;
   1035       1.1       cgd 	for (d = bp->bif_dlist; d != 0; d = d->bd_next) {
   1036       1.1       cgd 		++d->bd_rcount;
   1037       1.1       cgd 		slen = bpf_filter(d->bd_filter, pkt, pktlen, pktlen);
   1038       1.1       cgd 		if (slen != 0)
   1039      1.41     perry 			catchpacket(d, pkt, pktlen, slen, memcpy);
   1040       1.1       cgd 	}
   1041       1.1       cgd }
   1042       1.1       cgd 
   1043       1.1       cgd /*
   1044       1.1       cgd  * Copy data from an mbuf chain into a buffer.  This code is derived
   1045       1.1       cgd  * from m_copydata in sys/uipc_mbuf.c.
   1046       1.1       cgd  */
   1047      1.43     perry static void *
   1048      1.41     perry bpf_mcpy(dst_arg, src_arg, len)
   1049      1.41     perry 	void *dst_arg;
   1050      1.12   mycroft 	const void *src_arg;
   1051      1.53  augustss 	size_t len;
   1052      1.12   mycroft {
   1053      1.53  augustss 	const struct mbuf *m;
   1054      1.53  augustss 	u_int count;
   1055       1.1       cgd 	u_char *dst;
   1056       1.1       cgd 
   1057      1.12   mycroft 	m = src_arg;
   1058      1.12   mycroft 	dst = dst_arg;
   1059       1.1       cgd 	while (len > 0) {
   1060       1.1       cgd 		if (m == 0)
   1061      1.41     perry 			panic("bpf_mcpy");
   1062      1.12   mycroft 		count = min(m->m_len, len);
   1063      1.41     perry 		memcpy((caddr_t)dst, mtod(m, caddr_t), count);
   1064       1.1       cgd 		m = m->m_next;
   1065       1.1       cgd 		dst += count;
   1066       1.1       cgd 		len -= count;
   1067       1.1       cgd 	}
   1068      1.43     perry 	return(dst_arg);
   1069       1.1       cgd }
   1070       1.1       cgd 
   1071       1.1       cgd /*
   1072       1.2       cgd  * Incoming linkage from device drivers, when packet is in an mbuf chain.
   1073       1.1       cgd  */
   1074       1.1       cgd void
   1075       1.1       cgd bpf_mtap(arg, m)
   1076       1.1       cgd 	caddr_t arg;
   1077       1.1       cgd 	struct mbuf *m;
   1078       1.1       cgd {
   1079       1.1       cgd 	struct bpf_if *bp = (struct bpf_if *)arg;
   1080       1.1       cgd 	struct bpf_d *d;
   1081      1.36  christos 	u_int pktlen, slen;
   1082       1.1       cgd 	struct mbuf *m0;
   1083       1.1       cgd 
   1084       1.1       cgd 	pktlen = 0;
   1085       1.2       cgd 	for (m0 = m; m0 != 0; m0 = m0->m_next)
   1086       1.1       cgd 		pktlen += m0->m_len;
   1087       1.1       cgd 
   1088       1.1       cgd 	for (d = bp->bif_dlist; d != 0; d = d->bd_next) {
   1089       1.1       cgd 		++d->bd_rcount;
   1090       1.1       cgd 		slen = bpf_filter(d->bd_filter, (u_char *)m, pktlen, 0);
   1091       1.1       cgd 		if (slen != 0)
   1092      1.41     perry 			catchpacket(d, (u_char *)m, pktlen, slen, bpf_mcpy);
   1093       1.1       cgd 	}
   1094       1.1       cgd }
   1095       1.1       cgd 
   1096       1.1       cgd /*
   1097       1.1       cgd  * Move the packet data from interface memory (pkt) into the
   1098       1.1       cgd  * store buffer.  Return 1 if it's time to wakeup a listener (buffer full),
   1099       1.2       cgd  * otherwise 0.  "copy" is the routine called to do the actual data
   1100      1.41     perry  * transfer.  memcpy is passed in to copy contiguous chunks, while
   1101      1.41     perry  * bpf_mcpy is passed in to copy mbuf chains.  In the latter case,
   1102       1.2       cgd  * pkt is really an mbuf.
   1103       1.1       cgd  */
   1104       1.1       cgd static void
   1105       1.1       cgd catchpacket(d, pkt, pktlen, snaplen, cpfn)
   1106      1.53  augustss 	struct bpf_d *d;
   1107      1.53  augustss 	u_char *pkt;
   1108      1.53  augustss 	u_int pktlen, snaplen;
   1109      1.53  augustss 	void *(*cpfn) __P((void *, const void *, size_t));
   1110      1.53  augustss {
   1111      1.53  augustss 	struct bpf_hdr *hp;
   1112      1.53  augustss 	int totlen, curlen;
   1113      1.53  augustss 	int hdrlen = d->bd_bif->bif_hdrlen;
   1114       1.1       cgd 	/*
   1115       1.1       cgd 	 * Figure out how many bytes to move.  If the packet is
   1116       1.1       cgd 	 * greater or equal to the snapshot length, transfer that
   1117       1.1       cgd 	 * much.  Otherwise, transfer the whole packet (unless
   1118       1.1       cgd 	 * we hit the buffer size limit).
   1119       1.1       cgd 	 */
   1120      1.12   mycroft 	totlen = hdrlen + min(snaplen, pktlen);
   1121       1.1       cgd 	if (totlen > d->bd_bufsize)
   1122       1.1       cgd 		totlen = d->bd_bufsize;
   1123       1.1       cgd 
   1124       1.1       cgd 	/*
   1125       1.1       cgd 	 * Round up the end of the previous packet to the next longword.
   1126       1.1       cgd 	 */
   1127       1.1       cgd 	curlen = BPF_WORDALIGN(d->bd_slen);
   1128       1.1       cgd 	if (curlen + totlen > d->bd_bufsize) {
   1129       1.1       cgd 		/*
   1130       1.1       cgd 		 * This packet will overflow the storage buffer.
   1131       1.1       cgd 		 * Rotate the buffers if we can, then wakeup any
   1132       1.1       cgd 		 * pending reads.
   1133       1.1       cgd 		 */
   1134       1.1       cgd 		if (d->bd_fbuf == 0) {
   1135      1.12   mycroft 			/*
   1136      1.12   mycroft 			 * We haven't completed the previous read yet,
   1137       1.1       cgd 			 * so drop the packet.
   1138       1.1       cgd 			 */
   1139       1.1       cgd 			++d->bd_dcount;
   1140       1.1       cgd 			return;
   1141       1.1       cgd 		}
   1142       1.1       cgd 		ROTATE_BUFFERS(d);
   1143       1.1       cgd 		bpf_wakeup(d);
   1144       1.1       cgd 		curlen = 0;
   1145       1.1       cgd 	}
   1146      1.12   mycroft 	else if (d->bd_immediate)
   1147       1.1       cgd 		/*
   1148       1.1       cgd 		 * Immediate mode is set.  A packet arrived so any
   1149       1.1       cgd 		 * reads should be woken up.
   1150       1.1       cgd 		 */
   1151       1.1       cgd 		bpf_wakeup(d);
   1152       1.1       cgd 
   1153       1.1       cgd 	/*
   1154       1.1       cgd 	 * Append the bpf header.
   1155       1.1       cgd 	 */
   1156       1.1       cgd 	hp = (struct bpf_hdr *)(d->bd_sbuf + curlen);
   1157       1.2       cgd 	microtime(&hp->bh_tstamp);
   1158       1.1       cgd 	hp->bh_datalen = pktlen;
   1159       1.1       cgd 	hp->bh_hdrlen = hdrlen;
   1160       1.1       cgd 	/*
   1161       1.1       cgd 	 * Copy the packet data into the store buffer and update its length.
   1162       1.1       cgd 	 */
   1163      1.41     perry 	(*cpfn)((u_char *)hp + hdrlen, pkt, (hp->bh_caplen = totlen - hdrlen));
   1164       1.1       cgd 	d->bd_slen = curlen + totlen;
   1165       1.1       cgd }
   1166       1.1       cgd 
   1167      1.12   mycroft /*
   1168       1.1       cgd  * Initialize all nonzero fields of a descriptor.
   1169       1.1       cgd  */
   1170       1.1       cgd static int
   1171       1.2       cgd bpf_allocbufs(d)
   1172      1.53  augustss 	struct bpf_d *d;
   1173       1.1       cgd {
   1174      1.50     enami 
   1175       1.1       cgd 	d->bd_fbuf = (caddr_t)malloc(d->bd_bufsize, M_DEVBUF, M_WAITOK);
   1176       1.1       cgd 	d->bd_sbuf = (caddr_t)malloc(d->bd_bufsize, M_DEVBUF, M_WAITOK);
   1177       1.1       cgd 	d->bd_slen = 0;
   1178       1.1       cgd 	d->bd_hlen = 0;
   1179       1.1       cgd 	return (0);
   1180       1.1       cgd }
   1181       1.1       cgd 
   1182       1.1       cgd /*
   1183       1.2       cgd  * Free buffers currently in use by a descriptor.
   1184       1.2       cgd  * Called on close.
   1185       1.2       cgd  */
   1186       1.2       cgd static void
   1187       1.2       cgd bpf_freed(d)
   1188      1.53  augustss 	struct bpf_d *d;
   1189       1.2       cgd {
   1190       1.2       cgd 	/*
   1191       1.2       cgd 	 * We don't need to lock out interrupts since this descriptor has
   1192       1.2       cgd 	 * been detached from its interface and it yet hasn't been marked
   1193       1.2       cgd 	 * free.
   1194       1.2       cgd 	 */
   1195       1.2       cgd 	if (d->bd_sbuf != 0) {
   1196       1.2       cgd 		free(d->bd_sbuf, M_DEVBUF);
   1197       1.2       cgd 		if (d->bd_hbuf != 0)
   1198       1.2       cgd 			free(d->bd_hbuf, M_DEVBUF);
   1199       1.2       cgd 		if (d->bd_fbuf != 0)
   1200       1.2       cgd 			free(d->bd_fbuf, M_DEVBUF);
   1201       1.2       cgd 	}
   1202       1.2       cgd 	if (d->bd_filter)
   1203       1.2       cgd 		free((caddr_t)d->bd_filter, M_DEVBUF);
   1204       1.2       cgd 
   1205       1.2       cgd 	D_MARKFREE(d);
   1206       1.2       cgd }
   1207       1.2       cgd 
   1208       1.2       cgd /*
   1209      1.60   thorpej  * Attach an interface to bpf.  dlt is the link layer type; hdrlen is the
   1210      1.60   thorpej  * fixed size of the link header (variable length headers not yet supported).
   1211       1.1       cgd  */
   1212       1.1       cgd void
   1213      1.59   thorpej bpfattach(ifp, dlt, hdrlen)
   1214       1.1       cgd 	struct ifnet *ifp;
   1215       1.1       cgd 	u_int dlt, hdrlen;
   1216       1.1       cgd {
   1217       1.1       cgd 	struct bpf_if *bp;
   1218       1.1       cgd 	bp = (struct bpf_if *)malloc(sizeof(*bp), M_DEVBUF, M_DONTWAIT);
   1219      1.12   mycroft 	if (bp == 0)
   1220      1.12   mycroft 		panic("bpfattach");
   1221      1.12   mycroft 
   1222       1.1       cgd 	bp->bif_dlist = 0;
   1223      1.59   thorpej 	bp->bif_driverp = (struct bpf_if **)&ifp->if_bpf;
   1224       1.1       cgd 	bp->bif_ifp = ifp;
   1225       1.1       cgd 	bp->bif_dlt = dlt;
   1226       1.1       cgd 
   1227       1.1       cgd 	bp->bif_next = bpf_iflist;
   1228       1.1       cgd 	bpf_iflist = bp;
   1229       1.1       cgd 
   1230       1.1       cgd 	*bp->bif_driverp = 0;
   1231       1.1       cgd 
   1232       1.1       cgd 	/*
   1233       1.1       cgd 	 * Compute the length of the bpf header.  This is not necessarily
   1234      1.12   mycroft 	 * equal to SIZEOF_BPF_HDR because we want to insert spacing such
   1235      1.12   mycroft 	 * that the network layer header begins on a longword boundary (for
   1236       1.1       cgd 	 * performance reasons and to alleviate alignment restrictions).
   1237       1.1       cgd 	 */
   1238       1.1       cgd 	bp->bif_hdrlen = BPF_WORDALIGN(hdrlen + SIZEOF_BPF_HDR) - hdrlen;
   1239       1.1       cgd 
   1240      1.11   deraadt #if 0
   1241      1.32  christos 	printf("bpf: %s attached\n", ifp->if_xname);
   1242      1.11   deraadt #endif
   1243      1.48   thorpej }
   1244      1.48   thorpej 
   1245      1.48   thorpej /*
   1246      1.48   thorpej  * Remove an interface from bpf.
   1247      1.48   thorpej  */
   1248      1.48   thorpej void
   1249      1.48   thorpej bpfdetach(ifp)
   1250      1.48   thorpej 	struct ifnet *ifp;
   1251      1.48   thorpej {
   1252      1.48   thorpej 	struct bpf_if *bp, **pbp;
   1253      1.51     enami 	struct bpf_d *d;
   1254      1.51     enami 	int i, s, cmaj;
   1255      1.51     enami 
   1256      1.51     enami 	/* locate the major number */
   1257      1.51     enami 	for (cmaj = 0; cmaj <= nchrdev; cmaj++)
   1258      1.51     enami 		if (cdevsw[cmaj].d_open == bpfopen)
   1259      1.51     enami 			break;
   1260      1.51     enami 
   1261      1.52     soren 	/* Nuke the vnodes for any open instances */
   1262      1.51     enami 	for (i = 0; i < NBPFILTER; ++i) {
   1263      1.51     enami 		d = &bpf_dtab[i];
   1264      1.51     enami 		if (!D_ISFREE(d) && d->bd_bif != NULL &&
   1265      1.51     enami 		    d->bd_bif->bif_ifp == ifp) {
   1266      1.51     enami 			/*
   1267      1.51     enami 			 * Detach the descriptor from an interface now.
   1268      1.51     enami 			 * It will be free'ed later by close routine.
   1269      1.51     enami 			 */
   1270      1.61   thorpej 			s = splnet();
   1271      1.51     enami 			d->bd_promisc = 0;	/* we can't touch device. */
   1272      1.51     enami 			bpf_detachd(d);
   1273      1.51     enami 			splx(s);
   1274      1.51     enami 			vdevgone(cmaj, i, i, VCHR);
   1275      1.51     enami 		}
   1276      1.51     enami 	}
   1277      1.48   thorpej 
   1278      1.48   thorpej 	for (bp = bpf_iflist, pbp = &bpf_iflist;
   1279      1.48   thorpej 	     bp != NULL; pbp = &bp->bif_next, bp = bp->bif_next) {
   1280      1.48   thorpej 		if (bp->bif_ifp == ifp) {
   1281      1.48   thorpej 			*pbp = bp->bif_next;
   1282      1.48   thorpej 			free(bp, M_DEVBUF);
   1283      1.48   thorpej 			break;
   1284      1.48   thorpej 		}
   1285      1.48   thorpej 	}
   1286      1.47   thorpej }
   1287      1.47   thorpej 
   1288      1.47   thorpej /*
   1289      1.47   thorpej  * Change the data link type of a BPF instance.
   1290      1.47   thorpej  */
   1291      1.47   thorpej void
   1292      1.59   thorpej bpf_change_type(ifp, dlt, hdrlen)
   1293      1.59   thorpej 	struct ifnet *ifp;
   1294      1.47   thorpej 	u_int dlt, hdrlen;
   1295      1.47   thorpej {
   1296      1.47   thorpej 	struct bpf_if *bp;
   1297      1.47   thorpej 
   1298      1.47   thorpej 	for (bp = bpf_iflist; bp != NULL; bp = bp->bif_next) {
   1299      1.59   thorpej 		if (bp->bif_driverp == (struct bpf_if **)&ifp->if_bpf)
   1300      1.47   thorpej 			break;
   1301      1.47   thorpej 	}
   1302      1.47   thorpej 	if (bp == NULL)
   1303      1.47   thorpej 		panic("bpf_change_type");
   1304      1.47   thorpej 
   1305      1.47   thorpej 	bp->bif_dlt = dlt;
   1306      1.47   thorpej 
   1307      1.47   thorpej 	/*
   1308      1.47   thorpej 	 * Compute the length of the bpf header.  This is not necessarily
   1309      1.47   thorpej 	 * equal to SIZEOF_BPF_HDR because we want to insert spacing such
   1310      1.47   thorpej 	 * that the network layer header begins on a longword boundary (for
   1311      1.47   thorpej 	 * performance reasons and to alleviate alignment restrictions).
   1312      1.47   thorpej 	 */
   1313      1.47   thorpej 	bp->bif_hdrlen = BPF_WORDALIGN(hdrlen + SIZEOF_BPF_HDR) - hdrlen;
   1314       1.1       cgd }
   1315