Home | History | Annotate | Line # | Download | only in altq
altq_subr.c revision 1.16
      1  1.16     peter /*	$NetBSD: altq_subr.c,v 1.16 2006/10/12 19:59:08 peter Exp $	*/
      2  1.16     peter /*	$KAME: altq_subr.c,v 1.24 2005/04/13 03:44:25 suz Exp $	*/
      3   1.1   thorpej 
      4   1.1   thorpej /*
      5  1.16     peter  * Copyright (C) 1997-2003
      6   1.1   thorpej  *	Sony Computer Science Laboratories Inc.  All rights reserved.
      7   1.1   thorpej  *
      8   1.1   thorpej  * Redistribution and use in source and binary forms, with or without
      9   1.1   thorpej  * modification, are permitted provided that the following conditions
     10   1.1   thorpej  * are met:
     11   1.1   thorpej  * 1. Redistributions of source code must retain the above copyright
     12   1.1   thorpej  *    notice, this list of conditions and the following disclaimer.
     13   1.1   thorpej  * 2. Redistributions in binary form must reproduce the above copyright
     14   1.1   thorpej  *    notice, this list of conditions and the following disclaimer in the
     15   1.1   thorpej  *    documentation and/or other materials provided with the distribution.
     16   1.1   thorpej  *
     17   1.1   thorpej  * THIS SOFTWARE IS PROVIDED BY SONY CSL AND CONTRIBUTORS ``AS IS'' AND
     18   1.1   thorpej  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     19   1.1   thorpej  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     20   1.1   thorpej  * ARE DISCLAIMED.  IN NO EVENT SHALL SONY CSL OR CONTRIBUTORS BE LIABLE
     21   1.1   thorpej  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     22   1.1   thorpej  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     23   1.1   thorpej  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     24   1.1   thorpej  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     25   1.1   thorpej  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     26   1.1   thorpej  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     27   1.1   thorpej  * SUCH DAMAGE.
     28   1.1   thorpej  */
     29   1.7     lukem 
     30   1.7     lukem #include <sys/cdefs.h>
     31  1.16     peter __KERNEL_RCSID(0, "$NetBSD: altq_subr.c,v 1.16 2006/10/12 19:59:08 peter Exp $");
     32   1.1   thorpej 
     33  1.16     peter #ifdef _KERNEL_OPT
     34   1.1   thorpej #include "opt_altq.h"
     35   1.1   thorpej #include "opt_inet.h"
     36   1.1   thorpej #endif
     37   1.1   thorpej 
     38   1.1   thorpej #include <sys/param.h>
     39   1.1   thorpej #include <sys/malloc.h>
     40   1.1   thorpej #include <sys/mbuf.h>
     41   1.1   thorpej #include <sys/systm.h>
     42   1.1   thorpej #include <sys/proc.h>
     43   1.1   thorpej #include <sys/socket.h>
     44   1.1   thorpej #include <sys/socketvar.h>
     45   1.1   thorpej #include <sys/kernel.h>
     46   1.1   thorpej #include <sys/errno.h>
     47   1.1   thorpej #include <sys/syslog.h>
     48   1.1   thorpej #include <sys/sysctl.h>
     49   1.1   thorpej #include <sys/queue.h>
     50   1.1   thorpej 
     51   1.1   thorpej #include <net/if.h>
     52   1.1   thorpej #include <net/if_dl.h>
     53   1.1   thorpej #include <net/if_types.h>
     54   1.1   thorpej 
     55   1.1   thorpej #include <netinet/in.h>
     56   1.1   thorpej #include <netinet/in_systm.h>
     57   1.1   thorpej #include <netinet/ip.h>
     58   1.1   thorpej #ifdef INET6
     59   1.1   thorpej #include <netinet/ip6.h>
     60   1.1   thorpej #endif
     61   1.1   thorpej #include <netinet/tcp.h>
     62   1.1   thorpej #include <netinet/udp.h>
     63   1.1   thorpej 
     64  1.16     peter #include <net/pfvar.h>
     65   1.1   thorpej #include <altq/altq.h>
     66  1.16     peter #ifdef ALTQ3_COMPAT
     67   1.1   thorpej #include <altq/altq_conf.h>
     68  1.16     peter #endif
     69   1.1   thorpej 
     70   1.8    itojun /* machine dependent clock related includes */
     71   1.1   thorpej #ifdef __FreeBSD__
     72   1.1   thorpej #include "opt_cpu.h"	/* for FreeBSD-2.2.8 to get i586_ctr_freq */
     73   1.1   thorpej #include <machine/clock.h>
     74   1.1   thorpej #endif
     75   1.8    itojun #if defined(__i386__)
     76  1.16     peter #include <machine/cpufunc.h>		/* for pentium tsc */
     77   1.8    itojun #include <machine/specialreg.h>		/* for CPUID_TSC */
     78   1.8    itojun #ifdef __FreeBSD__
     79   1.8    itojun #include <machine/md_var.h>		/* for cpu_feature */
     80   1.8    itojun #elif defined(__NetBSD__) || defined(__OpenBSD__)
     81   1.8    itojun #include <machine/cpu.h>		/* for cpu_feature */
     82   1.8    itojun #endif
     83   1.8    itojun #endif /* __i386__ */
     84   1.1   thorpej 
     85   1.1   thorpej /*
     86   1.1   thorpej  * internal function prototypes
     87   1.1   thorpej  */
     88  1.16     peter static void	tbr_timeout(void *);
     89  1.16     peter int (*altq_input)(struct mbuf *, int) = NULL;
     90  1.16     peter static int tbr_timer = 0;	/* token bucket regulator timer */
     91  1.16     peter static struct callout tbr_callout = CALLOUT_INITIALIZER;
     92  1.16     peter 
     93  1.16     peter int pfaltq_running;	/* keep track of running state */
     94  1.16     peter 
     95  1.16     peter #ifdef ALTQ3_CLFIER_COMPAT
     96  1.16     peter static int 	extract_ports4(struct mbuf *, struct ip *, struct flowinfo_in *);
     97   1.1   thorpej #ifdef INET6
     98  1.16     peter static int 	extract_ports6(struct mbuf *, struct ip6_hdr *,
     99  1.16     peter 			       struct flowinfo_in6 *);
    100   1.1   thorpej #endif
    101  1.16     peter static int	apply_filter4(u_int32_t, struct flow_filter *,
    102  1.16     peter 			      struct flowinfo_in *);
    103  1.16     peter static int	apply_ppfilter4(u_int32_t, struct flow_filter *,
    104  1.16     peter 				struct flowinfo_in *);
    105   1.1   thorpej #ifdef INET6
    106  1.16     peter static int	apply_filter6(u_int32_t, struct flow_filter6 *,
    107  1.16     peter 			      struct flowinfo_in6 *);
    108   1.1   thorpej #endif
    109  1.16     peter static int	apply_tosfilter4(u_int32_t, struct flow_filter *,
    110  1.16     peter 				 struct flowinfo_in *);
    111  1.16     peter static u_long	get_filt_handle(struct acc_classifier *, int);
    112  1.16     peter static struct acc_filter *filth_to_filtp(struct acc_classifier *, u_long);
    113  1.16     peter static u_int32_t filt2fibmask(struct flow_filter *);
    114  1.16     peter 
    115  1.16     peter static void 	ip4f_cache(struct ip *, struct flowinfo_in *);
    116  1.16     peter static int 	ip4f_lookup(struct ip *, struct flowinfo_in *);
    117  1.16     peter static int 	ip4f_init(void);
    118  1.16     peter static struct ip4_frag	*ip4f_alloc(void);
    119  1.16     peter static void 	ip4f_free(struct ip4_frag *);
    120  1.16     peter #endif /* ALTQ3_CLFIER_COMPAT */
    121   1.1   thorpej 
    122   1.1   thorpej /*
    123   1.1   thorpej  * alternate queueing support routines
    124   1.1   thorpej  */
    125   1.1   thorpej 
    126  1.16     peter /* look up the queue state by the interface name and the queueing type. */
    127   1.1   thorpej void *
    128  1.16     peter altq_lookup(char *name, int type)
    129   1.1   thorpej {
    130   1.1   thorpej 	struct ifnet *ifp;
    131   1.1   thorpej 
    132   1.1   thorpej 	if ((ifp = ifunit(name)) != NULL) {
    133   1.1   thorpej 		if (type != ALTQT_NONE && ifp->if_snd.altq_type == type)
    134   1.1   thorpej 			return (ifp->if_snd.altq_disc);
    135   1.1   thorpej 	}
    136   1.1   thorpej 
    137   1.1   thorpej 	return NULL;
    138   1.1   thorpej }
    139   1.1   thorpej 
    140   1.1   thorpej int
    141  1.16     peter altq_attach(struct ifaltq *ifq, int type, void *discipline,
    142  1.16     peter     int (*enqueue)(struct ifaltq *, struct mbuf *, struct altq_pktattr *),
    143  1.16     peter     struct mbuf *(*dequeue)(struct ifaltq *, int),
    144  1.16     peter     int (*request)(struct ifaltq *, int, void *),
    145  1.16     peter     void *clfier, void *(*classify)(void *, struct mbuf *, int))
    146   1.1   thorpej {
    147   1.1   thorpej 	if (!ALTQ_IS_READY(ifq))
    148   1.1   thorpej 		return ENXIO;
    149  1.16     peter 
    150  1.16     peter #ifdef ALTQ3_COMPAT
    151  1.16     peter 	/*
    152  1.16     peter 	 * pfaltq can override the existing discipline, but altq3 cannot.
    153  1.16     peter 	 * check these if clfier is not NULL (which implies altq3).
    154  1.16     peter 	 */
    155  1.16     peter 	if (clfier != NULL) {
    156  1.16     peter 		if (ALTQ_IS_ENABLED(ifq))
    157  1.16     peter 			return EBUSY;
    158  1.16     peter 		if (ALTQ_IS_ATTACHED(ifq))
    159  1.16     peter 			return EEXIST;
    160  1.16     peter 	}
    161  1.16     peter #endif
    162   1.1   thorpej 	ifq->altq_type     = type;
    163   1.1   thorpej 	ifq->altq_disc     = discipline;
    164   1.1   thorpej 	ifq->altq_enqueue  = enqueue;
    165   1.1   thorpej 	ifq->altq_dequeue  = dequeue;
    166   1.1   thorpej 	ifq->altq_request  = request;
    167   1.1   thorpej 	ifq->altq_clfier   = clfier;
    168   1.1   thorpej 	ifq->altq_classify = classify;
    169  1.16     peter 	ifq->altq_flags &= (ALTQF_CANTCHANGE|ALTQF_ENABLED);
    170  1.16     peter #ifdef ALTQ3_COMPAT
    171   1.1   thorpej #ifdef ALTQ_KLD
    172   1.1   thorpej 	altq_module_incref(type);
    173   1.1   thorpej #endif
    174  1.16     peter #endif
    175   1.1   thorpej 	return 0;
    176   1.1   thorpej }
    177   1.1   thorpej 
    178   1.1   thorpej int
    179  1.16     peter altq_detach(struct ifaltq *ifq)
    180   1.1   thorpej {
    181   1.1   thorpej 	if (!ALTQ_IS_READY(ifq))
    182   1.1   thorpej 		return ENXIO;
    183   1.1   thorpej 	if (ALTQ_IS_ENABLED(ifq))
    184   1.1   thorpej 		return EBUSY;
    185   1.1   thorpej 	if (!ALTQ_IS_ATTACHED(ifq))
    186   1.1   thorpej 		return (0);
    187  1.16     peter #ifdef ALTQ3_COMPAT
    188   1.1   thorpej #ifdef ALTQ_KLD
    189   1.1   thorpej 	altq_module_declref(ifq->altq_type);
    190   1.1   thorpej #endif
    191  1.16     peter #endif
    192  1.16     peter 
    193   1.1   thorpej 	ifq->altq_type     = ALTQT_NONE;
    194   1.1   thorpej 	ifq->altq_disc     = NULL;
    195   1.1   thorpej 	ifq->altq_enqueue  = NULL;
    196   1.1   thorpej 	ifq->altq_dequeue  = NULL;
    197   1.1   thorpej 	ifq->altq_request  = NULL;
    198   1.1   thorpej 	ifq->altq_clfier   = NULL;
    199   1.1   thorpej 	ifq->altq_classify = NULL;
    200   1.1   thorpej 	ifq->altq_flags &= ALTQF_CANTCHANGE;
    201   1.1   thorpej 	return 0;
    202   1.1   thorpej }
    203   1.1   thorpej 
    204   1.1   thorpej int
    205  1.16     peter altq_enable(struct ifaltq *ifq)
    206   1.1   thorpej {
    207   1.1   thorpej 	int s;
    208  1.12     perry 
    209   1.1   thorpej 	if (!ALTQ_IS_READY(ifq))
    210   1.1   thorpej 		return ENXIO;
    211   1.1   thorpej 	if (ALTQ_IS_ENABLED(ifq))
    212   1.1   thorpej 		return 0;
    213   1.1   thorpej 
    214   1.5   thorpej 	s = splnet();
    215   1.1   thorpej 	IFQ_PURGE(ifq);
    216   1.1   thorpej 	ASSERT(ifq->ifq_len == 0);
    217   1.1   thorpej 	ifq->altq_flags |= ALTQF_ENABLED;
    218   1.1   thorpej 	if (ifq->altq_clfier != NULL)
    219   1.1   thorpej 		ifq->altq_flags |= ALTQF_CLASSIFY;
    220   1.1   thorpej 	splx(s);
    221   1.1   thorpej 
    222   1.1   thorpej 	return 0;
    223   1.1   thorpej }
    224   1.1   thorpej 
    225   1.1   thorpej int
    226  1.16     peter altq_disable(struct ifaltq *ifq)
    227   1.1   thorpej {
    228   1.1   thorpej 	int s;
    229  1.12     perry 
    230   1.1   thorpej 	if (!ALTQ_IS_ENABLED(ifq))
    231   1.1   thorpej 		return 0;
    232   1.1   thorpej 
    233   1.5   thorpej 	s = splnet();
    234   1.1   thorpej 	IFQ_PURGE(ifq);
    235   1.1   thorpej 	ASSERT(ifq->ifq_len == 0);
    236   1.1   thorpej 	ifq->altq_flags &= ~(ALTQF_ENABLED|ALTQF_CLASSIFY);
    237   1.1   thorpej 	splx(s);
    238   1.1   thorpej 	return 0;
    239   1.1   thorpej }
    240   1.1   thorpej 
    241  1.16     peter #ifdef ALTQ_DEBUG
    242   1.1   thorpej void
    243  1.16     peter altq_assert(const char *file, int line, const char *failedexpr)
    244   1.1   thorpej {
    245   1.1   thorpej 	(void)printf("altq assertion \"%s\" failed: file \"%s\", line %d\n",
    246   1.1   thorpej 		     failedexpr, file, line);
    247   1.1   thorpej 	panic("altq assertion");
    248   1.1   thorpej 	/* NOTREACHED */
    249   1.1   thorpej }
    250  1.16     peter #endif
    251   1.1   thorpej 
    252   1.1   thorpej /*
    253   1.1   thorpej  * internal representation of token bucket parameters
    254  1.16     peter  *	rate:	byte_per_unittime << 32
    255   1.1   thorpej  *		(((bits_per_sec) / 8) << 32) / machclk_freq
    256   1.1   thorpej  *	depth:	byte << 32
    257   1.1   thorpej  *
    258   1.1   thorpej  */
    259   1.1   thorpej #define	TBR_SHIFT	32
    260   1.1   thorpej #define	TBR_SCALE(x)	((int64_t)(x) << TBR_SHIFT)
    261   1.1   thorpej #define	TBR_UNSCALE(x)	((x) >> TBR_SHIFT)
    262   1.1   thorpej 
    263   1.1   thorpej struct mbuf *
    264  1.16     peter tbr_dequeue(struct ifaltq *ifq, int op)
    265   1.1   thorpej {
    266   1.1   thorpej 	struct tb_regulator *tbr;
    267   1.1   thorpej 	struct mbuf *m;
    268   1.1   thorpej 	int64_t interval;
    269   1.1   thorpej 	u_int64_t now;
    270   1.1   thorpej 
    271   1.1   thorpej 	tbr = ifq->altq_tbr;
    272   1.1   thorpej 	if (op == ALTDQ_REMOVE && tbr->tbr_lastop == ALTDQ_POLL) {
    273   1.1   thorpej 		/* if this is a remove after poll, bypass tbr check */
    274   1.1   thorpej 	} else {
    275   1.1   thorpej 		/* update token only when it is negative */
    276   1.1   thorpej 		if (tbr->tbr_token <= 0) {
    277   1.1   thorpej 			now = read_machclk();
    278   1.1   thorpej 			interval = now - tbr->tbr_last;
    279   1.1   thorpej 			if (interval >= tbr->tbr_filluptime)
    280   1.1   thorpej 				tbr->tbr_token = tbr->tbr_depth;
    281   1.1   thorpej 			else {
    282   1.1   thorpej 				tbr->tbr_token += interval * tbr->tbr_rate;
    283   1.1   thorpej 				if (tbr->tbr_token > tbr->tbr_depth)
    284   1.1   thorpej 					tbr->tbr_token = tbr->tbr_depth;
    285   1.1   thorpej 			}
    286   1.1   thorpej 			tbr->tbr_last = now;
    287   1.1   thorpej 		}
    288   1.1   thorpej 		/* if token is still negative, don't allow dequeue */
    289   1.1   thorpej 		if (tbr->tbr_token <= 0)
    290   1.1   thorpej 			return (NULL);
    291   1.1   thorpej 	}
    292   1.1   thorpej 
    293   1.1   thorpej 	if (ALTQ_IS_ENABLED(ifq))
    294   1.1   thorpej 		m = (*ifq->altq_dequeue)(ifq, op);
    295   1.1   thorpej 	else {
    296   1.1   thorpej 		if (op == ALTDQ_POLL)
    297   1.1   thorpej 			IF_POLL(ifq, m);
    298   1.1   thorpej 		else
    299   1.1   thorpej 			IF_DEQUEUE(ifq, m);
    300   1.1   thorpej 	}
    301   1.1   thorpej 
    302   1.1   thorpej 	if (m != NULL && op == ALTDQ_REMOVE)
    303   1.1   thorpej 		tbr->tbr_token -= TBR_SCALE(m_pktlen(m));
    304   1.1   thorpej 	tbr->tbr_lastop = op;
    305   1.1   thorpej 	return (m);
    306   1.1   thorpej }
    307   1.1   thorpej 
    308   1.1   thorpej /*
    309   1.1   thorpej  * set a token bucket regulator.
    310   1.1   thorpej  * if the specified rate is zero, the token bucket regulator is deleted.
    311   1.1   thorpej  */
    312   1.1   thorpej int
    313  1.16     peter tbr_set(struct ifaltq *ifq, struct tb_profile *profile)
    314   1.1   thorpej {
    315   1.1   thorpej 	struct tb_regulator *tbr, *otbr;
    316   1.1   thorpej 
    317   1.1   thorpej 	if (machclk_freq == 0)
    318   1.1   thorpej 		init_machclk();
    319   1.1   thorpej 	if (machclk_freq == 0) {
    320  1.11       wiz 		printf("tbr_set: no CPU clock available!\n");
    321   1.1   thorpej 		return (ENXIO);
    322   1.1   thorpej 	}
    323  1.12     perry 
    324   1.1   thorpej 	if (profile->rate == 0) {
    325   1.1   thorpej 		/* delete this tbr */
    326   1.1   thorpej 		if ((tbr = ifq->altq_tbr) == NULL)
    327   1.1   thorpej 			return (ENOENT);
    328   1.1   thorpej 		ifq->altq_tbr = NULL;
    329  1.14  christos 		free(tbr, M_DEVBUF);
    330   1.1   thorpej 		return (0);
    331   1.1   thorpej 	}
    332   1.1   thorpej 
    333  1.14  christos 	tbr = malloc(sizeof(struct tb_regulator), M_DEVBUF, M_WAITOK|M_ZERO);
    334   1.1   thorpej 	if (tbr == NULL)
    335   1.1   thorpej 		return (ENOMEM);
    336   1.1   thorpej 
    337   1.1   thorpej 	tbr->tbr_rate = TBR_SCALE(profile->rate / 8) / machclk_freq;
    338   1.1   thorpej 	tbr->tbr_depth = TBR_SCALE(profile->depth);
    339   1.1   thorpej 	if (tbr->tbr_rate > 0)
    340   1.1   thorpej 		tbr->tbr_filluptime = tbr->tbr_depth / tbr->tbr_rate;
    341   1.1   thorpej 	else
    342   1.1   thorpej 		tbr->tbr_filluptime = 0xffffffffffffffffLL;
    343   1.1   thorpej 	tbr->tbr_token = tbr->tbr_depth;
    344   1.1   thorpej 	tbr->tbr_last = read_machclk();
    345   1.1   thorpej 	tbr->tbr_lastop = ALTDQ_REMOVE;
    346   1.1   thorpej 
    347   1.1   thorpej 	otbr = ifq->altq_tbr;
    348   1.1   thorpej 	ifq->altq_tbr = tbr;	/* set the new tbr */
    349   1.1   thorpej 
    350   1.1   thorpej 	if (otbr != NULL)
    351  1.14  christos 		free(otbr, M_DEVBUF);
    352   1.1   thorpej 	else {
    353   1.1   thorpej 		if (tbr_timer == 0) {
    354   1.1   thorpej 			CALLOUT_RESET(&tbr_callout, 1, tbr_timeout, (void *)0);
    355   1.1   thorpej 			tbr_timer = 1;
    356   1.1   thorpej 		}
    357   1.1   thorpej 	}
    358   1.1   thorpej 	return (0);
    359   1.1   thorpej }
    360   1.1   thorpej 
    361   1.1   thorpej /*
    362   1.1   thorpej  * tbr_timeout goes through the interface list, and kicks the drivers
    363   1.1   thorpej  * if necessary.
    364   1.1   thorpej  */
    365   1.1   thorpej static void
    366  1.15  christos tbr_timeout(void *arg __unused)
    367   1.1   thorpej {
    368   1.1   thorpej 	struct ifnet *ifp;
    369   1.1   thorpej 	int active, s;
    370   1.1   thorpej 
    371   1.1   thorpej 	active = 0;
    372   1.5   thorpej 	s = splnet();
    373  1.16     peter 	for (ifp = TAILQ_FIRST(&ifnet); ifp; ifp = TAILQ_NEXT(ifp, if_list)) {
    374   1.1   thorpej 		if (!TBR_IS_ENABLED(&ifp->if_snd))
    375   1.1   thorpej 			continue;
    376   1.1   thorpej 		active++;
    377   1.1   thorpej 		if (!IFQ_IS_EMPTY(&ifp->if_snd) && ifp->if_start != NULL)
    378   1.1   thorpej 			(*ifp->if_start)(ifp);
    379  1.16     peter 	}
    380  1.16     peter 	splx(s);
    381  1.16     peter 	if (active > 0)
    382  1.16     peter 		CALLOUT_RESET(&tbr_callout, 1, tbr_timeout, (void *)0);
    383  1.16     peter 	else
    384  1.16     peter 		tbr_timer = 0;	/* don't need tbr_timer anymore */
    385  1.16     peter #if defined(__alpha__) && !defined(ALTQ_NOPCC)
    386  1.16     peter 	{
    387  1.16     peter 		/*
    388  1.16     peter 		 * XXX read out the machine dependent clock once a second
    389  1.16     peter 		 * to detect counter wrap-around.
    390  1.16     peter 		 */
    391  1.16     peter 		static u_int cnt;
    392  1.16     peter 
    393  1.16     peter 		if (++cnt >= hz) {
    394  1.16     peter 			(void)read_machclk();
    395  1.16     peter 			cnt = 0;
    396  1.16     peter 		}
    397  1.16     peter 	}
    398  1.16     peter #endif /* __alpha__ && !ALTQ_NOPCC */
    399  1.16     peter }
    400  1.16     peter 
    401  1.16     peter /*
    402  1.16     peter  * get token bucket regulator profile
    403  1.16     peter  */
    404  1.16     peter int
    405  1.16     peter tbr_get(struct ifaltq *ifq, struct tb_profile *profile)
    406  1.16     peter {
    407  1.16     peter 	struct tb_regulator *tbr;
    408  1.16     peter 
    409  1.16     peter 	if ((tbr = ifq->altq_tbr) == NULL) {
    410  1.16     peter 		profile->rate = 0;
    411  1.16     peter 		profile->depth = 0;
    412  1.16     peter 	} else {
    413  1.16     peter 		profile->rate =
    414  1.16     peter 		    (u_int)TBR_UNSCALE(tbr->tbr_rate * 8 * machclk_freq);
    415  1.16     peter 		profile->depth = (u_int)TBR_UNSCALE(tbr->tbr_depth);
    416  1.16     peter 	}
    417  1.16     peter 	return (0);
    418  1.16     peter }
    419  1.16     peter 
    420  1.16     peter /*
    421  1.16     peter  * attach a discipline to the interface.  if one already exists, it is
    422  1.16     peter  * overridden.
    423  1.16     peter  */
    424  1.16     peter int
    425  1.16     peter altq_pfattach(struct pf_altq *a)
    426  1.16     peter {
    427  1.16     peter 	struct ifnet *ifp;
    428  1.16     peter 	struct tb_profile tb;
    429  1.16     peter 	int s, error = 0;
    430  1.16     peter 
    431  1.16     peter 	switch (a->scheduler) {
    432  1.16     peter 	case ALTQT_NONE:
    433  1.16     peter 		break;
    434  1.16     peter #ifdef ALTQ_CBQ
    435  1.16     peter 	case ALTQT_CBQ:
    436  1.16     peter 		error = cbq_pfattach(a);
    437  1.16     peter 		break;
    438  1.16     peter #endif
    439  1.16     peter #ifdef ALTQ_PRIQ
    440  1.16     peter 	case ALTQT_PRIQ:
    441  1.16     peter 		error = priq_pfattach(a);
    442  1.16     peter 		break;
    443  1.16     peter #endif
    444  1.16     peter #ifdef ALTQ_HFSC
    445  1.16     peter 	case ALTQT_HFSC:
    446  1.16     peter 		error = hfsc_pfattach(a);
    447  1.16     peter 		break;
    448  1.16     peter #endif
    449  1.16     peter 	default:
    450  1.16     peter 		error = ENXIO;
    451  1.16     peter 	}
    452  1.16     peter 
    453  1.16     peter 	ifp = ifunit(a->ifname);
    454  1.16     peter 
    455  1.16     peter 	/* if the state is running, enable altq */
    456  1.16     peter 	if (error == 0 && pfaltq_running &&
    457  1.16     peter 	    ifp != NULL && ifp->if_snd.altq_type != ALTQT_NONE &&
    458  1.16     peter 	    !ALTQ_IS_ENABLED(&ifp->if_snd))
    459  1.16     peter 			error = altq_enable(&ifp->if_snd);
    460  1.16     peter 
    461  1.16     peter 	/* if altq is already enabled, reset set tokenbucket regulator */
    462  1.16     peter 	if (error == 0 && ifp != NULL && ALTQ_IS_ENABLED(&ifp->if_snd)) {
    463  1.16     peter 		tb.rate = a->ifbandwidth;
    464  1.16     peter 		tb.depth = a->tbrsize;
    465  1.16     peter 		s = splnet();
    466  1.16     peter 		error = tbr_set(&ifp->if_snd, &tb);
    467  1.16     peter 		splx(s);
    468  1.16     peter 	}
    469  1.16     peter 
    470  1.16     peter 	return (error);
    471  1.16     peter }
    472  1.16     peter 
    473  1.16     peter /*
    474  1.16     peter  * detach a discipline from the interface.
    475  1.16     peter  * it is possible that the discipline was already overridden by another
    476  1.16     peter  * discipline.
    477  1.16     peter  */
    478  1.16     peter int
    479  1.16     peter altq_pfdetach(struct pf_altq *a)
    480  1.16     peter {
    481  1.16     peter 	struct ifnet *ifp;
    482  1.16     peter 	int s, error = 0;
    483  1.16     peter 
    484  1.16     peter 	if ((ifp = ifunit(a->ifname)) == NULL)
    485  1.16     peter 		return (EINVAL);
    486  1.16     peter 
    487  1.16     peter 	/* if this discipline is no longer referenced, just return */
    488  1.16     peter 	if (a->altq_disc == NULL || a->altq_disc != ifp->if_snd.altq_disc)
    489  1.16     peter 		return (0);
    490  1.16     peter 
    491  1.16     peter 	s = splnet();
    492  1.16     peter 	if (ALTQ_IS_ENABLED(&ifp->if_snd))
    493  1.16     peter 		error = altq_disable(&ifp->if_snd);
    494  1.16     peter 	if (error == 0)
    495  1.16     peter 		error = altq_detach(&ifp->if_snd);
    496  1.16     peter 	splx(s);
    497  1.16     peter 
    498  1.16     peter 	return (error);
    499  1.16     peter }
    500  1.16     peter 
    501  1.16     peter /*
    502  1.16     peter  * add a discipline or a queue
    503  1.16     peter  */
    504  1.16     peter int
    505  1.16     peter altq_add(struct pf_altq *a)
    506  1.16     peter {
    507  1.16     peter 	int error = 0;
    508  1.16     peter 
    509  1.16     peter 	if (a->qname[0] != 0)
    510  1.16     peter 		return (altq_add_queue(a));
    511  1.16     peter 
    512  1.16     peter 	if (machclk_freq == 0)
    513  1.16     peter 		init_machclk();
    514  1.16     peter 	if (machclk_freq == 0)
    515  1.16     peter 		panic("altq_add: no CPU clock");
    516  1.16     peter 
    517  1.16     peter 	switch (a->scheduler) {
    518  1.16     peter #ifdef ALTQ_CBQ
    519  1.16     peter 	case ALTQT_CBQ:
    520  1.16     peter 		error = cbq_add_altq(a);
    521  1.16     peter 		break;
    522  1.16     peter #endif
    523  1.16     peter #ifdef ALTQ_PRIQ
    524  1.16     peter 	case ALTQT_PRIQ:
    525  1.16     peter 		error = priq_add_altq(a);
    526  1.16     peter 		break;
    527  1.16     peter #endif
    528  1.16     peter #ifdef ALTQ_HFSC
    529  1.16     peter 	case ALTQT_HFSC:
    530  1.16     peter 		error = hfsc_add_altq(a);
    531  1.16     peter 		break;
    532  1.16     peter #endif
    533  1.16     peter 	default:
    534  1.16     peter 		error = ENXIO;
    535  1.16     peter 	}
    536  1.16     peter 
    537  1.16     peter 	return (error);
    538  1.16     peter }
    539  1.16     peter 
    540  1.16     peter /*
    541  1.16     peter  * remove a discipline or a queue
    542  1.16     peter  */
    543  1.16     peter int
    544  1.16     peter altq_remove(struct pf_altq *a)
    545  1.16     peter {
    546  1.16     peter 	int error = 0;
    547  1.16     peter 
    548  1.16     peter 	if (a->qname[0] != 0)
    549  1.16     peter 		return (altq_remove_queue(a));
    550  1.16     peter 
    551  1.16     peter 	switch (a->scheduler) {
    552  1.16     peter #ifdef ALTQ_CBQ
    553  1.16     peter 	case ALTQT_CBQ:
    554  1.16     peter 		error = cbq_remove_altq(a);
    555  1.16     peter 		break;
    556  1.16     peter #endif
    557  1.16     peter #ifdef ALTQ_PRIQ
    558  1.16     peter 	case ALTQT_PRIQ:
    559  1.16     peter 		error = priq_remove_altq(a);
    560  1.16     peter 		break;
    561  1.16     peter #endif
    562  1.16     peter #ifdef ALTQ_HFSC
    563  1.16     peter 	case ALTQT_HFSC:
    564  1.16     peter 		error = hfsc_remove_altq(a);
    565  1.16     peter 		break;
    566  1.16     peter #endif
    567  1.16     peter 	default:
    568  1.16     peter 		error = ENXIO;
    569  1.16     peter 	}
    570  1.16     peter 
    571  1.16     peter 	return (error);
    572  1.16     peter }
    573  1.16     peter 
    574  1.16     peter /*
    575  1.16     peter  * add a queue to the discipline
    576  1.16     peter  */
    577  1.16     peter int
    578  1.16     peter altq_add_queue(struct pf_altq *a)
    579  1.16     peter {
    580  1.16     peter 	int error = 0;
    581  1.16     peter 
    582  1.16     peter 	switch (a->scheduler) {
    583  1.16     peter #ifdef ALTQ_CBQ
    584  1.16     peter 	case ALTQT_CBQ:
    585  1.16     peter 		error = cbq_add_queue(a);
    586  1.16     peter 		break;
    587  1.16     peter #endif
    588  1.16     peter #ifdef ALTQ_PRIQ
    589  1.16     peter 	case ALTQT_PRIQ:
    590  1.16     peter 		error = priq_add_queue(a);
    591  1.16     peter 		break;
    592  1.16     peter #endif
    593  1.16     peter #ifdef ALTQ_HFSC
    594  1.16     peter 	case ALTQT_HFSC:
    595  1.16     peter 		error = hfsc_add_queue(a);
    596  1.16     peter 		break;
    597  1.16     peter #endif
    598  1.16     peter 	default:
    599  1.16     peter 		error = ENXIO;
    600  1.16     peter 	}
    601  1.16     peter 
    602  1.16     peter 	return (error);
    603  1.16     peter }
    604  1.16     peter 
    605  1.16     peter /*
    606  1.16     peter  * remove a queue from the discipline
    607  1.16     peter  */
    608  1.16     peter int
    609  1.16     peter altq_remove_queue(struct pf_altq *a)
    610  1.16     peter {
    611  1.16     peter 	int error = 0;
    612  1.16     peter 
    613  1.16     peter 	switch (a->scheduler) {
    614  1.16     peter #ifdef ALTQ_CBQ
    615  1.16     peter 	case ALTQT_CBQ:
    616  1.16     peter 		error = cbq_remove_queue(a);
    617  1.16     peter 		break;
    618  1.16     peter #endif
    619  1.16     peter #ifdef ALTQ_PRIQ
    620  1.16     peter 	case ALTQT_PRIQ:
    621  1.16     peter 		error = priq_remove_queue(a);
    622  1.16     peter 		break;
    623  1.16     peter #endif
    624  1.16     peter #ifdef ALTQ_HFSC
    625  1.16     peter 	case ALTQT_HFSC:
    626  1.16     peter 		error = hfsc_remove_queue(a);
    627  1.16     peter 		break;
    628  1.16     peter #endif
    629  1.16     peter 	default:
    630  1.16     peter 		error = ENXIO;
    631  1.16     peter 	}
    632  1.16     peter 
    633  1.16     peter 	return (error);
    634  1.16     peter }
    635  1.16     peter 
    636  1.16     peter /*
    637  1.16     peter  * get queue statistics
    638  1.16     peter  */
    639  1.16     peter int
    640  1.16     peter altq_getqstats(struct pf_altq *a, void *ubuf, int *nbytes)
    641  1.16     peter {
    642  1.16     peter 	int error = 0;
    643  1.16     peter 
    644  1.16     peter 	switch (a->scheduler) {
    645  1.16     peter #ifdef ALTQ_CBQ
    646  1.16     peter 	case ALTQT_CBQ:
    647  1.16     peter 		error = cbq_getqstats(a, ubuf, nbytes);
    648  1.16     peter 		break;
    649  1.16     peter #endif
    650  1.16     peter #ifdef ALTQ_PRIQ
    651  1.16     peter 	case ALTQT_PRIQ:
    652  1.16     peter 		error = priq_getqstats(a, ubuf, nbytes);
    653  1.16     peter 		break;
    654  1.16     peter #endif
    655  1.16     peter #ifdef ALTQ_HFSC
    656  1.16     peter 	case ALTQT_HFSC:
    657  1.16     peter 		error = hfsc_getqstats(a, ubuf, nbytes);
    658  1.16     peter 		break;
    659  1.16     peter #endif
    660  1.16     peter 	default:
    661  1.16     peter 		error = ENXIO;
    662  1.16     peter 	}
    663  1.16     peter 
    664  1.16     peter 	return (error);
    665  1.16     peter }
    666  1.16     peter 
    667  1.16     peter /*
    668  1.16     peter  * read and write diffserv field in IPv4 or IPv6 header
    669  1.16     peter  */
    670  1.16     peter u_int8_t
    671  1.16     peter read_dsfield(struct mbuf *m, struct altq_pktattr *pktattr)
    672  1.16     peter {
    673  1.16     peter 	struct mbuf *m0;
    674  1.16     peter 	u_int8_t ds_field = 0;
    675  1.16     peter 
    676  1.16     peter 	if (pktattr == NULL ||
    677  1.16     peter 	    (pktattr->pattr_af != AF_INET && pktattr->pattr_af != AF_INET6))
    678  1.16     peter 		return ((u_int8_t)0);
    679  1.16     peter 
    680  1.16     peter 	/* verify that pattr_hdr is within the mbuf data */
    681  1.16     peter 	for (m0 = m; m0 != NULL; m0 = m0->m_next)
    682  1.16     peter 		if ((pktattr->pattr_hdr >= m0->m_data) &&
    683  1.16     peter 		    (pktattr->pattr_hdr < m0->m_data + m0->m_len))
    684  1.16     peter 			break;
    685  1.16     peter 	if (m0 == NULL) {
    686  1.16     peter 		/* ick, pattr_hdr is stale */
    687  1.16     peter 		pktattr->pattr_af = AF_UNSPEC;
    688  1.16     peter #ifdef ALTQ_DEBUG
    689  1.16     peter 		printf("read_dsfield: can't locate header!\n");
    690  1.16     peter #endif
    691  1.16     peter 		return ((u_int8_t)0);
    692  1.16     peter 	}
    693  1.16     peter 
    694  1.16     peter 	if (pktattr->pattr_af == AF_INET) {
    695  1.16     peter 		struct ip *ip = (struct ip *)pktattr->pattr_hdr;
    696  1.16     peter 
    697  1.16     peter 		if (ip->ip_v != 4)
    698  1.16     peter 			return ((u_int8_t)0);	/* version mismatch! */
    699  1.16     peter 		ds_field = ip->ip_tos;
    700  1.16     peter 	}
    701  1.16     peter #ifdef INET6
    702  1.16     peter 	else if (pktattr->pattr_af == AF_INET6) {
    703  1.16     peter 		struct ip6_hdr *ip6 = (struct ip6_hdr *)pktattr->pattr_hdr;
    704  1.16     peter 		u_int32_t flowlabel;
    705  1.16     peter 
    706  1.16     peter 		flowlabel = ntohl(ip6->ip6_flow);
    707  1.16     peter 		if ((flowlabel >> 28) != 6)
    708  1.16     peter 			return ((u_int8_t)0);	/* version mismatch! */
    709  1.16     peter 		ds_field = (flowlabel >> 20) & 0xff;
    710  1.16     peter 	}
    711  1.16     peter #endif
    712  1.16     peter 	return (ds_field);
    713  1.16     peter }
    714  1.16     peter 
    715  1.16     peter void
    716  1.16     peter write_dsfield(struct mbuf *m, struct altq_pktattr *pktattr, u_int8_t dsfield)
    717  1.16     peter {
    718  1.16     peter 	struct mbuf *m0;
    719  1.16     peter 
    720  1.16     peter 	if (pktattr == NULL ||
    721  1.16     peter 	    (pktattr->pattr_af != AF_INET && pktattr->pattr_af != AF_INET6))
    722  1.16     peter 		return;
    723  1.16     peter 
    724  1.16     peter 	/* verify that pattr_hdr is within the mbuf data */
    725  1.16     peter 	for (m0 = m; m0 != NULL; m0 = m0->m_next)
    726  1.16     peter 		if ((pktattr->pattr_hdr >= m0->m_data) &&
    727  1.16     peter 		    (pktattr->pattr_hdr < m0->m_data + m0->m_len))
    728  1.16     peter 			break;
    729  1.16     peter 	if (m0 == NULL) {
    730  1.16     peter 		/* ick, pattr_hdr is stale */
    731  1.16     peter 		pktattr->pattr_af = AF_UNSPEC;
    732  1.16     peter #ifdef ALTQ_DEBUG
    733  1.16     peter 		printf("write_dsfield: can't locate header!\n");
    734  1.16     peter #endif
    735  1.16     peter 		return;
    736  1.16     peter 	}
    737  1.16     peter 
    738  1.16     peter 	if (pktattr->pattr_af == AF_INET) {
    739  1.16     peter 		struct ip *ip = (struct ip *)pktattr->pattr_hdr;
    740  1.16     peter 		u_int8_t old;
    741  1.16     peter 		int32_t sum;
    742  1.16     peter 
    743  1.16     peter 		if (ip->ip_v != 4)
    744  1.16     peter 			return;		/* version mismatch! */
    745  1.16     peter 		old = ip->ip_tos;
    746  1.16     peter 		dsfield |= old & 3;	/* leave CU bits */
    747  1.16     peter 		if (old == dsfield)
    748  1.16     peter 			return;
    749  1.16     peter 		ip->ip_tos = dsfield;
    750  1.16     peter 		/*
    751  1.16     peter 		 * update checksum (from RFC1624)
    752  1.16     peter 		 *	   HC' = ~(~HC + ~m + m')
    753  1.16     peter 		 */
    754  1.16     peter 		sum = ~ntohs(ip->ip_sum) & 0xffff;
    755  1.16     peter 		sum += 0xff00 + (~old & 0xff) + dsfield;
    756  1.16     peter 		sum = (sum >> 16) + (sum & 0xffff);
    757  1.16     peter 		sum += (sum >> 16);  /* add carry */
    758  1.16     peter 
    759  1.16     peter 		ip->ip_sum = htons(~sum & 0xffff);
    760  1.16     peter 	}
    761  1.16     peter #ifdef INET6
    762  1.16     peter 	else if (pktattr->pattr_af == AF_INET6) {
    763  1.16     peter 		struct ip6_hdr *ip6 = (struct ip6_hdr *)pktattr->pattr_hdr;
    764  1.16     peter 		u_int32_t flowlabel;
    765  1.16     peter 
    766  1.16     peter 		flowlabel = ntohl(ip6->ip6_flow);
    767  1.16     peter 		if ((flowlabel >> 28) != 6)
    768  1.16     peter 			return;		/* version mismatch! */
    769  1.16     peter 		flowlabel = (flowlabel & 0xf03fffff) | (dsfield << 20);
    770  1.16     peter 		ip6->ip6_flow = htonl(flowlabel);
    771  1.16     peter 	}
    772  1.16     peter #endif
    773  1.16     peter 	return;
    774  1.16     peter }
    775  1.16     peter 
    776  1.16     peter 
    777  1.16     peter /*
    778  1.16     peter  * high resolution clock support taking advantage of a machine dependent
    779  1.16     peter  * high resolution time counter (e.g., timestamp counter of intel pentium).
    780  1.16     peter  * we assume
    781  1.16     peter  *  - 64-bit-long monotonically-increasing counter
    782  1.16     peter  *  - frequency range is 100M-4GHz (CPU speed)
    783  1.16     peter  */
    784  1.16     peter /* if pcc is not available or disabled, emulate 256MHz using microtime() */
    785  1.16     peter #define	MACHCLK_SHIFT	8
    786  1.16     peter 
    787  1.16     peter int machclk_usepcc;
    788  1.16     peter u_int32_t machclk_freq = 0;
    789  1.16     peter u_int32_t machclk_per_tick = 0;
    790  1.16     peter 
    791  1.16     peter #ifdef __alpha__
    792  1.16     peter #ifdef __FreeBSD__
    793  1.16     peter extern u_int32_t cycles_per_sec;	/* alpha cpu clock frequency */
    794  1.16     peter #elif defined(__NetBSD__) || defined(__OpenBSD__)
    795  1.16     peter extern u_int64_t cycles_per_usec;	/* alpha cpu clock frequency */
    796  1.16     peter #endif
    797  1.16     peter #endif /* __alpha__ */
    798  1.16     peter 
    799  1.16     peter void
    800  1.16     peter init_machclk(void)
    801  1.16     peter {
    802  1.16     peter 	machclk_usepcc = 1;
    803  1.16     peter 
    804  1.16     peter #if (!defined(__i386__) && !defined(__alpha__)) || defined(ALTQ_NOPCC)
    805  1.16     peter 	machclk_usepcc = 0;
    806  1.16     peter #endif
    807  1.16     peter #if defined(__FreeBSD__) && defined(SMP)
    808  1.16     peter 	machclk_usepcc = 0;
    809  1.16     peter #endif
    810  1.16     peter #if defined(__NetBSD__) && defined(MULTIPROCESSOR)
    811  1.16     peter 	machclk_usepcc = 0;
    812  1.16     peter #endif
    813  1.16     peter #ifdef __i386__
    814  1.16     peter 	/* check if TSC is available */
    815  1.16     peter 	if (machclk_usepcc == 1 && (cpu_feature & CPUID_TSC) == 0)
    816  1.16     peter 		machclk_usepcc = 0;
    817  1.16     peter #endif
    818  1.16     peter 
    819  1.16     peter 	if (machclk_usepcc == 0) {
    820  1.16     peter 		/* emulate 256MHz using microtime() */
    821  1.16     peter 		machclk_freq = 1000000 << MACHCLK_SHIFT;
    822  1.16     peter 		machclk_per_tick = machclk_freq / hz;
    823  1.16     peter #ifdef ALTQ_DEBUG
    824  1.16     peter 		printf("altq: emulate %uHz CPU clock\n", machclk_freq);
    825  1.16     peter #endif
    826  1.16     peter 		return;
    827  1.16     peter 	}
    828  1.16     peter 
    829  1.16     peter 	/*
    830  1.16     peter 	 * if the clock frequency (of Pentium TSC or Alpha PCC) is
    831  1.16     peter 	 * accessible, just use it.
    832  1.16     peter 	 */
    833  1.16     peter #ifdef __i386__
    834  1.16     peter #ifdef __FreeBSD__
    835  1.16     peter #if (__FreeBSD_version > 300000)
    836  1.16     peter 	machclk_freq = tsc_freq;
    837  1.16     peter #else
    838  1.16     peter 	machclk_freq = i586_ctr_freq;
    839  1.16     peter #endif
    840  1.16     peter #elif defined(__NetBSD__)
    841  1.16     peter 	machclk_freq = (u_int32_t)curcpu()->ci_tsc_freq;
    842  1.16     peter #elif defined(__OpenBSD__) && (defined(I586_CPU) || defined(I686_CPU))
    843  1.16     peter 	machclk_freq = pentium_mhz * 1000000;
    844  1.16     peter #endif
    845  1.16     peter #elif defined(__alpha__)
    846  1.16     peter #ifdef __FreeBSD__
    847  1.16     peter 	machclk_freq = cycles_per_sec;
    848  1.16     peter #elif defined(__NetBSD__) || defined(__OpenBSD__)
    849  1.16     peter 	machclk_freq = (u_int32_t)(cycles_per_usec * 1000000);
    850  1.16     peter #endif
    851  1.16     peter #endif /* __alpha__ */
    852  1.16     peter 
    853  1.16     peter 	/*
    854  1.16     peter 	 * if we don't know the clock frequency, measure it.
    855  1.16     peter 	 */
    856  1.16     peter 	if (machclk_freq == 0) {
    857  1.16     peter 		static int	wait;
    858  1.16     peter 		struct timeval	tv_start, tv_end;
    859  1.16     peter 		u_int64_t	start, end, diff;
    860  1.16     peter 		int		timo;
    861  1.16     peter 
    862  1.16     peter 		microtime(&tv_start);
    863  1.16     peter 		start = read_machclk();
    864  1.16     peter 		timo = hz;	/* 1 sec */
    865  1.16     peter 		(void)tsleep(&wait, PWAIT | PCATCH, "init_machclk", timo);
    866  1.16     peter 		microtime(&tv_end);
    867  1.16     peter 		end = read_machclk();
    868  1.16     peter 		diff = (u_int64_t)(tv_end.tv_sec - tv_start.tv_sec) * 1000000
    869  1.16     peter 		    + tv_end.tv_usec - tv_start.tv_usec;
    870  1.16     peter 		if (diff != 0)
    871  1.16     peter 			machclk_freq = (u_int)((end - start) * 1000000 / diff);
    872  1.16     peter 	}
    873  1.16     peter 
    874  1.16     peter 	machclk_per_tick = machclk_freq / hz;
    875  1.16     peter 
    876  1.16     peter #ifdef ALTQ_DEBUG
    877  1.16     peter 	printf("altq: CPU clock: %uHz\n", machclk_freq);
    878  1.16     peter #endif
    879  1.16     peter }
    880   1.1   thorpej 
    881  1.16     peter #if defined(__OpenBSD__) && defined(__i386__)
    882  1.16     peter static inline u_int64_t
    883  1.16     peter rdtsc(void)
    884  1.16     peter {
    885  1.16     peter 	u_int64_t rv;
    886  1.16     peter 	__asm __volatile(".byte 0x0f, 0x31" : "=A" (rv));
    887  1.16     peter 	return (rv);
    888   1.1   thorpej }
    889  1.16     peter #endif /* __OpenBSD__ && __i386__ */
    890   1.1   thorpej 
    891  1.16     peter u_int64_t
    892  1.16     peter read_machclk(void)
    893   1.1   thorpej {
    894  1.16     peter 	u_int64_t val;
    895  1.16     peter 
    896  1.16     peter 	if (machclk_usepcc) {
    897  1.16     peter #if defined(__i386__)
    898  1.16     peter 		val = rdtsc();
    899  1.16     peter #elif defined(__alpha__)
    900  1.16     peter 		static u_int32_t last_pcc, upper;
    901  1.16     peter 		u_int32_t pcc;
    902   1.1   thorpej 
    903  1.16     peter 		/*
    904  1.16     peter 		 * for alpha, make a 64bit counter value out of the 32bit
    905  1.16     peter 		 * alpha processor cycle counter.
    906  1.16     peter 		 * read_machclk must be called within a half of its
    907  1.16     peter 		 * wrap-around cycle (about 5 sec for 400MHz cpu) to properly
    908  1.16     peter 		 * detect a counter wrap-around.
    909  1.16     peter 		 * tbr_timeout calls read_machclk once a second.
    910  1.16     peter 		 */
    911  1.16     peter 		pcc = (u_int32_t)alpha_rpcc();
    912  1.16     peter 		if (pcc <= last_pcc)
    913  1.16     peter 			upper++;
    914  1.16     peter 		last_pcc = pcc;
    915  1.16     peter 		val = ((u_int64_t)upper << 32) + pcc;
    916  1.16     peter #else
    917  1.16     peter 		panic("read_machclk");
    918  1.16     peter #endif
    919   1.1   thorpej 	} else {
    920  1.16     peter 		struct timeval tv;
    921  1.16     peter 
    922  1.16     peter 		microtime(&tv);
    923  1.16     peter 		val = (((u_int64_t)(tv.tv_sec - boottime.tv_sec) * 1000000
    924  1.16     peter 		    + tv.tv_usec) << MACHCLK_SHIFT);
    925   1.1   thorpej 	}
    926  1.16     peter 	return (val);
    927   1.1   thorpej }
    928   1.1   thorpej 
    929  1.16     peter #ifdef ALTQ3_CLFIER_COMPAT
    930   1.1   thorpej 
    931   1.1   thorpej #ifndef IPPROTO_ESP
    932   1.1   thorpej #define	IPPROTO_ESP	50		/* encapsulating security payload */
    933   1.1   thorpej #endif
    934   1.1   thorpej #ifndef IPPROTO_AH
    935   1.1   thorpej #define	IPPROTO_AH	51		/* authentication header */
    936   1.1   thorpej #endif
    937   1.1   thorpej 
    938  1.12     perry /*
    939   1.1   thorpej  * extract flow information from a given packet.
    940   1.1   thorpej  * filt_mask shows flowinfo fields required.
    941   1.1   thorpej  * we assume the ip header is in one mbuf, and addresses and ports are
    942   1.1   thorpej  * in network byte order.
    943   1.1   thorpej  */
    944  1.12     perry int
    945  1.16     peter altq_extractflow(struct mbuf *m, int af, struct flowinfo *flow,
    946  1.16     peter     u_int32_t filt_bmask)
    947   1.1   thorpej {
    948   1.1   thorpej 
    949   1.1   thorpej 	switch (af) {
    950   1.1   thorpej 	case PF_INET: {
    951   1.1   thorpej 		struct flowinfo_in *fin;
    952   1.1   thorpej 		struct ip *ip;
    953   1.1   thorpej 
    954   1.1   thorpej 		ip = mtod(m, struct ip *);
    955   1.1   thorpej 
    956   1.1   thorpej 		if (ip->ip_v != 4)
    957   1.1   thorpej 			break;
    958   1.8    itojun 
    959   1.1   thorpej 		fin = (struct flowinfo_in *)flow;
    960   1.1   thorpej 		fin->fi_len = sizeof(struct flowinfo_in);
    961   1.1   thorpej 		fin->fi_family = AF_INET;
    962   1.1   thorpej 
    963   1.1   thorpej 		fin->fi_proto = ip->ip_p;
    964   1.1   thorpej 		fin->fi_tos = ip->ip_tos;
    965   1.1   thorpej 
    966   1.1   thorpej 		fin->fi_src.s_addr = ip->ip_src.s_addr;
    967   1.1   thorpej 		fin->fi_dst.s_addr = ip->ip_dst.s_addr;
    968   1.8    itojun 
    969   1.1   thorpej 		if (filt_bmask & FIMB4_PORTS)
    970   1.1   thorpej 			/* if port info is required, extract port numbers */
    971   1.1   thorpej 			extract_ports4(m, ip, fin);
    972   1.1   thorpej 		else {
    973   1.1   thorpej 			fin->fi_sport = 0;
    974   1.1   thorpej 			fin->fi_dport = 0;
    975   1.1   thorpej 			fin->fi_gpi = 0;
    976   1.1   thorpej 		}
    977   1.1   thorpej 		return (1);
    978   1.1   thorpej 	}
    979   1.8    itojun 
    980   1.1   thorpej #ifdef INET6
    981   1.1   thorpej 	case PF_INET6: {
    982   1.1   thorpej 		struct flowinfo_in6 *fin6;
    983   1.1   thorpej 		struct ip6_hdr *ip6;
    984   1.1   thorpej 
    985   1.1   thorpej 		ip6 = mtod(m, struct ip6_hdr *);
    986   1.1   thorpej 		/* should we check the ip version? */
    987   1.8    itojun 
    988   1.1   thorpej 		fin6 = (struct flowinfo_in6 *)flow;
    989   1.1   thorpej 		fin6->fi6_len = sizeof(struct flowinfo_in6);
    990   1.1   thorpej 		fin6->fi6_family = AF_INET6;
    991   1.1   thorpej 
    992   1.1   thorpej 		fin6->fi6_proto = ip6->ip6_nxt;
    993   1.1   thorpej 		fin6->fi6_tclass   = (ntohl(ip6->ip6_flow) >> 20) & 0xff;
    994   1.1   thorpej 
    995   1.1   thorpej 		fin6->fi6_flowlabel = ip6->ip6_flow & htonl(0x000fffff);
    996   1.1   thorpej 		fin6->fi6_src = ip6->ip6_src;
    997   1.1   thorpej 		fin6->fi6_dst = ip6->ip6_dst;
    998   1.1   thorpej 
    999   1.1   thorpej 		if ((filt_bmask & FIMB6_PORTS) ||
   1000   1.1   thorpej 		    ((filt_bmask & FIMB6_PROTO)
   1001   1.1   thorpej 		     && ip6->ip6_nxt > IPPROTO_IPV6))
   1002   1.1   thorpej 			/*
   1003   1.1   thorpej 			 * if port info is required, or proto is required
   1004   1.1   thorpej 			 * but there are option headers, extract port
   1005   1.1   thorpej 			 * and protocol numbers.
   1006   1.1   thorpej 			 */
   1007   1.1   thorpej 			extract_ports6(m, ip6, fin6);
   1008   1.1   thorpej 		else {
   1009   1.1   thorpej 			fin6->fi6_sport = 0;
   1010   1.1   thorpej 			fin6->fi6_dport = 0;
   1011   1.1   thorpej 			fin6->fi6_gpi = 0;
   1012   1.1   thorpej 		}
   1013   1.1   thorpej 		return (1);
   1014   1.1   thorpej 	}
   1015   1.1   thorpej #endif /* INET6 */
   1016   1.1   thorpej 
   1017   1.1   thorpej 	default:
   1018   1.1   thorpej 		break;
   1019   1.1   thorpej 	}
   1020   1.1   thorpej 
   1021   1.1   thorpej 	/* failed */
   1022   1.1   thorpej 	flow->fi_len = sizeof(struct flowinfo);
   1023   1.1   thorpej 	flow->fi_family = AF_UNSPEC;
   1024   1.1   thorpej 	return (0);
   1025   1.1   thorpej }
   1026   1.1   thorpej 
   1027   1.1   thorpej /*
   1028   1.1   thorpej  * helper routine to extract port numbers
   1029   1.1   thorpej  */
   1030   1.1   thorpej /* structure for ipsec and ipv6 option header template */
   1031   1.1   thorpej struct _opt6 {
   1032   1.1   thorpej 	u_int8_t	opt6_nxt;	/* next header */
   1033   1.1   thorpej 	u_int8_t	opt6_hlen;	/* header extension length */
   1034   1.1   thorpej 	u_int16_t	_pad;
   1035   1.1   thorpej 	u_int32_t	ah_spi;		/* security parameter index
   1036   1.1   thorpej 					   for authentication header */
   1037   1.1   thorpej };
   1038   1.1   thorpej 
   1039   1.1   thorpej /*
   1040   1.1   thorpej  * extract port numbers from a ipv4 packet.
   1041   1.1   thorpej  */
   1042   1.1   thorpej static int
   1043  1.16     peter extract_ports4(struct mbuf *m, struct ip *ip, struct flowinfo_in *fin)
   1044   1.1   thorpej {
   1045   1.1   thorpej 	struct mbuf *m0;
   1046   1.1   thorpej 	u_short ip_off;
   1047   1.1   thorpej 	u_int8_t proto;
   1048   1.1   thorpej 	int 	off;
   1049   1.8    itojun 
   1050   1.1   thorpej 	fin->fi_sport = 0;
   1051   1.1   thorpej 	fin->fi_dport = 0;
   1052   1.1   thorpej 	fin->fi_gpi = 0;
   1053   1.8    itojun 
   1054   1.1   thorpej 	ip_off = ntohs(ip->ip_off);
   1055   1.1   thorpej 	/* if it is a fragment, try cached fragment info */
   1056   1.1   thorpej 	if (ip_off & IP_OFFMASK) {
   1057   1.1   thorpej 		ip4f_lookup(ip, fin);
   1058   1.1   thorpej 		return (1);
   1059   1.1   thorpej 	}
   1060   1.1   thorpej 
   1061   1.1   thorpej 	/* locate the mbuf containing the protocol header */
   1062   1.1   thorpej 	for (m0 = m; m0 != NULL; m0 = m0->m_next)
   1063   1.1   thorpej 		if (((caddr_t)ip >= m0->m_data) &&
   1064   1.1   thorpej 		    ((caddr_t)ip < m0->m_data + m0->m_len))
   1065   1.1   thorpej 			break;
   1066   1.1   thorpej 	if (m0 == NULL) {
   1067   1.1   thorpej #ifdef ALTQ_DEBUG
   1068   1.1   thorpej 		printf("extract_ports4: can't locate header! ip=%p\n", ip);
   1069   1.1   thorpej #endif
   1070   1.1   thorpej 		return (0);
   1071   1.1   thorpej 	}
   1072   1.1   thorpej 	off = ((caddr_t)ip - m0->m_data) + (ip->ip_hl << 2);
   1073   1.1   thorpej 	proto = ip->ip_p;
   1074   1.1   thorpej 
   1075   1.1   thorpej #ifdef ALTQ_IPSEC
   1076   1.1   thorpej  again:
   1077   1.1   thorpej #endif
   1078   1.1   thorpej 	while (off >= m0->m_len) {
   1079   1.1   thorpej 		off -= m0->m_len;
   1080   1.1   thorpej 		m0 = m0->m_next;
   1081   1.8    itojun 		if (m0 == NULL)
   1082   1.8    itojun 			return (0);  /* bogus ip_hl! */
   1083   1.1   thorpej 	}
   1084   1.8    itojun 	if (m0->m_len < off + 4)
   1085   1.8    itojun 		return (0);
   1086   1.1   thorpej 
   1087   1.1   thorpej 	switch (proto) {
   1088   1.1   thorpej 	case IPPROTO_TCP:
   1089   1.1   thorpej 	case IPPROTO_UDP: {
   1090   1.1   thorpej 		struct udphdr *udp;
   1091   1.8    itojun 
   1092   1.1   thorpej 		udp = (struct udphdr *)(mtod(m0, caddr_t) + off);
   1093   1.1   thorpej 		fin->fi_sport = udp->uh_sport;
   1094   1.1   thorpej 		fin->fi_dport = udp->uh_dport;
   1095   1.1   thorpej 		fin->fi_proto = proto;
   1096   1.1   thorpej 		}
   1097   1.1   thorpej 		break;
   1098   1.1   thorpej 
   1099   1.1   thorpej #ifdef ALTQ_IPSEC
   1100   1.1   thorpej 	case IPPROTO_ESP:
   1101   1.1   thorpej 		if (fin->fi_gpi == 0){
   1102   1.1   thorpej 			u_int32_t *gpi;
   1103   1.8    itojun 
   1104   1.1   thorpej 			gpi = (u_int32_t *)(mtod(m0, caddr_t) + off);
   1105   1.1   thorpej 			fin->fi_gpi   = *gpi;
   1106   1.1   thorpej 		}
   1107   1.1   thorpej 		fin->fi_proto = proto;
   1108   1.1   thorpej 		break;
   1109   1.1   thorpej 
   1110   1.1   thorpej 	case IPPROTO_AH: {
   1111   1.1   thorpej 			/* get next header and header length */
   1112   1.1   thorpej 			struct _opt6 *opt6;
   1113   1.1   thorpej 
   1114   1.1   thorpej 			opt6 = (struct _opt6 *)(mtod(m0, caddr_t) + off);
   1115   1.1   thorpej 			proto = opt6->opt6_nxt;
   1116   1.1   thorpej 			off += 8 + (opt6->opt6_hlen * 4);
   1117   1.8    itojun 			if (fin->fi_gpi == 0 && m0->m_len >= off + 8)
   1118   1.1   thorpej 				fin->fi_gpi = opt6->ah_spi;
   1119   1.1   thorpej 		}
   1120   1.1   thorpej 		/* goto the next header */
   1121   1.1   thorpej 		goto again;
   1122   1.1   thorpej #endif  /* ALTQ_IPSEC */
   1123   1.1   thorpej 
   1124   1.1   thorpej 	default:
   1125   1.1   thorpej 		fin->fi_proto = proto;
   1126   1.1   thorpej 		return (0);
   1127   1.1   thorpej 	}
   1128   1.1   thorpej 
   1129   1.1   thorpej 	/* if this is a first fragment, cache it. */
   1130   1.1   thorpej 	if (ip_off & IP_MF)
   1131   1.1   thorpej 		ip4f_cache(ip, fin);
   1132   1.1   thorpej 
   1133   1.1   thorpej 	return (1);
   1134   1.1   thorpej }
   1135   1.1   thorpej 
   1136   1.1   thorpej #ifdef INET6
   1137   1.1   thorpej static int
   1138  1.16     peter extract_ports6(struct mbuf *m, struct ip6_hdr *ip6, struct flowinfo_in6 *fin6)
   1139   1.1   thorpej {
   1140   1.1   thorpej 	struct mbuf *m0;
   1141   1.1   thorpej 	int	off;
   1142   1.1   thorpej 	u_int8_t proto;
   1143   1.8    itojun 
   1144   1.1   thorpej 	fin6->fi6_gpi   = 0;
   1145   1.1   thorpej 	fin6->fi6_sport = 0;
   1146   1.1   thorpej 	fin6->fi6_dport = 0;
   1147   1.8    itojun 
   1148   1.1   thorpej 	/* locate the mbuf containing the protocol header */
   1149   1.1   thorpej 	for (m0 = m; m0 != NULL; m0 = m0->m_next)
   1150   1.1   thorpej 		if (((caddr_t)ip6 >= m0->m_data) &&
   1151   1.1   thorpej 		    ((caddr_t)ip6 < m0->m_data + m0->m_len))
   1152   1.1   thorpej 			break;
   1153   1.1   thorpej 	if (m0 == NULL) {
   1154   1.1   thorpej #ifdef ALTQ_DEBUG
   1155   1.1   thorpej 		printf("extract_ports6: can't locate header! ip6=%p\n", ip6);
   1156   1.1   thorpej #endif
   1157   1.1   thorpej 		return (0);
   1158   1.1   thorpej 	}
   1159   1.1   thorpej 	off = ((caddr_t)ip6 - m0->m_data) + sizeof(struct ip6_hdr);
   1160   1.1   thorpej 
   1161   1.1   thorpej 	proto = ip6->ip6_nxt;
   1162   1.1   thorpej 	do {
   1163   1.1   thorpej 		while (off >= m0->m_len) {
   1164   1.1   thorpej 			off -= m0->m_len;
   1165   1.1   thorpej 			m0 = m0->m_next;
   1166   1.8    itojun 			if (m0 == NULL)
   1167   1.8    itojun 				return (0);
   1168   1.1   thorpej 		}
   1169   1.8    itojun 		if (m0->m_len < off + 4)
   1170   1.8    itojun 			return (0);
   1171   1.1   thorpej 
   1172   1.1   thorpej 		switch (proto) {
   1173   1.1   thorpej 		case IPPROTO_TCP:
   1174   1.1   thorpej 		case IPPROTO_UDP: {
   1175   1.1   thorpej 			struct udphdr *udp;
   1176   1.8    itojun 
   1177   1.1   thorpej 			udp = (struct udphdr *)(mtod(m0, caddr_t) + off);
   1178   1.1   thorpej 			fin6->fi6_sport = udp->uh_sport;
   1179   1.1   thorpej 			fin6->fi6_dport = udp->uh_dport;
   1180   1.1   thorpej 			fin6->fi6_proto = proto;
   1181   1.1   thorpej 			}
   1182   1.1   thorpej 			return (1);
   1183   1.8    itojun 
   1184   1.1   thorpej 		case IPPROTO_ESP:
   1185   1.1   thorpej 			if (fin6->fi6_gpi == 0) {
   1186   1.1   thorpej 				u_int32_t *gpi;
   1187   1.8    itojun 
   1188   1.1   thorpej 				gpi = (u_int32_t *)(mtod(m0, caddr_t) + off);
   1189   1.1   thorpej 				fin6->fi6_gpi   = *gpi;
   1190   1.1   thorpej 			}
   1191   1.1   thorpej 			fin6->fi6_proto = proto;
   1192   1.1   thorpej 			return (1);
   1193   1.1   thorpej 
   1194   1.1   thorpej 		case IPPROTO_AH: {
   1195   1.1   thorpej 			/* get next header and header length */
   1196   1.1   thorpej 			struct _opt6 *opt6;
   1197   1.1   thorpej 
   1198   1.1   thorpej 			opt6 = (struct _opt6 *)(mtod(m0, caddr_t) + off);
   1199   1.8    itojun 			if (fin6->fi6_gpi == 0 && m0->m_len >= off + 8)
   1200   1.1   thorpej 				fin6->fi6_gpi = opt6->ah_spi;
   1201   1.1   thorpej 			proto = opt6->opt6_nxt;
   1202   1.1   thorpej 			off += 8 + (opt6->opt6_hlen * 4);
   1203   1.1   thorpej 			/* goto the next header */
   1204   1.1   thorpej 			break;
   1205   1.1   thorpej 			}
   1206   1.1   thorpej 
   1207   1.1   thorpej 		case IPPROTO_HOPOPTS:
   1208   1.1   thorpej 		case IPPROTO_ROUTING:
   1209   1.1   thorpej 		case IPPROTO_DSTOPTS: {
   1210   1.1   thorpej 			/* get next header and header length */
   1211   1.1   thorpej 			struct _opt6 *opt6;
   1212   1.1   thorpej 
   1213   1.1   thorpej 			opt6 = (struct _opt6 *)(mtod(m0, caddr_t) + off);
   1214   1.1   thorpej 			proto = opt6->opt6_nxt;
   1215   1.1   thorpej 			off += (opt6->opt6_hlen + 1) * 8;
   1216   1.1   thorpej 			/* goto the next header */
   1217   1.1   thorpej 			break;
   1218   1.1   thorpej 			}
   1219   1.8    itojun 
   1220   1.1   thorpej 		case IPPROTO_FRAGMENT:
   1221   1.1   thorpej 			/* ipv6 fragmentations are not supported yet */
   1222   1.1   thorpej 		default:
   1223   1.1   thorpej 			fin6->fi6_proto = proto;
   1224   1.1   thorpej 			return (0);
   1225   1.1   thorpej 		}
   1226   1.1   thorpej 	} while (1);
   1227   1.1   thorpej 	/*NOTREACHED*/
   1228   1.1   thorpej }
   1229   1.1   thorpej #endif /* INET6 */
   1230   1.1   thorpej 
   1231   1.1   thorpej /*
   1232   1.1   thorpej  * altq common classifier
   1233   1.1   thorpej  */
   1234   1.1   thorpej int
   1235  1.16     peter acc_add_filter(struct acc_classifier *classifier, struct flow_filter *filter,
   1236  1.16     peter     void *class, u_long *phandle)
   1237   1.1   thorpej {
   1238   1.1   thorpej 	struct acc_filter *afp, *prev, *tmp;
   1239   1.1   thorpej 	int	i, s;
   1240   1.1   thorpej 
   1241   1.1   thorpej #ifdef INET6
   1242   1.1   thorpej 	if (filter->ff_flow.fi_family != AF_INET &&
   1243   1.1   thorpej 	    filter->ff_flow.fi_family != AF_INET6)
   1244   1.1   thorpej 		return (EINVAL);
   1245   1.1   thorpej #else
   1246   1.1   thorpej 	if (filter->ff_flow.fi_family != AF_INET)
   1247   1.1   thorpej 		return (EINVAL);
   1248   1.1   thorpej #endif
   1249   1.8    itojun 
   1250  1.14  christos 	afp = malloc(sizeof(struct acc_filter), M_DEVBUF, M_WAITOK|M_ZERO);
   1251   1.1   thorpej 	if (afp == NULL)
   1252   1.1   thorpej 		return (ENOMEM);
   1253   1.1   thorpej 
   1254   1.1   thorpej 	afp->f_filter = *filter;
   1255   1.1   thorpej 	afp->f_class = class;
   1256   1.1   thorpej 
   1257   1.1   thorpej 	i = ACC_WILDCARD_INDEX;
   1258   1.1   thorpej 	if (filter->ff_flow.fi_family == AF_INET) {
   1259   1.1   thorpej 		struct flow_filter *filter4 = &afp->f_filter;
   1260   1.8    itojun 
   1261   1.1   thorpej 		/*
   1262   1.1   thorpej 		 * if address is 0, it's a wildcard.  if address mask
   1263   1.1   thorpej 		 * isn't set, use full mask.
   1264   1.1   thorpej 		 */
   1265   1.1   thorpej 		if (filter4->ff_flow.fi_dst.s_addr == 0)
   1266   1.1   thorpej 			filter4->ff_mask.mask_dst.s_addr = 0;
   1267   1.1   thorpej 		else if (filter4->ff_mask.mask_dst.s_addr == 0)
   1268   1.1   thorpej 			filter4->ff_mask.mask_dst.s_addr = 0xffffffff;
   1269   1.1   thorpej 		if (filter4->ff_flow.fi_src.s_addr == 0)
   1270   1.1   thorpej 			filter4->ff_mask.mask_src.s_addr = 0;
   1271   1.1   thorpej 		else if (filter4->ff_mask.mask_src.s_addr == 0)
   1272   1.1   thorpej 			filter4->ff_mask.mask_src.s_addr = 0xffffffff;
   1273   1.1   thorpej 
   1274   1.1   thorpej 		/* clear extra bits in addresses  */
   1275   1.1   thorpej 		   filter4->ff_flow.fi_dst.s_addr &=
   1276   1.1   thorpej 		       filter4->ff_mask.mask_dst.s_addr;
   1277   1.1   thorpej 		   filter4->ff_flow.fi_src.s_addr &=
   1278   1.1   thorpej 		       filter4->ff_mask.mask_src.s_addr;
   1279   1.1   thorpej 
   1280   1.1   thorpej 		/*
   1281   1.1   thorpej 		 * if dst address is a wildcard, use hash-entry
   1282   1.1   thorpej 		 * ACC_WILDCARD_INDEX.
   1283   1.1   thorpej 		 */
   1284   1.1   thorpej 		if (filter4->ff_mask.mask_dst.s_addr != 0xffffffff)
   1285   1.1   thorpej 			i = ACC_WILDCARD_INDEX;
   1286   1.1   thorpej 		else
   1287   1.1   thorpej 			i = ACC_GET_HASH_INDEX(filter4->ff_flow.fi_dst.s_addr);
   1288   1.1   thorpej 	}
   1289   1.1   thorpej #ifdef INET6
   1290   1.1   thorpej 	else if (filter->ff_flow.fi_family == AF_INET6) {
   1291   1.1   thorpej 		struct flow_filter6 *filter6 =
   1292   1.1   thorpej 			(struct flow_filter6 *)&afp->f_filter;
   1293   1.1   thorpej #ifndef IN6MASK0 /* taken from kame ipv6 */
   1294   1.1   thorpej #define	IN6MASK0	{{{ 0, 0, 0, 0 }}}
   1295   1.1   thorpej #define	IN6MASK128	{{{ 0xffffffff, 0xffffffff, 0xffffffff, 0xffffffff }}}
   1296   1.1   thorpej 		const struct in6_addr in6mask0 = IN6MASK0;
   1297   1.1   thorpej 		const struct in6_addr in6mask128 = IN6MASK128;
   1298   1.1   thorpej #endif
   1299   1.1   thorpej 
   1300   1.1   thorpej 		if (IN6_IS_ADDR_UNSPECIFIED(&filter6->ff_flow6.fi6_dst))
   1301   1.1   thorpej 			filter6->ff_mask6.mask6_dst = in6mask0;
   1302   1.1   thorpej 		else if (IN6_IS_ADDR_UNSPECIFIED(&filter6->ff_mask6.mask6_dst))
   1303   1.1   thorpej 			filter6->ff_mask6.mask6_dst = in6mask128;
   1304   1.1   thorpej 		if (IN6_IS_ADDR_UNSPECIFIED(&filter6->ff_flow6.fi6_src))
   1305   1.1   thorpej 			filter6->ff_mask6.mask6_src = in6mask0;
   1306   1.1   thorpej 		else if (IN6_IS_ADDR_UNSPECIFIED(&filter6->ff_mask6.mask6_src))
   1307   1.1   thorpej 			filter6->ff_mask6.mask6_src = in6mask128;
   1308   1.1   thorpej 
   1309   1.1   thorpej 		/* clear extra bits in addresses  */
   1310   1.1   thorpej 		for (i = 0; i < 16; i++)
   1311   1.1   thorpej 			filter6->ff_flow6.fi6_dst.s6_addr[i] &=
   1312   1.1   thorpej 			    filter6->ff_mask6.mask6_dst.s6_addr[i];
   1313   1.1   thorpej 		for (i = 0; i < 16; i++)
   1314   1.1   thorpej 			filter6->ff_flow6.fi6_src.s6_addr[i] &=
   1315   1.1   thorpej 			    filter6->ff_mask6.mask6_src.s6_addr[i];
   1316   1.8    itojun 
   1317   1.1   thorpej 		if (filter6->ff_flow6.fi6_flowlabel == 0)
   1318   1.1   thorpej 			i = ACC_WILDCARD_INDEX;
   1319   1.1   thorpej 		else
   1320   1.1   thorpej 			i = ACC_GET_HASH_INDEX(filter6->ff_flow6.fi6_flowlabel);
   1321   1.1   thorpej 	}
   1322   1.1   thorpej #endif /* INET6 */
   1323   1.1   thorpej 
   1324   1.1   thorpej 	afp->f_handle = get_filt_handle(classifier, i);
   1325   1.1   thorpej 
   1326   1.1   thorpej 	/* update filter bitmask */
   1327   1.1   thorpej 	afp->f_fbmask = filt2fibmask(filter);
   1328   1.1   thorpej 	classifier->acc_fbmask |= afp->f_fbmask;
   1329   1.1   thorpej 
   1330   1.1   thorpej 	/*
   1331   1.1   thorpej 	 * add this filter to the filter list.
   1332   1.1   thorpej 	 * filters are ordered from the highest rule number.
   1333   1.1   thorpej 	 */
   1334   1.5   thorpej 	s = splnet();
   1335   1.1   thorpej 	prev = NULL;
   1336   1.1   thorpej 	LIST_FOREACH(tmp, &classifier->acc_filters[i], f_chain) {
   1337   1.1   thorpej 		if (tmp->f_filter.ff_ruleno > afp->f_filter.ff_ruleno)
   1338   1.1   thorpej 			prev = tmp;
   1339   1.1   thorpej 		else
   1340   1.1   thorpej 			break;
   1341   1.1   thorpej 	}
   1342   1.1   thorpej 	if (prev == NULL)
   1343   1.1   thorpej 		LIST_INSERT_HEAD(&classifier->acc_filters[i], afp, f_chain);
   1344   1.1   thorpej 	else
   1345   1.1   thorpej 		LIST_INSERT_AFTER(prev, afp, f_chain);
   1346   1.1   thorpej 	splx(s);
   1347   1.1   thorpej 
   1348   1.1   thorpej 	*phandle = afp->f_handle;
   1349   1.1   thorpej 	return (0);
   1350   1.1   thorpej }
   1351   1.1   thorpej 
   1352   1.1   thorpej int
   1353  1.16     peter acc_delete_filter(struct acc_classifier *classifier, u_long handle)
   1354   1.1   thorpej {
   1355   1.1   thorpej 	struct acc_filter *afp;
   1356   1.1   thorpej 	int	s;
   1357   1.1   thorpej 
   1358   1.1   thorpej 	if ((afp = filth_to_filtp(classifier, handle)) == NULL)
   1359   1.1   thorpej 		return (EINVAL);
   1360   1.1   thorpej 
   1361   1.5   thorpej 	s = splnet();
   1362   1.1   thorpej 	LIST_REMOVE(afp, f_chain);
   1363   1.1   thorpej 	splx(s);
   1364   1.1   thorpej 
   1365  1.14  christos 	free(afp, M_DEVBUF);
   1366   1.1   thorpej 
   1367   1.1   thorpej 	/* todo: update filt_bmask */
   1368   1.1   thorpej 
   1369   1.1   thorpej 	return (0);
   1370   1.1   thorpej }
   1371   1.1   thorpej 
   1372   1.1   thorpej /*
   1373   1.1   thorpej  * delete filters referencing to the specified class.
   1374   1.1   thorpej  * if the all flag is not 0, delete all the filters.
   1375   1.1   thorpej  */
   1376   1.1   thorpej int
   1377  1.16     peter acc_discard_filters(struct acc_classifier *classifier, void *class, int all)
   1378   1.1   thorpej {
   1379   1.1   thorpej 	struct acc_filter *afp;
   1380   1.1   thorpej 	int	i, s;
   1381   1.1   thorpej 
   1382   1.5   thorpej 	s = splnet();
   1383   1.1   thorpej 	for (i = 0; i < ACC_FILTER_TABLESIZE; i++) {
   1384   1.1   thorpej 		do {
   1385   1.1   thorpej 			LIST_FOREACH(afp, &classifier->acc_filters[i], f_chain)
   1386   1.1   thorpej 				if (all || afp->f_class == class) {
   1387   1.1   thorpej 					LIST_REMOVE(afp, f_chain);
   1388  1.14  christos 					free(afp, M_DEVBUF);
   1389   1.1   thorpej 					/* start again from the head */
   1390   1.1   thorpej 					break;
   1391   1.1   thorpej 				}
   1392   1.1   thorpej 		} while (afp != NULL);
   1393   1.1   thorpej 	}
   1394   1.1   thorpej 	splx(s);
   1395   1.1   thorpej 
   1396   1.1   thorpej 	if (all)
   1397   1.1   thorpej 		classifier->acc_fbmask = 0;
   1398   1.1   thorpej 
   1399   1.1   thorpej 	return (0);
   1400   1.1   thorpej }
   1401   1.1   thorpej 
   1402   1.1   thorpej void *
   1403  1.16     peter acc_classify(void *clfier, struct mbuf *m, int af)
   1404   1.1   thorpej {
   1405   1.1   thorpej 	struct acc_classifier *classifier;
   1406   1.1   thorpej 	struct flowinfo flow;
   1407   1.1   thorpej 	struct acc_filter *afp;
   1408   1.1   thorpej 	int	i;
   1409   1.1   thorpej 
   1410   1.1   thorpej 	classifier = (struct acc_classifier *)clfier;
   1411   1.1   thorpej 	altq_extractflow(m, af, &flow, classifier->acc_fbmask);
   1412   1.1   thorpej 
   1413   1.1   thorpej 	if (flow.fi_family == AF_INET) {
   1414   1.1   thorpej 		struct flowinfo_in *fp = (struct flowinfo_in *)&flow;
   1415   1.8    itojun 
   1416   1.1   thorpej 		if ((classifier->acc_fbmask & FIMB4_ALL) == FIMB4_TOS) {
   1417   1.1   thorpej 			/* only tos is used */
   1418   1.1   thorpej 			LIST_FOREACH(afp,
   1419   1.1   thorpej 				 &classifier->acc_filters[ACC_WILDCARD_INDEX],
   1420   1.1   thorpej 				 f_chain)
   1421   1.1   thorpej 				if (apply_tosfilter4(afp->f_fbmask,
   1422   1.1   thorpej 						     &afp->f_filter, fp))
   1423   1.1   thorpej 					/* filter matched */
   1424   1.1   thorpej 					return (afp->f_class);
   1425   1.1   thorpej 		} else if ((classifier->acc_fbmask &
   1426   1.1   thorpej 			(~(FIMB4_PROTO|FIMB4_SPORT|FIMB4_DPORT) & FIMB4_ALL))
   1427   1.1   thorpej 		    == 0) {
   1428   1.1   thorpej 			/* only proto and ports are used */
   1429   1.1   thorpej 			LIST_FOREACH(afp,
   1430   1.1   thorpej 				 &classifier->acc_filters[ACC_WILDCARD_INDEX],
   1431   1.1   thorpej 				 f_chain)
   1432   1.1   thorpej 				if (apply_ppfilter4(afp->f_fbmask,
   1433   1.1   thorpej 						    &afp->f_filter, fp))
   1434   1.1   thorpej 					/* filter matched */
   1435   1.1   thorpej 					return (afp->f_class);
   1436   1.1   thorpej 		} else {
   1437   1.1   thorpej 			/* get the filter hash entry from its dest address */
   1438   1.1   thorpej 			i = ACC_GET_HASH_INDEX(fp->fi_dst.s_addr);
   1439   1.1   thorpej 			do {
   1440   1.1   thorpej 				/*
   1441   1.1   thorpej 				 * go through this loop twice.  first for dst
   1442   1.1   thorpej 				 * hash, second for wildcards.
   1443   1.1   thorpej 				 */
   1444   1.1   thorpej 				LIST_FOREACH(afp, &classifier->acc_filters[i],
   1445   1.1   thorpej 					     f_chain)
   1446   1.1   thorpej 					if (apply_filter4(afp->f_fbmask,
   1447   1.1   thorpej 							  &afp->f_filter, fp))
   1448   1.1   thorpej 						/* filter matched */
   1449   1.1   thorpej 						return (afp->f_class);
   1450   1.8    itojun 
   1451   1.1   thorpej 				/*
   1452   1.1   thorpej 				 * check again for filters with a dst addr
   1453   1.1   thorpej 				 * wildcard.
   1454   1.1   thorpej 				 * (daddr == 0 || dmask != 0xffffffff).
   1455   1.1   thorpej 				 */
   1456   1.1   thorpej 				if (i != ACC_WILDCARD_INDEX)
   1457   1.1   thorpej 					i = ACC_WILDCARD_INDEX;
   1458   1.1   thorpej 				else
   1459   1.1   thorpej 					break;
   1460   1.1   thorpej 			} while (1);
   1461   1.1   thorpej 		}
   1462   1.1   thorpej 	}
   1463   1.1   thorpej #ifdef INET6
   1464   1.1   thorpej 	else if (flow.fi_family == AF_INET6) {
   1465   1.1   thorpej 		struct flowinfo_in6 *fp6 = (struct flowinfo_in6 *)&flow;
   1466   1.8    itojun 
   1467   1.1   thorpej 		/* get the filter hash entry from its flow ID */
   1468   1.1   thorpej 		if (fp6->fi6_flowlabel != 0)
   1469   1.1   thorpej 			i = ACC_GET_HASH_INDEX(fp6->fi6_flowlabel);
   1470   1.1   thorpej 		else
   1471   1.1   thorpej 			/* flowlable can be zero */
   1472   1.1   thorpej 			i = ACC_WILDCARD_INDEX;
   1473   1.1   thorpej 
   1474   1.1   thorpej 		/* go through this loop twice.  first for flow hash, second
   1475   1.1   thorpej 		   for wildcards. */
   1476   1.1   thorpej 		do {
   1477   1.1   thorpej 			LIST_FOREACH(afp, &classifier->acc_filters[i], f_chain)
   1478   1.1   thorpej 				if (apply_filter6(afp->f_fbmask,
   1479   1.1   thorpej 					(struct flow_filter6 *)&afp->f_filter,
   1480   1.1   thorpej 					fp6))
   1481   1.1   thorpej 					/* filter matched */
   1482   1.1   thorpej 					return (afp->f_class);
   1483   1.1   thorpej 
   1484   1.1   thorpej 			/*
   1485   1.1   thorpej 			 * check again for filters with a wildcard.
   1486   1.1   thorpej 			 */
   1487   1.1   thorpej 			if (i != ACC_WILDCARD_INDEX)
   1488   1.1   thorpej 				i = ACC_WILDCARD_INDEX;
   1489   1.1   thorpej 			else
   1490   1.1   thorpej 				break;
   1491   1.1   thorpej 		} while (1);
   1492   1.1   thorpej 	}
   1493   1.1   thorpej #endif /* INET6 */
   1494   1.1   thorpej 
   1495   1.1   thorpej 	/* no filter matched */
   1496   1.1   thorpej 	return (NULL);
   1497   1.1   thorpej }
   1498   1.1   thorpej 
   1499   1.1   thorpej static int
   1500  1.16     peter apply_filter4(u_int32_t fbmask, struct flow_filter *filt,
   1501  1.16     peter     struct flowinfo_in *pkt)
   1502   1.1   thorpej {
   1503   1.1   thorpej 	if (filt->ff_flow.fi_family != AF_INET)
   1504   1.1   thorpej 		return (0);
   1505   1.1   thorpej 	if ((fbmask & FIMB4_SPORT) && filt->ff_flow.fi_sport != pkt->fi_sport)
   1506   1.1   thorpej 		return (0);
   1507   1.1   thorpej 	if ((fbmask & FIMB4_DPORT) && filt->ff_flow.fi_dport != pkt->fi_dport)
   1508   1.1   thorpej 		return (0);
   1509   1.1   thorpej 	if ((fbmask & FIMB4_DADDR) &&
   1510   1.1   thorpej 	    filt->ff_flow.fi_dst.s_addr !=
   1511   1.1   thorpej 	    (pkt->fi_dst.s_addr & filt->ff_mask.mask_dst.s_addr))
   1512   1.1   thorpej 		return (0);
   1513   1.1   thorpej 	if ((fbmask & FIMB4_SADDR) &&
   1514   1.1   thorpej 	    filt->ff_flow.fi_src.s_addr !=
   1515   1.1   thorpej 	    (pkt->fi_src.s_addr & filt->ff_mask.mask_src.s_addr))
   1516   1.1   thorpej 		return (0);
   1517   1.1   thorpej 	if ((fbmask & FIMB4_PROTO) && filt->ff_flow.fi_proto != pkt->fi_proto)
   1518   1.1   thorpej 		return (0);
   1519   1.1   thorpej 	if ((fbmask & FIMB4_TOS) && filt->ff_flow.fi_tos !=
   1520   1.1   thorpej 	    (pkt->fi_tos & filt->ff_mask.mask_tos))
   1521   1.1   thorpej 		return (0);
   1522   1.1   thorpej 	if ((fbmask & FIMB4_GPI) && filt->ff_flow.fi_gpi != (pkt->fi_gpi))
   1523   1.1   thorpej 		return (0);
   1524   1.1   thorpej 	/* match */
   1525   1.1   thorpej 	return (1);
   1526   1.1   thorpej }
   1527   1.1   thorpej 
   1528   1.1   thorpej /*
   1529   1.1   thorpej  * filter matching function optimized for a common case that checks
   1530   1.1   thorpej  * only protocol and port numbers
   1531   1.1   thorpej  */
   1532   1.1   thorpej static int
   1533  1.16     peter apply_ppfilter4(u_int32_t fbmask, struct flow_filter *filt,
   1534  1.16     peter     struct flowinfo_in *pkt)
   1535   1.1   thorpej {
   1536   1.1   thorpej 	if (filt->ff_flow.fi_family != AF_INET)
   1537   1.1   thorpej 		return (0);
   1538   1.1   thorpej 	if ((fbmask & FIMB4_SPORT) && filt->ff_flow.fi_sport != pkt->fi_sport)
   1539   1.1   thorpej 		return (0);
   1540   1.1   thorpej 	if ((fbmask & FIMB4_DPORT) && filt->ff_flow.fi_dport != pkt->fi_dport)
   1541   1.1   thorpej 		return (0);
   1542   1.1   thorpej 	if ((fbmask & FIMB4_PROTO) && filt->ff_flow.fi_proto != pkt->fi_proto)
   1543   1.1   thorpej 		return (0);
   1544   1.1   thorpej 	/* match */
   1545   1.1   thorpej 	return (1);
   1546   1.1   thorpej }
   1547   1.1   thorpej 
   1548   1.1   thorpej /*
   1549   1.1   thorpej  * filter matching function only for tos field.
   1550   1.1   thorpej  */
   1551   1.1   thorpej static int
   1552  1.16     peter apply_tosfilter4(u_int32_t fbmask, struct flow_filter *filt,
   1553  1.16     peter     struct flowinfo_in *pkt)
   1554   1.1   thorpej {
   1555   1.1   thorpej 	if (filt->ff_flow.fi_family != AF_INET)
   1556   1.1   thorpej 		return (0);
   1557   1.1   thorpej 	if ((fbmask & FIMB4_TOS) && filt->ff_flow.fi_tos !=
   1558   1.1   thorpej 	    (pkt->fi_tos & filt->ff_mask.mask_tos))
   1559   1.1   thorpej 		return (0);
   1560   1.1   thorpej 	/* match */
   1561   1.1   thorpej 	return (1);
   1562   1.1   thorpej }
   1563   1.1   thorpej 
   1564   1.1   thorpej #ifdef INET6
   1565   1.1   thorpej static int
   1566  1.16     peter apply_filter6(u_int32_t fbmask, struct flow_filter6 *filt,
   1567  1.16     peter     struct flowinfo_in6 *pkt)
   1568   1.1   thorpej {
   1569   1.1   thorpej 	int i;
   1570   1.1   thorpej 
   1571   1.1   thorpej 	if (filt->ff_flow6.fi6_family != AF_INET6)
   1572   1.1   thorpej 		return (0);
   1573   1.1   thorpej 	if ((fbmask & FIMB6_FLABEL) &&
   1574   1.1   thorpej 	    filt->ff_flow6.fi6_flowlabel != pkt->fi6_flowlabel)
   1575   1.1   thorpej 		return (0);
   1576   1.1   thorpej 	if ((fbmask & FIMB6_PROTO) &&
   1577   1.1   thorpej 	    filt->ff_flow6.fi6_proto != pkt->fi6_proto)
   1578   1.1   thorpej 		return (0);
   1579   1.1   thorpej 	if ((fbmask & FIMB6_SPORT) &&
   1580   1.1   thorpej 	    filt->ff_flow6.fi6_sport != pkt->fi6_sport)
   1581   1.1   thorpej 		return (0);
   1582   1.1   thorpej 	if ((fbmask & FIMB6_DPORT) &&
   1583   1.1   thorpej 	    filt->ff_flow6.fi6_dport != pkt->fi6_dport)
   1584   1.1   thorpej 		return (0);
   1585   1.1   thorpej 	if (fbmask & FIMB6_SADDR) {
   1586   1.1   thorpej 		for (i = 0; i < 4; i++)
   1587   1.1   thorpej 			if (filt->ff_flow6.fi6_src.s6_addr32[i] !=
   1588   1.1   thorpej 			    (pkt->fi6_src.s6_addr32[i] &
   1589   1.1   thorpej 			     filt->ff_mask6.mask6_src.s6_addr32[i]))
   1590   1.1   thorpej 				return (0);
   1591   1.1   thorpej 	}
   1592   1.1   thorpej 	if (fbmask & FIMB6_DADDR) {
   1593   1.1   thorpej 		for (i = 0; i < 4; i++)
   1594   1.1   thorpej 			if (filt->ff_flow6.fi6_dst.s6_addr32[i] !=
   1595   1.1   thorpej 			    (pkt->fi6_dst.s6_addr32[i] &
   1596   1.1   thorpej 			     filt->ff_mask6.mask6_dst.s6_addr32[i]))
   1597   1.1   thorpej 				return (0);
   1598   1.1   thorpej 	}
   1599   1.1   thorpej 	if ((fbmask & FIMB6_TCLASS) &&
   1600   1.1   thorpej 	    filt->ff_flow6.fi6_tclass !=
   1601   1.1   thorpej 	    (pkt->fi6_tclass & filt->ff_mask6.mask6_tclass))
   1602   1.1   thorpej 		return (0);
   1603   1.1   thorpej 	if ((fbmask & FIMB6_GPI) &&
   1604   1.1   thorpej 	    filt->ff_flow6.fi6_gpi != pkt->fi6_gpi)
   1605   1.1   thorpej 		return (0);
   1606   1.1   thorpej 	/* match */
   1607   1.1   thorpej 	return (1);
   1608   1.1   thorpej }
   1609   1.1   thorpej #endif /* INET6 */
   1610   1.1   thorpej 
   1611   1.1   thorpej /*
   1612   1.1   thorpej  *  filter handle:
   1613   1.1   thorpej  *	bit 20-28: index to the filter hash table
   1614   1.1   thorpej  *	bit  0-19: unique id in the hash bucket.
   1615   1.1   thorpej  */
   1616   1.1   thorpej static u_long
   1617  1.16     peter get_filt_handle(struct acc_classifier *classifier, int i)
   1618   1.1   thorpej {
   1619   1.1   thorpej 	static u_long handle_number = 1;
   1620   1.1   thorpej 	u_long 	handle;
   1621   1.1   thorpej 	struct acc_filter *afp;
   1622   1.1   thorpej 
   1623   1.1   thorpej 	while (1) {
   1624   1.1   thorpej 		handle = handle_number++ & 0x000fffff;
   1625   1.1   thorpej 
   1626   1.1   thorpej 		if (LIST_EMPTY(&classifier->acc_filters[i]))
   1627   1.1   thorpej 			break;
   1628   1.1   thorpej 
   1629   1.1   thorpej 		LIST_FOREACH(afp, &classifier->acc_filters[i], f_chain)
   1630   1.1   thorpej 			if ((afp->f_handle & 0x000fffff) == handle)
   1631   1.1   thorpej 				break;
   1632   1.1   thorpej 		if (afp == NULL)
   1633   1.1   thorpej 			break;
   1634   1.1   thorpej 		/* this handle is already used, try again */
   1635   1.1   thorpej 	}
   1636   1.1   thorpej 
   1637   1.1   thorpej 	return ((i << 20) | handle);
   1638   1.1   thorpej }
   1639   1.1   thorpej 
   1640   1.1   thorpej /* convert filter handle to filter pointer */
   1641   1.1   thorpej static struct acc_filter *
   1642  1.16     peter filth_to_filtp(struct acc_classifier *classifier, u_long handle)
   1643   1.1   thorpej {
   1644   1.1   thorpej 	struct acc_filter *afp;
   1645   1.1   thorpej 	int	i;
   1646   1.1   thorpej 
   1647   1.1   thorpej 	i = ACC_GET_HINDEX(handle);
   1648   1.1   thorpej 
   1649   1.1   thorpej 	LIST_FOREACH(afp, &classifier->acc_filters[i], f_chain)
   1650   1.1   thorpej 		if (afp->f_handle == handle)
   1651   1.1   thorpej 			return (afp);
   1652   1.1   thorpej 
   1653   1.1   thorpej 	return (NULL);
   1654   1.1   thorpej }
   1655   1.1   thorpej 
   1656   1.1   thorpej /* create flowinfo bitmask */
   1657   1.1   thorpej static u_int32_t
   1658  1.16     peter filt2fibmask(struct flow_filter *filt)
   1659   1.1   thorpej {
   1660   1.1   thorpej 	u_int32_t mask = 0;
   1661   1.1   thorpej #ifdef INET6
   1662   1.1   thorpej 	struct flow_filter6 *filt6;
   1663   1.1   thorpej #endif
   1664   1.1   thorpej 
   1665   1.1   thorpej 	switch (filt->ff_flow.fi_family) {
   1666   1.1   thorpej 	case AF_INET:
   1667   1.1   thorpej 		if (filt->ff_flow.fi_proto != 0)
   1668   1.1   thorpej 			mask |= FIMB4_PROTO;
   1669   1.1   thorpej 		if (filt->ff_flow.fi_tos != 0)
   1670   1.1   thorpej 			mask |= FIMB4_TOS;
   1671   1.1   thorpej 		if (filt->ff_flow.fi_dst.s_addr != 0)
   1672   1.1   thorpej 			mask |= FIMB4_DADDR;
   1673   1.1   thorpej 		if (filt->ff_flow.fi_src.s_addr != 0)
   1674   1.1   thorpej 			mask |= FIMB4_SADDR;
   1675   1.1   thorpej 		if (filt->ff_flow.fi_sport != 0)
   1676   1.1   thorpej 			mask |= FIMB4_SPORT;
   1677   1.1   thorpej 		if (filt->ff_flow.fi_dport != 0)
   1678   1.1   thorpej 			mask |= FIMB4_DPORT;
   1679   1.1   thorpej 		if (filt->ff_flow.fi_gpi != 0)
   1680   1.1   thorpej 			mask |= FIMB4_GPI;
   1681   1.1   thorpej 		break;
   1682   1.1   thorpej #ifdef INET6
   1683   1.1   thorpej 	case AF_INET6:
   1684   1.1   thorpej 		filt6 = (struct flow_filter6 *)filt;
   1685   1.1   thorpej 
   1686   1.1   thorpej 		if (filt6->ff_flow6.fi6_proto != 0)
   1687   1.1   thorpej 			mask |= FIMB6_PROTO;
   1688   1.1   thorpej 		if (filt6->ff_flow6.fi6_tclass != 0)
   1689   1.1   thorpej 			mask |= FIMB6_TCLASS;
   1690   1.1   thorpej 		if (!IN6_IS_ADDR_UNSPECIFIED(&filt6->ff_flow6.fi6_dst))
   1691   1.1   thorpej 			mask |= FIMB6_DADDR;
   1692   1.1   thorpej 		if (!IN6_IS_ADDR_UNSPECIFIED(&filt6->ff_flow6.fi6_src))
   1693   1.1   thorpej 			mask |= FIMB6_SADDR;
   1694   1.1   thorpej 		if (filt6->ff_flow6.fi6_sport != 0)
   1695   1.1   thorpej 			mask |= FIMB6_SPORT;
   1696   1.1   thorpej 		if (filt6->ff_flow6.fi6_dport != 0)
   1697   1.1   thorpej 			mask |= FIMB6_DPORT;
   1698   1.1   thorpej 		if (filt6->ff_flow6.fi6_gpi != 0)
   1699   1.1   thorpej 			mask |= FIMB6_GPI;
   1700   1.1   thorpej 		if (filt6->ff_flow6.fi6_flowlabel != 0)
   1701   1.1   thorpej 			mask |= FIMB6_FLABEL;
   1702   1.1   thorpej 		break;
   1703   1.1   thorpej #endif /* INET6 */
   1704   1.1   thorpej 	}
   1705   1.1   thorpej 	return (mask);
   1706   1.1   thorpej }
   1707   1.1   thorpej 
   1708   1.1   thorpej 
   1709   1.1   thorpej /*
   1710   1.1   thorpej  * helper functions to handle IPv4 fragments.
   1711   1.1   thorpej  * currently only in-sequence fragments are handled.
   1712   1.1   thorpej  *	- fragment info is cached in a LRU list.
   1713   1.1   thorpej  *	- when a first fragment is found, cache its flow info.
   1714   1.1   thorpej  *	- when a non-first fragment is found, lookup the cache.
   1715   1.1   thorpej  */
   1716   1.1   thorpej 
   1717   1.1   thorpej struct ip4_frag {
   1718   1.1   thorpej     TAILQ_ENTRY(ip4_frag) ip4f_chain;
   1719   1.1   thorpej     char    ip4f_valid;
   1720   1.1   thorpej     u_short ip4f_id;
   1721   1.1   thorpej     struct flowinfo_in ip4f_info;
   1722   1.1   thorpej };
   1723   1.1   thorpej 
   1724   1.1   thorpej static TAILQ_HEAD(ip4f_list, ip4_frag) ip4f_list; /* IPv4 fragment cache */
   1725   1.1   thorpej 
   1726   1.1   thorpej #define	IP4F_TABSIZE		16	/* IPv4 fragment cache size */
   1727   1.1   thorpej 
   1728   1.1   thorpej 
   1729   1.1   thorpej static void
   1730  1.16     peter ip4f_cache(struct ip *ip, struct flowinfo_in *fin)
   1731   1.1   thorpej {
   1732   1.1   thorpej 	struct ip4_frag *fp;
   1733   1.1   thorpej 
   1734   1.1   thorpej 	if (TAILQ_EMPTY(&ip4f_list)) {
   1735   1.1   thorpej 		/* first time call, allocate fragment cache entries. */
   1736   1.1   thorpej 		if (ip4f_init() < 0)
   1737   1.1   thorpej 			/* allocation failed! */
   1738   1.1   thorpej 			return;
   1739   1.1   thorpej 	}
   1740   1.1   thorpej 
   1741   1.1   thorpej 	fp = ip4f_alloc();
   1742   1.1   thorpej 	fp->ip4f_id = ip->ip_id;
   1743   1.6    itojun 	fp->ip4f_info.fi_proto = ip->ip_p;
   1744   1.6    itojun 	fp->ip4f_info.fi_src.s_addr = ip->ip_src.s_addr;
   1745   1.6    itojun 	fp->ip4f_info.fi_dst.s_addr = ip->ip_dst.s_addr;
   1746   1.1   thorpej 
   1747   1.1   thorpej 	/* save port numbers */
   1748   1.1   thorpej 	fp->ip4f_info.fi_sport = fin->fi_sport;
   1749   1.1   thorpej 	fp->ip4f_info.fi_dport = fin->fi_dport;
   1750   1.1   thorpej 	fp->ip4f_info.fi_gpi   = fin->fi_gpi;
   1751   1.1   thorpej }
   1752   1.1   thorpej 
   1753   1.1   thorpej static int
   1754  1.16     peter ip4f_lookup(struct ip *ip, struct flowinfo_in *fin)
   1755   1.1   thorpej {
   1756   1.1   thorpej 	struct ip4_frag *fp;
   1757   1.1   thorpej 
   1758   1.1   thorpej 	for (fp = TAILQ_FIRST(&ip4f_list); fp != NULL && fp->ip4f_valid;
   1759   1.1   thorpej 	     fp = TAILQ_NEXT(fp, ip4f_chain))
   1760   1.1   thorpej 		if (ip->ip_id == fp->ip4f_id &&
   1761   1.1   thorpej 		    ip->ip_src.s_addr == fp->ip4f_info.fi_src.s_addr &&
   1762   1.1   thorpej 		    ip->ip_dst.s_addr == fp->ip4f_info.fi_dst.s_addr &&
   1763   1.1   thorpej 		    ip->ip_p == fp->ip4f_info.fi_proto) {
   1764   1.1   thorpej 
   1765   1.1   thorpej 			/* found the matching entry */
   1766   1.1   thorpej 			fin->fi_sport = fp->ip4f_info.fi_sport;
   1767   1.1   thorpej 			fin->fi_dport = fp->ip4f_info.fi_dport;
   1768   1.1   thorpej 			fin->fi_gpi   = fp->ip4f_info.fi_gpi;
   1769   1.1   thorpej 
   1770   1.1   thorpej 			if ((ntohs(ip->ip_off) & IP_MF) == 0)
   1771   1.1   thorpej 				/* this is the last fragment,
   1772   1.1   thorpej 				   release the entry. */
   1773   1.1   thorpej 				ip4f_free(fp);
   1774   1.1   thorpej 
   1775   1.1   thorpej 			return (1);
   1776   1.1   thorpej 		}
   1777   1.1   thorpej 
   1778   1.1   thorpej 	/* no matching entry found */
   1779   1.1   thorpej 	return (0);
   1780   1.1   thorpej }
   1781   1.1   thorpej 
   1782   1.1   thorpej static int
   1783   1.1   thorpej ip4f_init(void)
   1784   1.1   thorpej {
   1785   1.1   thorpej 	struct ip4_frag *fp;
   1786   1.1   thorpej 	int i;
   1787   1.8    itojun 
   1788   1.1   thorpej 	TAILQ_INIT(&ip4f_list);
   1789   1.1   thorpej 	for (i=0; i<IP4F_TABSIZE; i++) {
   1790  1.14  christos 		fp = malloc(sizeof(struct ip4_frag), M_DEVBUF, M_NOWAIT);
   1791   1.1   thorpej 		if (fp == NULL) {
   1792   1.1   thorpej 			printf("ip4f_init: can't alloc %dth entry!\n", i);
   1793   1.1   thorpej 			if (i == 0)
   1794   1.1   thorpej 				return (-1);
   1795   1.1   thorpej 			return (0);
   1796   1.1   thorpej 		}
   1797   1.1   thorpej 		fp->ip4f_valid = 0;
   1798   1.1   thorpej 		TAILQ_INSERT_TAIL(&ip4f_list, fp, ip4f_chain);
   1799   1.1   thorpej 	}
   1800   1.1   thorpej 	return (0);
   1801   1.1   thorpej }
   1802   1.1   thorpej 
   1803   1.1   thorpej static struct ip4_frag *
   1804   1.1   thorpej ip4f_alloc(void)
   1805   1.1   thorpej {
   1806   1.1   thorpej 	struct ip4_frag *fp;
   1807   1.1   thorpej 
   1808   1.1   thorpej 	/* reclaim an entry at the tail, put it at the head */
   1809   1.1   thorpej 	fp = TAILQ_LAST(&ip4f_list, ip4f_list);
   1810   1.1   thorpej 	TAILQ_REMOVE(&ip4f_list, fp, ip4f_chain);
   1811   1.1   thorpej 	fp->ip4f_valid = 1;
   1812   1.1   thorpej 	TAILQ_INSERT_HEAD(&ip4f_list, fp, ip4f_chain);
   1813   1.1   thorpej 	return (fp);
   1814   1.1   thorpej }
   1815   1.1   thorpej 
   1816   1.1   thorpej static void
   1817  1.16     peter ip4f_free(struct ip4_frag *fp)
   1818   1.1   thorpej {
   1819   1.1   thorpej 	TAILQ_REMOVE(&ip4f_list, fp, ip4f_chain);
   1820   1.1   thorpej 	fp->ip4f_valid = 0;
   1821   1.1   thorpej 	TAILQ_INSERT_TAIL(&ip4f_list, fp, ip4f_chain);
   1822   1.1   thorpej }
   1823   1.1   thorpej 
   1824  1.16     peter #endif /* ALTQ3_CLFIER_COMPAT */
   1825