Home | History | Annotate | Line # | Download | only in netinet6
ip6_flow.c revision 1.23.2.1
      1  1.23.2.1       snj /*	$NetBSD: ip6_flow.c,v 1.23.2.1 2017/05/12 05:44:10 snj Exp $	*/
      2       1.1  liamjfoy 
      3       1.1  liamjfoy /*-
      4       1.1  liamjfoy  * Copyright (c) 2007 The NetBSD Foundation, Inc.
      5       1.1  liamjfoy  * All rights reserved.
      6       1.1  liamjfoy  *
      7       1.1  liamjfoy  * This code is derived from software contributed to The NetBSD Foundation
      8       1.1  liamjfoy  * by the 3am Software Foundry ("3am").  It was developed by Liam J. Foy
      9       1.1  liamjfoy  * <liamjfoy (at) netbsd.org> and Matt Thomas <matt (at) netbsd.org>.
     10       1.1  liamjfoy  *
     11       1.1  liamjfoy  * Redistribution and use in source and binary forms, with or without
     12       1.1  liamjfoy  * modification, are permitted provided that the following conditions
     13       1.1  liamjfoy  * are met:
     14       1.1  liamjfoy  * 1. Redistributions of source code must retain the above copyright
     15       1.1  liamjfoy  *    notice, this list of conditions and the following disclaimer.
     16       1.1  liamjfoy  * 2. Redistributions in binary form must reproduce the above copyright
     17       1.1  liamjfoy  *    notice, this list of conditions and the following disclaimer in the
     18       1.1  liamjfoy  *    documentation and/or other materials provided with the distribution.
     19       1.1  liamjfoy  *
     20       1.1  liamjfoy  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     21       1.1  liamjfoy  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     22       1.1  liamjfoy  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     23       1.1  liamjfoy  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     24       1.1  liamjfoy  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     25       1.1  liamjfoy  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     26       1.1  liamjfoy  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     27       1.1  liamjfoy  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     28       1.1  liamjfoy  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     29       1.1  liamjfoy  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     30       1.1  liamjfoy  * POSSIBILITY OF SUCH DAMAGE.
     31       1.1  liamjfoy  *
     32       1.1  liamjfoy  * IPv6 version was developed by Liam J. Foy. Original source existed in IPv4
     33       1.1  liamjfoy  * format developed by Matt Thomas. Thanks to Joerg Sonnenberger, Matt
     34       1.1  liamjfoy  * Thomas and Christos Zoulas.
     35       1.1  liamjfoy  *
     36       1.1  liamjfoy  * Thanks to Liverpool John Moores University, especially Dr. David Llewellyn-Jones
     37       1.1  liamjfoy  * for providing resources (to test) and Professor Madjid Merabti.
     38       1.1  liamjfoy  */
     39       1.1  liamjfoy 
     40       1.1  liamjfoy #include <sys/cdefs.h>
     41  1.23.2.1       snj __KERNEL_RCSID(0, "$NetBSD: ip6_flow.c,v 1.23.2.1 2017/05/12 05:44:10 snj Exp $");
     42       1.1  liamjfoy 
     43       1.1  liamjfoy #include <sys/param.h>
     44       1.1  liamjfoy #include <sys/systm.h>
     45       1.1  liamjfoy #include <sys/malloc.h>
     46       1.1  liamjfoy #include <sys/mbuf.h>
     47       1.1  liamjfoy #include <sys/domain.h>
     48       1.1  liamjfoy #include <sys/protosw.h>
     49       1.1  liamjfoy #include <sys/socket.h>
     50       1.1  liamjfoy #include <sys/socketvar.h>
     51       1.1  liamjfoy #include <sys/time.h>
     52       1.1  liamjfoy #include <sys/kernel.h>
     53       1.1  liamjfoy #include <sys/pool.h>
     54       1.1  liamjfoy #include <sys/sysctl.h>
     55  1.23.2.1       snj #include <sys/workqueue.h>
     56       1.1  liamjfoy 
     57       1.1  liamjfoy #include <net/if.h>
     58       1.1  liamjfoy #include <net/if_dl.h>
     59       1.1  liamjfoy #include <net/route.h>
     60       1.1  liamjfoy #include <net/pfil.h>
     61       1.1  liamjfoy 
     62       1.1  liamjfoy #include <netinet/in.h>
     63       1.1  liamjfoy #include <netinet6/in6_var.h>
     64       1.1  liamjfoy #include <netinet/in_systm.h>
     65       1.1  liamjfoy #include <netinet/ip6.h>
     66       1.1  liamjfoy #include <netinet6/ip6_var.h>
     67      1.15   thorpej #include <netinet6/ip6_private.h>
     68       1.1  liamjfoy 
     69       1.1  liamjfoy /*
     70       1.1  liamjfoy  * IPv6 Fast Forward caches/hashes flows from one source to destination.
     71       1.1  liamjfoy  *
     72       1.1  liamjfoy  * Upon a successful forward IPv6FF caches and hashes details such as the
     73       1.1  liamjfoy  * route, source and destination. Once another packet is received matching
     74       1.1  liamjfoy  * the source and destination the packet is forwarded straight onto if_output
     75       1.1  liamjfoy  * using the cached details.
     76       1.1  liamjfoy  *
     77       1.1  liamjfoy  * Example:
     78      1.20  christos  * ether/fddi_input -> ip6flow_fastforward -> if_output
     79       1.1  liamjfoy  */
     80       1.1  liamjfoy 
     81      1.18  liamjfoy static struct pool ip6flow_pool;
     82       1.1  liamjfoy 
     83       1.1  liamjfoy LIST_HEAD(ip6flowhead, ip6flow);
     84       1.1  liamjfoy 
     85       1.1  liamjfoy /*
     86       1.1  liamjfoy  * We could use IPv4 defines (IPFLOW_HASHBITS) but we'll
     87       1.1  liamjfoy  * use our own (possibly for future expansion).
     88       1.1  liamjfoy  */
     89       1.1  liamjfoy #define	IP6FLOW_TIMER		(5 * PR_SLOWHZ)
     90       1.4  liamjfoy #define	IP6FLOW_DEFAULT_HASHSIZE	(1 << IP6FLOW_HASHBITS)
     91       1.1  liamjfoy 
     92       1.4  liamjfoy static struct ip6flowhead *ip6flowtable = NULL;
     93       1.1  liamjfoy static struct ip6flowhead ip6flowlist;
     94       1.1  liamjfoy static int ip6flow_inuse;
     95       1.1  liamjfoy 
     96  1.23.2.1       snj static void ip6flow_slowtimo_work(struct work *, void *);
     97  1.23.2.1       snj static struct workqueue	*ip6flow_slowtimo_wq;
     98  1.23.2.1       snj static struct work	ip6flow_slowtimo_wk;
     99  1.23.2.1       snj 
    100       1.1  liamjfoy /*
    101       1.1  liamjfoy  * Insert an ip6flow into the list.
    102       1.1  liamjfoy  */
    103       1.1  liamjfoy #define	IP6FLOW_INSERT(bucket, ip6f) \
    104       1.1  liamjfoy do { \
    105       1.1  liamjfoy 	LIST_INSERT_HEAD((bucket), (ip6f), ip6f_hash); \
    106       1.1  liamjfoy 	LIST_INSERT_HEAD(&ip6flowlist, (ip6f), ip6f_list); \
    107       1.1  liamjfoy } while (/*CONSTCOND*/ 0)
    108       1.1  liamjfoy 
    109       1.1  liamjfoy /*
    110       1.1  liamjfoy  * Remove an ip6flow from the list.
    111       1.1  liamjfoy  */
    112       1.1  liamjfoy #define	IP6FLOW_REMOVE(ip6f) \
    113       1.1  liamjfoy do { \
    114       1.1  liamjfoy 	LIST_REMOVE((ip6f), ip6f_hash); \
    115       1.1  liamjfoy 	LIST_REMOVE((ip6f), ip6f_list); \
    116       1.1  liamjfoy } while (/*CONSTCOND*/ 0)
    117       1.1  liamjfoy 
    118       1.1  liamjfoy #ifndef IP6FLOW_DEFAULT
    119       1.1  liamjfoy #define	IP6FLOW_DEFAULT		256
    120       1.1  liamjfoy #endif
    121       1.1  liamjfoy 
    122       1.1  liamjfoy int ip6_maxflows = IP6FLOW_DEFAULT;
    123       1.4  liamjfoy int ip6_hashsize = IP6FLOW_DEFAULT_HASHSIZE;
    124       1.1  liamjfoy 
    125       1.1  liamjfoy /*
    126       1.1  liamjfoy  * Calculate hash table position.
    127       1.1  liamjfoy  */
    128       1.1  liamjfoy static size_t
    129      1.13    dyoung ip6flow_hash(const struct ip6_hdr *ip6)
    130       1.1  liamjfoy {
    131       1.1  liamjfoy 	size_t hash;
    132       1.1  liamjfoy 	uint32_t dst_sum, src_sum;
    133       1.6  liamjfoy 	size_t idx;
    134       1.1  liamjfoy 
    135       1.1  liamjfoy 	src_sum = ip6->ip6_src.s6_addr32[0] + ip6->ip6_src.s6_addr32[1]
    136       1.1  liamjfoy 	    + ip6->ip6_src.s6_addr32[2] + ip6->ip6_src.s6_addr32[3];
    137       1.1  liamjfoy 	dst_sum = ip6->ip6_dst.s6_addr32[0] + ip6->ip6_dst.s6_addr32[1]
    138       1.1  liamjfoy 	    + ip6->ip6_dst.s6_addr32[2] + ip6->ip6_dst.s6_addr32[3];
    139       1.1  liamjfoy 
    140       1.1  liamjfoy 	hash = ip6->ip6_flow;
    141       1.1  liamjfoy 
    142       1.1  liamjfoy 	for (idx = 0; idx < 32; idx += IP6FLOW_HASHBITS)
    143       1.1  liamjfoy 		hash += (dst_sum >> (32 - idx)) + (src_sum >> idx);
    144       1.1  liamjfoy 
    145       1.4  liamjfoy 	return hash & (ip6_hashsize-1);
    146       1.1  liamjfoy }
    147       1.1  liamjfoy 
    148       1.1  liamjfoy /*
    149       1.1  liamjfoy  * Check to see if a flow already exists - if so return it.
    150       1.1  liamjfoy  */
    151       1.1  liamjfoy static struct ip6flow *
    152      1.13    dyoung ip6flow_lookup(const struct ip6_hdr *ip6)
    153       1.1  liamjfoy {
    154       1.1  liamjfoy 	size_t hash;
    155       1.1  liamjfoy 	struct ip6flow *ip6f;
    156       1.1  liamjfoy 
    157       1.1  liamjfoy 	hash = ip6flow_hash(ip6);
    158       1.1  liamjfoy 
    159       1.2  liamjfoy 	LIST_FOREACH(ip6f, &ip6flowtable[hash], ip6f_hash) {
    160       1.1  liamjfoy 		if (IN6_ARE_ADDR_EQUAL(&ip6->ip6_dst, &ip6f->ip6f_dst)
    161       1.1  liamjfoy 		    && IN6_ARE_ADDR_EQUAL(&ip6->ip6_src, &ip6f->ip6f_src)
    162       1.1  liamjfoy 		    && ip6f->ip6f_flow == ip6->ip6_flow) {
    163       1.1  liamjfoy 		    	/* A cached flow has been found. */
    164       1.1  liamjfoy 			return ip6f;
    165       1.1  liamjfoy 		}
    166       1.1  liamjfoy 	}
    167       1.1  liamjfoy 
    168       1.1  liamjfoy 	return NULL;
    169       1.1  liamjfoy }
    170       1.1  liamjfoy 
    171      1.18  liamjfoy void
    172      1.18  liamjfoy ip6flow_poolinit(void)
    173      1.18  liamjfoy {
    174      1.18  liamjfoy 
    175      1.18  liamjfoy 	pool_init(&ip6flow_pool, sizeof(struct ip6flow), 0, 0, 0, "ip6flowpl",
    176      1.18  liamjfoy 			NULL, IPL_NET);
    177      1.18  liamjfoy }
    178      1.18  liamjfoy 
    179       1.1  liamjfoy /*
    180       1.4  liamjfoy  * Allocate memory and initialise lists. This function is called
    181       1.4  liamjfoy  * from ip6_init and called there after to resize the hash table.
    182       1.4  liamjfoy  * If a newly sized table cannot be malloc'ed we just continue
    183       1.4  liamjfoy  * to use the old one.
    184       1.1  liamjfoy  */
    185       1.4  liamjfoy int
    186       1.4  liamjfoy ip6flow_init(int table_size)
    187       1.1  liamjfoy {
    188       1.4  liamjfoy 	struct ip6flowhead *new_table;
    189       1.1  liamjfoy 	size_t i;
    190  1.23.2.1       snj 	int error;
    191  1.23.2.1       snj 
    192  1.23.2.1       snj 	error = workqueue_create(&ip6flow_slowtimo_wq, "ip6flow_slowtimo",
    193  1.23.2.1       snj 	    ip6flow_slowtimo_work, NULL, PRI_SOFTNET, IPL_NET, WQ_MPSAFE);
    194  1.23.2.1       snj 	if (error != 0)
    195  1.23.2.1       snj 		panic("%s: workqueue_create failed (%d)\n", __func__, error);
    196       1.1  liamjfoy 
    197       1.4  liamjfoy 	new_table = (struct ip6flowhead *)malloc(sizeof(struct ip6flowhead) *
    198       1.4  liamjfoy 	    table_size, M_RTABLE, M_NOWAIT);
    199       1.4  liamjfoy 
    200       1.4  liamjfoy 	if (new_table == NULL)
    201       1.4  liamjfoy 		return 1;
    202       1.4  liamjfoy 
    203       1.4  liamjfoy 	if (ip6flowtable != NULL)
    204       1.4  liamjfoy 		free(ip6flowtable, M_RTABLE);
    205       1.4  liamjfoy 
    206       1.4  liamjfoy 	ip6flowtable = new_table;
    207       1.4  liamjfoy 	ip6_hashsize = table_size;
    208       1.4  liamjfoy 
    209       1.1  liamjfoy 	LIST_INIT(&ip6flowlist);
    210       1.4  liamjfoy 	for (i = 0; i < ip6_hashsize; i++)
    211       1.1  liamjfoy 		LIST_INIT(&ip6flowtable[i]);
    212       1.4  liamjfoy 
    213       1.4  liamjfoy 	return 0;
    214       1.1  liamjfoy }
    215       1.1  liamjfoy 
    216       1.1  liamjfoy /*
    217       1.1  liamjfoy  * IPv6 Fast Forward routine. Attempt to forward the packet -
    218       1.1  liamjfoy  * if any problems are found return to the main IPv6 input
    219       1.1  liamjfoy  * routine to deal with.
    220       1.1  liamjfoy  */
    221       1.1  liamjfoy int
    222      1.20  christos ip6flow_fastforward(struct mbuf **mp)
    223       1.1  liamjfoy {
    224       1.1  liamjfoy 	struct ip6flow *ip6f;
    225       1.1  liamjfoy 	struct ip6_hdr *ip6;
    226       1.1  liamjfoy 	struct rtentry *rt;
    227      1.20  christos 	struct mbuf *m;
    228       1.7    dyoung 	const struct sockaddr *dst;
    229       1.1  liamjfoy 	int error;
    230       1.1  liamjfoy 
    231       1.1  liamjfoy 	/*
    232       1.1  liamjfoy 	 * Are we forwarding packets and have flows?
    233       1.1  liamjfoy 	 */
    234       1.1  liamjfoy 	if (!ip6_forwarding || ip6flow_inuse == 0)
    235       1.1  liamjfoy 		return 0;
    236       1.1  liamjfoy 
    237      1.20  christos 	m = *mp;
    238       1.1  liamjfoy 	/*
    239       1.1  liamjfoy 	 * At least size of IPv6 Header?
    240       1.1  liamjfoy 	 */
    241       1.1  liamjfoy 	if (m->m_len < sizeof(struct ip6_hdr))
    242       1.1  liamjfoy 		return 0;
    243       1.1  liamjfoy 	/*
    244       1.1  liamjfoy 	 * Was packet received as a link-level multicast or broadcast?
    245       1.1  liamjfoy 	 * If so, don't try to fast forward.
    246       1.1  liamjfoy 	 */
    247       1.1  liamjfoy 	if ((m->m_flags & (M_BCAST|M_MCAST)) != 0)
    248       1.1  liamjfoy 		return 0;
    249       1.1  liamjfoy 
    250      1.13    dyoung 	if (IP6_HDR_ALIGNED_P(mtod(m, const void *)) == 0) {
    251       1.1  liamjfoy 		if ((m = m_copyup(m, sizeof(struct ip6_hdr),
    252       1.1  liamjfoy 				(max_linkhdr + 3) & ~3)) == NULL) {
    253       1.1  liamjfoy 			return 0;
    254       1.1  liamjfoy 		}
    255      1.20  christos 		*mp = m;
    256       1.1  liamjfoy 	} else if (__predict_false(m->m_len < sizeof(struct ip6_hdr))) {
    257       1.1  liamjfoy 		if ((m = m_pullup(m, sizeof(struct ip6_hdr))) == NULL) {
    258       1.1  liamjfoy 			return 0;
    259       1.1  liamjfoy 		}
    260      1.20  christos 		*mp = m;
    261       1.1  liamjfoy 	}
    262       1.1  liamjfoy 
    263       1.1  liamjfoy 	ip6 = mtod(m, struct ip6_hdr *);
    264       1.1  liamjfoy 
    265       1.1  liamjfoy 	if ((ip6->ip6_vfc & IPV6_VERSION_MASK) != IPV6_VERSION) {
    266       1.1  liamjfoy 		/* Bad version. */
    267       1.1  liamjfoy 		return 0;
    268       1.1  liamjfoy 	}
    269       1.1  liamjfoy 
    270       1.1  liamjfoy 	/*
    271       1.1  liamjfoy 	 * If we have a hop-by-hop extension we must process it.
    272       1.1  liamjfoy 	 * We just leave this up to ip6_input to deal with.
    273       1.1  liamjfoy 	 */
    274       1.1  liamjfoy 	if (ip6->ip6_nxt == IPPROTO_HOPOPTS)
    275       1.1  liamjfoy 		return 0;
    276       1.1  liamjfoy 
    277       1.1  liamjfoy 	/*
    278       1.1  liamjfoy 	 * Attempt to find a flow.
    279       1.1  liamjfoy 	 */
    280       1.1  liamjfoy 	if ((ip6f = ip6flow_lookup(ip6)) == NULL) {
    281       1.1  liamjfoy 		/* No flow found. */
    282       1.1  liamjfoy 		return 0;
    283       1.1  liamjfoy 	}
    284       1.1  liamjfoy 
    285       1.1  liamjfoy 	/*
    286       1.1  liamjfoy 	 * Route and interface still up?
    287       1.1  liamjfoy 	 */
    288      1.12    dyoung 	if ((rt = rtcache_validate(&ip6f->ip6f_ro)) == NULL ||
    289       1.9    dyoung 	    (rt->rt_ifp->if_flags & IFF_UP) == 0) {
    290       1.1  liamjfoy 	    	/* Route or interface is down */
    291       1.1  liamjfoy 		return 0;
    292       1.1  liamjfoy 	}
    293       1.1  liamjfoy 
    294       1.1  liamjfoy 	/*
    295       1.1  liamjfoy 	 * Packet size greater than MTU?
    296       1.1  liamjfoy 	 */
    297       1.1  liamjfoy 	if (m->m_pkthdr.len > rt->rt_ifp->if_mtu) {
    298       1.1  liamjfoy 		/* Return to main IPv6 input function. */
    299       1.1  liamjfoy 		return 0;
    300       1.1  liamjfoy 	}
    301       1.1  liamjfoy 
    302      1.21   msaitoh 	/*
    303      1.21   msaitoh 	 * Clear any in-bound checksum flags for this packet.
    304      1.21   msaitoh 	 */
    305      1.21   msaitoh 	m->m_pkthdr.csum_flags = 0;
    306      1.21   msaitoh 
    307       1.1  liamjfoy 	if (ip6->ip6_hlim <= IPV6_HLIMDEC)
    308       1.1  liamjfoy 		return 0;
    309       1.1  liamjfoy 
    310       1.1  liamjfoy 	/* Decrement hop limit (same as TTL) */
    311       1.1  liamjfoy 	ip6->ip6_hlim -= IPV6_HLIMDEC;
    312       1.1  liamjfoy 
    313       1.1  liamjfoy 	if (rt->rt_flags & RTF_GATEWAY)
    314       1.7    dyoung 		dst = rt->rt_gateway;
    315       1.1  liamjfoy 	else
    316       1.7    dyoung 		dst = rtcache_getdst(&ip6f->ip6f_ro);
    317       1.1  liamjfoy 
    318       1.1  liamjfoy 	PRT_SLOW_ARM(ip6f->ip6f_timer, IP6FLOW_TIMER);
    319       1.1  liamjfoy 
    320       1.1  liamjfoy 	ip6f->ip6f_uses++;
    321       1.1  liamjfoy 
    322      1.23    bouyer 	KERNEL_LOCK(1, NULL);
    323       1.1  liamjfoy 	/* Send on its way - straight to the interface output routine. */
    324       1.7    dyoung 	if ((error = (*rt->rt_ifp->if_output)(rt->rt_ifp, m, dst, rt)) != 0) {
    325       1.1  liamjfoy 		ip6f->ip6f_dropped++;
    326       1.1  liamjfoy 	} else {
    327       1.1  liamjfoy 		ip6f->ip6f_forwarded++;
    328       1.1  liamjfoy 	}
    329      1.23    bouyer 	KERNEL_UNLOCK_ONE(NULL);
    330       1.1  liamjfoy 	return 1;
    331       1.1  liamjfoy }
    332       1.1  liamjfoy 
    333       1.1  liamjfoy /*
    334       1.1  liamjfoy  * Add the IPv6 flow statistics to the main IPv6 statistics.
    335       1.1  liamjfoy  */
    336       1.1  liamjfoy static void
    337      1.13    dyoung ip6flow_addstats(const struct ip6flow *ip6f)
    338       1.1  liamjfoy {
    339      1.11    dyoung 	struct rtentry *rt;
    340      1.15   thorpej 	uint64_t *ip6s;
    341      1.11    dyoung 
    342      1.12    dyoung 	if ((rt = rtcache_validate(&ip6f->ip6f_ro)) != NULL)
    343      1.11    dyoung 		rt->rt_use += ip6f->ip6f_uses;
    344      1.15   thorpej 	ip6s = IP6_STAT_GETREF();
    345      1.15   thorpej 	ip6s[IP6_STAT_FASTFORWARDFLOWS] = ip6flow_inuse;
    346      1.15   thorpej 	ip6s[IP6_STAT_CANTFORWARD] += ip6f->ip6f_dropped;
    347      1.15   thorpej 	ip6s[IP6_STAT_ODROPPED] += ip6f->ip6f_dropped;
    348      1.15   thorpej 	ip6s[IP6_STAT_TOTAL] += ip6f->ip6f_uses;
    349      1.15   thorpej 	ip6s[IP6_STAT_FORWARD] += ip6f->ip6f_forwarded;
    350      1.15   thorpej 	ip6s[IP6_STAT_FASTFORWARD] += ip6f->ip6f_forwarded;
    351      1.15   thorpej 	IP6_STAT_PUTREF();
    352       1.1  liamjfoy }
    353       1.1  liamjfoy 
    354       1.1  liamjfoy /*
    355       1.1  liamjfoy  * Add statistics and free the flow.
    356       1.1  liamjfoy  */
    357       1.1  liamjfoy static void
    358       1.1  liamjfoy ip6flow_free(struct ip6flow *ip6f)
    359       1.1  liamjfoy {
    360       1.1  liamjfoy 	int s;
    361       1.1  liamjfoy 
    362       1.1  liamjfoy 	/*
    363       1.1  liamjfoy 	 * Remove the flow from the hash table (at elevated IPL).
    364       1.1  liamjfoy 	 * Once it's off the list, we can deal with it at normal
    365       1.1  liamjfoy 	 * network IPL.
    366       1.1  liamjfoy 	 */
    367       1.1  liamjfoy 	s = splnet();
    368       1.1  liamjfoy 	IP6FLOW_REMOVE(ip6f);
    369       1.1  liamjfoy 	splx(s);
    370       1.1  liamjfoy 	ip6flow_inuse--;
    371       1.1  liamjfoy 	ip6flow_addstats(ip6f);
    372       1.7    dyoung 	rtcache_free(&ip6f->ip6f_ro);
    373       1.1  liamjfoy 	pool_put(&ip6flow_pool, ip6f);
    374       1.1  liamjfoy }
    375       1.1  liamjfoy 
    376       1.1  liamjfoy /*
    377       1.1  liamjfoy  * Reap one or more flows - ip6flow_reap may remove
    378       1.1  liamjfoy  * multiple flows if net.inet6.ip6.maxflows is reduced.
    379       1.1  liamjfoy  */
    380       1.1  liamjfoy struct ip6flow *
    381       1.1  liamjfoy ip6flow_reap(int just_one)
    382       1.1  liamjfoy {
    383       1.1  liamjfoy 	while (just_one || ip6flow_inuse > ip6_maxflows) {
    384       1.1  liamjfoy 		struct ip6flow *ip6f, *maybe_ip6f = NULL;
    385       1.1  liamjfoy 		int s;
    386       1.1  liamjfoy 
    387       1.1  liamjfoy 		ip6f = LIST_FIRST(&ip6flowlist);
    388       1.1  liamjfoy 		while (ip6f != NULL) {
    389       1.1  liamjfoy 			/*
    390       1.1  liamjfoy 			 * If this no longer points to a valid route -
    391       1.1  liamjfoy 			 * reclaim it.
    392       1.1  liamjfoy 			 */
    393      1.12    dyoung 			if (rtcache_validate(&ip6f->ip6f_ro) == NULL)
    394       1.1  liamjfoy 				goto done;
    395       1.1  liamjfoy 			/*
    396       1.1  liamjfoy 			 * choose the one that's been least recently
    397       1.1  liamjfoy 			 * used or has had the least uses in the
    398       1.1  liamjfoy 			 * last 1.5 intervals.
    399       1.1  liamjfoy 			 */
    400       1.1  liamjfoy 			if (maybe_ip6f == NULL ||
    401       1.1  liamjfoy 			    ip6f->ip6f_timer < maybe_ip6f->ip6f_timer ||
    402       1.1  liamjfoy 			    (ip6f->ip6f_timer == maybe_ip6f->ip6f_timer &&
    403       1.1  liamjfoy 			     ip6f->ip6f_last_uses + ip6f->ip6f_uses <
    404       1.1  liamjfoy 			         maybe_ip6f->ip6f_last_uses +
    405       1.1  liamjfoy 			         maybe_ip6f->ip6f_uses))
    406       1.1  liamjfoy 				maybe_ip6f = ip6f;
    407       1.1  liamjfoy 			ip6f = LIST_NEXT(ip6f, ip6f_list);
    408       1.1  liamjfoy 		}
    409       1.1  liamjfoy 		ip6f = maybe_ip6f;
    410       1.1  liamjfoy 	    done:
    411       1.1  liamjfoy 		/*
    412       1.1  liamjfoy 		 * Remove the entry from the flow table
    413       1.1  liamjfoy 		 */
    414       1.1  liamjfoy 		s = splnet();
    415       1.1  liamjfoy 		IP6FLOW_REMOVE(ip6f);
    416       1.1  liamjfoy 		splx(s);
    417       1.7    dyoung 		rtcache_free(&ip6f->ip6f_ro);
    418       1.1  liamjfoy 		if (just_one) {
    419       1.1  liamjfoy 			ip6flow_addstats(ip6f);
    420       1.1  liamjfoy 			return ip6f;
    421       1.1  liamjfoy 		}
    422       1.1  liamjfoy 		ip6flow_inuse--;
    423       1.1  liamjfoy 		ip6flow_addstats(ip6f);
    424       1.1  liamjfoy 		pool_put(&ip6flow_pool, ip6f);
    425       1.1  liamjfoy 	}
    426       1.1  liamjfoy 	return NULL;
    427       1.1  liamjfoy }
    428       1.1  liamjfoy 
    429  1.23.2.1       snj static bool ip6flow_work_enqueued = false;
    430  1.23.2.1       snj 
    431       1.1  liamjfoy void
    432  1.23.2.1       snj ip6flow_slowtimo_work(struct work *wk, void *arg)
    433       1.1  liamjfoy {
    434       1.1  liamjfoy 	struct ip6flow *ip6f, *next_ip6f;
    435       1.1  liamjfoy 
    436      1.16        ad 	mutex_enter(softnet_lock);
    437      1.16        ad 	KERNEL_LOCK(1, NULL);
    438      1.16        ad 
    439       1.1  liamjfoy 	for (ip6f = LIST_FIRST(&ip6flowlist); ip6f != NULL; ip6f = next_ip6f) {
    440       1.1  liamjfoy 		next_ip6f = LIST_NEXT(ip6f, ip6f_list);
    441       1.1  liamjfoy 		if (PRT_SLOW_ISEXPIRED(ip6f->ip6f_timer) ||
    442      1.12    dyoung 		    rtcache_validate(&ip6f->ip6f_ro) == NULL) {
    443       1.1  liamjfoy 			ip6flow_free(ip6f);
    444       1.1  liamjfoy 		} else {
    445       1.1  liamjfoy 			ip6f->ip6f_last_uses = ip6f->ip6f_uses;
    446       1.1  liamjfoy 			ip6flow_addstats(ip6f);
    447       1.1  liamjfoy 			ip6f->ip6f_uses = 0;
    448       1.1  liamjfoy 			ip6f->ip6f_dropped = 0;
    449       1.1  liamjfoy 			ip6f->ip6f_forwarded = 0;
    450       1.1  liamjfoy 		}
    451       1.1  liamjfoy 	}
    452  1.23.2.1       snj 	ip6flow_work_enqueued = false;
    453      1.16        ad 
    454      1.16        ad 	KERNEL_UNLOCK_ONE(NULL);
    455      1.16        ad 	mutex_exit(softnet_lock);
    456       1.1  liamjfoy }
    457       1.1  liamjfoy 
    458  1.23.2.1       snj void
    459  1.23.2.1       snj ip6flow_slowtimo(void)
    460  1.23.2.1       snj {
    461  1.23.2.1       snj 
    462  1.23.2.1       snj 	/* Avoid enqueuing another work when one is already enqueued */
    463  1.23.2.1       snj 	KERNEL_LOCK(1, NULL);
    464  1.23.2.1       snj 	if (ip6flow_work_enqueued) {
    465  1.23.2.1       snj 		KERNEL_UNLOCK_ONE(NULL);
    466  1.23.2.1       snj 		return;
    467  1.23.2.1       snj 	}
    468  1.23.2.1       snj 	ip6flow_work_enqueued = true;
    469  1.23.2.1       snj 	KERNEL_UNLOCK_ONE(NULL);
    470  1.23.2.1       snj 
    471  1.23.2.1       snj 	workqueue_enqueue(ip6flow_slowtimo_wq, &ip6flow_slowtimo_wk, NULL);
    472  1.23.2.1       snj }
    473  1.23.2.1       snj 
    474       1.1  liamjfoy /*
    475       1.1  liamjfoy  * We have successfully forwarded a packet using the normal
    476       1.1  liamjfoy  * IPv6 stack. Now create/update a flow.
    477       1.1  liamjfoy  */
    478       1.1  liamjfoy void
    479       1.7    dyoung ip6flow_create(const struct route *ro, struct mbuf *m)
    480       1.1  liamjfoy {
    481      1.13    dyoung 	const struct ip6_hdr *ip6;
    482       1.1  liamjfoy 	struct ip6flow *ip6f;
    483       1.1  liamjfoy 	size_t hash;
    484       1.1  liamjfoy 	int s;
    485       1.1  liamjfoy 
    486      1.13    dyoung 	ip6 = mtod(m, const struct ip6_hdr *);
    487       1.1  liamjfoy 
    488       1.1  liamjfoy 	/*
    489       1.1  liamjfoy 	 * If IPv6 Fast Forward is disabled, don't create a flow.
    490       1.1  liamjfoy 	 * It can be disabled by setting net.inet6.ip6.maxflows to 0.
    491       1.1  liamjfoy 	 *
    492       1.1  liamjfoy 	 * Don't create a flow for ICMPv6 messages.
    493       1.1  liamjfoy 	 */
    494       1.1  liamjfoy 	if (ip6_maxflows == 0 || ip6->ip6_nxt == IPPROTO_IPV6_ICMP)
    495       1.1  liamjfoy 		return;
    496       1.1  liamjfoy 
    497      1.22     pooka 	KERNEL_LOCK(1, NULL);
    498      1.22     pooka 
    499       1.1  liamjfoy 	/*
    500       1.1  liamjfoy 	 * See if an existing flow exists.  If so:
    501       1.1  liamjfoy 	 *	- Remove the flow
    502       1.1  liamjfoy 	 *	- Add flow statistics
    503       1.1  liamjfoy 	 *	- Free the route
    504       1.1  liamjfoy 	 *	- Reset statistics
    505       1.1  liamjfoy 	 *
    506       1.1  liamjfoy 	 * If a flow doesn't exist allocate a new one if
    507       1.1  liamjfoy 	 * ip6_maxflows hasn't reached its limit. If it has
    508       1.1  liamjfoy 	 * been reached, reap some flows.
    509       1.1  liamjfoy 	 */
    510       1.1  liamjfoy 	ip6f = ip6flow_lookup(ip6);
    511       1.1  liamjfoy 	if (ip6f == NULL) {
    512       1.1  liamjfoy 		if (ip6flow_inuse >= ip6_maxflows) {
    513       1.1  liamjfoy 			ip6f = ip6flow_reap(1);
    514       1.1  liamjfoy 		} else {
    515       1.1  liamjfoy 			ip6f = pool_get(&ip6flow_pool, PR_NOWAIT);
    516       1.1  liamjfoy 			if (ip6f == NULL)
    517      1.22     pooka 				goto out;
    518       1.1  liamjfoy 			ip6flow_inuse++;
    519       1.1  liamjfoy 		}
    520       1.1  liamjfoy 		memset(ip6f, 0, sizeof(*ip6f));
    521       1.1  liamjfoy 	} else {
    522       1.1  liamjfoy 		s = splnet();
    523       1.1  liamjfoy 		IP6FLOW_REMOVE(ip6f);
    524       1.1  liamjfoy 		splx(s);
    525       1.1  liamjfoy 		ip6flow_addstats(ip6f);
    526       1.7    dyoung 		rtcache_free(&ip6f->ip6f_ro);
    527       1.1  liamjfoy 		ip6f->ip6f_uses = 0;
    528       1.1  liamjfoy 		ip6f->ip6f_last_uses = 0;
    529       1.1  liamjfoy 		ip6f->ip6f_dropped = 0;
    530       1.1  liamjfoy 		ip6f->ip6f_forwarded = 0;
    531       1.1  liamjfoy 	}
    532       1.1  liamjfoy 
    533       1.1  liamjfoy 	/*
    534       1.1  liamjfoy 	 * Fill in the updated/new details.
    535       1.1  liamjfoy 	 */
    536       1.7    dyoung 	rtcache_copy(&ip6f->ip6f_ro, ro);
    537       1.1  liamjfoy 	ip6f->ip6f_dst = ip6->ip6_dst;
    538       1.1  liamjfoy 	ip6f->ip6f_src = ip6->ip6_src;
    539       1.1  liamjfoy 	ip6f->ip6f_flow = ip6->ip6_flow;
    540       1.1  liamjfoy 	PRT_SLOW_ARM(ip6f->ip6f_timer, IP6FLOW_TIMER);
    541       1.1  liamjfoy 
    542       1.1  liamjfoy 	/*
    543       1.1  liamjfoy 	 * Insert into the approriate bucket of the flow table.
    544       1.1  liamjfoy 	 */
    545       1.1  liamjfoy 	hash = ip6flow_hash(ip6);
    546       1.1  liamjfoy 	s = splnet();
    547       1.1  liamjfoy 	IP6FLOW_INSERT(&ip6flowtable[hash], ip6f);
    548       1.1  liamjfoy 	splx(s);
    549      1.22     pooka 
    550      1.22     pooka  out:
    551      1.22     pooka 	KERNEL_UNLOCK_ONE(NULL);
    552       1.1  liamjfoy }
    553       1.1  liamjfoy 
    554       1.1  liamjfoy /*
    555       1.4  liamjfoy  * Invalidate/remove all flows - if new_size is positive we
    556       1.4  liamjfoy  * resize the hash table.
    557       1.1  liamjfoy  */
    558       1.4  liamjfoy int
    559       1.4  liamjfoy ip6flow_invalidate_all(int new_size)
    560       1.1  liamjfoy {
    561       1.1  liamjfoy 	struct ip6flow *ip6f, *next_ip6f;
    562       1.4  liamjfoy 	int s, error;
    563       1.1  liamjfoy 
    564       1.4  liamjfoy 	error = 0;
    565       1.1  liamjfoy 	s = splnet();
    566       1.1  liamjfoy 	for (ip6f = LIST_FIRST(&ip6flowlist); ip6f != NULL; ip6f = next_ip6f) {
    567       1.1  liamjfoy 		next_ip6f = LIST_NEXT(ip6f, ip6f_list);
    568       1.1  liamjfoy 		ip6flow_free(ip6f);
    569       1.1  liamjfoy 	}
    570       1.4  liamjfoy 
    571       1.4  liamjfoy 	if (new_size)
    572       1.4  liamjfoy 		error = ip6flow_init(new_size);
    573       1.1  liamjfoy 	splx(s);
    574       1.4  liamjfoy 
    575       1.4  liamjfoy 	return error;
    576       1.1  liamjfoy }
    577