Home | History | Annotate | Line # | Download | only in npf
npf_handler.c revision 1.35
      1  1.34     rmind /*	$NetBSD: npf_handler.c,v 1.35 2016/12/26 23:05:06 christos Exp $	*/
      2   1.1     rmind 
      3   1.1     rmind /*-
      4  1.26     rmind  * Copyright (c) 2009-2013 The NetBSD Foundation, Inc.
      5   1.1     rmind  * All rights reserved.
      6   1.1     rmind  *
      7   1.1     rmind  * This material is based upon work partially supported by The
      8   1.1     rmind  * NetBSD Foundation under a contract with Mindaugas Rasiukevicius.
      9   1.1     rmind  *
     10   1.1     rmind  * Redistribution and use in source and binary forms, with or without
     11   1.1     rmind  * modification, are permitted provided that the following conditions
     12   1.1     rmind  * are met:
     13   1.1     rmind  * 1. Redistributions of source code must retain the above copyright
     14   1.1     rmind  *    notice, this list of conditions and the following disclaimer.
     15   1.1     rmind  * 2. Redistributions in binary form must reproduce the above copyright
     16   1.1     rmind  *    notice, this list of conditions and the following disclaimer in the
     17   1.1     rmind  *    documentation and/or other materials provided with the distribution.
     18   1.1     rmind  *
     19   1.1     rmind  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     20   1.1     rmind  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     21   1.1     rmind  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     22   1.1     rmind  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     23   1.1     rmind  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     24   1.1     rmind  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     25   1.1     rmind  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     26   1.1     rmind  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     27   1.1     rmind  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     28   1.1     rmind  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     29   1.1     rmind  * POSSIBILITY OF SUCH DAMAGE.
     30   1.1     rmind  */
     31   1.1     rmind 
     32   1.1     rmind /*
     33   1.1     rmind  * NPF packet handler.
     34  1.28     rmind  *
     35  1.28     rmind  * Note: pfil(9) hooks are currently locked by softnet_lock and kernel-lock.
     36   1.1     rmind  */
     37   1.1     rmind 
     38  1.35  christos #ifdef _KERNEL
     39   1.1     rmind #include <sys/cdefs.h>
     40  1.34     rmind __KERNEL_RCSID(0, "$NetBSD: npf_handler.c,v 1.35 2016/12/26 23:05:06 christos Exp $");
     41   1.1     rmind 
     42  1.14     rmind #include <sys/types.h>
     43   1.1     rmind #include <sys/param.h>
     44   1.1     rmind 
     45   1.1     rmind #include <sys/mbuf.h>
     46   1.1     rmind #include <sys/mutex.h>
     47   1.1     rmind #include <net/if.h>
     48   1.1     rmind #include <net/pfil.h>
     49   1.1     rmind #include <sys/socketvar.h>
     50   1.1     rmind 
     51   1.4     rmind #include <netinet/in_systm.h>
     52   1.4     rmind #include <netinet/in.h>
     53   1.4     rmind #include <netinet/ip_var.h>
     54   1.8    zoltan #include <netinet/ip6.h>
     55   1.8    zoltan #include <netinet6/ip6_var.h>
     56  1.35  christos #endif
     57   1.4     rmind 
     58   1.1     rmind #include "npf_impl.h"
     59  1.31     rmind #include "npf_conn.h"
     60   1.1     rmind 
     61  1.35  christos #if defined(_NPF_STANDALONE)
     62  1.35  christos #define	m_freem(m)		npf->mbufops->free(m)
     63  1.35  christos #define	m_clear_flag(m,f)
     64  1.35  christos #else
     65  1.35  christos #define	m_clear_flag(m,f)	(m)->m_flags &= ~(f)
     66  1.35  christos #endif
     67   1.1     rmind 
     68  1.26     rmind #ifndef INET6
     69  1.26     rmind #define ip6_reass_packet(x, y)	ENOTSUP
     70  1.26     rmind #endif
     71  1.26     rmind 
     72  1.24     rmind static int
     73  1.35  christos npf_reassembly(npf_t *npf, npf_cache_t *npc, struct mbuf **mp)
     74  1.24     rmind {
     75  1.32     rmind 	nbuf_t *nbuf = npc->npc_nbuf;
     76  1.24     rmind 	int error = EINVAL;
     77  1.24     rmind 
     78  1.24     rmind 	/* Reset the mbuf as it may have changed. */
     79  1.24     rmind 	*mp = nbuf_head_mbuf(nbuf);
     80  1.24     rmind 	nbuf_reset(nbuf);
     81  1.24     rmind 
     82  1.24     rmind 	if (npf_iscached(npc, NPC_IP4)) {
     83  1.24     rmind 		struct ip *ip = nbuf_dataptr(nbuf);
     84  1.24     rmind 		error = ip_reass_packet(mp, ip);
     85  1.24     rmind 	} else if (npf_iscached(npc, NPC_IP6)) {
     86  1.24     rmind 		/*
     87  1.24     rmind 		 * Note: ip6_reass_packet() offset is the start of
     88  1.24     rmind 		 * the fragment header.
     89  1.24     rmind 		 */
     90  1.26     rmind 		error = ip6_reass_packet(mp, npc->npc_hlen);
     91  1.25     rmind 		if (error && *mp == NULL) {
     92  1.25     rmind 			memset(nbuf, 0, sizeof(nbuf_t));
     93  1.25     rmind 		}
     94  1.24     rmind 	}
     95  1.24     rmind 	if (error) {
     96  1.35  christos 		npf_stats_inc(npf, NPF_STAT_REASSFAIL);
     97  1.24     rmind 		return error;
     98  1.24     rmind 	}
     99  1.24     rmind 	if (*mp == NULL) {
    100  1.24     rmind 		/* More fragments should come. */
    101  1.35  christos 		npf_stats_inc(npf, NPF_STAT_FRAGMENTS);
    102  1.24     rmind 		return 0;
    103  1.24     rmind 	}
    104  1.24     rmind 
    105  1.24     rmind 	/*
    106  1.24     rmind 	 * Reassembly is complete, we have the final packet.
    107  1.24     rmind 	 * Cache again, since layer 4 data is accessible now.
    108  1.24     rmind 	 */
    109  1.35  christos 	nbuf_init(npf, nbuf, *mp, nbuf->nb_ifp);
    110  1.24     rmind 	npc->npc_info = 0;
    111  1.24     rmind 
    112  1.32     rmind 	if (npf_cache_all(npc) & NPC_IPFRAG) {
    113  1.24     rmind 		return EINVAL;
    114  1.24     rmind 	}
    115  1.35  christos 	npf_stats_inc(npf, NPF_STAT_REASSEMBLY);
    116  1.24     rmind 	return 0;
    117  1.24     rmind }
    118  1.24     rmind 
    119   1.1     rmind /*
    120   1.2     rmind  * npf_packet_handler: main packet handling routine for layer 3.
    121   1.1     rmind  *
    122   1.1     rmind  * Note: packet flow and inspection logic is in strict order.
    123   1.1     rmind  */
    124  1.35  christos __dso_public int
    125  1.35  christos npf_packet_handler(npf_t *npf, struct mbuf **mp, ifnet_t *ifp, int di)
    126   1.1     rmind {
    127  1.24     rmind 	nbuf_t nbuf;
    128   1.1     rmind 	npf_cache_t npc;
    129  1.31     rmind 	npf_conn_t *con;
    130   1.1     rmind 	npf_rule_t *rl;
    131   1.5     rmind 	npf_rproc_t *rp;
    132  1.14     rmind 	int error, retfl;
    133  1.34     rmind 	uint32_t ntag;
    134  1.14     rmind 	int decision;
    135   1.1     rmind 
    136  1.35  christos 	/* QSBR checkpoint. */
    137  1.35  christos 	pserialize_checkpoint(npf->qsbr);
    138  1.35  christos 	KASSERT(ifp != NULL);
    139  1.35  christos 
    140   1.1     rmind 	/*
    141   1.1     rmind 	 * Initialise packet information cache.
    142   1.1     rmind 	 * Note: it is enough to clear the info bits.
    143   1.1     rmind 	 */
    144  1.35  christos 	npc.npc_ctx = npf;
    145  1.35  christos 	nbuf_init(npf, &nbuf, *mp, ifp);
    146  1.32     rmind 	npc.npc_nbuf = &nbuf;
    147   1.1     rmind 	npc.npc_info = 0;
    148  1.32     rmind 
    149  1.14     rmind 	decision = NPF_DECISION_BLOCK;
    150   1.2     rmind 	error = 0;
    151   1.2     rmind 	retfl = 0;
    152   1.5     rmind 	rp = NULL;
    153   1.1     rmind 
    154  1.10     rmind 	/* Cache everything.  Determine whether it is an IP fragment. */
    155  1.32     rmind 	if (__predict_false(npf_cache_all(&npc) & NPC_IPFRAG)) {
    156  1.18     rmind 		/*
    157  1.18     rmind 		 * Pass to IPv4 or IPv6 reassembly mechanism.
    158  1.18     rmind 		 */
    159  1.35  christos 		error = npf_reassembly(npf, &npc, mp);
    160  1.18     rmind 		if (error) {
    161  1.31     rmind 			con = NULL;
    162   1.4     rmind 			goto out;
    163   1.4     rmind 		}
    164   1.4     rmind 		if (*mp == NULL) {
    165   1.4     rmind 			/* More fragments should come; return. */
    166   1.4     rmind 			return 0;
    167   1.4     rmind 		}
    168   1.4     rmind 	}
    169   1.4     rmind 
    170  1.34     rmind 	/* Just pass-through if specially tagged. */
    171  1.34     rmind 	if (nbuf_find_tag(&nbuf, &ntag) == 0 && (ntag & NPF_NTAG_PASS) != 0) {
    172  1.34     rmind 		con = NULL;
    173  1.34     rmind 		goto pass;
    174  1.34     rmind 	}
    175  1.34     rmind 
    176  1.31     rmind 	/* Inspect the list of connections (if found, acquires a reference). */
    177  1.32     rmind 	con = npf_conn_inspect(&npc, di, &error);
    178   1.2     rmind 
    179  1.31     rmind 	/* If "passing" connection found - skip the ruleset inspection. */
    180  1.31     rmind 	if (con && npf_conn_pass(con, &rp)) {
    181  1.35  christos 		npf_stats_inc(npf, NPF_STAT_PASS_CONN);
    182  1.14     rmind 		KASSERT(error == 0);
    183   1.2     rmind 		goto pass;
    184  1.14     rmind 	}
    185  1.32     rmind 	if (__predict_false(error)) {
    186  1.24     rmind 		if (error == ENETUNREACH)
    187  1.24     rmind 			goto block;
    188  1.24     rmind 		goto out;
    189   1.2     rmind 	}
    190   1.1     rmind 
    191   1.7     rmind 	/* Acquire the lock, inspect the ruleset using this packet. */
    192  1.26     rmind 	int slock = npf_config_read_enter();
    193  1.35  christos 	npf_ruleset_t *rlset = npf_config_ruleset(npf);
    194  1.26     rmind 
    195  1.32     rmind 	rl = npf_ruleset_inspect(&npc, rlset, di, NPF_LAYER_3);
    196  1.32     rmind 	if (__predict_false(rl == NULL)) {
    197  1.35  christos 		const bool pass = npf_default_pass(npf);
    198  1.26     rmind 		npf_config_read_exit(slock);
    199  1.14     rmind 
    200  1.26     rmind 		if (pass) {
    201  1.35  christos 			npf_stats_inc(npf, NPF_STAT_PASS_DEFAULT);
    202   1.2     rmind 			goto pass;
    203   1.2     rmind 		}
    204  1.35  christos 		npf_stats_inc(npf, NPF_STAT_BLOCK_DEFAULT);
    205   1.6     rmind 		goto block;
    206   1.1     rmind 	}
    207   1.1     rmind 
    208  1.13     rmind 	/*
    209  1.24     rmind 	 * Get the rule procedure (acquires a reference) for association
    210  1.31     rmind 	 * with a connection (if any) and execution.
    211  1.13     rmind 	 */
    212   1.6     rmind 	KASSERT(rp == NULL);
    213  1.13     rmind 	rp = npf_rule_getrproc(rl);
    214   1.6     rmind 
    215  1.26     rmind 	/* Conclude with the rule and release the lock. */
    216  1.26     rmind 	error = npf_rule_conclude(rl, &retfl);
    217  1.26     rmind 	npf_config_read_exit(slock);
    218  1.26     rmind 
    219   1.2     rmind 	if (error) {
    220  1.35  christos 		npf_stats_inc(npf, NPF_STAT_BLOCK_RULESET);
    221   1.6     rmind 		goto block;
    222   1.1     rmind 	}
    223  1.35  christos 	npf_stats_inc(npf, NPF_STAT_PASS_RULESET);
    224   1.1     rmind 
    225  1.14     rmind 	/*
    226  1.31     rmind 	 * Establish a "pass" connection, if required.  Just proceed if
    227  1.31     rmind 	 * connection creation fails (e.g. due to unsupported protocol).
    228  1.14     rmind 	 */
    229  1.31     rmind 	if ((retfl & NPF_RULE_STATEFUL) != 0 && !con) {
    230  1.32     rmind 		con = npf_conn_establish(&npc, di,
    231  1.29     rmind 		    (retfl & NPF_RULE_MULTIENDS) == 0);
    232  1.31     rmind 		if (con) {
    233  1.26     rmind 			/*
    234  1.26     rmind 			 * Note: the reference on the rule procedure is
    235  1.31     rmind 			 * transfered to the connection.  It will be
    236  1.31     rmind 			 * released on connection destruction.
    237  1.26     rmind 			 */
    238  1.31     rmind 			npf_conn_setpass(con, rp);
    239   1.2     rmind 		}
    240   1.1     rmind 	}
    241   1.2     rmind pass:
    242  1.14     rmind 	decision = NPF_DECISION_PASS;
    243   1.2     rmind 	KASSERT(error == 0);
    244   1.5     rmind 	/*
    245   1.6     rmind 	 * Perform NAT.
    246   1.6     rmind 	 */
    247  1.32     rmind 	error = npf_do_nat(&npc, con, di);
    248   1.6     rmind block:
    249   1.6     rmind 	/*
    250  1.22     rmind 	 * Execute the rule procedure, if any is associated.
    251  1.22     rmind 	 * It may reverse the decision from pass to block.
    252   1.5     rmind 	 */
    253  1.32     rmind 	if (rp && !npf_rproc_run(&npc, rp, &decision)) {
    254  1.31     rmind 		if (con) {
    255  1.31     rmind 			npf_conn_release(con);
    256  1.30  jakllsch 		}
    257  1.30  jakllsch 		npf_rproc_release(rp);
    258  1.30  jakllsch 		*mp = NULL;
    259  1.30  jakllsch 		return 0;
    260   1.5     rmind 	}
    261   1.1     rmind out:
    262  1.13     rmind 	/*
    263  1.31     rmind 	 * Release the reference on a connection.  Release the reference
    264  1.31     rmind 	 * on a rule procedure only if there was no association.
    265  1.13     rmind 	 */
    266  1.31     rmind 	if (con) {
    267  1.31     rmind 		npf_conn_release(con);
    268   1.6     rmind 	} else if (rp) {
    269  1.13     rmind 		npf_rproc_release(rp);
    270   1.1     rmind 	}
    271   1.1     rmind 
    272  1.24     rmind 	/* Reset mbuf pointer before returning to the caller. */
    273  1.24     rmind 	if ((*mp = nbuf_head_mbuf(&nbuf)) == NULL) {
    274  1.25     rmind 		return error ? error : ENOMEM;
    275  1.24     rmind 	}
    276  1.24     rmind 
    277  1.14     rmind 	/* Pass the packet if decided and there is no error. */
    278  1.14     rmind 	if (decision == NPF_DECISION_PASS && !error) {
    279   1.3     rmind 		/*
    280   1.3     rmind 		 * XXX: Disable for now, it will be set accordingly later,
    281   1.3     rmind 		 * for optimisations (to reduce inspection).
    282   1.3     rmind 		 */
    283  1.35  christos 		m_clear_flag(*mp, M_CANFASTFWD);
    284  1.13     rmind 		return 0;
    285   1.1     rmind 	}
    286  1.13     rmind 
    287  1.13     rmind 	/*
    288  1.13     rmind 	 * Block the packet.  ENETUNREACH is used to indicate blocking.
    289  1.13     rmind 	 * Depending on the flags and protocol, return TCP reset (RST) or
    290  1.13     rmind 	 * ICMP destination unreachable.
    291  1.13     rmind 	 */
    292  1.32     rmind 	if (retfl && npf_return_block(&npc, retfl)) {
    293  1.16     rmind 		*mp = NULL;
    294  1.13     rmind 	}
    295  1.16     rmind 
    296  1.20     rmind 	if (!error) {
    297  1.14     rmind 		error = ENETUNREACH;
    298  1.13     rmind 	}
    299  1.13     rmind 
    300  1.16     rmind 	if (*mp) {
    301  1.35  christos 		/* Free the mbuf chain. */
    302  1.16     rmind 		m_freem(*mp);
    303  1.16     rmind 		*mp = NULL;
    304  1.16     rmind 	}
    305   1.1     rmind 	return error;
    306   1.1     rmind }
    307