npf.c revision 1.7.2.3 1 1.7.2.3 riz /* $NetBSD: npf.c,v 1.7.2.3 2012/07/16 22:13:27 riz Exp $ */
2 1.1 rmind
3 1.1 rmind /*-
4 1.1 rmind * Copyright (c) 2009-2010 The NetBSD Foundation, Inc.
5 1.1 rmind * All rights reserved.
6 1.1 rmind *
7 1.1 rmind * This material is based upon work partially supported by The
8 1.1 rmind * NetBSD Foundation under a contract with Mindaugas Rasiukevicius.
9 1.1 rmind *
10 1.1 rmind * Redistribution and use in source and binary forms, with or without
11 1.1 rmind * modification, are permitted provided that the following conditions
12 1.1 rmind * are met:
13 1.1 rmind * 1. Redistributions of source code must retain the above copyright
14 1.1 rmind * notice, this list of conditions and the following disclaimer.
15 1.1 rmind * 2. Redistributions in binary form must reproduce the above copyright
16 1.1 rmind * notice, this list of conditions and the following disclaimer in the
17 1.1 rmind * documentation and/or other materials provided with the distribution.
18 1.1 rmind *
19 1.1 rmind * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
20 1.1 rmind * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
21 1.1 rmind * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
22 1.1 rmind * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
23 1.1 rmind * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
24 1.1 rmind * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
25 1.1 rmind * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
26 1.1 rmind * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
27 1.1 rmind * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
28 1.1 rmind * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
29 1.1 rmind * POSSIBILITY OF SUCH DAMAGE.
30 1.1 rmind */
31 1.1 rmind
32 1.1 rmind /*
33 1.1 rmind * NPF main: dynamic load/initialisation and unload routines.
34 1.1 rmind */
35 1.1 rmind
36 1.1 rmind #include <sys/cdefs.h>
37 1.7.2.3 riz __KERNEL_RCSID(0, "$NetBSD: npf.c,v 1.7.2.3 2012/07/16 22:13:27 riz Exp $");
38 1.1 rmind
39 1.1 rmind #include <sys/param.h>
40 1.1 rmind #include <sys/types.h>
41 1.1 rmind
42 1.2 rmind #include <sys/atomic.h>
43 1.1 rmind #include <sys/conf.h>
44 1.1 rmind #include <sys/kauth.h>
45 1.2 rmind #include <sys/kmem.h>
46 1.1 rmind #include <sys/lwp.h>
47 1.1 rmind #include <sys/module.h>
48 1.2 rmind #include <sys/percpu.h>
49 1.2 rmind #include <sys/rwlock.h>
50 1.1 rmind #include <sys/socketvar.h>
51 1.7.2.2 riz #include <sys/sysctl.h>
52 1.1 rmind #include <sys/uio.h>
53 1.1 rmind
54 1.1 rmind #include "npf_impl.h"
55 1.1 rmind
56 1.1 rmind /*
57 1.1 rmind * Module and device structures.
58 1.1 rmind */
59 1.6 tron MODULE(MODULE_CLASS_DRIVER, npf, NULL);
60 1.1 rmind
61 1.1 rmind void npfattach(int);
62 1.1 rmind
63 1.5 yamt static int npf_fini(void);
64 1.1 rmind static int npf_dev_open(dev_t, int, int, lwp_t *);
65 1.1 rmind static int npf_dev_close(dev_t, int, int, lwp_t *);
66 1.1 rmind static int npf_dev_ioctl(dev_t, u_long, void *, int, lwp_t *);
67 1.1 rmind static int npf_dev_poll(dev_t, int, lwp_t *);
68 1.1 rmind static int npf_dev_read(dev_t, struct uio *, int);
69 1.1 rmind
70 1.2 rmind typedef struct {
71 1.2 rmind npf_ruleset_t * n_rules;
72 1.2 rmind npf_tableset_t * n_tables;
73 1.2 rmind npf_ruleset_t * n_nat_rules;
74 1.7.2.1 riz prop_dictionary_t n_dict;
75 1.7.2.1 riz bool n_default_pass;
76 1.2 rmind } npf_core_t;
77 1.2 rmind
78 1.2 rmind static void npf_core_destroy(npf_core_t *);
79 1.2 rmind static int npfctl_stats(void *);
80 1.2 rmind
81 1.2 rmind static krwlock_t npf_lock __cacheline_aligned;
82 1.2 rmind static npf_core_t * npf_core __cacheline_aligned;
83 1.2 rmind static percpu_t * npf_stats_percpu __read_mostly;
84 1.7.2.2 riz static struct sysctllog * npf_sysctl __read_mostly;
85 1.2 rmind
86 1.1 rmind const struct cdevsw npf_cdevsw = {
87 1.1 rmind npf_dev_open, npf_dev_close, npf_dev_read, nowrite, npf_dev_ioctl,
88 1.1 rmind nostop, notty, npf_dev_poll, nommap, nokqfilter, D_OTHER | D_MPSAFE
89 1.1 rmind };
90 1.1 rmind
91 1.1 rmind static int
92 1.1 rmind npf_init(void)
93 1.1 rmind {
94 1.1 rmind #ifdef _MODULE
95 1.1 rmind devmajor_t bmajor = NODEVMAJOR, cmajor = NODEVMAJOR;
96 1.1 rmind #endif
97 1.2 rmind npf_ruleset_t *rset, *nset;
98 1.2 rmind npf_tableset_t *tset;
99 1.7.2.1 riz prop_dictionary_t dict;
100 1.2 rmind int error = 0;
101 1.2 rmind
102 1.2 rmind rw_init(&npf_lock);
103 1.2 rmind npf_stats_percpu = percpu_alloc(NPF_STATS_SIZE);
104 1.7.2.2 riz npf_sysctl = NULL;
105 1.7.2.2 riz
106 1.2 rmind npf_tableset_sysinit();
107 1.2 rmind npf_session_sysinit();
108 1.1 rmind npf_nat_sysinit();
109 1.1 rmind npf_alg_sysinit();
110 1.2 rmind npflogattach(1);
111 1.2 rmind
112 1.2 rmind /* Load empty configuration. */
113 1.7.2.1 riz dict = prop_dictionary_create();
114 1.2 rmind rset = npf_ruleset_create();
115 1.2 rmind tset = npf_tableset_create();
116 1.2 rmind nset = npf_ruleset_create();
117 1.7.2.1 riz npf_reload(dict, rset, tset, nset, true);
118 1.2 rmind KASSERT(npf_core != NULL);
119 1.1 rmind
120 1.1 rmind #ifdef _MODULE
121 1.1 rmind /* Attach /dev/npf device. */
122 1.1 rmind error = devsw_attach("npf", NULL, &bmajor, &npf_cdevsw, &cmajor);
123 1.1 rmind if (error) {
124 1.2 rmind /* It will call devsw_detach(), which is safe. */
125 1.2 rmind (void)npf_fini();
126 1.1 rmind }
127 1.1 rmind #endif
128 1.1 rmind return error;
129 1.1 rmind }
130 1.1 rmind
131 1.1 rmind static int
132 1.1 rmind npf_fini(void)
133 1.1 rmind {
134 1.1 rmind
135 1.7.2.1 riz /* At first, detach device and remove pfil hooks. */
136 1.1 rmind #ifdef _MODULE
137 1.1 rmind devsw_detach(NULL, &npf_cdevsw);
138 1.1 rmind #endif
139 1.2 rmind npflogdetach();
140 1.7.2.1 riz npf_pfil_unregister();
141 1.2 rmind
142 1.7.2.1 riz /* Flush all sessions, destroy configuration (ruleset, etc). */
143 1.7.2.1 riz npf_session_tracking(false);
144 1.7.2.1 riz npf_core_destroy(npf_core);
145 1.7.2.1 riz
146 1.7.2.1 riz /* Finally, safe to destroy the subsystems. */
147 1.1 rmind npf_alg_sysfini();
148 1.7.2.1 riz npf_nat_sysfini();
149 1.1 rmind npf_session_sysfini();
150 1.1 rmind npf_tableset_sysfini();
151 1.7.2.2 riz
152 1.7.2.2 riz if (npf_sysctl) {
153 1.7.2.2 riz sysctl_teardown(&npf_sysctl);
154 1.7.2.2 riz }
155 1.2 rmind percpu_free(npf_stats_percpu, NPF_STATS_SIZE);
156 1.2 rmind rw_destroy(&npf_lock);
157 1.1 rmind
158 1.1 rmind return 0;
159 1.1 rmind }
160 1.1 rmind
161 1.1 rmind /*
162 1.1 rmind * Module interface.
163 1.1 rmind */
164 1.1 rmind static int
165 1.1 rmind npf_modcmd(modcmd_t cmd, void *arg)
166 1.1 rmind {
167 1.1 rmind
168 1.1 rmind switch (cmd) {
169 1.1 rmind case MODULE_CMD_INIT:
170 1.1 rmind return npf_init();
171 1.1 rmind case MODULE_CMD_FINI:
172 1.1 rmind return npf_fini();
173 1.7.2.3 riz case MODULE_CMD_AUTOUNLOAD:
174 1.7.2.3 riz if (npf_pfil_registered_p() || !npf_default_pass()) {
175 1.7.2.3 riz return EBUSY;
176 1.7.2.3 riz }
177 1.7.2.3 riz break;
178 1.1 rmind default:
179 1.1 rmind return ENOTTY;
180 1.1 rmind }
181 1.1 rmind return 0;
182 1.1 rmind }
183 1.1 rmind
184 1.1 rmind void
185 1.1 rmind npfattach(int nunits)
186 1.1 rmind {
187 1.1 rmind
188 1.1 rmind /* Void. */
189 1.1 rmind }
190 1.1 rmind
191 1.1 rmind static int
192 1.1 rmind npf_dev_open(dev_t dev, int flag, int mode, lwp_t *l)
193 1.1 rmind {
194 1.1 rmind
195 1.1 rmind /* Available only for super-user. */
196 1.1 rmind if (kauth_authorize_generic(l->l_cred, KAUTH_GENERIC_ISSUSER, NULL)) {
197 1.1 rmind return EPERM;
198 1.1 rmind }
199 1.1 rmind return 0;
200 1.1 rmind }
201 1.1 rmind
202 1.1 rmind static int
203 1.1 rmind npf_dev_close(dev_t dev, int flag, int mode, lwp_t *l)
204 1.1 rmind {
205 1.1 rmind
206 1.1 rmind return 0;
207 1.1 rmind }
208 1.1 rmind
209 1.1 rmind static int
210 1.1 rmind npf_dev_ioctl(dev_t dev, u_long cmd, void *data, int flag, lwp_t *l)
211 1.1 rmind {
212 1.1 rmind int error;
213 1.1 rmind
214 1.1 rmind /* Available only for super-user. */
215 1.1 rmind if (kauth_authorize_generic(l->l_cred, KAUTH_GENERIC_ISSUSER, NULL)) {
216 1.1 rmind return EPERM;
217 1.1 rmind }
218 1.1 rmind
219 1.1 rmind switch (cmd) {
220 1.1 rmind case IOC_NPF_VERSION:
221 1.1 rmind *(int *)data = NPF_VERSION;
222 1.1 rmind error = 0;
223 1.1 rmind break;
224 1.1 rmind case IOC_NPF_SWITCH:
225 1.1 rmind error = npfctl_switch(data);
226 1.1 rmind break;
227 1.1 rmind case IOC_NPF_RELOAD:
228 1.1 rmind error = npfctl_reload(cmd, data);
229 1.1 rmind break;
230 1.7.2.1 riz case IOC_NPF_GETCONF:
231 1.7.2.1 riz error = npfctl_getconf(cmd, data);
232 1.7.2.1 riz break;
233 1.1 rmind case IOC_NPF_TABLE:
234 1.1 rmind error = npfctl_table(data);
235 1.1 rmind break;
236 1.2 rmind case IOC_NPF_STATS:
237 1.2 rmind error = npfctl_stats(data);
238 1.2 rmind break;
239 1.2 rmind case IOC_NPF_SESSIONS_SAVE:
240 1.2 rmind error = npfctl_sessions_save(cmd, data);
241 1.2 rmind break;
242 1.2 rmind case IOC_NPF_SESSIONS_LOAD:
243 1.2 rmind error = npfctl_sessions_load(cmd, data);
244 1.2 rmind break;
245 1.4 rmind case IOC_NPF_UPDATE_RULE:
246 1.4 rmind error = npfctl_update_rule(cmd, data);
247 1.4 rmind break;
248 1.1 rmind default:
249 1.1 rmind error = ENOTTY;
250 1.1 rmind break;
251 1.1 rmind }
252 1.1 rmind return error;
253 1.1 rmind }
254 1.1 rmind
255 1.1 rmind static int
256 1.1 rmind npf_dev_poll(dev_t dev, int events, lwp_t *l)
257 1.1 rmind {
258 1.1 rmind
259 1.1 rmind return ENOTSUP;
260 1.1 rmind }
261 1.1 rmind
262 1.1 rmind static int
263 1.1 rmind npf_dev_read(dev_t dev, struct uio *uio, int flag)
264 1.1 rmind {
265 1.1 rmind
266 1.1 rmind return ENOTSUP;
267 1.1 rmind }
268 1.2 rmind
269 1.2 rmind /*
270 1.2 rmind * NPF core loading/reloading/unloading mechanism.
271 1.2 rmind */
272 1.2 rmind
273 1.2 rmind static void
274 1.2 rmind npf_core_destroy(npf_core_t *nc)
275 1.2 rmind {
276 1.2 rmind
277 1.7.2.1 riz prop_object_release(nc->n_dict);
278 1.2 rmind npf_ruleset_destroy(nc->n_rules);
279 1.2 rmind npf_ruleset_destroy(nc->n_nat_rules);
280 1.3 rmind npf_tableset_destroy(nc->n_tables);
281 1.2 rmind kmem_free(nc, sizeof(npf_core_t));
282 1.2 rmind }
283 1.2 rmind
284 1.2 rmind /*
285 1.2 rmind * npf_reload: atomically load new ruleset, tableset and NAT policies.
286 1.2 rmind * Then destroy old (unloaded) structures.
287 1.2 rmind */
288 1.2 rmind void
289 1.7.2.1 riz npf_reload(prop_dictionary_t dict, npf_ruleset_t *rset,
290 1.7.2.1 riz npf_tableset_t *tset, npf_ruleset_t *nset, bool flush)
291 1.2 rmind {
292 1.2 rmind npf_core_t *nc, *onc;
293 1.2 rmind
294 1.2 rmind /* Setup a new core structure. */
295 1.7.2.1 riz nc = kmem_zalloc(sizeof(npf_core_t), KM_SLEEP);
296 1.2 rmind nc->n_rules = rset;
297 1.2 rmind nc->n_tables = tset;
298 1.2 rmind nc->n_nat_rules = nset;
299 1.7.2.1 riz nc->n_dict = dict;
300 1.7.2.1 riz nc->n_default_pass = flush;
301 1.2 rmind
302 1.2 rmind /* Lock and load the core structure. */
303 1.2 rmind rw_enter(&npf_lock, RW_WRITER);
304 1.2 rmind onc = atomic_swap_ptr(&npf_core, nc);
305 1.2 rmind if (onc) {
306 1.2 rmind /* Reload only necessary NAT policies. */
307 1.2 rmind npf_ruleset_natreload(nset, onc->n_nat_rules);
308 1.2 rmind }
309 1.2 rmind /* Unlock. Everything goes "live" now. */
310 1.2 rmind rw_exit(&npf_lock);
311 1.2 rmind
312 1.2 rmind if (onc) {
313 1.2 rmind /* Destroy unloaded structures. */
314 1.2 rmind npf_core_destroy(onc);
315 1.2 rmind }
316 1.2 rmind }
317 1.2 rmind
318 1.2 rmind void
319 1.2 rmind npf_core_enter(void)
320 1.2 rmind {
321 1.2 rmind rw_enter(&npf_lock, RW_READER);
322 1.2 rmind }
323 1.2 rmind
324 1.2 rmind npf_ruleset_t *
325 1.2 rmind npf_core_ruleset(void)
326 1.2 rmind {
327 1.2 rmind KASSERT(rw_lock_held(&npf_lock));
328 1.2 rmind return npf_core->n_rules;
329 1.2 rmind }
330 1.2 rmind
331 1.2 rmind npf_ruleset_t *
332 1.2 rmind npf_core_natset(void)
333 1.2 rmind {
334 1.2 rmind KASSERT(rw_lock_held(&npf_lock));
335 1.2 rmind return npf_core->n_nat_rules;
336 1.2 rmind }
337 1.2 rmind
338 1.2 rmind npf_tableset_t *
339 1.2 rmind npf_core_tableset(void)
340 1.2 rmind {
341 1.2 rmind KASSERT(rw_lock_held(&npf_lock));
342 1.2 rmind return npf_core->n_tables;
343 1.2 rmind }
344 1.2 rmind
345 1.2 rmind void
346 1.2 rmind npf_core_exit(void)
347 1.2 rmind {
348 1.2 rmind rw_exit(&npf_lock);
349 1.2 rmind }
350 1.2 rmind
351 1.2 rmind bool
352 1.2 rmind npf_core_locked(void)
353 1.2 rmind {
354 1.2 rmind return rw_lock_held(&npf_lock);
355 1.2 rmind }
356 1.2 rmind
357 1.7.2.1 riz prop_dictionary_t
358 1.7.2.1 riz npf_core_dict(void)
359 1.7.2.1 riz {
360 1.7.2.1 riz KASSERT(rw_lock_held(&npf_lock));
361 1.7.2.1 riz return npf_core->n_dict;
362 1.7.2.1 riz }
363 1.7.2.1 riz
364 1.7.2.1 riz bool
365 1.7.2.1 riz npf_default_pass(void)
366 1.7.2.1 riz {
367 1.7.2.1 riz KASSERT(rw_lock_held(&npf_lock));
368 1.7.2.1 riz return npf_core->n_default_pass;
369 1.7.2.1 riz }
370 1.7.2.1 riz
371 1.2 rmind /*
372 1.2 rmind * NPF statistics interface.
373 1.2 rmind */
374 1.2 rmind
375 1.2 rmind void
376 1.2 rmind npf_stats_inc(npf_stats_t st)
377 1.2 rmind {
378 1.2 rmind uint64_t *stats = percpu_getref(npf_stats_percpu);
379 1.2 rmind stats[st]++;
380 1.2 rmind percpu_putref(npf_stats_percpu);
381 1.2 rmind }
382 1.2 rmind
383 1.2 rmind void
384 1.2 rmind npf_stats_dec(npf_stats_t st)
385 1.2 rmind {
386 1.2 rmind uint64_t *stats = percpu_getref(npf_stats_percpu);
387 1.2 rmind stats[st]--;
388 1.2 rmind percpu_putref(npf_stats_percpu);
389 1.2 rmind }
390 1.2 rmind
391 1.2 rmind static void
392 1.2 rmind npf_stats_collect(void *mem, void *arg, struct cpu_info *ci)
393 1.2 rmind {
394 1.2 rmind uint64_t *percpu_stats = mem, *full_stats = arg;
395 1.2 rmind int i;
396 1.2 rmind
397 1.2 rmind for (i = 0; i < NPF_STATS_COUNT; i++) {
398 1.2 rmind full_stats[i] += percpu_stats[i];
399 1.2 rmind }
400 1.2 rmind }
401 1.2 rmind
402 1.2 rmind /*
403 1.2 rmind * npfctl_stats: export collected statistics.
404 1.2 rmind */
405 1.2 rmind static int
406 1.2 rmind npfctl_stats(void *data)
407 1.2 rmind {
408 1.2 rmind uint64_t *fullst, *uptr = *(uint64_t **)data;
409 1.2 rmind int error;
410 1.2 rmind
411 1.2 rmind fullst = kmem_zalloc(NPF_STATS_SIZE, KM_SLEEP);
412 1.2 rmind percpu_foreach(npf_stats_percpu, npf_stats_collect, fullst);
413 1.2 rmind error = copyout(fullst, uptr, NPF_STATS_SIZE);
414 1.2 rmind kmem_free(fullst, NPF_STATS_SIZE);
415 1.2 rmind return error;
416 1.2 rmind }
417