if_pfsync.c revision 1.1.1.1 1 /* $OpenBSD: if_pfsync.c,v 1.26 2004/03/28 18:14:20 mcbride Exp $ */
2
3 /*
4 * Copyright (c) 2002 Michael Shalayeff
5 * All rights reserved.
6 *
7 * Redistribution and use in source and binary forms, with or without
8 * modification, are permitted provided that the following conditions
9 * are met:
10 * 1. Redistributions of source code must retain the above copyright
11 * notice, this list of conditions and the following disclaimer.
12 * 2. Redistributions in binary form must reproduce the above copyright
13 * notice, this list of conditions and the following disclaimer in the
14 * documentation and/or other materials provided with the distribution.
15 *
16 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
17 * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
18 * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
19 * IN NO EVENT SHALL THE AUTHOR OR HIS RELATIVES BE LIABLE FOR ANY DIRECT,
20 * INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
21 * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
22 * SERVICES; LOSS OF MIND, USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
23 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
24 * STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING
25 * IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF
26 * THE POSSIBILITY OF SUCH DAMAGE.
27 */
28
29 #include "bpfilter.h"
30 #include "pfsync.h"
31
32 #include <sys/param.h>
33 #include <sys/proc.h>
34 #include <sys/systm.h>
35 #include <sys/time.h>
36 #include <sys/mbuf.h>
37 #include <sys/socket.h>
38 #include <sys/ioctl.h>
39 #include <sys/timeout.h>
40
41 #include <net/if.h>
42 #include <net/if_types.h>
43 #include <net/route.h>
44 #include <net/bpf.h>
45
46 #ifdef INET
47 #include <netinet/in.h>
48 #include <netinet/in_systm.h>
49 #include <netinet/in_var.h>
50 #include <netinet/ip.h>
51 #include <netinet/ip_var.h>
52 #endif
53
54 #ifdef INET6
55 #ifndef INET
56 #include <netinet/in.h>
57 #endif
58 #include <netinet6/nd6.h>
59 #endif /* INET6 */
60
61 #include <net/pfvar.h>
62 #include <net/if_pfsync.h>
63
64 #define PFSYNC_MINMTU \
65 (sizeof(struct pfsync_header) + sizeof(struct pf_state))
66
67 #ifdef PFSYNCDEBUG
68 #define DPRINTF(x) do { if (pfsyncdebug) printf x ; } while (0)
69 int pfsyncdebug;
70 #else
71 #define DPRINTF(x)
72 #endif
73
74 struct pfsync_softc pfsyncif;
75 int pfsync_sync_ok;
76 struct pfsyncstats pfsyncstats;
77
78 void pfsyncattach(int);
79 void pfsync_setmtu(struct pfsync_softc *, int);
80 int pfsync_insert_net_state(struct pfsync_state *);
81 int pfsyncoutput(struct ifnet *, struct mbuf *, struct sockaddr *,
82 struct rtentry *);
83 int pfsyncioctl(struct ifnet *, u_long, caddr_t);
84 void pfsyncstart(struct ifnet *);
85
86 struct mbuf *pfsync_get_mbuf(struct pfsync_softc *, u_int8_t, void **);
87 int pfsync_request_update(struct pfsync_state_upd *, struct in_addr *);
88 int pfsync_sendout(struct pfsync_softc *);
89 void pfsync_timeout(void *);
90 void pfsync_send_bus(struct pfsync_softc *, u_int8_t);
91 void pfsync_bulk_update(void *);
92 void pfsync_bulkfail(void *);
93
94 extern int ifqmaxlen;
95 extern struct timeval time;
96 extern struct timeval mono_time;
97 extern int hz;
98
99 void
100 pfsyncattach(int npfsync)
101 {
102 struct ifnet *ifp;
103
104 pfsync_sync_ok = 1;
105 bzero(&pfsyncif, sizeof(pfsyncif));
106 pfsyncif.sc_mbuf = NULL;
107 pfsyncif.sc_mbuf_net = NULL;
108 pfsyncif.sc_statep.s = NULL;
109 pfsyncif.sc_statep_net.s = NULL;
110 pfsyncif.sc_maxupdates = 128;
111 pfsyncif.sc_sendaddr.s_addr = INADDR_PFSYNC_GROUP;
112 pfsyncif.sc_ureq_received = 0;
113 pfsyncif.sc_ureq_sent = 0;
114 ifp = &pfsyncif.sc_if;
115 strlcpy(ifp->if_xname, "pfsync0", sizeof ifp->if_xname);
116 ifp->if_softc = &pfsyncif;
117 ifp->if_ioctl = pfsyncioctl;
118 ifp->if_output = pfsyncoutput;
119 ifp->if_start = pfsyncstart;
120 ifp->if_type = IFT_PFSYNC;
121 ifp->if_snd.ifq_maxlen = ifqmaxlen;
122 ifp->if_hdrlen = PFSYNC_HDRLEN;
123 pfsync_setmtu(&pfsyncif, MCLBYTES);
124 timeout_set(&pfsyncif.sc_tmo, pfsync_timeout, &pfsyncif);
125 timeout_set(&pfsyncif.sc_bulk_tmo, pfsync_bulk_update, &pfsyncif);
126 timeout_set(&pfsyncif.sc_bulkfail_tmo, pfsync_bulkfail, &pfsyncif);
127 if_attach(ifp);
128 if_alloc_sadl(ifp);
129
130 #if NBPFILTER > 0
131 bpfattach(&pfsyncif.sc_if.if_bpf, ifp, DLT_PFSYNC, PFSYNC_HDRLEN);
132 #endif
133 }
134
135 /*
136 * Start output on the pfsync interface.
137 */
138 void
139 pfsyncstart(struct ifnet *ifp)
140 {
141 struct mbuf *m;
142 int s;
143
144 for (;;) {
145 s = splimp();
146 IF_DROP(&ifp->if_snd);
147 IF_DEQUEUE(&ifp->if_snd, m);
148 splx(s);
149
150 if (m == NULL)
151 return;
152 else
153 m_freem(m);
154 }
155 }
156
157 int
158 pfsync_insert_net_state(struct pfsync_state *sp)
159 {
160 struct pf_state *st = NULL;
161 struct pf_rule *r = NULL;
162 struct pfi_kif *kif;
163
164 if (sp->creatorid == 0 && pf_status.debug >= PF_DEBUG_MISC) {
165 printf("pfsync_insert_net_state: invalid creator id:"
166 " %08x\n", ntohl(sp->creatorid));
167 return (EINVAL);
168 }
169
170 kif = pfi_lookup_create(sp->ifname);
171 if (kif == NULL) {
172 if (pf_status.debug >= PF_DEBUG_MISC)
173 printf("pfsync_insert_net_state: "
174 "unknown interface: %s\n", sp->ifname);
175 /* skip this state */
176 return (0);
177 }
178
179 /*
180 * Just use the default rule until we have infrastructure to find the
181 * best matching rule.
182 */
183 r = &pf_default_rule;
184
185 if (!r->max_states || r->states < r->max_states)
186 st = pool_get(&pf_state_pl, PR_NOWAIT);
187 if (st == NULL) {
188 pfi_maybe_destroy(kif);
189 return (ENOMEM);
190 }
191 bzero(st, sizeof(*st));
192
193 st->rule.ptr = r;
194 /* XXX get pointers to nat_rule and anchor */
195
196 /* fill in the rest of the state entry */
197 pf_state_host_ntoh(&sp->lan, &st->lan);
198 pf_state_host_ntoh(&sp->gwy, &st->gwy);
199 pf_state_host_ntoh(&sp->ext, &st->ext);
200
201 pf_state_peer_ntoh(&sp->src, &st->src);
202 pf_state_peer_ntoh(&sp->dst, &st->dst);
203
204 bcopy(&sp->rt_addr, &st->rt_addr, sizeof(st->rt_addr));
205 st->creation = ntohl(sp->creation) + time.tv_sec;
206 st->expire = ntohl(sp->expire) + time.tv_sec;
207
208 st->af = sp->af;
209 st->proto = sp->proto;
210 st->direction = sp->direction;
211 st->log = sp->log;
212 st->timeout = sp->timeout;
213 st->allow_opts = sp->allow_opts;
214
215 bcopy(sp->id, &st->id, sizeof(st->id));
216 st->creatorid = sp->creatorid;
217 st->sync_flags = sp->sync_flags | PFSTATE_FROMSYNC;
218
219
220 if (pf_insert_state(kif, st)) {
221 pfi_maybe_destroy(kif);
222 pool_put(&pf_state_pl, st);
223 return (EINVAL);
224 }
225
226 return (0);
227 }
228
229 void
230 pfsync_input(struct mbuf *m, ...)
231 {
232 struct ip *ip = mtod(m, struct ip *);
233 struct pfsync_header *ph;
234 struct pfsync_softc *sc = &pfsyncif;
235 struct pf_state *st, key;
236 struct pfsync_state *sp;
237 struct pfsync_state_upd *up;
238 struct pfsync_state_del *dp;
239 struct pfsync_state_clr *cp;
240 struct pfsync_state_upd_req *rup;
241 struct pfsync_state_bus *bus;
242 struct in_addr src;
243 struct mbuf *mp;
244 int iplen, action, error, i, s, count, offp;
245
246 pfsyncstats.pfsyncs_ipackets++;
247
248 /* verify that we have a sync interface configured */
249 if (!sc->sc_sync_ifp || !pf_status.running)
250 goto done;
251
252 /* verify that the packet came in on the right interface */
253 if (sc->sc_sync_ifp != m->m_pkthdr.rcvif) {
254 pfsyncstats.pfsyncs_badif++;
255 goto done;
256 }
257
258 /* verify that the IP TTL is 255. */
259 if (ip->ip_ttl != PFSYNC_DFLTTL) {
260 pfsyncstats.pfsyncs_badttl++;
261 goto done;
262 }
263
264 iplen = ip->ip_hl << 2;
265
266 if (m->m_pkthdr.len < iplen + sizeof(*ph)) {
267 pfsyncstats.pfsyncs_hdrops++;
268 goto done;
269 }
270
271 if (iplen + sizeof(*ph) > m->m_len) {
272 if ((m = m_pullup(m, iplen + sizeof(*ph))) == NULL) {
273 pfsyncstats.pfsyncs_hdrops++;
274 goto done;
275 }
276 ip = mtod(m, struct ip *);
277 }
278 ph = (struct pfsync_header *)((char *)ip + iplen);
279
280 /* verify the version */
281 if (ph->version != PFSYNC_VERSION) {
282 pfsyncstats.pfsyncs_badver++;
283 goto done;
284 }
285
286 action = ph->action;
287 count = ph->count;
288
289 /* make sure it's a valid action code */
290 if (action >= PFSYNC_ACT_MAX) {
291 pfsyncstats.pfsyncs_badact++;
292 goto done;
293 }
294
295 /* Cheaper to grab this now than having to mess with mbufs later */
296 src = ip->ip_src;
297
298 switch (action) {
299 case PFSYNC_ACT_CLR: {
300 struct pfi_kif *kif;
301 u_int32_t creatorid;
302 if ((mp = m_pulldown(m, iplen + sizeof(*ph),
303 sizeof(*cp), &offp)) == NULL) {
304 pfsyncstats.pfsyncs_badlen++;
305 return;
306 }
307 cp = (struct pfsync_state_clr *)(mp->m_data + offp);
308 creatorid = cp->creatorid;
309
310 s = splsoftnet();
311 if (cp->ifname[0] == '\0') {
312 RB_FOREACH(st, pf_state_tree_id, &tree_id) {
313 if (st->creatorid == creatorid)
314 st->timeout = PFTM_PURGE;
315 }
316 } else {
317 kif = pfi_lookup_if(cp->ifname);
318 if (kif == NULL) {
319 if (pf_status.debug >= PF_DEBUG_MISC)
320 printf("pfsync_input: PFSYNC_ACT_CLR "
321 "bad interface: %s\n", cp->ifname);
322 splx(s);
323 goto done;
324 }
325 RB_FOREACH(st, pf_state_tree_lan_ext,
326 &kif->pfik_lan_ext) {
327 if (st->creatorid == creatorid)
328 st->timeout = PFTM_PURGE;
329 }
330 }
331 pf_purge_expired_states();
332 splx(s);
333
334 break;
335 }
336 case PFSYNC_ACT_INS:
337 if ((mp = m_pulldown(m, iplen + sizeof(*ph),
338 count * sizeof(*sp), &offp)) == NULL) {
339 pfsyncstats.pfsyncs_badlen++;
340 return;
341 }
342
343 s = splsoftnet();
344 for (i = 0, sp = (struct pfsync_state *)(mp->m_data + offp);
345 i < count; i++, sp++) {
346 /* check for invalid values */
347 if (sp->timeout >= PFTM_MAX ||
348 sp->src.state > PF_TCPS_PROXY_DST ||
349 sp->dst.state > PF_TCPS_PROXY_DST ||
350 sp->direction > PF_OUT ||
351 (sp->af != AF_INET && sp->af != AF_INET6)) {
352 if (pf_status.debug >= PF_DEBUG_MISC)
353 printf("pfsync_insert: PFSYNC_ACT_INS: "
354 "invalid value\n");
355 pfsyncstats.pfsyncs_badstate++;
356 continue;
357 }
358
359 if ((error = pfsync_insert_net_state(sp))) {
360 if (error == ENOMEM) {
361 splx(s);
362 goto done;
363 }
364 continue;
365 }
366 }
367 splx(s);
368 break;
369 case PFSYNC_ACT_UPD:
370 if ((mp = m_pulldown(m, iplen + sizeof(*ph),
371 count * sizeof(*sp), &offp)) == NULL) {
372 pfsyncstats.pfsyncs_badlen++;
373 return;
374 }
375
376 s = splsoftnet();
377 for (i = 0, sp = (struct pfsync_state *)(mp->m_data + offp);
378 i < count; i++, sp++) {
379 /* check for invalid values */
380 if (sp->timeout >= PFTM_MAX ||
381 sp->src.state > PF_TCPS_PROXY_DST ||
382 sp->dst.state > PF_TCPS_PROXY_DST) {
383 if (pf_status.debug >= PF_DEBUG_MISC)
384 printf("pfsync_insert: PFSYNC_ACT_UPD: "
385 "invalid value\n");
386 pfsyncstats.pfsyncs_badstate++;
387 continue;
388 }
389
390 bcopy(sp->id, &key.id, sizeof(key.id));
391 key.creatorid = sp->creatorid;
392
393 st = pf_find_state_byid(&key);
394 if (st == NULL) {
395 /* insert the update */
396 if (pfsync_insert_net_state(sp))
397 pfsyncstats.pfsyncs_badstate++;
398 continue;
399 }
400 pf_state_peer_ntoh(&sp->src, &st->src);
401 pf_state_peer_ntoh(&sp->dst, &st->dst);
402 st->expire = ntohl(sp->expire) + time.tv_sec;
403 st->timeout = sp->timeout;
404
405 }
406 splx(s);
407 break;
408 /*
409 * It's not strictly necessary for us to support the "uncompressed"
410 * delete action, but it's relatively simple and maintains consistency.
411 */
412 case PFSYNC_ACT_DEL:
413 if ((mp = m_pulldown(m, iplen + sizeof(*ph),
414 count * sizeof(*sp), &offp)) == NULL) {
415 pfsyncstats.pfsyncs_badlen++;
416 return;
417 }
418
419 s = splsoftnet();
420 for (i = 0, sp = (struct pfsync_state *)(mp->m_data + offp);
421 i < count; i++, sp++) {
422 bcopy(sp->id, &key.id, sizeof(key.id));
423 key.creatorid = sp->creatorid;
424
425 st = pf_find_state_byid(&key);
426 if (st == NULL) {
427 pfsyncstats.pfsyncs_badstate++;
428 continue;
429 }
430 /*
431 * XXX
432 * pf_purge_expired_states() is expensive,
433 * we really want to purge the state directly.
434 */
435 st->timeout = PFTM_PURGE;
436 st->sync_flags |= PFSTATE_FROMSYNC;
437 }
438 pf_purge_expired_states();
439 splx(s);
440 break;
441 case PFSYNC_ACT_UPD_C: {
442 int update_requested = 0;
443
444 if ((mp = m_pulldown(m, iplen + sizeof(*ph),
445 count * sizeof(*up), &offp)) == NULL) {
446 pfsyncstats.pfsyncs_badlen++;
447 return;
448 }
449
450 s = splsoftnet();
451 for (i = 0, up = (struct pfsync_state_upd *)(mp->m_data + offp);
452 i < count; i++, up++) {
453 /* check for invalid values */
454 if (up->timeout >= PFTM_MAX ||
455 up->src.state > PF_TCPS_PROXY_DST ||
456 up->dst.state > PF_TCPS_PROXY_DST) {
457 if (pf_status.debug >= PF_DEBUG_MISC)
458 printf("pfsync_insert: "
459 "PFSYNC_ACT_UPD_C: "
460 "invalid value\n");
461 pfsyncstats.pfsyncs_badstate++;
462 continue;
463 }
464
465 bcopy(up->id, &key.id, sizeof(key.id));
466 key.creatorid = up->creatorid;
467
468 st = pf_find_state_byid(&key);
469 if (st == NULL) {
470 /* We don't have this state. Ask for it. */
471 pfsync_request_update(up, &src);
472 update_requested = 1;
473 pfsyncstats.pfsyncs_badstate++;
474 continue;
475 }
476 pf_state_peer_ntoh(&up->src, &st->src);
477 pf_state_peer_ntoh(&up->dst, &st->dst);
478 st->expire = ntohl(up->expire) + time.tv_sec;
479 st->timeout = up->timeout;
480 }
481 if (update_requested)
482 pfsync_sendout(sc);
483 splx(s);
484 break;
485 }
486 case PFSYNC_ACT_DEL_C:
487 if ((mp = m_pulldown(m, iplen + sizeof(*ph),
488 count * sizeof(*dp), &offp)) == NULL) {
489 pfsyncstats.pfsyncs_badlen++;
490 return;
491 }
492
493 s = splsoftnet();
494 for (i = 0, dp = (struct pfsync_state_del *)(mp->m_data + offp);
495 i < count; i++, dp++) {
496 bcopy(dp->id, &key.id, sizeof(key.id));
497 key.creatorid = dp->creatorid;
498
499 st = pf_find_state_byid(&key);
500 if (st == NULL) {
501 pfsyncstats.pfsyncs_badstate++;
502 continue;
503 }
504 /*
505 * XXX
506 * pf_purge_expired_states() is expensive,
507 * we really want to purge the state directly.
508 */
509 st->timeout = PFTM_PURGE;
510 st->sync_flags |= PFSTATE_FROMSYNC;
511 }
512 pf_purge_expired_states();
513 splx(s);
514 break;
515 case PFSYNC_ACT_INS_F:
516 case PFSYNC_ACT_DEL_F:
517 /* not implemented */
518 break;
519 case PFSYNC_ACT_UREQ:
520 if ((mp = m_pulldown(m, iplen + sizeof(*ph),
521 count * sizeof(*rup), &offp)) == NULL) {
522 pfsyncstats.pfsyncs_badlen++;
523 return;
524 }
525
526 s = splsoftnet();
527 /* XXX send existing. pfsync_pack_state should handle this. */
528 if (sc->sc_mbuf != NULL)
529 pfsync_sendout(sc);
530 for (i = 0,
531 rup = (struct pfsync_state_upd_req *)(mp->m_data + offp);
532 i < count; i++, rup++) {
533 bcopy(rup->id, &key.id, sizeof(key.id));
534 key.creatorid = rup->creatorid;
535
536 if (key.id == 0 && key.creatorid == 0) {
537 sc->sc_ureq_received = mono_time.tv_sec;
538 if (pf_status.debug >= PF_DEBUG_MISC)
539 printf("pfsync: received "
540 "bulk update request\n");
541 pfsync_send_bus(sc, PFSYNC_BUS_START);
542 timeout_add(&sc->sc_bulk_tmo, 1 * hz);
543 } else {
544 st = pf_find_state_byid(&key);
545 if (st == NULL) {
546 pfsyncstats.pfsyncs_badstate++;
547 continue;
548 }
549 pfsync_pack_state(PFSYNC_ACT_UPD, st, 0);
550 }
551 }
552 if (sc->sc_mbuf != NULL)
553 pfsync_sendout(sc);
554 splx(s);
555 break;
556 case PFSYNC_ACT_BUS:
557 /* If we're not waiting for a bulk update, who cares. */
558 if (sc->sc_ureq_sent == 0)
559 break;
560
561 if ((mp = m_pulldown(m, iplen + sizeof(*ph),
562 sizeof(*bus), &offp)) == NULL) {
563 pfsyncstats.pfsyncs_badlen++;
564 return;
565 }
566 bus = (struct pfsync_state_bus *)(mp->m_data + offp);
567 switch (bus->status) {
568 case PFSYNC_BUS_START:
569 timeout_add(&sc->sc_bulkfail_tmo,
570 pf_pool_limits[PF_LIMIT_STATES].limit /
571 (PFSYNC_BULKPACKETS * sc->sc_maxcount));
572 if (pf_status.debug >= PF_DEBUG_MISC)
573 printf("pfsync: received bulk "
574 "update start\n");
575 break;
576 case PFSYNC_BUS_END:
577 if (mono_time.tv_sec - ntohl(bus->endtime) >=
578 sc->sc_ureq_sent) {
579 /* that's it, we're happy */
580 sc->sc_ureq_sent = 0;
581 sc->sc_bulk_tries = 0;
582 timeout_del(&sc->sc_bulkfail_tmo);
583 pfsync_sync_ok = 1;
584 if (pf_status.debug >= PF_DEBUG_MISC)
585 printf("pfsync: received valid "
586 "bulk update end\n");
587 } else {
588 if (pf_status.debug >= PF_DEBUG_MISC)
589 printf("pfsync: received invalid "
590 "bulk update end: bad timestamp\n");
591 }
592 break;
593 }
594 break;
595 }
596
597 done:
598 if (m)
599 m_freem(m);
600 }
601
602 int
603 pfsyncoutput(struct ifnet *ifp, struct mbuf *m, struct sockaddr *dst,
604 struct rtentry *rt)
605 {
606 m_freem(m);
607 return (0);
608 }
609
610 /* ARGSUSED */
611 int
612 pfsyncioctl(struct ifnet *ifp, u_long cmd, caddr_t data)
613 {
614 struct proc *p = curproc;
615 struct pfsync_softc *sc = ifp->if_softc;
616 struct ifreq *ifr = (struct ifreq *)data;
617 struct ip_moptions *imo = &sc->sc_imo;
618 struct pfsyncreq pfsyncr;
619 struct ifnet *sifp;
620 int s, error;
621
622 switch (cmd) {
623 case SIOCSIFADDR:
624 case SIOCAIFADDR:
625 case SIOCSIFDSTADDR:
626 case SIOCSIFFLAGS:
627 if (ifp->if_flags & IFF_UP)
628 ifp->if_flags |= IFF_RUNNING;
629 else
630 ifp->if_flags &= ~IFF_RUNNING;
631 break;
632 case SIOCSIFMTU:
633 if (ifr->ifr_mtu < PFSYNC_MINMTU)
634 return (EINVAL);
635 if (ifr->ifr_mtu > MCLBYTES)
636 ifr->ifr_mtu = MCLBYTES;
637 s = splnet();
638 if (ifr->ifr_mtu < ifp->if_mtu)
639 pfsync_sendout(sc);
640 pfsync_setmtu(sc, ifr->ifr_mtu);
641 splx(s);
642 break;
643 case SIOCGETPFSYNC:
644 bzero(&pfsyncr, sizeof(pfsyncr));
645 if (sc->sc_sync_ifp)
646 strlcpy(pfsyncr.pfsyncr_syncif,
647 sc->sc_sync_ifp->if_xname, IFNAMSIZ);
648 pfsyncr.pfsyncr_maxupdates = sc->sc_maxupdates;
649 if ((error = copyout(&pfsyncr, ifr->ifr_data, sizeof(pfsyncr))))
650 return (error);
651 break;
652 case SIOCSETPFSYNC:
653 if ((error = suser(p, p->p_acflag)) != 0)
654 return (error);
655 if ((error = copyin(ifr->ifr_data, &pfsyncr, sizeof(pfsyncr))))
656 return (error);
657
658 if (pfsyncr.pfsyncr_maxupdates > 255)
659 return (EINVAL);
660 sc->sc_maxupdates = pfsyncr.pfsyncr_maxupdates;
661
662 if (pfsyncr.pfsyncr_syncif[0] == 0) {
663 sc->sc_sync_ifp = NULL;
664 if (sc->sc_mbuf_net != NULL) {
665 /* Don't keep stale pfsync packets around. */
666 s = splnet();
667 m_freem(sc->sc_mbuf_net);
668 sc->sc_mbuf_net = NULL;
669 sc->sc_statep_net.s = NULL;
670 splx(s);
671 }
672 break;
673 }
674 if ((sifp = ifunit(pfsyncr.pfsyncr_syncif)) == NULL)
675 return (EINVAL);
676 else if (sifp == sc->sc_sync_ifp)
677 break;
678
679 s = splnet();
680 if (sifp->if_mtu < sc->sc_if.if_mtu ||
681 (sc->sc_sync_ifp != NULL &&
682 sifp->if_mtu < sc->sc_sync_ifp->if_mtu) ||
683 sifp->if_mtu < MCLBYTES - sizeof(struct ip))
684 pfsync_sendout(sc);
685 sc->sc_sync_ifp = sifp;
686
687 pfsync_setmtu(sc, sc->sc_if.if_mtu);
688
689 if (imo->imo_num_memberships > 0) {
690 in_delmulti(imo->imo_membership[--imo->imo_num_memberships]);
691 imo->imo_multicast_ifp = NULL;
692 }
693
694 if (sc->sc_sync_ifp) {
695 struct in_addr addr;
696
697 addr.s_addr = INADDR_PFSYNC_GROUP;
698 if ((imo->imo_membership[0] =
699 in_addmulti(&addr, sc->sc_sync_ifp)) == NULL) {
700 splx(s);
701 return (ENOBUFS);
702 }
703 imo->imo_num_memberships++;
704 imo->imo_multicast_ifp = sc->sc_sync_ifp;
705 imo->imo_multicast_ttl = PFSYNC_DFLTTL;
706 imo->imo_multicast_loop = 0;
707
708 /* Request a full state table update. */
709 sc->sc_ureq_sent = mono_time.tv_sec;
710 pfsync_sync_ok = 0;
711 if (pf_status.debug >= PF_DEBUG_MISC)
712 printf("pfsync: requesting bulk update\n");
713 timeout_add(&sc->sc_bulkfail_tmo, 5 * hz);
714 pfsync_request_update(NULL, NULL);
715 pfsync_sendout(sc);
716 }
717 splx(s);
718
719 break;
720
721 default:
722 return (ENOTTY);
723 }
724
725 return (0);
726 }
727
728 void
729 pfsync_setmtu(struct pfsync_softc *sc, int mtu_req)
730 {
731 int mtu;
732
733 if (sc->sc_sync_ifp && sc->sc_sync_ifp->if_mtu < mtu_req)
734 mtu = sc->sc_sync_ifp->if_mtu;
735 else
736 mtu = mtu_req;
737
738 sc->sc_maxcount = (mtu - sizeof(struct pfsync_header)) /
739 sizeof(struct pfsync_state);
740 if (sc->sc_maxcount > 254)
741 sc->sc_maxcount = 254;
742 sc->sc_if.if_mtu = sizeof(struct pfsync_header) +
743 sc->sc_maxcount * sizeof(struct pfsync_state);
744 }
745
746 struct mbuf *
747 pfsync_get_mbuf(struct pfsync_softc *sc, u_int8_t action, void **sp)
748 {
749 struct pfsync_header *h;
750 struct mbuf *m;
751 int len;
752
753 MGETHDR(m, M_DONTWAIT, MT_DATA);
754 if (m == NULL) {
755 sc->sc_if.if_oerrors++;
756 return (NULL);
757 }
758
759 switch (action) {
760 case PFSYNC_ACT_CLR:
761 len = sizeof(struct pfsync_header) +
762 sizeof(struct pfsync_state_clr);
763 break;
764 case PFSYNC_ACT_UPD_C:
765 len = (sc->sc_maxcount * sizeof(struct pfsync_state_upd)) +
766 sizeof(struct pfsync_header);
767 break;
768 case PFSYNC_ACT_DEL_C:
769 len = (sc->sc_maxcount * sizeof(struct pfsync_state_del)) +
770 sizeof(struct pfsync_header);
771 break;
772 case PFSYNC_ACT_UREQ:
773 len = (sc->sc_maxcount * sizeof(struct pfsync_state_upd_req)) +
774 sizeof(struct pfsync_header);
775 break;
776 case PFSYNC_ACT_BUS:
777 len = sizeof(struct pfsync_header) +
778 sizeof(struct pfsync_state_bus);
779 break;
780 default:
781 len = (sc->sc_maxcount * sizeof(struct pfsync_state)) +
782 sizeof(struct pfsync_header);
783 break;
784 }
785
786 if (len > MHLEN) {
787 MCLGET(m, M_DONTWAIT);
788 if ((m->m_flags & M_EXT) == 0) {
789 m_free(m);
790 sc->sc_if.if_oerrors++;
791 return (NULL);
792 }
793 m->m_data += (MCLBYTES - len) &~ (sizeof(long) - 1);
794 } else
795 MH_ALIGN(m, len);
796
797 m->m_pkthdr.rcvif = NULL;
798 m->m_pkthdr.len = m->m_len = sizeof(struct pfsync_header);
799 h = mtod(m, struct pfsync_header *);
800 h->version = PFSYNC_VERSION;
801 h->af = 0;
802 h->count = 0;
803 h->action = action;
804
805 *sp = (void *)((char *)h + PFSYNC_HDRLEN);
806 timeout_add(&sc->sc_tmo, hz);
807 return (m);
808 }
809
810 int
811 pfsync_pack_state(u_int8_t action, struct pf_state *st, int compress)
812 {
813 struct ifnet *ifp = &pfsyncif.sc_if;
814 struct pfsync_softc *sc = ifp->if_softc;
815 struct pfsync_header *h, *h_net;
816 struct pfsync_state *sp = NULL;
817 struct pfsync_state_upd *up = NULL;
818 struct pfsync_state_del *dp = NULL;
819 struct pf_rule *r;
820 u_long secs;
821 int s, ret = 0;
822 u_int8_t i = 255, newaction = 0;
823
824 /*
825 * If a packet falls in the forest and there's nobody around to
826 * hear, does it make a sound?
827 */
828 if (ifp->if_bpf == NULL && sc->sc_sync_ifp == NULL) {
829 /* Don't leave any stale pfsync packets hanging around. */
830 if (sc->sc_mbuf != NULL) {
831 m_freem(sc->sc_mbuf);
832 sc->sc_mbuf = NULL;
833 sc->sc_statep.s = NULL;
834 }
835 return (0);
836 }
837
838 if (action >= PFSYNC_ACT_MAX)
839 return (EINVAL);
840
841 s = splnet();
842 if (sc->sc_mbuf == NULL) {
843 if ((sc->sc_mbuf = pfsync_get_mbuf(sc, action,
844 (void *)&sc->sc_statep.s)) == NULL) {
845 splx(s);
846 return (ENOMEM);
847 }
848 h = mtod(sc->sc_mbuf, struct pfsync_header *);
849 } else {
850 h = mtod(sc->sc_mbuf, struct pfsync_header *);
851 if (h->action != action) {
852 pfsync_sendout(sc);
853 if ((sc->sc_mbuf = pfsync_get_mbuf(sc, action,
854 (void *)&sc->sc_statep.s)) == NULL) {
855 splx(s);
856 return (ENOMEM);
857 }
858 h = mtod(sc->sc_mbuf, struct pfsync_header *);
859 } else {
860 /*
861 * If it's an update, look in the packet to see if
862 * we already have an update for the state.
863 */
864 if (action == PFSYNC_ACT_UPD && sc->sc_maxupdates) {
865 struct pfsync_state *usp =
866 (void *)((char *)h + PFSYNC_HDRLEN);
867
868 for (i = 0; i < h->count; i++) {
869 if (!memcmp(usp->id, &st->id,
870 PFSYNC_ID_LEN) &&
871 usp->creatorid == st->creatorid) {
872 sp = usp;
873 sp->updates++;
874 break;
875 }
876 usp++;
877 }
878 }
879 }
880 }
881
882 secs = time.tv_sec;
883
884 st->pfsync_time = mono_time.tv_sec;
885 TAILQ_REMOVE(&state_updates, st, u.s.entry_updates);
886 TAILQ_INSERT_TAIL(&state_updates, st, u.s.entry_updates);
887
888 if (sp == NULL) {
889 /* not a "duplicate" update */
890 i = 255;
891 sp = sc->sc_statep.s++;
892 sc->sc_mbuf->m_pkthdr.len =
893 sc->sc_mbuf->m_len += sizeof(struct pfsync_state);
894 h->count++;
895 bzero(sp, sizeof(*sp));
896
897 bcopy(&st->id, sp->id, sizeof(sp->id));
898 sp->creatorid = st->creatorid;
899
900 strlcpy(sp->ifname, st->u.s.kif->pfik_name, sizeof(sp->ifname));
901 pf_state_host_hton(&st->lan, &sp->lan);
902 pf_state_host_hton(&st->gwy, &sp->gwy);
903 pf_state_host_hton(&st->ext, &sp->ext);
904
905 bcopy(&st->rt_addr, &sp->rt_addr, sizeof(sp->rt_addr));
906
907 sp->creation = htonl(secs - st->creation);
908 sp->packets[0] = htonl(st->packets[0]);
909 sp->packets[1] = htonl(st->packets[1]);
910 sp->bytes[0] = htonl(st->bytes[0]);
911 sp->bytes[1] = htonl(st->bytes[1]);
912 if ((r = st->rule.ptr) == NULL)
913 sp->rule = htonl(-1);
914 else
915 sp->rule = htonl(r->nr);
916 if ((r = st->anchor.ptr) == NULL)
917 sp->anchor = htonl(-1);
918 else
919 sp->anchor = htonl(r->nr);
920 sp->af = st->af;
921 sp->proto = st->proto;
922 sp->direction = st->direction;
923 sp->log = st->log;
924 sp->allow_opts = st->allow_opts;
925 sp->timeout = st->timeout;
926
927 sp->sync_flags = st->sync_flags & PFSTATE_NOSYNC;
928 }
929
930 pf_state_peer_hton(&st->src, &sp->src);
931 pf_state_peer_hton(&st->dst, &sp->dst);
932
933 if (st->expire <= secs)
934 sp->expire = htonl(0);
935 else
936 sp->expire = htonl(st->expire - secs);
937
938 /* do we need to build "compressed" actions for network transfer? */
939 if (sc->sc_sync_ifp && compress) {
940 switch (action) {
941 case PFSYNC_ACT_UPD:
942 newaction = PFSYNC_ACT_UPD_C;
943 break;
944 case PFSYNC_ACT_DEL:
945 newaction = PFSYNC_ACT_DEL_C;
946 break;
947 default:
948 /* by default we just send the uncompressed states */
949 break;
950 }
951 }
952
953 if (newaction) {
954 if (sc->sc_mbuf_net == NULL) {
955 if ((sc->sc_mbuf_net = pfsync_get_mbuf(sc, newaction,
956 (void *)&sc->sc_statep_net.s)) == NULL) {
957 splx(s);
958 return (ENOMEM);
959 }
960 }
961 h_net = mtod(sc->sc_mbuf_net, struct pfsync_header *);
962
963 switch (newaction) {
964 case PFSYNC_ACT_UPD_C:
965 if (i != 255) {
966 up = (void *)((char *)h_net +
967 PFSYNC_HDRLEN + (i * sizeof(*up)));
968 up->updates++;
969 } else {
970 h_net->count++;
971 sc->sc_mbuf_net->m_pkthdr.len =
972 sc->sc_mbuf_net->m_len += sizeof(*up);
973 up = sc->sc_statep_net.u++;
974
975 bzero(up, sizeof(*up));
976 bcopy(&st->id, up->id, sizeof(up->id));
977 up->creatorid = st->creatorid;
978 }
979 up->timeout = st->timeout;
980 up->expire = sp->expire;
981 up->src = sp->src;
982 up->dst = sp->dst;
983 break;
984 case PFSYNC_ACT_DEL_C:
985 sc->sc_mbuf_net->m_pkthdr.len =
986 sc->sc_mbuf_net->m_len += sizeof(*dp);
987 dp = sc->sc_statep_net.d++;
988 h_net->count++;
989
990 bzero(dp, sizeof(*dp));
991 bcopy(&st->id, dp->id, sizeof(dp->id));
992 dp->creatorid = st->creatorid;
993 break;
994 }
995 }
996
997 if (h->count == sc->sc_maxcount ||
998 (sc->sc_maxupdates && (sp->updates >= sc->sc_maxupdates)))
999 ret = pfsync_sendout(sc);
1000
1001 splx(s);
1002 return (ret);
1003 }
1004
1005 /* This must be called in splnet() */
1006 int
1007 pfsync_request_update(struct pfsync_state_upd *up, struct in_addr *src)
1008 {
1009 struct ifnet *ifp = &pfsyncif.sc_if;
1010 struct pfsync_header *h;
1011 struct pfsync_softc *sc = ifp->if_softc;
1012 struct pfsync_state_upd_req *rup;
1013 int s, ret;
1014
1015 if (sc->sc_mbuf == NULL) {
1016 if ((sc->sc_mbuf = pfsync_get_mbuf(sc, PFSYNC_ACT_UREQ,
1017 (void *)&sc->sc_statep.s)) == NULL) {
1018 splx(s);
1019 return (ENOMEM);
1020 }
1021 h = mtod(sc->sc_mbuf, struct pfsync_header *);
1022 } else {
1023 h = mtod(sc->sc_mbuf, struct pfsync_header *);
1024 if (h->action != PFSYNC_ACT_UREQ) {
1025 pfsync_sendout(sc);
1026 if ((sc->sc_mbuf = pfsync_get_mbuf(sc, PFSYNC_ACT_UREQ,
1027 (void *)&sc->sc_statep.s)) == NULL) {
1028 splx(s);
1029 return (ENOMEM);
1030 }
1031 h = mtod(sc->sc_mbuf, struct pfsync_header *);
1032 }
1033 }
1034
1035 if (src != NULL)
1036 sc->sc_sendaddr = *src;
1037 sc->sc_mbuf->m_pkthdr.len = sc->sc_mbuf->m_len += sizeof(*rup);
1038 h->count++;
1039 rup = sc->sc_statep.r++;
1040 bzero(rup, sizeof(*rup));
1041 if (up != NULL) {
1042 bcopy(up->id, rup->id, sizeof(rup->id));
1043 rup->creatorid = up->creatorid;
1044 }
1045
1046 if (h->count == sc->sc_maxcount)
1047 ret = pfsync_sendout(sc);
1048
1049 return (ret);
1050 }
1051
1052 int
1053 pfsync_clear_states(u_int32_t creatorid, char *ifname)
1054 {
1055 struct ifnet *ifp = &pfsyncif.sc_if;
1056 struct pfsync_softc *sc = ifp->if_softc;
1057 struct pfsync_state_clr *cp;
1058 int s, ret;
1059
1060 s = splnet();
1061 if (sc->sc_mbuf != NULL)
1062 pfsync_sendout(sc);
1063 if ((sc->sc_mbuf = pfsync_get_mbuf(sc, PFSYNC_ACT_CLR,
1064 (void *)&sc->sc_statep.c)) == NULL) {
1065 splx(s);
1066 return (ENOMEM);
1067 }
1068 sc->sc_mbuf->m_pkthdr.len = sc->sc_mbuf->m_len += sizeof(*cp);
1069 cp = sc->sc_statep.c;
1070 cp->creatorid = creatorid;
1071 if (ifname != NULL)
1072 strlcpy(cp->ifname, ifname, IFNAMSIZ);
1073
1074 ret = (pfsync_sendout(sc));
1075 splx(s);
1076 return (ret);
1077 }
1078
1079 void
1080 pfsync_timeout(void *v)
1081 {
1082 struct pfsync_softc *sc = v;
1083 int s;
1084
1085 s = splnet();
1086 pfsync_sendout(sc);
1087 splx(s);
1088 }
1089
1090 void
1091 pfsync_send_bus(struct pfsync_softc *sc, u_int8_t status)
1092 {
1093 struct pfsync_state_bus *bus;
1094
1095 if (sc->sc_mbuf != NULL)
1096 pfsync_sendout(sc);
1097
1098 if (pfsync_sync_ok &&
1099 (sc->sc_mbuf = pfsync_get_mbuf(sc, PFSYNC_ACT_BUS,
1100 (void *)&sc->sc_statep.b)) != NULL) {
1101 sc->sc_mbuf->m_pkthdr.len = sc->sc_mbuf->m_len += sizeof(*bus);
1102 bus = sc->sc_statep.b;
1103 bus->creatorid = pf_status.hostid;
1104 bus->status = status;
1105 bus->endtime = htonl(mono_time.tv_sec - sc->sc_ureq_received);
1106 pfsync_sendout(sc);
1107 }
1108 }
1109
1110 void
1111 pfsync_bulk_update(void *v)
1112 {
1113 struct pfsync_softc *sc = v;
1114 int s, i = 0;
1115 struct pf_state *state;
1116
1117 s = splnet();
1118 if (sc->sc_mbuf != NULL)
1119 pfsync_sendout(sc);
1120
1121 /*
1122 * Grab at most PFSYNC_BULKPACKETS worth of states which have not
1123 * been sent since the latest request was made.
1124 */
1125 while ((state = TAILQ_FIRST(&state_updates)) != NULL &&
1126 ++i < (sc->sc_maxcount * PFSYNC_BULKPACKETS)) {
1127 if (state->pfsync_time > sc->sc_ureq_received) {
1128 /* we're done */
1129 pfsync_send_bus(sc, PFSYNC_BUS_END);
1130 sc->sc_ureq_received = 0;
1131 timeout_del(&sc->sc_bulk_tmo);
1132 if (pf_status.debug >= PF_DEBUG_MISC)
1133 printf("pfsync: bulk update complete\n");
1134 break;
1135 } else {
1136 /* send an update and move to end of list */
1137 if (!state->sync_flags)
1138 pfsync_pack_state(PFSYNC_ACT_UPD, state, 0);
1139 state->pfsync_time = mono_time.tv_sec;
1140 TAILQ_REMOVE(&state_updates, state, u.s.entry_updates);
1141 TAILQ_INSERT_TAIL(&state_updates, state,
1142 u.s.entry_updates);
1143
1144 /* look again for more in a bit */
1145 timeout_add(&sc->sc_bulk_tmo, 1);
1146 }
1147 }
1148 if (sc->sc_mbuf != NULL)
1149 pfsync_sendout(sc);
1150 splx(s);
1151 }
1152
1153 void
1154 pfsync_bulkfail(void *v)
1155 {
1156 struct pfsync_softc *sc = v;
1157
1158 if (sc->sc_bulk_tries++ < PFSYNC_MAX_BULKTRIES) {
1159 /* Try again in a bit */
1160 timeout_add(&sc->sc_bulkfail_tmo, 5 * hz);
1161 pfsync_request_update(NULL, NULL);
1162 pfsync_sendout(sc);
1163 } else {
1164 /* Pretend like the transfer was ok */
1165 sc->sc_ureq_sent = 0;
1166 sc->sc_bulk_tries = 0;
1167 pfsync_sync_ok = 1;
1168 if (pf_status.debug >= PF_DEBUG_MISC)
1169 printf("pfsync: failed to receive "
1170 "bulk update status\n");
1171 timeout_del(&sc->sc_bulkfail_tmo);
1172 }
1173 }
1174
1175 int
1176 pfsync_sendout(sc)
1177 struct pfsync_softc *sc;
1178 {
1179 struct ifnet *ifp = &sc->sc_if;
1180 struct mbuf *m;
1181
1182 timeout_del(&sc->sc_tmo);
1183
1184 if (sc->sc_mbuf == NULL)
1185 return (0);
1186 m = sc->sc_mbuf;
1187 sc->sc_mbuf = NULL;
1188 sc->sc_statep.s = NULL;
1189
1190 #if NBPFILTER > 0
1191 if (ifp->if_bpf)
1192 bpf_mtap(ifp->if_bpf, m);
1193 #endif
1194
1195 if (sc->sc_mbuf_net) {
1196 m_freem(m);
1197 m = sc->sc_mbuf_net;
1198 sc->sc_mbuf_net = NULL;
1199 sc->sc_statep_net.s = NULL;
1200 }
1201
1202 if (sc->sc_sync_ifp) {
1203 struct ip *ip;
1204 struct ifaddr *ifa;
1205 struct sockaddr sa;
1206
1207 M_PREPEND(m, sizeof(struct ip), M_DONTWAIT);
1208 if (m == NULL) {
1209 pfsyncstats.pfsyncs_onomem++;
1210 return (0);
1211 }
1212 ip = mtod(m, struct ip *);
1213 ip->ip_v = IPVERSION;
1214 ip->ip_hl = sizeof(*ip) >> 2;
1215 ip->ip_tos = IPTOS_LOWDELAY;
1216 ip->ip_len = htons(m->m_pkthdr.len);
1217 ip->ip_id = htons(ip_randomid());
1218 ip->ip_off = htons(IP_DF);
1219 ip->ip_ttl = PFSYNC_DFLTTL;
1220 ip->ip_p = IPPROTO_PFSYNC;
1221 ip->ip_sum = 0;
1222
1223 bzero(&sa, sizeof(sa));
1224 sa.sa_family = AF_INET;
1225 ifa = ifaof_ifpforaddr(&sa, sc->sc_sync_ifp);
1226 if (ifa == NULL)
1227 return (0);
1228 ip->ip_src.s_addr = ifatoia(ifa)->ia_addr.sin_addr.s_addr;
1229
1230 if (sc->sc_sendaddr.s_addr == INADDR_PFSYNC_GROUP)
1231 m->m_flags |= M_MCAST;
1232 ip->ip_dst = sc->sc_sendaddr;
1233 sc->sc_sendaddr.s_addr = INADDR_PFSYNC_GROUP;
1234
1235 pfsyncstats.pfsyncs_opackets++;
1236
1237 if (ip_output(m, NULL, NULL, IP_RAWOUTPUT, &sc->sc_imo, NULL))
1238 pfsyncstats.pfsyncs_oerrors++;
1239 } else
1240 m_freem(m);
1241
1242 return (0);
1243 }
1244