npf_alg_icmp.c revision 1.12 1 /* $NetBSD: npf_alg_icmp.c,v 1.12 2012/09/10 21:42:53 rmind Exp $ */
2
3 /*-
4 * Copyright (c) 2010 The NetBSD Foundation, Inc.
5 * All rights reserved.
6 *
7 * This material is based upon work partially supported by The
8 * NetBSD Foundation under a contract with Mindaugas Rasiukevicius.
9 *
10 * Redistribution and use in source and binary forms, with or without
11 * modification, are permitted provided that the following conditions
12 * are met:
13 * 1. Redistributions of source code must retain the above copyright
14 * notice, this list of conditions and the following disclaimer.
15 * 2. Redistributions in binary form must reproduce the above copyright
16 * notice, this list of conditions and the following disclaimer in the
17 * documentation and/or other materials provided with the distribution.
18 *
19 * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
20 * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
21 * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
22 * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
23 * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
24 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
25 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
26 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
27 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
28 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
29 * POSSIBILITY OF SUCH DAMAGE.
30 */
31
32 /*
33 * NPF ALG for ICMP and traceroute translations.
34 */
35
36 #include <sys/cdefs.h>
37 __KERNEL_RCSID(0, "$NetBSD: npf_alg_icmp.c,v 1.12 2012/09/10 21:42:53 rmind Exp $");
38
39 #include <sys/param.h>
40 #include <sys/module.h>
41 #include <sys/pool.h>
42
43 #include <netinet/in_systm.h>
44 #include <netinet/in.h>
45 #include <netinet/ip.h>
46 #include <netinet/tcp.h>
47 #include <netinet/udp.h>
48 #include <netinet/ip_icmp.h>
49 #include <netinet/icmp6.h>
50 #include <net/pfil.h>
51
52 #include "npf_impl.h"
53
54 MODULE(MODULE_CLASS_MISC, npf_alg_icmp, "npf");
55
56 /*
57 * Traceroute criteria.
58 *
59 * IANA assigned base port: 33434. However, common practice is to increase
60 * the port, thus monitor [33434-33484] range. Additional filter is TTL < 50.
61 */
62
63 #define TR_BASE_PORT 33434
64 #define TR_PORT_RANGE 33484
65 #define TR_MAX_TTL 50
66
67 static npf_alg_t * alg_icmp __read_mostly;
68
69 static bool npfa_icmp_match(npf_cache_t *, nbuf_t *, void *);
70 static bool npfa_icmp_natin(npf_cache_t *, nbuf_t *, void *);
71 static bool npfa_icmp_session(npf_cache_t *, nbuf_t *, void *);
72
73 /*
74 * npf_alg_icmp_{init,fini,modcmd}: ICMP ALG initialization, destruction
75 * and module interface.
76 */
77
78 static int
79 npf_alg_icmp_init(void)
80 {
81
82 alg_icmp = npf_alg_register(npfa_icmp_match, NULL,
83 npfa_icmp_natin, npfa_icmp_session);
84 KASSERT(alg_icmp != NULL);
85 return 0;
86 }
87
88 static int
89 npf_alg_icmp_fini(void)
90 {
91
92 KASSERT(alg_icmp != NULL);
93 return npf_alg_unregister(alg_icmp);
94 }
95
96 static int
97 npf_alg_icmp_modcmd(modcmd_t cmd, void *arg)
98 {
99
100 switch (cmd) {
101 case MODULE_CMD_INIT:
102 return npf_alg_icmp_init();
103 case MODULE_CMD_FINI:
104 return npf_alg_icmp_fini();
105 case MODULE_CMD_AUTOUNLOAD:
106 return EBUSY;
107 default:
108 return ENOTTY;
109 }
110 return 0;
111 }
112
113 /*
114 * npfa_icmp_match: ALG matching inspector - determines ALG case and
115 * associates ALG with NAT entry.
116 */
117 static bool
118 npfa_icmp_match(npf_cache_t *npc, nbuf_t *nbuf, void *ntptr)
119 {
120 const int proto = npf_cache_ipproto(npc);
121 struct ip *ip = &npc->npc_ip.v4;
122 in_port_t dport;
123
124 KASSERT(npf_iscached(npc, NPC_IP46));
125 KASSERT(npf_iscached(npc, NPC_LAYER4));
126
127 /* Check for low TTL. */
128 if (ip->ip_ttl > TR_MAX_TTL) {
129 return false;
130 }
131
132 if (proto == IPPROTO_TCP) {
133 struct tcphdr *th = &npc->npc_l4.tcp;
134 dport = ntohs(th->th_dport);
135 } else if (proto == IPPROTO_UDP) {
136 struct udphdr *uh = &npc->npc_l4.udp;
137 dport = ntohs(uh->uh_dport);
138 } else {
139 return false;
140 }
141
142 /* Handle TCP/UDP traceroute - check for port range. */
143 if (dport < TR_BASE_PORT || dport > TR_PORT_RANGE) {
144 return false;
145 }
146
147 /* Associate ALG with translation entry. */
148 npf_nat_t *nt = ntptr;
149 npf_nat_setalg(nt, alg_icmp, 0);
150 return true;
151 }
152
153 /*
154 * npf_icmp_uniqid: retrieve unique identifiers - either ICMP query ID
155 * or TCP/UDP ports of the original packet, which is embedded.
156 */
157 static bool
158 npf_icmp_uniqid(const int npcinf, const int type,
159 npf_cache_t *npc, nbuf_t *nbuf, void *n_ptr)
160 {
161 struct icmp *ic;
162 struct icmp6_hdr *ic6;
163 u_int offby;
164
165 if (npcinf & NPC_IP4) {
166 /* Per RFC 792. */
167 switch (type) {
168 case ICMP_UNREACH:
169 case ICMP_SOURCEQUENCH:
170 case ICMP_REDIRECT:
171 case ICMP_TIMXCEED:
172 case ICMP_PARAMPROB:
173 /* Should contain original IP header. */
174 offby = offsetof(struct icmp, icmp_ip);
175 if ((n_ptr = nbuf_advance(&nbuf, n_ptr, offby)) == NULL) {
176 return false;
177 }
178 /* Fetch into the cache. */
179 if (!npf_fetch_ip(npc, nbuf, n_ptr)) {
180 return false;
181 }
182 switch (npf_cache_ipproto(npc)) {
183 case IPPROTO_TCP:
184 return npf_fetch_tcp(npc, nbuf, n_ptr);
185 case IPPROTO_UDP:
186 return npf_fetch_udp(npc, nbuf, n_ptr);
187 default:
188 return false;
189 }
190 return true;
191
192 case ICMP_ECHOREPLY:
193 case ICMP_ECHO:
194 case ICMP_TSTAMP:
195 case ICMP_TSTAMPREPLY:
196 case ICMP_IREQ:
197 case ICMP_IREQREPLY:
198 /* Should contain ICMP query ID. */
199 ic = &npc->npc_l4.icmp;
200 offby = offsetof(struct icmp, icmp_id);
201 if (nbuf_advfetch(&nbuf, &n_ptr, offby,
202 sizeof(uint16_t), &ic->icmp_id)) {
203 return false;
204 }
205 npc->npc_info |= NPC_ICMP_ID;
206 return true;
207 default:
208 break;
209 }
210 /* No unique IDs. */
211 return false;
212 }
213 if (npcinf & NPC_IP6) {
214 switch (type) {
215 /* Per RFC 4443. */
216 case ICMP6_DST_UNREACH:
217 case ICMP6_PACKET_TOO_BIG:
218 case ICMP6_TIME_EXCEEDED:
219 case ICMP6_PARAM_PROB:
220 /* Should contain original IP header. */
221 offby = sizeof(struct icmp6_hdr);
222 if ((n_ptr = nbuf_advance(&nbuf, n_ptr, offby)) == NULL) {
223 return false;
224 }
225 /* Fetch into the cache. */
226 if (!npf_fetch_ip(npc, nbuf, n_ptr)) {
227 return false;
228 }
229 switch (npf_cache_ipproto(npc)) {
230 case IPPROTO_TCP:
231 return npf_fetch_tcp(npc, nbuf, n_ptr);
232 case IPPROTO_UDP:
233 return npf_fetch_udp(npc, nbuf, n_ptr);
234 default:
235 return false;
236 }
237 return true;
238
239 case ICMP6_ECHO_REQUEST:
240 case ICMP6_ECHO_REPLY:
241 /* Should contain ICMP query ID. */
242 ic6 = &npc->npc_l4.icmp6;
243 offby = offsetof(struct icmp6_hdr, icmp6_id);
244 if (nbuf_advfetch(&nbuf, &n_ptr, offby,
245 sizeof(uint16_t), &ic6->icmp6_id)) {
246 return false;
247 }
248 npc->npc_info |= NPC_ICMP_ID;
249 return true;
250 default:
251 break;
252 }
253 /* No unique IDs. */
254 return false;
255 }
256 /* Whatever protocol that may have been ... */
257 return false;
258 }
259
260 static void
261 npfa_srcdst_invert(npf_cache_t *npc)
262 {
263 const int proto = npf_cache_ipproto(npc);
264 npf_addr_t *tmp_ip;
265
266 if (proto == IPPROTO_TCP) {
267 struct tcphdr *th = &npc->npc_l4.tcp;
268 in_port_t tmp_sport = th->th_sport;
269 th->th_sport = th->th_dport;
270 th->th_dport = tmp_sport;
271
272 } else if (proto == IPPROTO_UDP) {
273 struct udphdr *uh = &npc->npc_l4.udp;
274 in_port_t tmp_sport = uh->uh_sport;
275 uh->uh_sport = uh->uh_dport;
276 uh->uh_dport = tmp_sport;
277 }
278 tmp_ip = npc->npc_srcip;
279 npc->npc_srcip = npc->npc_dstip;
280 npc->npc_dstip = tmp_ip;
281 }
282
283 /*
284 * npfa_icmp_session: ALG session inspector, returns unique identifiers.
285 */
286 static bool
287 npfa_icmp_session(npf_cache_t *npc, nbuf_t *nbuf, void *keyptr)
288 {
289 npf_cache_t *key = keyptr;
290 KASSERT(key->npc_info == 0);
291
292 /* IP + ICMP? Get unique identifiers from ICMP packet. */
293 if (!npf_iscached(npc, NPC_IP4)) {
294 return false;
295 }
296 if (npf_cache_ipproto(npc) != IPPROTO_ICMP) {
297 return false;
298 }
299 KASSERT(npf_iscached(npc, NPC_ICMP));
300
301 /* Advance to ICMP header. */
302 void *n_ptr = nbuf_dataptr(nbuf);
303 const u_int hlen = npf_cache_hlen(npc);
304
305 if ((n_ptr = nbuf_advance(&nbuf, n_ptr, hlen)) == NULL) {
306 return false;
307 }
308
309 /* Fetch relevant data into the separate ("key") cache. */
310 struct icmp *ic = &npc->npc_l4.icmp;
311 if (!npf_icmp_uniqid(npc->npc_info & NPC_IP46, ic->icmp_type,
312 key, nbuf, n_ptr)) {
313 return false;
314 }
315
316 if (npf_iscached(key, NPC_ICMP_ID)) {
317 struct icmp *keyic = &key->npc_l4.icmp;
318
319 /* Copy ICMP ID to the cache and flag it. */
320 npc->npc_info |= NPC_ICMP_ID;
321 ic->icmp_id = keyic->icmp_id;
322
323 /* Note: return False, since key is the original cache. */
324 return false;
325 }
326
327 /*
328 * Embedded IP packet is the original of "forwards" stream.
329 * We should imitate the "backwards" stream for inspection.
330 */
331 KASSERT(npf_iscached(key, NPC_IP46));
332 KASSERT(npf_iscached(key, NPC_LAYER4));
333 npfa_srcdst_invert(key);
334 key->npc_alen = npc->npc_alen;
335
336 return true;
337 }
338
339 /*
340 * npfa_icmp_natin: ALG inbound translation inspector, rewrite IP address
341 * in the IP header, which is embedded in ICMP packet.
342 */
343 static bool
344 npfa_icmp_natin(npf_cache_t *npc, nbuf_t *nbuf, void *ntptr)
345 {
346 npf_cache_t enpc = { .npc_info = 0 };
347
348 /* XXX: Duplicated work (done at session inspection). */
349 if (!npfa_icmp_session(npc, nbuf, &enpc)) {
350 return false;
351 }
352 /* XXX: Restore inversion (inefficient). */
353 KASSERT(npf_iscached(&enpc, NPC_IP46));
354 KASSERT(npf_iscached(&enpc, NPC_LAYER4));
355 npfa_srcdst_invert(&enpc);
356
357 /*
358 * Save ICMP and embedded IP with TCP/UDP header checksums, retrieve
359 * the original address and port, and calculate ICMP checksum for
360 * embedded packet changes, while data is not rewritten in the cache.
361 */
362 const int proto = npf_cache_ipproto(&enpc);
363 const struct ip *eip = &enpc.npc_ip.v4;
364 const struct icmp * const ic = &npc->npc_l4.icmp;
365 uint16_t cksum = ic->icmp_cksum, ecksum = eip->ip_sum, l4cksum;
366 npf_nat_t *nt = ntptr;
367 npf_addr_t *addr;
368 in_port_t port;
369
370 npf_nat_getorig(nt, &addr, &port);
371
372 if (proto == IPPROTO_TCP) {
373 struct tcphdr *th = &enpc.npc_l4.tcp;
374 cksum = npf_fixup16_cksum(cksum, th->th_sport, port);
375 l4cksum = th->th_sum;
376 } else {
377 struct udphdr *uh = &enpc.npc_l4.udp;
378 cksum = npf_fixup16_cksum(cksum, uh->uh_sport, port);
379 l4cksum = uh->uh_sum;
380 }
381 cksum = npf_addr_cksum(cksum, enpc.npc_alen, enpc.npc_srcip, addr);
382
383 /*
384 * Save the original pointers to the main IP header and then advance
385 * to the embedded IP header after ICMP header.
386 */
387 void *n_ptr = nbuf_dataptr(nbuf), *cnbuf = nbuf, *cnptr = n_ptr;
388 u_int offby = npf_cache_hlen(npc) + offsetof(struct icmp, icmp_ip);
389
390 if ((n_ptr = nbuf_advance(&nbuf, n_ptr, offby)) == NULL) {
391 return false;
392 }
393
394 /*
395 * Rewrite source IP address and port of the embedded IP header,
396 * which represents original packet - therefore passing PFIL_OUT.
397 * Note: checksums are first, since it uses values from the cache.
398 */
399 if (!npf_rwrcksum(&enpc, nbuf, n_ptr, PFIL_OUT, addr, port)) {
400 return false;
401 }
402 if (!npf_rwrip(&enpc, nbuf, n_ptr, PFIL_OUT, addr)) {
403 return false;
404 }
405 if (!npf_rwrport(&enpc, nbuf, n_ptr, PFIL_OUT, port)) {
406 return false;
407 }
408
409 /*
410 * Finish calculation of the ICMP checksum. Update for embedded IP
411 * and TCP/UDP checksum changes. Finally, rewrite ICMP checksum.
412 */
413 if (proto == IPPROTO_TCP) {
414 struct tcphdr *th = &enpc.npc_l4.tcp;
415 cksum = npf_fixup16_cksum(cksum, l4cksum, th->th_sum);
416 } else if (l4cksum) {
417 struct udphdr *uh = &enpc.npc_l4.udp;
418 cksum = npf_fixup16_cksum(cksum, l4cksum, uh->uh_sum);
419 }
420 cksum = npf_fixup16_cksum(cksum, ecksum, eip->ip_sum);
421
422 offby = npf_cache_hlen(npc) + offsetof(struct icmp, icmp_cksum);
423 if (nbuf_advstore(&cnbuf, &cnptr, offby, sizeof(uint16_t), &cksum)) {
424 return false;
425 }
426 return true;
427 }
428