npf_alg_icmp.c revision 1.11 1 /* $NetBSD: npf_alg_icmp.c,v 1.11 2012/07/19 21:52:29 spz Exp $ */
2
3 /*-
4 * Copyright (c) 2010 The NetBSD Foundation, Inc.
5 * All rights reserved.
6 *
7 * This material is based upon work partially supported by The
8 * NetBSD Foundation under a contract with Mindaugas Rasiukevicius.
9 *
10 * Redistribution and use in source and binary forms, with or without
11 * modification, are permitted provided that the following conditions
12 * are met:
13 * 1. Redistributions of source code must retain the above copyright
14 * notice, this list of conditions and the following disclaimer.
15 * 2. Redistributions in binary form must reproduce the above copyright
16 * notice, this list of conditions and the following disclaimer in the
17 * documentation and/or other materials provided with the distribution.
18 *
19 * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
20 * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
21 * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
22 * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
23 * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
24 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
25 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
26 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
27 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
28 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
29 * POSSIBILITY OF SUCH DAMAGE.
30 */
31
32 /*
33 * NPF ALG for ICMP and traceroute translations.
34 */
35
36 #include <sys/cdefs.h>
37 __KERNEL_RCSID(0, "$NetBSD: npf_alg_icmp.c,v 1.11 2012/07/19 21:52:29 spz Exp $");
38
39 #include <sys/param.h>
40 #include <sys/module.h>
41 #include <sys/pool.h>
42
43 #include <netinet/in_systm.h>
44 #include <netinet/in.h>
45 #include <netinet/ip.h>
46 #include <netinet/tcp.h>
47 #include <netinet/udp.h>
48 #include <netinet/ip_icmp.h>
49 #include <netinet/icmp6.h>
50 #include <net/pfil.h>
51
52 #include "npf_impl.h"
53
54 MODULE(MODULE_CLASS_MISC, npf_alg_icmp, "npf");
55
56 /*
57 * Traceroute criteria.
58 *
59 * IANA assigned base port: 33434. However, common practice is to increase
60 * the port, thus monitor [33434-33484] range. Additional filter is TTL < 50.
61 */
62
63 #define TR_BASE_PORT 33434
64 #define TR_PORT_RANGE 33484
65 #define TR_MAX_TTL 50
66
67 static npf_alg_t * alg_icmp __read_mostly;
68
69 static bool npfa_icmp_match(npf_cache_t *, nbuf_t *, void *);
70 static bool npfa_icmp_natin(npf_cache_t *, nbuf_t *, void *);
71 static bool npfa_icmp_session(npf_cache_t *, nbuf_t *, void *);
72
73 /*
74 * npf_alg_icmp_{init,fini,modcmd}: ICMP ALG initialization, destruction
75 * and module interface.
76 */
77
78 static int
79 npf_alg_icmp_init(void)
80 {
81
82 alg_icmp = npf_alg_register(npfa_icmp_match, NULL,
83 npfa_icmp_natin, npfa_icmp_session);
84 KASSERT(alg_icmp != NULL);
85 return 0;
86 }
87
88 static int
89 npf_alg_icmp_fini(void)
90 {
91
92 KASSERT(alg_icmp != NULL);
93 return npf_alg_unregister(alg_icmp);
94 }
95
96 static int
97 npf_alg_icmp_modcmd(modcmd_t cmd, void *arg)
98 {
99
100 switch (cmd) {
101 case MODULE_CMD_INIT:
102 return npf_alg_icmp_init();
103 case MODULE_CMD_FINI:
104 return npf_alg_icmp_fini();
105 case MODULE_CMD_AUTOUNLOAD:
106 return EBUSY;
107 default:
108 return ENOTTY;
109 }
110 return 0;
111 }
112
113 /*
114 * npfa_icmp_match: ALG matching inspector - determines ALG case and
115 * associates ALG with NAT entry.
116 */
117 static bool
118 npfa_icmp_match(npf_cache_t *npc, nbuf_t *nbuf, void *ntptr)
119 {
120 const int proto = npf_cache_ipproto(npc);
121 struct ip *ip = &npc->npc_ip.v4;
122 in_port_t dport;
123
124 KASSERT(npf_iscached(npc, NPC_IP46));
125 KASSERT(npf_iscached(npc, NPC_LAYER4));
126
127 /* Check for low TTL. */
128 if (ip->ip_ttl > TR_MAX_TTL) {
129 return false;
130 }
131
132 if (proto == IPPROTO_TCP) {
133 struct tcphdr *th = &npc->npc_l4.tcp;
134 dport = ntohs(th->th_dport);
135 } else if (proto == IPPROTO_UDP) {
136 struct udphdr *uh = &npc->npc_l4.udp;
137 dport = ntohs(uh->uh_dport);
138 } else {
139 return false;
140 }
141
142 /* Handle TCP/UDP traceroute - check for port range. */
143 if (dport < TR_BASE_PORT || dport > TR_PORT_RANGE) {
144 return false;
145 }
146
147 /* Associate ALG with translation entry. */
148 npf_nat_t *nt = ntptr;
149 npf_nat_setalg(nt, alg_icmp, 0);
150 return true;
151 }
152
153 /*
154 * npf_icmp_uniqid: retrieve unique identifiers - either ICMP query ID
155 * or TCP/UDP ports of the original packet, which is embedded.
156 */
157 static bool
158 npf_icmp_uniqid(const int type, npf_cache_t *npc, nbuf_t *nbuf, void *n_ptr)
159 {
160 struct icmp *ic;
161 struct icmp6_hdr *ic6;
162 u_int offby;
163
164 if (npf_iscached(npc, NPC_IP4)) {
165 /* Per RFC 792. */
166 switch (type) {
167 case ICMP_UNREACH:
168 case ICMP_SOURCEQUENCH:
169 case ICMP_REDIRECT:
170 case ICMP_TIMXCEED:
171 case ICMP_PARAMPROB:
172 /* Should contain original IP header. */
173 offby = offsetof(struct icmp, icmp_ip);
174 if ((n_ptr = nbuf_advance(&nbuf, n_ptr, offby)) == NULL) {
175 return false;
176 }
177 /* Fetch into the cache. */
178 if (!npf_fetch_ip(npc, nbuf, n_ptr)) {
179 return false;
180 }
181 switch (npf_cache_ipproto(npc)) {
182 case IPPROTO_TCP:
183 return npf_fetch_tcp(npc, nbuf, n_ptr);
184 case IPPROTO_UDP:
185 return npf_fetch_udp(npc, nbuf, n_ptr);
186 default:
187 return false;
188 }
189 return true;
190
191 case ICMP_ECHOREPLY:
192 case ICMP_ECHO:
193 case ICMP_TSTAMP:
194 case ICMP_TSTAMPREPLY:
195 case ICMP_IREQ:
196 case ICMP_IREQREPLY:
197 /* Should contain ICMP query ID. */
198 ic = &npc->npc_l4.icmp;
199 offby = offsetof(struct icmp, icmp_id);
200 if (nbuf_advfetch(&nbuf, &n_ptr, offby,
201 sizeof(uint16_t), &ic->icmp_id)) {
202 return false;
203 }
204 npc->npc_info |= NPC_ICMP_ID;
205 return true;
206 default:
207 break;
208 }
209 /* No unique IDs. */
210 return false;
211 }
212 if (npf_iscached(npc, NPC_IP6)) {
213 switch (type) {
214 /* Per RFC 4443. */
215 case ICMP6_DST_UNREACH:
216 case ICMP6_PACKET_TOO_BIG:
217 case ICMP6_TIME_EXCEEDED:
218 case ICMP6_PARAM_PROB:
219 /* Should contain original IP header. */
220 offby = sizeof(struct icmp6_hdr);
221 if ((n_ptr = nbuf_advance(&nbuf, n_ptr, offby)) == NULL) {
222 return false;
223 }
224 /* Fetch into the cache. */
225 if (!npf_fetch_ip(npc, nbuf, n_ptr)) {
226 return false;
227 }
228 switch (npf_cache_ipproto(npc)) {
229 case IPPROTO_TCP:
230 return npf_fetch_tcp(npc, nbuf, n_ptr);
231 case IPPROTO_UDP:
232 return npf_fetch_udp(npc, nbuf, n_ptr);
233 default:
234 return false;
235 }
236 return true;
237
238 case ICMP6_ECHO_REQUEST:
239 case ICMP6_ECHO_REPLY:
240 /* Should contain ICMP query ID. */
241 ic6 = &npc->npc_l4.icmp6;
242 offby = offsetof(struct icmp6_hdr, icmp6_id);
243 if (nbuf_advfetch(&nbuf, &n_ptr, offby,
244 sizeof(uint16_t), &ic6->icmp6_id)) {
245 return false;
246 }
247 npc->npc_info |= NPC_ICMP_ID;
248 return true;
249 default:
250 break;
251 }
252 /* No unique IDs. */
253 return false;
254 }
255 /* Whatever protocol that may have been ... */
256 return false;
257 }
258
259 static void
260 npfa_srcdst_invert(npf_cache_t *npc)
261 {
262 const int proto = npf_cache_ipproto(npc);
263 npf_addr_t *tmp_ip;
264
265 if (proto == IPPROTO_TCP) {
266 struct tcphdr *th = &npc->npc_l4.tcp;
267 in_port_t tmp_sport = th->th_sport;
268 th->th_sport = th->th_dport;
269 th->th_dport = tmp_sport;
270
271 } else if (proto == IPPROTO_UDP) {
272 struct udphdr *uh = &npc->npc_l4.udp;
273 in_port_t tmp_sport = uh->uh_sport;
274 uh->uh_sport = uh->uh_dport;
275 uh->uh_dport = tmp_sport;
276 }
277 tmp_ip = npc->npc_srcip;
278 npc->npc_srcip = npc->npc_dstip;
279 npc->npc_dstip = tmp_ip;
280 }
281
282 /*
283 * npfa_icmp_session: ALG session inspector, returns unique identifiers.
284 */
285 static bool
286 npfa_icmp_session(npf_cache_t *npc, nbuf_t *nbuf, void *keyptr)
287 {
288 npf_cache_t *key = keyptr;
289 KASSERT(key->npc_info == 0);
290
291 /* IP + ICMP? Get unique identifiers from ICMP packet. */
292 if (!npf_iscached(npc, NPC_IP4)) {
293 return false;
294 }
295 if (npf_cache_ipproto(npc) != IPPROTO_ICMP) {
296 return false;
297 }
298 KASSERT(npf_iscached(npc, NPC_ICMP));
299
300 /* Advance to ICMP header. */
301 void *n_ptr = nbuf_dataptr(nbuf);
302 const u_int hlen = npf_cache_hlen(npc);
303
304 if ((n_ptr = nbuf_advance(&nbuf, n_ptr, hlen)) == NULL) {
305 return false;
306 }
307
308 /* Fetch relevant data into the separate ("key") cache. */
309 struct icmp *ic = &npc->npc_l4.icmp;
310 if (!npf_icmp_uniqid(ic->icmp_type, key, nbuf, n_ptr)) {
311 return false;
312 }
313
314 if (npf_iscached(key, NPC_ICMP_ID)) {
315 struct icmp *keyic = &key->npc_l4.icmp;
316
317 /* Copy ICMP ID to the cache and flag it. */
318 npc->npc_info |= NPC_ICMP_ID;
319 ic->icmp_id = keyic->icmp_id;
320
321 /* Note: return False, since key is the original cache. */
322 return false;
323 }
324
325 /*
326 * Embedded IP packet is the original of "forwards" stream.
327 * We should imitate the "backwards" stream for inspection.
328 */
329 KASSERT(npf_iscached(key, NPC_IP46));
330 KASSERT(npf_iscached(key, NPC_LAYER4));
331 npfa_srcdst_invert(key);
332 key->npc_alen = npc->npc_alen;
333
334 return true;
335 }
336
337 /*
338 * npfa_icmp_natin: ALG inbound translation inspector, rewrite IP address
339 * in the IP header, which is embedded in ICMP packet.
340 */
341 static bool
342 npfa_icmp_natin(npf_cache_t *npc, nbuf_t *nbuf, void *ntptr)
343 {
344 npf_cache_t enpc = { .npc_info = 0 };
345
346 /* XXX: Duplicated work (done at session inspection). */
347 if (!npfa_icmp_session(npc, nbuf, &enpc)) {
348 return false;
349 }
350 /* XXX: Restore inversion (inefficient). */
351 KASSERT(npf_iscached(&enpc, NPC_IP46));
352 KASSERT(npf_iscached(&enpc, NPC_LAYER4));
353 npfa_srcdst_invert(&enpc);
354
355 /*
356 * Save ICMP and embedded IP with TCP/UDP header checksums, retrieve
357 * the original address and port, and calculate ICMP checksum for
358 * embedded packet changes, while data is not rewritten in the cache.
359 */
360 const int proto = npf_cache_ipproto(&enpc);
361 const struct ip *eip = &enpc.npc_ip.v4;
362 const struct icmp * const ic = &npc->npc_l4.icmp;
363 uint16_t cksum = ic->icmp_cksum, ecksum = eip->ip_sum, l4cksum;
364 npf_nat_t *nt = ntptr;
365 npf_addr_t *addr;
366 in_port_t port;
367
368 npf_nat_getorig(nt, &addr, &port);
369
370 if (proto == IPPROTO_TCP) {
371 struct tcphdr *th = &enpc.npc_l4.tcp;
372 cksum = npf_fixup16_cksum(cksum, th->th_sport, port);
373 l4cksum = th->th_sum;
374 } else {
375 struct udphdr *uh = &enpc.npc_l4.udp;
376 cksum = npf_fixup16_cksum(cksum, uh->uh_sport, port);
377 l4cksum = uh->uh_sum;
378 }
379 cksum = npf_addr_cksum(cksum, enpc.npc_alen, enpc.npc_srcip, addr);
380
381 /*
382 * Save the original pointers to the main IP header and then advance
383 * to the embedded IP header after ICMP header.
384 */
385 void *n_ptr = nbuf_dataptr(nbuf), *cnbuf = nbuf, *cnptr = n_ptr;
386 u_int offby = npf_cache_hlen(npc) + offsetof(struct icmp, icmp_ip);
387
388 if ((n_ptr = nbuf_advance(&nbuf, n_ptr, offby)) == NULL) {
389 return false;
390 }
391
392 /*
393 * Rewrite source IP address and port of the embedded IP header,
394 * which represents original packet - therefore passing PFIL_OUT.
395 * Note: checksums are first, since it uses values from the cache.
396 */
397 if (!npf_rwrcksum(&enpc, nbuf, n_ptr, PFIL_OUT, addr, port)) {
398 return false;
399 }
400 if (!npf_rwrip(&enpc, nbuf, n_ptr, PFIL_OUT, addr)) {
401 return false;
402 }
403 if (!npf_rwrport(&enpc, nbuf, n_ptr, PFIL_OUT, port)) {
404 return false;
405 }
406
407 /*
408 * Finish calculation of the ICMP checksum. Update for embedded IP
409 * and TCP/UDP checksum changes. Finally, rewrite ICMP checksum.
410 */
411 if (proto == IPPROTO_TCP) {
412 struct tcphdr *th = &enpc.npc_l4.tcp;
413 cksum = npf_fixup16_cksum(cksum, l4cksum, th->th_sum);
414 } else if (l4cksum) {
415 struct udphdr *uh = &enpc.npc_l4.udp;
416 cksum = npf_fixup16_cksum(cksum, l4cksum, uh->uh_sum);
417 }
418 cksum = npf_fixup16_cksum(cksum, ecksum, eip->ip_sum);
419
420 offby = npf_cache_hlen(npc) + offsetof(struct icmp, icmp_cksum);
421 if (nbuf_advstore(&cnbuf, &cnptr, offby, sizeof(uint16_t), &cksum)) {
422 return false;
423 }
424 return true;
425 }
426