bpfjit.c revision 1.19 1 1.19 alnsn /* $NetBSD: bpfjit.c,v 1.19 2014/07/01 16:18:55 alnsn Exp $ */
2 1.3 rmind
3 1.1 alnsn /*-
4 1.7 alnsn * Copyright (c) 2011-2014 Alexander Nasonov.
5 1.1 alnsn * All rights reserved.
6 1.1 alnsn *
7 1.1 alnsn * Redistribution and use in source and binary forms, with or without
8 1.1 alnsn * modification, are permitted provided that the following conditions
9 1.1 alnsn * are met:
10 1.1 alnsn *
11 1.1 alnsn * 1. Redistributions of source code must retain the above copyright
12 1.1 alnsn * notice, this list of conditions and the following disclaimer.
13 1.1 alnsn * 2. Redistributions in binary form must reproduce the above copyright
14 1.1 alnsn * notice, this list of conditions and the following disclaimer in
15 1.1 alnsn * the documentation and/or other materials provided with the
16 1.1 alnsn * distribution.
17 1.1 alnsn *
18 1.1 alnsn * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
19 1.1 alnsn * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
20 1.1 alnsn * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
21 1.1 alnsn * FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
22 1.1 alnsn * COPYRIGHT HOLDERS OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
23 1.1 alnsn * INCIDENTAL, SPECIAL, EXEMPLARY OR CONSEQUENTIAL DAMAGES (INCLUDING,
24 1.1 alnsn * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
25 1.1 alnsn * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED
26 1.1 alnsn * AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
27 1.1 alnsn * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT
28 1.1 alnsn * OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
29 1.1 alnsn * SUCH DAMAGE.
30 1.1 alnsn */
31 1.1 alnsn
32 1.2 alnsn #include <sys/cdefs.h>
33 1.2 alnsn #ifdef _KERNEL
34 1.19 alnsn __KERNEL_RCSID(0, "$NetBSD: bpfjit.c,v 1.19 2014/07/01 16:18:55 alnsn Exp $");
35 1.2 alnsn #else
36 1.19 alnsn __RCSID("$NetBSD: bpfjit.c,v 1.19 2014/07/01 16:18:55 alnsn Exp $");
37 1.2 alnsn #endif
38 1.2 alnsn
39 1.3 rmind #include <sys/types.h>
40 1.3 rmind #include <sys/queue.h>
41 1.1 alnsn
42 1.1 alnsn #ifndef _KERNEL
43 1.7 alnsn #include <assert.h>
44 1.7 alnsn #define BJ_ASSERT(c) assert(c)
45 1.7 alnsn #else
46 1.7 alnsn #define BJ_ASSERT(c) KASSERT(c)
47 1.7 alnsn #endif
48 1.7 alnsn
49 1.7 alnsn #ifndef _KERNEL
50 1.3 rmind #include <stdlib.h>
51 1.7 alnsn #define BJ_ALLOC(sz) malloc(sz)
52 1.7 alnsn #define BJ_FREE(p, sz) free(p)
53 1.1 alnsn #else
54 1.3 rmind #include <sys/kmem.h>
55 1.7 alnsn #define BJ_ALLOC(sz) kmem_alloc(sz, KM_SLEEP)
56 1.7 alnsn #define BJ_FREE(p, sz) kmem_free(p, sz)
57 1.1 alnsn #endif
58 1.1 alnsn
59 1.1 alnsn #ifndef _KERNEL
60 1.1 alnsn #include <limits.h>
61 1.1 alnsn #include <stdbool.h>
62 1.1 alnsn #include <stddef.h>
63 1.1 alnsn #include <stdint.h>
64 1.1 alnsn #else
65 1.1 alnsn #include <sys/atomic.h>
66 1.1 alnsn #include <sys/module.h>
67 1.1 alnsn #endif
68 1.1 alnsn
69 1.5 rmind #define __BPF_PRIVATE
70 1.5 rmind #include <net/bpf.h>
71 1.3 rmind #include <net/bpfjit.h>
72 1.1 alnsn #include <sljitLir.h>
73 1.1 alnsn
74 1.7 alnsn #if !defined(_KERNEL) && defined(SLJIT_VERBOSE) && SLJIT_VERBOSE
75 1.7 alnsn #include <stdio.h> /* for stderr */
76 1.7 alnsn #endif
77 1.7 alnsn
78 1.7 alnsn /*
79 1.13 alnsn * Arguments of generated bpfjit_func_t.
80 1.13 alnsn * The first argument is reassigned upon entry
81 1.13 alnsn * to a more frequently used buf argument.
82 1.13 alnsn */
83 1.13 alnsn #define BJ_CTX_ARG SLJIT_SAVED_REG1
84 1.13 alnsn #define BJ_ARGS SLJIT_SAVED_REG2
85 1.13 alnsn
86 1.13 alnsn /*
87 1.7 alnsn * Permanent register assignments.
88 1.7 alnsn */
89 1.7 alnsn #define BJ_BUF SLJIT_SAVED_REG1
90 1.13 alnsn //#define BJ_ARGS SLJIT_SAVED_REG2
91 1.7 alnsn #define BJ_BUFLEN SLJIT_SAVED_REG3
92 1.12 alnsn #define BJ_AREG SLJIT_SCRATCH_REG1
93 1.12 alnsn #define BJ_TMP1REG SLJIT_SCRATCH_REG2
94 1.12 alnsn #define BJ_TMP2REG SLJIT_SCRATCH_REG3
95 1.7 alnsn #define BJ_XREG SLJIT_TEMPORARY_EREG1
96 1.7 alnsn #define BJ_TMP3REG SLJIT_TEMPORARY_EREG2
97 1.7 alnsn
98 1.13 alnsn /*
99 1.13 alnsn * EREG registers can't be used for indirect calls, reuse BJ_BUF and
100 1.13 alnsn * BJ_BUFLEN registers. They can be easily restored from BJ_ARGS.
101 1.13 alnsn */
102 1.13 alnsn #define BJ_COPF_PTR SLJIT_SAVED_REG1
103 1.13 alnsn #define BJ_COPF_IDX SLJIT_SAVED_REG3
104 1.13 alnsn
105 1.13 alnsn #ifdef _KERNEL
106 1.13 alnsn #define MAX_MEMWORDS BPF_MAX_MEMWORDS
107 1.13 alnsn #else
108 1.13 alnsn #define MAX_MEMWORDS BPF_MEMWORDS
109 1.13 alnsn #endif
110 1.13 alnsn
111 1.13 alnsn #define BJ_INIT_NOBITS ((bpf_memword_init_t)0)
112 1.13 alnsn #define BJ_INIT_MBIT(k) BPF_MEMWORD_INIT(k)
113 1.13 alnsn #define BJ_INIT_ABIT BJ_INIT_MBIT(MAX_MEMWORDS)
114 1.13 alnsn #define BJ_INIT_XBIT BJ_INIT_MBIT(MAX_MEMWORDS + 1)
115 1.1 alnsn
116 1.9 alnsn /*
117 1.19 alnsn * Get a number of memwords and external memwords from a bpf_ctx object.
118 1.19 alnsn */
119 1.19 alnsn #define GET_EXTWORDS(bc) ((bc) ? (bc)->extwords : 0)
120 1.19 alnsn #define GET_MEMWORDS(bc) (GET_EXTWORDS(bc) ? GET_EXTWORDS(bc) : BPF_MEMWORDS)
121 1.19 alnsn
122 1.19 alnsn /*
123 1.9 alnsn * Datatype for Array Bounds Check Elimination (ABC) pass.
124 1.9 alnsn */
125 1.9 alnsn typedef uint64_t bpfjit_abc_length_t;
126 1.9 alnsn #define MAX_ABC_LENGTH (UINT32_MAX + UINT64_C(4)) /* max. width is 4 */
127 1.8 alnsn
128 1.7 alnsn struct bpfjit_stack
129 1.7 alnsn {
130 1.13 alnsn bpf_ctx_t *ctx;
131 1.13 alnsn uint32_t *extmem; /* pointer to external memory store */
132 1.7 alnsn #ifdef _KERNEL
133 1.7 alnsn void *tmp;
134 1.7 alnsn #endif
135 1.13 alnsn uint32_t mem[BPF_MEMWORDS]; /* internal memory store */
136 1.7 alnsn };
137 1.7 alnsn
138 1.7 alnsn /*
139 1.7 alnsn * Data for BPF_JMP instruction.
140 1.7 alnsn * Forward declaration for struct bpfjit_jump.
141 1.1 alnsn */
142 1.7 alnsn struct bpfjit_jump_data;
143 1.1 alnsn
144 1.1 alnsn /*
145 1.7 alnsn * Node of bjumps list.
146 1.1 alnsn */
147 1.3 rmind struct bpfjit_jump {
148 1.7 alnsn struct sljit_jump *sjump;
149 1.7 alnsn SLIST_ENTRY(bpfjit_jump) entries;
150 1.7 alnsn struct bpfjit_jump_data *jdata;
151 1.1 alnsn };
152 1.1 alnsn
153 1.1 alnsn /*
154 1.1 alnsn * Data for BPF_JMP instruction.
155 1.1 alnsn */
156 1.3 rmind struct bpfjit_jump_data {
157 1.1 alnsn /*
158 1.7 alnsn * These entries make up bjumps list:
159 1.7 alnsn * jtf[0] - when coming from jt path,
160 1.7 alnsn * jtf[1] - when coming from jf path.
161 1.1 alnsn */
162 1.7 alnsn struct bpfjit_jump jtf[2];
163 1.7 alnsn /*
164 1.7 alnsn * Length calculated by Array Bounds Check Elimination (ABC) pass.
165 1.7 alnsn */
166 1.8 alnsn bpfjit_abc_length_t abc_length;
167 1.7 alnsn /*
168 1.7 alnsn * Length checked by the last out-of-bounds check.
169 1.7 alnsn */
170 1.8 alnsn bpfjit_abc_length_t checked_length;
171 1.1 alnsn };
172 1.1 alnsn
173 1.1 alnsn /*
174 1.1 alnsn * Data for "read from packet" instructions.
175 1.1 alnsn * See also read_pkt_insn() function below.
176 1.1 alnsn */
177 1.3 rmind struct bpfjit_read_pkt_data {
178 1.1 alnsn /*
179 1.7 alnsn * Length calculated by Array Bounds Check Elimination (ABC) pass.
180 1.7 alnsn */
181 1.8 alnsn bpfjit_abc_length_t abc_length;
182 1.7 alnsn /*
183 1.7 alnsn * If positive, emit "if (buflen < check_length) return 0"
184 1.7 alnsn * out-of-bounds check.
185 1.9 alnsn * Values greater than UINT32_MAX generate unconditional "return 0".
186 1.1 alnsn */
187 1.8 alnsn bpfjit_abc_length_t check_length;
188 1.1 alnsn };
189 1.1 alnsn
190 1.1 alnsn /*
191 1.1 alnsn * Additional (optimization-related) data for bpf_insn.
192 1.1 alnsn */
193 1.3 rmind struct bpfjit_insn_data {
194 1.1 alnsn /* List of jumps to this insn. */
195 1.7 alnsn SLIST_HEAD(, bpfjit_jump) bjumps;
196 1.1 alnsn
197 1.1 alnsn union {
198 1.7 alnsn struct bpfjit_jump_data jdata;
199 1.7 alnsn struct bpfjit_read_pkt_data rdata;
200 1.7 alnsn } u;
201 1.1 alnsn
202 1.13 alnsn bpf_memword_init_t invalid;
203 1.7 alnsn bool unreachable;
204 1.1 alnsn };
205 1.1 alnsn
206 1.1 alnsn #ifdef _KERNEL
207 1.1 alnsn
208 1.1 alnsn uint32_t m_xword(const struct mbuf *, uint32_t, int *);
209 1.1 alnsn uint32_t m_xhalf(const struct mbuf *, uint32_t, int *);
210 1.1 alnsn uint32_t m_xbyte(const struct mbuf *, uint32_t, int *);
211 1.1 alnsn
212 1.1 alnsn MODULE(MODULE_CLASS_MISC, bpfjit, "sljit")
213 1.1 alnsn
214 1.1 alnsn static int
215 1.1 alnsn bpfjit_modcmd(modcmd_t cmd, void *arg)
216 1.1 alnsn {
217 1.1 alnsn
218 1.1 alnsn switch (cmd) {
219 1.1 alnsn case MODULE_CMD_INIT:
220 1.1 alnsn bpfjit_module_ops.bj_free_code = &bpfjit_free_code;
221 1.1 alnsn membar_producer();
222 1.1 alnsn bpfjit_module_ops.bj_generate_code = &bpfjit_generate_code;
223 1.1 alnsn membar_producer();
224 1.1 alnsn return 0;
225 1.1 alnsn
226 1.1 alnsn case MODULE_CMD_FINI:
227 1.1 alnsn return EOPNOTSUPP;
228 1.1 alnsn
229 1.1 alnsn default:
230 1.1 alnsn return ENOTTY;
231 1.1 alnsn }
232 1.1 alnsn }
233 1.1 alnsn #endif
234 1.1 alnsn
235 1.1 alnsn static uint32_t
236 1.7 alnsn read_width(const struct bpf_insn *pc)
237 1.1 alnsn {
238 1.1 alnsn
239 1.1 alnsn switch (BPF_SIZE(pc->code)) {
240 1.1 alnsn case BPF_W:
241 1.1 alnsn return 4;
242 1.1 alnsn case BPF_H:
243 1.1 alnsn return 2;
244 1.1 alnsn case BPF_B:
245 1.1 alnsn return 1;
246 1.1 alnsn default:
247 1.7 alnsn BJ_ASSERT(false);
248 1.1 alnsn return 0;
249 1.1 alnsn }
250 1.1 alnsn }
251 1.1 alnsn
252 1.13 alnsn /*
253 1.13 alnsn * Copy buf and buflen members of bpf_args from BJ_ARGS
254 1.13 alnsn * pointer to BJ_BUF and BJ_BUFLEN registers.
255 1.13 alnsn */
256 1.13 alnsn static int
257 1.13 alnsn load_buf_buflen(struct sljit_compiler *compiler)
258 1.13 alnsn {
259 1.13 alnsn int status;
260 1.13 alnsn
261 1.13 alnsn status = sljit_emit_op1(compiler,
262 1.13 alnsn SLJIT_MOV_P,
263 1.13 alnsn BJ_BUF, 0,
264 1.13 alnsn SLJIT_MEM1(BJ_ARGS),
265 1.13 alnsn offsetof(struct bpf_args, pkt));
266 1.13 alnsn if (status != SLJIT_SUCCESS)
267 1.13 alnsn return status;
268 1.13 alnsn
269 1.13 alnsn status = sljit_emit_op1(compiler,
270 1.13 alnsn SLJIT_MOV,
271 1.13 alnsn BJ_BUFLEN, 0,
272 1.13 alnsn SLJIT_MEM1(BJ_ARGS),
273 1.13 alnsn offsetof(struct bpf_args, buflen));
274 1.13 alnsn
275 1.13 alnsn return status;
276 1.13 alnsn }
277 1.13 alnsn
278 1.7 alnsn static bool
279 1.7 alnsn grow_jumps(struct sljit_jump ***jumps, size_t *size)
280 1.7 alnsn {
281 1.7 alnsn struct sljit_jump **newptr;
282 1.7 alnsn const size_t elemsz = sizeof(struct sljit_jump *);
283 1.7 alnsn size_t old_size = *size;
284 1.7 alnsn size_t new_size = 2 * old_size;
285 1.7 alnsn
286 1.7 alnsn if (new_size < old_size || new_size > SIZE_MAX / elemsz)
287 1.7 alnsn return false;
288 1.7 alnsn
289 1.7 alnsn newptr = BJ_ALLOC(new_size * elemsz);
290 1.7 alnsn if (newptr == NULL)
291 1.7 alnsn return false;
292 1.7 alnsn
293 1.7 alnsn memcpy(newptr, *jumps, old_size * elemsz);
294 1.7 alnsn BJ_FREE(*jumps, old_size * elemsz);
295 1.7 alnsn
296 1.7 alnsn *jumps = newptr;
297 1.7 alnsn *size = new_size;
298 1.7 alnsn return true;
299 1.7 alnsn }
300 1.7 alnsn
301 1.7 alnsn static bool
302 1.7 alnsn append_jump(struct sljit_jump *jump, struct sljit_jump ***jumps,
303 1.7 alnsn size_t *size, size_t *max_size)
304 1.1 alnsn {
305 1.7 alnsn if (*size == *max_size && !grow_jumps(jumps, max_size))
306 1.7 alnsn return false;
307 1.1 alnsn
308 1.7 alnsn (*jumps)[(*size)++] = jump;
309 1.7 alnsn return true;
310 1.1 alnsn }
311 1.1 alnsn
312 1.1 alnsn /*
313 1.1 alnsn * Generate code for BPF_LD+BPF_B+BPF_ABS A <- P[k:1].
314 1.1 alnsn */
315 1.1 alnsn static int
316 1.19 alnsn emit_read8(struct sljit_compiler *compiler, uint32_t k)
317 1.1 alnsn {
318 1.1 alnsn
319 1.1 alnsn return sljit_emit_op1(compiler,
320 1.1 alnsn SLJIT_MOV_UB,
321 1.7 alnsn BJ_AREG, 0,
322 1.7 alnsn SLJIT_MEM1(BJ_BUF), k);
323 1.1 alnsn }
324 1.1 alnsn
325 1.1 alnsn /*
326 1.1 alnsn * Generate code for BPF_LD+BPF_H+BPF_ABS A <- P[k:2].
327 1.1 alnsn */
328 1.1 alnsn static int
329 1.19 alnsn emit_read16(struct sljit_compiler *compiler, uint32_t k)
330 1.1 alnsn {
331 1.1 alnsn int status;
332 1.1 alnsn
333 1.1 alnsn /* tmp1 = buf[k]; */
334 1.1 alnsn status = sljit_emit_op1(compiler,
335 1.1 alnsn SLJIT_MOV_UB,
336 1.7 alnsn BJ_TMP1REG, 0,
337 1.7 alnsn SLJIT_MEM1(BJ_BUF), k);
338 1.1 alnsn if (status != SLJIT_SUCCESS)
339 1.1 alnsn return status;
340 1.1 alnsn
341 1.1 alnsn /* A = buf[k+1]; */
342 1.1 alnsn status = sljit_emit_op1(compiler,
343 1.1 alnsn SLJIT_MOV_UB,
344 1.7 alnsn BJ_AREG, 0,
345 1.7 alnsn SLJIT_MEM1(BJ_BUF), k+1);
346 1.1 alnsn if (status != SLJIT_SUCCESS)
347 1.1 alnsn return status;
348 1.1 alnsn
349 1.1 alnsn /* tmp1 = tmp1 << 8; */
350 1.1 alnsn status = sljit_emit_op2(compiler,
351 1.1 alnsn SLJIT_SHL,
352 1.7 alnsn BJ_TMP1REG, 0,
353 1.7 alnsn BJ_TMP1REG, 0,
354 1.1 alnsn SLJIT_IMM, 8);
355 1.1 alnsn if (status != SLJIT_SUCCESS)
356 1.1 alnsn return status;
357 1.1 alnsn
358 1.1 alnsn /* A = A + tmp1; */
359 1.1 alnsn status = sljit_emit_op2(compiler,
360 1.1 alnsn SLJIT_ADD,
361 1.7 alnsn BJ_AREG, 0,
362 1.7 alnsn BJ_AREG, 0,
363 1.7 alnsn BJ_TMP1REG, 0);
364 1.1 alnsn return status;
365 1.1 alnsn }
366 1.1 alnsn
367 1.1 alnsn /*
368 1.1 alnsn * Generate code for BPF_LD+BPF_W+BPF_ABS A <- P[k:4].
369 1.1 alnsn */
370 1.1 alnsn static int
371 1.19 alnsn emit_read32(struct sljit_compiler *compiler, uint32_t k)
372 1.1 alnsn {
373 1.1 alnsn int status;
374 1.1 alnsn
375 1.1 alnsn /* tmp1 = buf[k]; */
376 1.1 alnsn status = sljit_emit_op1(compiler,
377 1.1 alnsn SLJIT_MOV_UB,
378 1.7 alnsn BJ_TMP1REG, 0,
379 1.7 alnsn SLJIT_MEM1(BJ_BUF), k);
380 1.1 alnsn if (status != SLJIT_SUCCESS)
381 1.1 alnsn return status;
382 1.1 alnsn
383 1.1 alnsn /* tmp2 = buf[k+1]; */
384 1.1 alnsn status = sljit_emit_op1(compiler,
385 1.1 alnsn SLJIT_MOV_UB,
386 1.7 alnsn BJ_TMP2REG, 0,
387 1.7 alnsn SLJIT_MEM1(BJ_BUF), k+1);
388 1.1 alnsn if (status != SLJIT_SUCCESS)
389 1.1 alnsn return status;
390 1.1 alnsn
391 1.1 alnsn /* A = buf[k+3]; */
392 1.1 alnsn status = sljit_emit_op1(compiler,
393 1.1 alnsn SLJIT_MOV_UB,
394 1.7 alnsn BJ_AREG, 0,
395 1.7 alnsn SLJIT_MEM1(BJ_BUF), k+3);
396 1.1 alnsn if (status != SLJIT_SUCCESS)
397 1.1 alnsn return status;
398 1.1 alnsn
399 1.1 alnsn /* tmp1 = tmp1 << 24; */
400 1.1 alnsn status = sljit_emit_op2(compiler,
401 1.1 alnsn SLJIT_SHL,
402 1.7 alnsn BJ_TMP1REG, 0,
403 1.7 alnsn BJ_TMP1REG, 0,
404 1.1 alnsn SLJIT_IMM, 24);
405 1.1 alnsn if (status != SLJIT_SUCCESS)
406 1.1 alnsn return status;
407 1.1 alnsn
408 1.1 alnsn /* A = A + tmp1; */
409 1.1 alnsn status = sljit_emit_op2(compiler,
410 1.1 alnsn SLJIT_ADD,
411 1.7 alnsn BJ_AREG, 0,
412 1.7 alnsn BJ_AREG, 0,
413 1.7 alnsn BJ_TMP1REG, 0);
414 1.1 alnsn if (status != SLJIT_SUCCESS)
415 1.1 alnsn return status;
416 1.1 alnsn
417 1.1 alnsn /* tmp1 = buf[k+2]; */
418 1.1 alnsn status = sljit_emit_op1(compiler,
419 1.1 alnsn SLJIT_MOV_UB,
420 1.7 alnsn BJ_TMP1REG, 0,
421 1.7 alnsn SLJIT_MEM1(BJ_BUF), k+2);
422 1.1 alnsn if (status != SLJIT_SUCCESS)
423 1.1 alnsn return status;
424 1.1 alnsn
425 1.1 alnsn /* tmp2 = tmp2 << 16; */
426 1.1 alnsn status = sljit_emit_op2(compiler,
427 1.1 alnsn SLJIT_SHL,
428 1.7 alnsn BJ_TMP2REG, 0,
429 1.7 alnsn BJ_TMP2REG, 0,
430 1.1 alnsn SLJIT_IMM, 16);
431 1.1 alnsn if (status != SLJIT_SUCCESS)
432 1.1 alnsn return status;
433 1.1 alnsn
434 1.1 alnsn /* A = A + tmp2; */
435 1.1 alnsn status = sljit_emit_op2(compiler,
436 1.1 alnsn SLJIT_ADD,
437 1.7 alnsn BJ_AREG, 0,
438 1.7 alnsn BJ_AREG, 0,
439 1.7 alnsn BJ_TMP2REG, 0);
440 1.1 alnsn if (status != SLJIT_SUCCESS)
441 1.1 alnsn return status;
442 1.1 alnsn
443 1.1 alnsn /* tmp1 = tmp1 << 8; */
444 1.1 alnsn status = sljit_emit_op2(compiler,
445 1.1 alnsn SLJIT_SHL,
446 1.7 alnsn BJ_TMP1REG, 0,
447 1.7 alnsn BJ_TMP1REG, 0,
448 1.1 alnsn SLJIT_IMM, 8);
449 1.1 alnsn if (status != SLJIT_SUCCESS)
450 1.1 alnsn return status;
451 1.1 alnsn
452 1.1 alnsn /* A = A + tmp1; */
453 1.1 alnsn status = sljit_emit_op2(compiler,
454 1.1 alnsn SLJIT_ADD,
455 1.7 alnsn BJ_AREG, 0,
456 1.7 alnsn BJ_AREG, 0,
457 1.7 alnsn BJ_TMP1REG, 0);
458 1.1 alnsn return status;
459 1.1 alnsn }
460 1.1 alnsn
461 1.1 alnsn #ifdef _KERNEL
462 1.1 alnsn /*
463 1.1 alnsn * Generate m_xword/m_xhalf/m_xbyte call.
464 1.1 alnsn *
465 1.1 alnsn * pc is one of:
466 1.1 alnsn * BPF_LD+BPF_W+BPF_ABS A <- P[k:4]
467 1.1 alnsn * BPF_LD+BPF_H+BPF_ABS A <- P[k:2]
468 1.1 alnsn * BPF_LD+BPF_B+BPF_ABS A <- P[k:1]
469 1.1 alnsn * BPF_LD+BPF_W+BPF_IND A <- P[X+k:4]
470 1.1 alnsn * BPF_LD+BPF_H+BPF_IND A <- P[X+k:2]
471 1.1 alnsn * BPF_LD+BPF_B+BPF_IND A <- P[X+k:1]
472 1.1 alnsn * BPF_LDX+BPF_B+BPF_MSH X <- 4*(P[k:1]&0xf)
473 1.1 alnsn *
474 1.7 alnsn * The dst variable should be
475 1.7 alnsn * - BJ_AREG when emitting code for BPF_LD instructions,
476 1.7 alnsn * - BJ_XREG or any of BJ_TMP[1-3]REG registers when emitting
477 1.7 alnsn * code for BPF_MSH instruction.
478 1.1 alnsn */
479 1.1 alnsn static int
480 1.19 alnsn emit_xcall(struct sljit_compiler *compiler, const struct bpf_insn *pc,
481 1.12 alnsn int dst, sljit_sw dstw, struct sljit_jump **ret0_jump,
482 1.1 alnsn uint32_t (*fn)(const struct mbuf *, uint32_t, int *))
483 1.1 alnsn {
484 1.7 alnsn #if BJ_XREG == SLJIT_RETURN_REG || \
485 1.12 alnsn BJ_XREG == SLJIT_SCRATCH_REG1 || \
486 1.12 alnsn BJ_XREG == SLJIT_SCRATCH_REG2 || \
487 1.12 alnsn BJ_XREG == SLJIT_SCRATCH_REG3
488 1.1 alnsn #error "Not supported assignment of registers."
489 1.1 alnsn #endif
490 1.1 alnsn int status;
491 1.1 alnsn
492 1.1 alnsn /*
493 1.1 alnsn * The third argument of fn is an address on stack.
494 1.1 alnsn */
495 1.7 alnsn const int arg3_offset = offsetof(struct bpfjit_stack, tmp);
496 1.1 alnsn
497 1.1 alnsn if (BPF_CLASS(pc->code) == BPF_LDX) {
498 1.1 alnsn /* save A */
499 1.1 alnsn status = sljit_emit_op1(compiler,
500 1.1 alnsn SLJIT_MOV,
501 1.7 alnsn BJ_TMP3REG, 0,
502 1.7 alnsn BJ_AREG, 0);
503 1.1 alnsn if (status != SLJIT_SUCCESS)
504 1.1 alnsn return status;
505 1.1 alnsn }
506 1.1 alnsn
507 1.1 alnsn /*
508 1.1 alnsn * Prepare registers for fn(buf, k, &err) call.
509 1.1 alnsn */
510 1.1 alnsn status = sljit_emit_op1(compiler,
511 1.1 alnsn SLJIT_MOV,
512 1.12 alnsn SLJIT_SCRATCH_REG1, 0,
513 1.7 alnsn BJ_BUF, 0);
514 1.1 alnsn if (status != SLJIT_SUCCESS)
515 1.1 alnsn return status;
516 1.1 alnsn
517 1.1 alnsn if (BPF_CLASS(pc->code) == BPF_LD && BPF_MODE(pc->code) == BPF_IND) {
518 1.1 alnsn status = sljit_emit_op2(compiler,
519 1.1 alnsn SLJIT_ADD,
520 1.12 alnsn SLJIT_SCRATCH_REG2, 0,
521 1.7 alnsn BJ_XREG, 0,
522 1.1 alnsn SLJIT_IMM, (uint32_t)pc->k);
523 1.1 alnsn } else {
524 1.1 alnsn status = sljit_emit_op1(compiler,
525 1.1 alnsn SLJIT_MOV,
526 1.12 alnsn SLJIT_SCRATCH_REG2, 0,
527 1.1 alnsn SLJIT_IMM, (uint32_t)pc->k);
528 1.1 alnsn }
529 1.1 alnsn
530 1.1 alnsn if (status != SLJIT_SUCCESS)
531 1.1 alnsn return status;
532 1.1 alnsn
533 1.1 alnsn status = sljit_get_local_base(compiler,
534 1.12 alnsn SLJIT_SCRATCH_REG3, 0, arg3_offset);
535 1.1 alnsn if (status != SLJIT_SUCCESS)
536 1.1 alnsn return status;
537 1.1 alnsn
538 1.1 alnsn /* fn(buf, k, &err); */
539 1.1 alnsn status = sljit_emit_ijump(compiler,
540 1.1 alnsn SLJIT_CALL3,
541 1.1 alnsn SLJIT_IMM, SLJIT_FUNC_OFFSET(fn));
542 1.1 alnsn
543 1.7 alnsn if (dst != SLJIT_RETURN_REG) {
544 1.1 alnsn /* move return value to dst */
545 1.1 alnsn status = sljit_emit_op1(compiler,
546 1.1 alnsn SLJIT_MOV,
547 1.1 alnsn dst, dstw,
548 1.1 alnsn SLJIT_RETURN_REG, 0);
549 1.1 alnsn if (status != SLJIT_SUCCESS)
550 1.1 alnsn return status;
551 1.7 alnsn }
552 1.1 alnsn
553 1.7 alnsn if (BPF_CLASS(pc->code) == BPF_LDX) {
554 1.1 alnsn /* restore A */
555 1.1 alnsn status = sljit_emit_op1(compiler,
556 1.1 alnsn SLJIT_MOV,
557 1.7 alnsn BJ_AREG, 0,
558 1.7 alnsn BJ_TMP3REG, 0);
559 1.1 alnsn if (status != SLJIT_SUCCESS)
560 1.1 alnsn return status;
561 1.1 alnsn }
562 1.1 alnsn
563 1.1 alnsn /* tmp3 = *err; */
564 1.1 alnsn status = sljit_emit_op1(compiler,
565 1.1 alnsn SLJIT_MOV_UI,
566 1.12 alnsn SLJIT_SCRATCH_REG3, 0,
567 1.1 alnsn SLJIT_MEM1(SLJIT_LOCALS_REG), arg3_offset);
568 1.1 alnsn if (status != SLJIT_SUCCESS)
569 1.1 alnsn return status;
570 1.1 alnsn
571 1.1 alnsn /* if (tmp3 != 0) return 0; */
572 1.1 alnsn *ret0_jump = sljit_emit_cmp(compiler,
573 1.1 alnsn SLJIT_C_NOT_EQUAL,
574 1.12 alnsn SLJIT_SCRATCH_REG3, 0,
575 1.1 alnsn SLJIT_IMM, 0);
576 1.1 alnsn if (*ret0_jump == NULL)
577 1.1 alnsn return SLJIT_ERR_ALLOC_FAILED;
578 1.1 alnsn
579 1.1 alnsn return status;
580 1.1 alnsn }
581 1.1 alnsn #endif
582 1.1 alnsn
583 1.1 alnsn /*
584 1.13 alnsn * Emit code for BPF_COP and BPF_COPX instructions.
585 1.13 alnsn */
586 1.13 alnsn static int
587 1.19 alnsn emit_cop(struct sljit_compiler *compiler, const bpf_ctx_t *bc,
588 1.13 alnsn const struct bpf_insn *pc, struct sljit_jump **ret0_jump)
589 1.13 alnsn {
590 1.13 alnsn #if BJ_XREG == SLJIT_RETURN_REG || \
591 1.13 alnsn BJ_XREG == SLJIT_SCRATCH_REG1 || \
592 1.13 alnsn BJ_XREG == SLJIT_SCRATCH_REG2 || \
593 1.13 alnsn BJ_XREG == SLJIT_SCRATCH_REG3 || \
594 1.13 alnsn BJ_COPF_PTR == BJ_ARGS || \
595 1.13 alnsn BJ_COPF_IDX == BJ_ARGS
596 1.13 alnsn #error "Not supported assignment of registers."
597 1.13 alnsn #endif
598 1.13 alnsn
599 1.13 alnsn struct sljit_jump *jump;
600 1.13 alnsn int status;
601 1.13 alnsn
602 1.13 alnsn jump = NULL;
603 1.13 alnsn
604 1.13 alnsn BJ_ASSERT(bc != NULL && bc->copfuncs != NULL);
605 1.13 alnsn
606 1.13 alnsn if (BPF_MISCOP(pc->code) == BPF_COPX) {
607 1.13 alnsn /* if (X >= bc->nfuncs) return 0; */
608 1.13 alnsn jump = sljit_emit_cmp(compiler,
609 1.13 alnsn SLJIT_C_GREATER_EQUAL,
610 1.13 alnsn BJ_XREG, 0,
611 1.13 alnsn SLJIT_IMM, bc->nfuncs);
612 1.13 alnsn if (jump == NULL)
613 1.13 alnsn return SLJIT_ERR_ALLOC_FAILED;
614 1.13 alnsn }
615 1.13 alnsn
616 1.13 alnsn if (jump != NULL)
617 1.13 alnsn *ret0_jump = jump;
618 1.13 alnsn
619 1.13 alnsn /*
620 1.13 alnsn * Copy bpf_copfunc_t arguments to registers.
621 1.13 alnsn */
622 1.13 alnsn #if BJ_AREG != SLJIT_SCRATCH_REG3
623 1.13 alnsn status = sljit_emit_op1(compiler,
624 1.13 alnsn SLJIT_MOV_UI,
625 1.13 alnsn SLJIT_SCRATCH_REG3, 0,
626 1.13 alnsn BJ_AREG, 0);
627 1.13 alnsn if (status != SLJIT_SUCCESS)
628 1.13 alnsn return status;
629 1.13 alnsn #endif
630 1.13 alnsn
631 1.13 alnsn status = sljit_emit_op1(compiler,
632 1.13 alnsn SLJIT_MOV_P,
633 1.13 alnsn SLJIT_SCRATCH_REG1, 0,
634 1.13 alnsn SLJIT_MEM1(SLJIT_LOCALS_REG),
635 1.13 alnsn offsetof(struct bpfjit_stack, ctx));
636 1.13 alnsn if (status != SLJIT_SUCCESS)
637 1.13 alnsn return status;
638 1.13 alnsn
639 1.13 alnsn status = sljit_emit_op1(compiler,
640 1.13 alnsn SLJIT_MOV_P,
641 1.13 alnsn SLJIT_SCRATCH_REG2, 0,
642 1.13 alnsn BJ_ARGS, 0);
643 1.13 alnsn if (status != SLJIT_SUCCESS)
644 1.13 alnsn return status;
645 1.13 alnsn
646 1.13 alnsn if (BPF_MISCOP(pc->code) == BPF_COP) {
647 1.13 alnsn status = sljit_emit_ijump(compiler,
648 1.13 alnsn SLJIT_CALL3,
649 1.13 alnsn SLJIT_IMM, SLJIT_FUNC_OFFSET(bc->copfuncs[pc->k]));
650 1.13 alnsn if (status != SLJIT_SUCCESS)
651 1.13 alnsn return status;
652 1.13 alnsn } else if (BPF_MISCOP(pc->code) == BPF_COPX) {
653 1.13 alnsn /* load ctx->copfuncs */
654 1.13 alnsn status = sljit_emit_op1(compiler,
655 1.13 alnsn SLJIT_MOV_P,
656 1.13 alnsn BJ_COPF_PTR, 0,
657 1.13 alnsn SLJIT_MEM1(SLJIT_SCRATCH_REG1),
658 1.13 alnsn offsetof(struct bpf_ctx, copfuncs));
659 1.13 alnsn if (status != SLJIT_SUCCESS)
660 1.13 alnsn return status;
661 1.13 alnsn
662 1.13 alnsn /*
663 1.13 alnsn * Load X to a register that can be used for
664 1.13 alnsn * memory addressing.
665 1.13 alnsn */
666 1.13 alnsn status = sljit_emit_op1(compiler,
667 1.13 alnsn SLJIT_MOV_P,
668 1.13 alnsn BJ_COPF_IDX, 0,
669 1.13 alnsn BJ_XREG, 0);
670 1.13 alnsn if (status != SLJIT_SUCCESS)
671 1.13 alnsn return status;
672 1.13 alnsn
673 1.13 alnsn status = sljit_emit_ijump(compiler,
674 1.13 alnsn SLJIT_CALL3,
675 1.13 alnsn SLJIT_MEM2(BJ_COPF_PTR, BJ_COPF_IDX),
676 1.13 alnsn SLJIT_WORD_SHIFT);
677 1.13 alnsn if (status != SLJIT_SUCCESS)
678 1.13 alnsn return status;
679 1.13 alnsn
680 1.13 alnsn status = load_buf_buflen(compiler);
681 1.13 alnsn if (status != SLJIT_SUCCESS)
682 1.13 alnsn return status;
683 1.13 alnsn }
684 1.13 alnsn
685 1.13 alnsn #if BJ_AREG != SLJIT_RETURN_REG
686 1.13 alnsn status = sljit_emit_op1(compiler,
687 1.13 alnsn SLJIT_MOV,
688 1.13 alnsn BJ_AREG, 0,
689 1.13 alnsn SLJIT_RETURN_REG, 0);
690 1.13 alnsn if (status != SLJIT_SUCCESS)
691 1.13 alnsn return status;
692 1.13 alnsn #endif
693 1.13 alnsn
694 1.13 alnsn return status;
695 1.13 alnsn }
696 1.13 alnsn
697 1.13 alnsn /*
698 1.1 alnsn * Generate code for
699 1.1 alnsn * BPF_LD+BPF_W+BPF_ABS A <- P[k:4]
700 1.1 alnsn * BPF_LD+BPF_H+BPF_ABS A <- P[k:2]
701 1.1 alnsn * BPF_LD+BPF_B+BPF_ABS A <- P[k:1]
702 1.1 alnsn * BPF_LD+BPF_W+BPF_IND A <- P[X+k:4]
703 1.1 alnsn * BPF_LD+BPF_H+BPF_IND A <- P[X+k:2]
704 1.1 alnsn * BPF_LD+BPF_B+BPF_IND A <- P[X+k:1]
705 1.1 alnsn */
706 1.1 alnsn static int
707 1.19 alnsn emit_pkt_read(struct sljit_compiler *compiler,
708 1.7 alnsn const struct bpf_insn *pc, struct sljit_jump *to_mchain_jump,
709 1.7 alnsn struct sljit_jump ***ret0, size_t *ret0_size, size_t *ret0_maxsize)
710 1.1 alnsn {
711 1.6 pooka int status = 0; /* XXX gcc 4.1 */
712 1.1 alnsn uint32_t width;
713 1.1 alnsn struct sljit_jump *jump;
714 1.1 alnsn #ifdef _KERNEL
715 1.1 alnsn struct sljit_label *label;
716 1.1 alnsn struct sljit_jump *over_mchain_jump;
717 1.1 alnsn const bool check_zero_buflen = (to_mchain_jump != NULL);
718 1.1 alnsn #endif
719 1.1 alnsn const uint32_t k = pc->k;
720 1.1 alnsn
721 1.1 alnsn #ifdef _KERNEL
722 1.1 alnsn if (to_mchain_jump == NULL) {
723 1.1 alnsn to_mchain_jump = sljit_emit_cmp(compiler,
724 1.1 alnsn SLJIT_C_EQUAL,
725 1.7 alnsn BJ_BUFLEN, 0,
726 1.1 alnsn SLJIT_IMM, 0);
727 1.1 alnsn if (to_mchain_jump == NULL)
728 1.7 alnsn return SLJIT_ERR_ALLOC_FAILED;
729 1.1 alnsn }
730 1.1 alnsn #endif
731 1.1 alnsn
732 1.1 alnsn width = read_width(pc);
733 1.1 alnsn
734 1.1 alnsn if (BPF_MODE(pc->code) == BPF_IND) {
735 1.1 alnsn /* tmp1 = buflen - (pc->k + width); */
736 1.1 alnsn status = sljit_emit_op2(compiler,
737 1.1 alnsn SLJIT_SUB,
738 1.7 alnsn BJ_TMP1REG, 0,
739 1.7 alnsn BJ_BUFLEN, 0,
740 1.1 alnsn SLJIT_IMM, k + width);
741 1.1 alnsn if (status != SLJIT_SUCCESS)
742 1.1 alnsn return status;
743 1.1 alnsn
744 1.1 alnsn /* buf += X; */
745 1.1 alnsn status = sljit_emit_op2(compiler,
746 1.1 alnsn SLJIT_ADD,
747 1.7 alnsn BJ_BUF, 0,
748 1.7 alnsn BJ_BUF, 0,
749 1.7 alnsn BJ_XREG, 0);
750 1.1 alnsn if (status != SLJIT_SUCCESS)
751 1.1 alnsn return status;
752 1.1 alnsn
753 1.1 alnsn /* if (tmp1 < X) return 0; */
754 1.1 alnsn jump = sljit_emit_cmp(compiler,
755 1.1 alnsn SLJIT_C_LESS,
756 1.7 alnsn BJ_TMP1REG, 0,
757 1.7 alnsn BJ_XREG, 0);
758 1.1 alnsn if (jump == NULL)
759 1.7 alnsn return SLJIT_ERR_ALLOC_FAILED;
760 1.7 alnsn if (!append_jump(jump, ret0, ret0_size, ret0_maxsize))
761 1.7 alnsn return SLJIT_ERR_ALLOC_FAILED;
762 1.1 alnsn }
763 1.1 alnsn
764 1.1 alnsn switch (width) {
765 1.1 alnsn case 4:
766 1.1 alnsn status = emit_read32(compiler, k);
767 1.1 alnsn break;
768 1.1 alnsn case 2:
769 1.1 alnsn status = emit_read16(compiler, k);
770 1.1 alnsn break;
771 1.1 alnsn case 1:
772 1.1 alnsn status = emit_read8(compiler, k);
773 1.1 alnsn break;
774 1.1 alnsn }
775 1.1 alnsn
776 1.1 alnsn if (status != SLJIT_SUCCESS)
777 1.1 alnsn return status;
778 1.1 alnsn
779 1.1 alnsn if (BPF_MODE(pc->code) == BPF_IND) {
780 1.1 alnsn /* buf -= X; */
781 1.1 alnsn status = sljit_emit_op2(compiler,
782 1.1 alnsn SLJIT_SUB,
783 1.7 alnsn BJ_BUF, 0,
784 1.7 alnsn BJ_BUF, 0,
785 1.7 alnsn BJ_XREG, 0);
786 1.1 alnsn if (status != SLJIT_SUCCESS)
787 1.1 alnsn return status;
788 1.1 alnsn }
789 1.1 alnsn
790 1.1 alnsn #ifdef _KERNEL
791 1.1 alnsn over_mchain_jump = sljit_emit_jump(compiler, SLJIT_JUMP);
792 1.1 alnsn if (over_mchain_jump == NULL)
793 1.7 alnsn return SLJIT_ERR_ALLOC_FAILED;
794 1.1 alnsn
795 1.1 alnsn /* entry point to mchain handler */
796 1.1 alnsn label = sljit_emit_label(compiler);
797 1.1 alnsn if (label == NULL)
798 1.7 alnsn return SLJIT_ERR_ALLOC_FAILED;
799 1.1 alnsn sljit_set_label(to_mchain_jump, label);
800 1.1 alnsn
801 1.1 alnsn if (check_zero_buflen) {
802 1.1 alnsn /* if (buflen != 0) return 0; */
803 1.1 alnsn jump = sljit_emit_cmp(compiler,
804 1.1 alnsn SLJIT_C_NOT_EQUAL,
805 1.7 alnsn BJ_BUFLEN, 0,
806 1.1 alnsn SLJIT_IMM, 0);
807 1.1 alnsn if (jump == NULL)
808 1.1 alnsn return SLJIT_ERR_ALLOC_FAILED;
809 1.7 alnsn if (!append_jump(jump, ret0, ret0_size, ret0_maxsize))
810 1.7 alnsn return SLJIT_ERR_ALLOC_FAILED;
811 1.1 alnsn }
812 1.1 alnsn
813 1.1 alnsn switch (width) {
814 1.1 alnsn case 4:
815 1.7 alnsn status = emit_xcall(compiler, pc, BJ_AREG, 0, &jump, &m_xword);
816 1.1 alnsn break;
817 1.1 alnsn case 2:
818 1.7 alnsn status = emit_xcall(compiler, pc, BJ_AREG, 0, &jump, &m_xhalf);
819 1.1 alnsn break;
820 1.1 alnsn case 1:
821 1.7 alnsn status = emit_xcall(compiler, pc, BJ_AREG, 0, &jump, &m_xbyte);
822 1.1 alnsn break;
823 1.1 alnsn }
824 1.1 alnsn
825 1.1 alnsn if (status != SLJIT_SUCCESS)
826 1.1 alnsn return status;
827 1.1 alnsn
828 1.7 alnsn if (!append_jump(jump, ret0, ret0_size, ret0_maxsize))
829 1.7 alnsn return SLJIT_ERR_ALLOC_FAILED;
830 1.1 alnsn
831 1.1 alnsn label = sljit_emit_label(compiler);
832 1.1 alnsn if (label == NULL)
833 1.1 alnsn return SLJIT_ERR_ALLOC_FAILED;
834 1.1 alnsn sljit_set_label(over_mchain_jump, label);
835 1.1 alnsn #endif
836 1.1 alnsn
837 1.1 alnsn return status;
838 1.1 alnsn }
839 1.1 alnsn
840 1.13 alnsn static int
841 1.19 alnsn emit_memload(struct sljit_compiler *compiler,
842 1.13 alnsn sljit_si dst, uint32_t k, size_t extwords)
843 1.13 alnsn {
844 1.13 alnsn int status;
845 1.13 alnsn sljit_si src;
846 1.13 alnsn sljit_sw srcw;
847 1.13 alnsn
848 1.13 alnsn srcw = k * sizeof(uint32_t);
849 1.13 alnsn
850 1.13 alnsn if (extwords == 0) {
851 1.13 alnsn src = SLJIT_MEM1(SLJIT_LOCALS_REG);
852 1.13 alnsn srcw += offsetof(struct bpfjit_stack, mem);
853 1.13 alnsn } else {
854 1.13 alnsn /* copy extmem pointer to the tmp1 register */
855 1.13 alnsn status = sljit_emit_op1(compiler,
856 1.16 alnsn SLJIT_MOV_P,
857 1.13 alnsn BJ_TMP1REG, 0,
858 1.13 alnsn SLJIT_MEM1(SLJIT_LOCALS_REG),
859 1.13 alnsn offsetof(struct bpfjit_stack, extmem));
860 1.13 alnsn if (status != SLJIT_SUCCESS)
861 1.13 alnsn return status;
862 1.13 alnsn src = SLJIT_MEM1(BJ_TMP1REG);
863 1.13 alnsn }
864 1.13 alnsn
865 1.13 alnsn return sljit_emit_op1(compiler, SLJIT_MOV_UI, dst, 0, src, srcw);
866 1.13 alnsn }
867 1.13 alnsn
868 1.13 alnsn static int
869 1.19 alnsn emit_memstore(struct sljit_compiler *compiler,
870 1.13 alnsn sljit_si src, uint32_t k, size_t extwords)
871 1.13 alnsn {
872 1.13 alnsn int status;
873 1.13 alnsn sljit_si dst;
874 1.13 alnsn sljit_sw dstw;
875 1.13 alnsn
876 1.13 alnsn dstw = k * sizeof(uint32_t);
877 1.13 alnsn
878 1.13 alnsn if (extwords == 0) {
879 1.13 alnsn dst = SLJIT_MEM1(SLJIT_LOCALS_REG);
880 1.13 alnsn dstw += offsetof(struct bpfjit_stack, mem);
881 1.13 alnsn } else {
882 1.13 alnsn /* copy extmem pointer to the tmp1 register */
883 1.13 alnsn status = sljit_emit_op1(compiler,
884 1.16 alnsn SLJIT_MOV_P,
885 1.13 alnsn BJ_TMP1REG, 0,
886 1.13 alnsn SLJIT_MEM1(SLJIT_LOCALS_REG),
887 1.13 alnsn offsetof(struct bpfjit_stack, extmem));
888 1.13 alnsn if (status != SLJIT_SUCCESS)
889 1.13 alnsn return status;
890 1.13 alnsn dst = SLJIT_MEM1(BJ_TMP1REG);
891 1.13 alnsn }
892 1.13 alnsn
893 1.13 alnsn return sljit_emit_op1(compiler, SLJIT_MOV_UI, dst, dstw, src, 0);
894 1.13 alnsn }
895 1.13 alnsn
896 1.1 alnsn /*
897 1.1 alnsn * Generate code for BPF_LDX+BPF_B+BPF_MSH X <- 4*(P[k:1]&0xf).
898 1.1 alnsn */
899 1.1 alnsn static int
900 1.19 alnsn emit_msh(struct sljit_compiler *compiler,
901 1.7 alnsn const struct bpf_insn *pc, struct sljit_jump *to_mchain_jump,
902 1.7 alnsn struct sljit_jump ***ret0, size_t *ret0_size, size_t *ret0_maxsize)
903 1.1 alnsn {
904 1.1 alnsn int status;
905 1.1 alnsn #ifdef _KERNEL
906 1.1 alnsn struct sljit_label *label;
907 1.1 alnsn struct sljit_jump *jump, *over_mchain_jump;
908 1.1 alnsn const bool check_zero_buflen = (to_mchain_jump != NULL);
909 1.1 alnsn #endif
910 1.1 alnsn const uint32_t k = pc->k;
911 1.1 alnsn
912 1.1 alnsn #ifdef _KERNEL
913 1.1 alnsn if (to_mchain_jump == NULL) {
914 1.1 alnsn to_mchain_jump = sljit_emit_cmp(compiler,
915 1.1 alnsn SLJIT_C_EQUAL,
916 1.7 alnsn BJ_BUFLEN, 0,
917 1.1 alnsn SLJIT_IMM, 0);
918 1.1 alnsn if (to_mchain_jump == NULL)
919 1.7 alnsn return SLJIT_ERR_ALLOC_FAILED;
920 1.1 alnsn }
921 1.1 alnsn #endif
922 1.1 alnsn
923 1.1 alnsn /* tmp1 = buf[k] */
924 1.1 alnsn status = sljit_emit_op1(compiler,
925 1.1 alnsn SLJIT_MOV_UB,
926 1.7 alnsn BJ_TMP1REG, 0,
927 1.7 alnsn SLJIT_MEM1(BJ_BUF), k);
928 1.1 alnsn if (status != SLJIT_SUCCESS)
929 1.1 alnsn return status;
930 1.1 alnsn
931 1.1 alnsn /* tmp1 &= 0xf */
932 1.1 alnsn status = sljit_emit_op2(compiler,
933 1.1 alnsn SLJIT_AND,
934 1.7 alnsn BJ_TMP1REG, 0,
935 1.7 alnsn BJ_TMP1REG, 0,
936 1.1 alnsn SLJIT_IMM, 0xf);
937 1.1 alnsn if (status != SLJIT_SUCCESS)
938 1.1 alnsn return status;
939 1.1 alnsn
940 1.1 alnsn /* tmp1 = tmp1 << 2 */
941 1.1 alnsn status = sljit_emit_op2(compiler,
942 1.1 alnsn SLJIT_SHL,
943 1.7 alnsn BJ_XREG, 0,
944 1.7 alnsn BJ_TMP1REG, 0,
945 1.1 alnsn SLJIT_IMM, 2);
946 1.1 alnsn if (status != SLJIT_SUCCESS)
947 1.1 alnsn return status;
948 1.1 alnsn
949 1.1 alnsn #ifdef _KERNEL
950 1.1 alnsn over_mchain_jump = sljit_emit_jump(compiler, SLJIT_JUMP);
951 1.1 alnsn if (over_mchain_jump == NULL)
952 1.1 alnsn return SLJIT_ERR_ALLOC_FAILED;
953 1.1 alnsn
954 1.1 alnsn /* entry point to mchain handler */
955 1.1 alnsn label = sljit_emit_label(compiler);
956 1.1 alnsn if (label == NULL)
957 1.1 alnsn return SLJIT_ERR_ALLOC_FAILED;
958 1.1 alnsn sljit_set_label(to_mchain_jump, label);
959 1.1 alnsn
960 1.1 alnsn if (check_zero_buflen) {
961 1.1 alnsn /* if (buflen != 0) return 0; */
962 1.1 alnsn jump = sljit_emit_cmp(compiler,
963 1.1 alnsn SLJIT_C_NOT_EQUAL,
964 1.7 alnsn BJ_BUFLEN, 0,
965 1.1 alnsn SLJIT_IMM, 0);
966 1.1 alnsn if (jump == NULL)
967 1.7 alnsn return SLJIT_ERR_ALLOC_FAILED;
968 1.7 alnsn if (!append_jump(jump, ret0, ret0_size, ret0_maxsize))
969 1.7 alnsn return SLJIT_ERR_ALLOC_FAILED;
970 1.1 alnsn }
971 1.1 alnsn
972 1.7 alnsn status = emit_xcall(compiler, pc, BJ_TMP1REG, 0, &jump, &m_xbyte);
973 1.1 alnsn if (status != SLJIT_SUCCESS)
974 1.1 alnsn return status;
975 1.7 alnsn
976 1.7 alnsn if (!append_jump(jump, ret0, ret0_size, ret0_maxsize))
977 1.7 alnsn return SLJIT_ERR_ALLOC_FAILED;
978 1.1 alnsn
979 1.1 alnsn /* tmp1 &= 0xf */
980 1.1 alnsn status = sljit_emit_op2(compiler,
981 1.1 alnsn SLJIT_AND,
982 1.7 alnsn BJ_TMP1REG, 0,
983 1.7 alnsn BJ_TMP1REG, 0,
984 1.1 alnsn SLJIT_IMM, 0xf);
985 1.1 alnsn if (status != SLJIT_SUCCESS)
986 1.1 alnsn return status;
987 1.1 alnsn
988 1.1 alnsn /* tmp1 = tmp1 << 2 */
989 1.1 alnsn status = sljit_emit_op2(compiler,
990 1.1 alnsn SLJIT_SHL,
991 1.7 alnsn BJ_XREG, 0,
992 1.7 alnsn BJ_TMP1REG, 0,
993 1.1 alnsn SLJIT_IMM, 2);
994 1.1 alnsn if (status != SLJIT_SUCCESS)
995 1.1 alnsn return status;
996 1.1 alnsn
997 1.1 alnsn
998 1.1 alnsn label = sljit_emit_label(compiler);
999 1.1 alnsn if (label == NULL)
1000 1.1 alnsn return SLJIT_ERR_ALLOC_FAILED;
1001 1.1 alnsn sljit_set_label(over_mchain_jump, label);
1002 1.1 alnsn #endif
1003 1.1 alnsn
1004 1.1 alnsn return status;
1005 1.1 alnsn }
1006 1.1 alnsn
1007 1.1 alnsn static int
1008 1.19 alnsn emit_pow2_division(struct sljit_compiler *compiler, uint32_t k)
1009 1.1 alnsn {
1010 1.1 alnsn int shift = 0;
1011 1.1 alnsn int status = SLJIT_SUCCESS;
1012 1.1 alnsn
1013 1.1 alnsn while (k > 1) {
1014 1.1 alnsn k >>= 1;
1015 1.1 alnsn shift++;
1016 1.1 alnsn }
1017 1.1 alnsn
1018 1.7 alnsn BJ_ASSERT(k == 1 && shift < 32);
1019 1.1 alnsn
1020 1.1 alnsn if (shift != 0) {
1021 1.1 alnsn status = sljit_emit_op2(compiler,
1022 1.1 alnsn SLJIT_LSHR|SLJIT_INT_OP,
1023 1.7 alnsn BJ_AREG, 0,
1024 1.7 alnsn BJ_AREG, 0,
1025 1.1 alnsn SLJIT_IMM, shift);
1026 1.1 alnsn }
1027 1.1 alnsn
1028 1.1 alnsn return status;
1029 1.1 alnsn }
1030 1.1 alnsn
1031 1.1 alnsn #if !defined(BPFJIT_USE_UDIV)
1032 1.1 alnsn static sljit_uw
1033 1.1 alnsn divide(sljit_uw x, sljit_uw y)
1034 1.1 alnsn {
1035 1.1 alnsn
1036 1.1 alnsn return (uint32_t)x / (uint32_t)y;
1037 1.1 alnsn }
1038 1.1 alnsn #endif
1039 1.1 alnsn
1040 1.1 alnsn /*
1041 1.1 alnsn * Generate A = A / div.
1042 1.7 alnsn * divt,divw are either SLJIT_IMM,pc->k or BJ_XREG,0.
1043 1.1 alnsn */
1044 1.1 alnsn static int
1045 1.19 alnsn emit_division(struct sljit_compiler *compiler, int divt, sljit_sw divw)
1046 1.1 alnsn {
1047 1.1 alnsn int status;
1048 1.1 alnsn
1049 1.7 alnsn #if BJ_XREG == SLJIT_RETURN_REG || \
1050 1.12 alnsn BJ_XREG == SLJIT_SCRATCH_REG1 || \
1051 1.12 alnsn BJ_XREG == SLJIT_SCRATCH_REG2 || \
1052 1.12 alnsn BJ_AREG == SLJIT_SCRATCH_REG2
1053 1.1 alnsn #error "Not supported assignment of registers."
1054 1.1 alnsn #endif
1055 1.1 alnsn
1056 1.12 alnsn #if BJ_AREG != SLJIT_SCRATCH_REG1
1057 1.1 alnsn status = sljit_emit_op1(compiler,
1058 1.1 alnsn SLJIT_MOV,
1059 1.12 alnsn SLJIT_SCRATCH_REG1, 0,
1060 1.7 alnsn BJ_AREG, 0);
1061 1.1 alnsn if (status != SLJIT_SUCCESS)
1062 1.1 alnsn return status;
1063 1.1 alnsn #endif
1064 1.1 alnsn
1065 1.1 alnsn status = sljit_emit_op1(compiler,
1066 1.1 alnsn SLJIT_MOV,
1067 1.12 alnsn SLJIT_SCRATCH_REG2, 0,
1068 1.1 alnsn divt, divw);
1069 1.1 alnsn if (status != SLJIT_SUCCESS)
1070 1.1 alnsn return status;
1071 1.1 alnsn
1072 1.1 alnsn #if defined(BPFJIT_USE_UDIV)
1073 1.1 alnsn status = sljit_emit_op0(compiler, SLJIT_UDIV|SLJIT_INT_OP);
1074 1.1 alnsn
1075 1.12 alnsn #if BJ_AREG != SLJIT_SCRATCH_REG1
1076 1.1 alnsn status = sljit_emit_op1(compiler,
1077 1.1 alnsn SLJIT_MOV,
1078 1.7 alnsn BJ_AREG, 0,
1079 1.12 alnsn SLJIT_SCRATCH_REG1, 0);
1080 1.1 alnsn if (status != SLJIT_SUCCESS)
1081 1.1 alnsn return status;
1082 1.1 alnsn #endif
1083 1.1 alnsn #else
1084 1.1 alnsn status = sljit_emit_ijump(compiler,
1085 1.1 alnsn SLJIT_CALL2,
1086 1.1 alnsn SLJIT_IMM, SLJIT_FUNC_OFFSET(divide));
1087 1.1 alnsn
1088 1.7 alnsn #if BJ_AREG != SLJIT_RETURN_REG
1089 1.1 alnsn status = sljit_emit_op1(compiler,
1090 1.1 alnsn SLJIT_MOV,
1091 1.7 alnsn BJ_AREG, 0,
1092 1.1 alnsn SLJIT_RETURN_REG, 0);
1093 1.1 alnsn if (status != SLJIT_SUCCESS)
1094 1.1 alnsn return status;
1095 1.1 alnsn #endif
1096 1.1 alnsn #endif
1097 1.1 alnsn
1098 1.1 alnsn return status;
1099 1.1 alnsn }
1100 1.1 alnsn
1101 1.1 alnsn /*
1102 1.1 alnsn * Return true if pc is a "read from packet" instruction.
1103 1.1 alnsn * If length is not NULL and return value is true, *length will
1104 1.1 alnsn * be set to a safe length required to read a packet.
1105 1.1 alnsn */
1106 1.1 alnsn static bool
1107 1.8 alnsn read_pkt_insn(const struct bpf_insn *pc, bpfjit_abc_length_t *length)
1108 1.1 alnsn {
1109 1.1 alnsn bool rv;
1110 1.8 alnsn bpfjit_abc_length_t width;
1111 1.1 alnsn
1112 1.1 alnsn switch (BPF_CLASS(pc->code)) {
1113 1.1 alnsn default:
1114 1.1 alnsn rv = false;
1115 1.1 alnsn break;
1116 1.1 alnsn
1117 1.1 alnsn case BPF_LD:
1118 1.1 alnsn rv = BPF_MODE(pc->code) == BPF_ABS ||
1119 1.1 alnsn BPF_MODE(pc->code) == BPF_IND;
1120 1.1 alnsn if (rv)
1121 1.1 alnsn width = read_width(pc);
1122 1.1 alnsn break;
1123 1.1 alnsn
1124 1.1 alnsn case BPF_LDX:
1125 1.1 alnsn rv = pc->code == (BPF_LDX|BPF_B|BPF_MSH);
1126 1.1 alnsn width = 1;
1127 1.1 alnsn break;
1128 1.1 alnsn }
1129 1.1 alnsn
1130 1.1 alnsn if (rv && length != NULL) {
1131 1.9 alnsn /*
1132 1.9 alnsn * Values greater than UINT32_MAX will generate
1133 1.9 alnsn * unconditional "return 0".
1134 1.9 alnsn */
1135 1.9 alnsn *length = (uint32_t)pc->k + width;
1136 1.1 alnsn }
1137 1.1 alnsn
1138 1.1 alnsn return rv;
1139 1.1 alnsn }
1140 1.1 alnsn
1141 1.1 alnsn static void
1142 1.7 alnsn optimize_init(struct bpfjit_insn_data *insn_dat, size_t insn_count)
1143 1.1 alnsn {
1144 1.7 alnsn size_t i;
1145 1.1 alnsn
1146 1.7 alnsn for (i = 0; i < insn_count; i++) {
1147 1.7 alnsn SLIST_INIT(&insn_dat[i].bjumps);
1148 1.7 alnsn insn_dat[i].invalid = BJ_INIT_NOBITS;
1149 1.1 alnsn }
1150 1.1 alnsn }
1151 1.1 alnsn
1152 1.1 alnsn /*
1153 1.1 alnsn * The function divides instructions into blocks. Destination of a jump
1154 1.1 alnsn * instruction starts a new block. BPF_RET and BPF_JMP instructions
1155 1.1 alnsn * terminate a block. Blocks are linear, that is, there are no jumps out
1156 1.1 alnsn * from the middle of a block and there are no jumps in to the middle of
1157 1.1 alnsn * a block.
1158 1.7 alnsn *
1159 1.7 alnsn * The function also sets bits in *initmask for memwords that
1160 1.7 alnsn * need to be initialized to zero. Note that this set should be empty
1161 1.7 alnsn * for any valid kernel filter program.
1162 1.1 alnsn */
1163 1.7 alnsn static bool
1164 1.19 alnsn optimize_pass1(const bpf_ctx_t *bc, const struct bpf_insn *insns,
1165 1.19 alnsn struct bpfjit_insn_data *insn_dat, size_t insn_count,
1166 1.13 alnsn bpf_memword_init_t *initmask, int *nscratches, int *ncopfuncs)
1167 1.1 alnsn {
1168 1.7 alnsn struct bpfjit_jump *jtf;
1169 1.1 alnsn size_t i;
1170 1.7 alnsn uint32_t jt, jf;
1171 1.10 alnsn bpfjit_abc_length_t length;
1172 1.13 alnsn bpf_memword_init_t invalid; /* borrowed from bpf_filter() */
1173 1.1 alnsn bool unreachable;
1174 1.1 alnsn
1175 1.19 alnsn const size_t memwords = GET_MEMWORDS(bc);
1176 1.13 alnsn
1177 1.13 alnsn *ncopfuncs = 0;
1178 1.7 alnsn *nscratches = 2;
1179 1.7 alnsn *initmask = BJ_INIT_NOBITS;
1180 1.1 alnsn
1181 1.1 alnsn unreachable = false;
1182 1.7 alnsn invalid = ~BJ_INIT_NOBITS;
1183 1.1 alnsn
1184 1.1 alnsn for (i = 0; i < insn_count; i++) {
1185 1.7 alnsn if (!SLIST_EMPTY(&insn_dat[i].bjumps))
1186 1.1 alnsn unreachable = false;
1187 1.7 alnsn insn_dat[i].unreachable = unreachable;
1188 1.1 alnsn
1189 1.1 alnsn if (unreachable)
1190 1.1 alnsn continue;
1191 1.1 alnsn
1192 1.7 alnsn invalid |= insn_dat[i].invalid;
1193 1.1 alnsn
1194 1.10 alnsn if (read_pkt_insn(&insns[i], &length) && length > UINT32_MAX)
1195 1.10 alnsn unreachable = true;
1196 1.10 alnsn
1197 1.1 alnsn switch (BPF_CLASS(insns[i].code)) {
1198 1.1 alnsn case BPF_RET:
1199 1.7 alnsn if (BPF_RVAL(insns[i].code) == BPF_A)
1200 1.7 alnsn *initmask |= invalid & BJ_INIT_ABIT;
1201 1.7 alnsn
1202 1.1 alnsn unreachable = true;
1203 1.1 alnsn continue;
1204 1.1 alnsn
1205 1.7 alnsn case BPF_LD:
1206 1.7 alnsn if (BPF_MODE(insns[i].code) == BPF_IND ||
1207 1.7 alnsn BPF_MODE(insns[i].code) == BPF_ABS) {
1208 1.7 alnsn if (BPF_MODE(insns[i].code) == BPF_IND &&
1209 1.7 alnsn *nscratches < 4) {
1210 1.7 alnsn /* uses BJ_XREG */
1211 1.7 alnsn *nscratches = 4;
1212 1.7 alnsn }
1213 1.7 alnsn if (*nscratches < 3 &&
1214 1.7 alnsn read_width(&insns[i]) == 4) {
1215 1.7 alnsn /* uses BJ_TMP2REG */
1216 1.7 alnsn *nscratches = 3;
1217 1.7 alnsn }
1218 1.7 alnsn }
1219 1.7 alnsn
1220 1.7 alnsn if (BPF_MODE(insns[i].code) == BPF_IND)
1221 1.7 alnsn *initmask |= invalid & BJ_INIT_XBIT;
1222 1.7 alnsn
1223 1.7 alnsn if (BPF_MODE(insns[i].code) == BPF_MEM &&
1224 1.13 alnsn (uint32_t)insns[i].k < memwords) {
1225 1.7 alnsn *initmask |= invalid & BJ_INIT_MBIT(insns[i].k);
1226 1.7 alnsn }
1227 1.7 alnsn
1228 1.7 alnsn invalid &= ~BJ_INIT_ABIT;
1229 1.7 alnsn continue;
1230 1.7 alnsn
1231 1.7 alnsn case BPF_LDX:
1232 1.7 alnsn #if defined(_KERNEL)
1233 1.7 alnsn /* uses BJ_TMP3REG */
1234 1.7 alnsn *nscratches = 5;
1235 1.7 alnsn #endif
1236 1.7 alnsn /* uses BJ_XREG */
1237 1.7 alnsn if (*nscratches < 4)
1238 1.7 alnsn *nscratches = 4;
1239 1.7 alnsn
1240 1.7 alnsn if (BPF_MODE(insns[i].code) == BPF_MEM &&
1241 1.13 alnsn (uint32_t)insns[i].k < memwords) {
1242 1.7 alnsn *initmask |= invalid & BJ_INIT_MBIT(insns[i].k);
1243 1.7 alnsn }
1244 1.7 alnsn
1245 1.7 alnsn invalid &= ~BJ_INIT_XBIT;
1246 1.7 alnsn continue;
1247 1.7 alnsn
1248 1.7 alnsn case BPF_ST:
1249 1.7 alnsn *initmask |= invalid & BJ_INIT_ABIT;
1250 1.7 alnsn
1251 1.13 alnsn if ((uint32_t)insns[i].k < memwords)
1252 1.7 alnsn invalid &= ~BJ_INIT_MBIT(insns[i].k);
1253 1.7 alnsn
1254 1.7 alnsn continue;
1255 1.7 alnsn
1256 1.7 alnsn case BPF_STX:
1257 1.7 alnsn /* uses BJ_XREG */
1258 1.7 alnsn if (*nscratches < 4)
1259 1.7 alnsn *nscratches = 4;
1260 1.7 alnsn
1261 1.7 alnsn *initmask |= invalid & BJ_INIT_XBIT;
1262 1.7 alnsn
1263 1.13 alnsn if ((uint32_t)insns[i].k < memwords)
1264 1.7 alnsn invalid &= ~BJ_INIT_MBIT(insns[i].k);
1265 1.7 alnsn
1266 1.7 alnsn continue;
1267 1.7 alnsn
1268 1.7 alnsn case BPF_ALU:
1269 1.7 alnsn *initmask |= invalid & BJ_INIT_ABIT;
1270 1.7 alnsn
1271 1.7 alnsn if (insns[i].code != (BPF_ALU|BPF_NEG) &&
1272 1.7 alnsn BPF_SRC(insns[i].code) == BPF_X) {
1273 1.7 alnsn *initmask |= invalid & BJ_INIT_XBIT;
1274 1.7 alnsn /* uses BJ_XREG */
1275 1.7 alnsn if (*nscratches < 4)
1276 1.7 alnsn *nscratches = 4;
1277 1.7 alnsn
1278 1.7 alnsn }
1279 1.7 alnsn
1280 1.7 alnsn invalid &= ~BJ_INIT_ABIT;
1281 1.7 alnsn continue;
1282 1.7 alnsn
1283 1.7 alnsn case BPF_MISC:
1284 1.7 alnsn switch (BPF_MISCOP(insns[i].code)) {
1285 1.7 alnsn case BPF_TAX: // X <- A
1286 1.7 alnsn /* uses BJ_XREG */
1287 1.7 alnsn if (*nscratches < 4)
1288 1.7 alnsn *nscratches = 4;
1289 1.7 alnsn
1290 1.7 alnsn *initmask |= invalid & BJ_INIT_ABIT;
1291 1.7 alnsn invalid &= ~BJ_INIT_XBIT;
1292 1.7 alnsn continue;
1293 1.7 alnsn
1294 1.7 alnsn case BPF_TXA: // A <- X
1295 1.7 alnsn /* uses BJ_XREG */
1296 1.7 alnsn if (*nscratches < 4)
1297 1.7 alnsn *nscratches = 4;
1298 1.7 alnsn
1299 1.7 alnsn *initmask |= invalid & BJ_INIT_XBIT;
1300 1.7 alnsn invalid &= ~BJ_INIT_ABIT;
1301 1.7 alnsn continue;
1302 1.13 alnsn
1303 1.13 alnsn case BPF_COPX:
1304 1.13 alnsn /* uses BJ_XREG */
1305 1.13 alnsn if (*nscratches < 4)
1306 1.13 alnsn *nscratches = 4;
1307 1.13 alnsn /* FALLTHROUGH */
1308 1.13 alnsn
1309 1.13 alnsn case BPF_COP:
1310 1.13 alnsn /* calls copfunc with three arguments */
1311 1.13 alnsn if (*nscratches < 3)
1312 1.13 alnsn *nscratches = 3;
1313 1.13 alnsn
1314 1.13 alnsn (*ncopfuncs)++;
1315 1.13 alnsn *initmask |= invalid & BJ_INIT_ABIT;
1316 1.13 alnsn invalid &= ~BJ_INIT_ABIT;
1317 1.13 alnsn continue;
1318 1.7 alnsn }
1319 1.7 alnsn
1320 1.7 alnsn continue;
1321 1.7 alnsn
1322 1.1 alnsn case BPF_JMP:
1323 1.7 alnsn /* Initialize abc_length for ABC pass. */
1324 1.8 alnsn insn_dat[i].u.jdata.abc_length = MAX_ABC_LENGTH;
1325 1.7 alnsn
1326 1.7 alnsn if (BPF_OP(insns[i].code) == BPF_JA) {
1327 1.1 alnsn jt = jf = insns[i].k;
1328 1.1 alnsn } else {
1329 1.1 alnsn jt = insns[i].jt;
1330 1.1 alnsn jf = insns[i].jf;
1331 1.1 alnsn }
1332 1.1 alnsn
1333 1.1 alnsn if (jt >= insn_count - (i + 1) ||
1334 1.1 alnsn jf >= insn_count - (i + 1)) {
1335 1.7 alnsn return false;
1336 1.1 alnsn }
1337 1.1 alnsn
1338 1.1 alnsn if (jt > 0 && jf > 0)
1339 1.1 alnsn unreachable = true;
1340 1.1 alnsn
1341 1.7 alnsn jt += i + 1;
1342 1.7 alnsn jf += i + 1;
1343 1.7 alnsn
1344 1.7 alnsn jtf = insn_dat[i].u.jdata.jtf;
1345 1.1 alnsn
1346 1.7 alnsn jtf[0].sjump = NULL;
1347 1.7 alnsn jtf[0].jdata = &insn_dat[i].u.jdata;
1348 1.7 alnsn SLIST_INSERT_HEAD(&insn_dat[jt].bjumps,
1349 1.7 alnsn &jtf[0], entries);
1350 1.1 alnsn
1351 1.1 alnsn if (jf != jt) {
1352 1.7 alnsn jtf[1].sjump = NULL;
1353 1.7 alnsn jtf[1].jdata = &insn_dat[i].u.jdata;
1354 1.7 alnsn SLIST_INSERT_HEAD(&insn_dat[jf].bjumps,
1355 1.7 alnsn &jtf[1], entries);
1356 1.1 alnsn }
1357 1.1 alnsn
1358 1.7 alnsn insn_dat[jf].invalid |= invalid;
1359 1.7 alnsn insn_dat[jt].invalid |= invalid;
1360 1.7 alnsn invalid = 0;
1361 1.7 alnsn
1362 1.1 alnsn continue;
1363 1.1 alnsn }
1364 1.1 alnsn }
1365 1.1 alnsn
1366 1.7 alnsn return true;
1367 1.1 alnsn }
1368 1.1 alnsn
1369 1.1 alnsn /*
1370 1.7 alnsn * Array Bounds Check Elimination (ABC) pass.
1371 1.1 alnsn */
1372 1.7 alnsn static void
1373 1.19 alnsn optimize_pass2(const bpf_ctx_t *bc, const struct bpf_insn *insns,
1374 1.19 alnsn struct bpfjit_insn_data *insn_dat, size_t insn_count)
1375 1.7 alnsn {
1376 1.7 alnsn struct bpfjit_jump *jmp;
1377 1.7 alnsn const struct bpf_insn *pc;
1378 1.7 alnsn struct bpfjit_insn_data *pd;
1379 1.7 alnsn size_t i;
1380 1.8 alnsn bpfjit_abc_length_t length, abc_length = 0;
1381 1.7 alnsn
1382 1.19 alnsn const size_t extwords = GET_EXTWORDS(bc);
1383 1.19 alnsn
1384 1.7 alnsn for (i = insn_count; i != 0; i--) {
1385 1.7 alnsn pc = &insns[i-1];
1386 1.7 alnsn pd = &insn_dat[i-1];
1387 1.7 alnsn
1388 1.7 alnsn if (pd->unreachable)
1389 1.7 alnsn continue;
1390 1.7 alnsn
1391 1.7 alnsn switch (BPF_CLASS(pc->code)) {
1392 1.7 alnsn case BPF_RET:
1393 1.11 alnsn /*
1394 1.11 alnsn * It's quite common for bpf programs to
1395 1.11 alnsn * check packet bytes in increasing order
1396 1.11 alnsn * and return zero if bytes don't match
1397 1.11 alnsn * specified critetion. Such programs disable
1398 1.11 alnsn * ABC optimization completely because for
1399 1.11 alnsn * every jump there is a branch with no read
1400 1.11 alnsn * instruction.
1401 1.13 alnsn * With no side effects, BPF_STMT(BPF_RET+BPF_K, 0)
1402 1.13 alnsn * is indistinguishable from out-of-bound load.
1403 1.11 alnsn * Therefore, abc_length can be set to
1404 1.11 alnsn * MAX_ABC_LENGTH and enable ABC for many
1405 1.11 alnsn * bpf programs.
1406 1.13 alnsn * If this optimization encounters any
1407 1.11 alnsn * instruction with a side effect, it will
1408 1.11 alnsn * reset abc_length.
1409 1.11 alnsn */
1410 1.11 alnsn if (BPF_RVAL(pc->code) == BPF_K && pc->k == 0)
1411 1.11 alnsn abc_length = MAX_ABC_LENGTH;
1412 1.11 alnsn else
1413 1.11 alnsn abc_length = 0;
1414 1.7 alnsn break;
1415 1.7 alnsn
1416 1.13 alnsn case BPF_MISC:
1417 1.13 alnsn if (BPF_MISCOP(pc->code) == BPF_COP ||
1418 1.13 alnsn BPF_MISCOP(pc->code) == BPF_COPX) {
1419 1.13 alnsn /* COP instructions can have side effects. */
1420 1.13 alnsn abc_length = 0;
1421 1.13 alnsn }
1422 1.13 alnsn break;
1423 1.13 alnsn
1424 1.13 alnsn case BPF_ST:
1425 1.13 alnsn case BPF_STX:
1426 1.13 alnsn if (extwords != 0) {
1427 1.13 alnsn /* Write to memory is visible after a call. */
1428 1.13 alnsn abc_length = 0;
1429 1.13 alnsn }
1430 1.13 alnsn break;
1431 1.13 alnsn
1432 1.7 alnsn case BPF_JMP:
1433 1.7 alnsn abc_length = pd->u.jdata.abc_length;
1434 1.7 alnsn break;
1435 1.7 alnsn
1436 1.7 alnsn default:
1437 1.7 alnsn if (read_pkt_insn(pc, &length)) {
1438 1.7 alnsn if (abc_length < length)
1439 1.7 alnsn abc_length = length;
1440 1.7 alnsn pd->u.rdata.abc_length = abc_length;
1441 1.7 alnsn }
1442 1.7 alnsn break;
1443 1.7 alnsn }
1444 1.7 alnsn
1445 1.7 alnsn SLIST_FOREACH(jmp, &pd->bjumps, entries) {
1446 1.7 alnsn if (jmp->jdata->abc_length > abc_length)
1447 1.7 alnsn jmp->jdata->abc_length = abc_length;
1448 1.7 alnsn }
1449 1.7 alnsn }
1450 1.7 alnsn }
1451 1.7 alnsn
1452 1.7 alnsn static void
1453 1.7 alnsn optimize_pass3(const struct bpf_insn *insns,
1454 1.7 alnsn struct bpfjit_insn_data *insn_dat, size_t insn_count)
1455 1.1 alnsn {
1456 1.7 alnsn struct bpfjit_jump *jmp;
1457 1.1 alnsn size_t i;
1458 1.8 alnsn bpfjit_abc_length_t checked_length = 0;
1459 1.1 alnsn
1460 1.1 alnsn for (i = 0; i < insn_count; i++) {
1461 1.7 alnsn if (insn_dat[i].unreachable)
1462 1.7 alnsn continue;
1463 1.1 alnsn
1464 1.7 alnsn SLIST_FOREACH(jmp, &insn_dat[i].bjumps, entries) {
1465 1.7 alnsn if (jmp->jdata->checked_length < checked_length)
1466 1.7 alnsn checked_length = jmp->jdata->checked_length;
1467 1.1 alnsn }
1468 1.1 alnsn
1469 1.7 alnsn if (BPF_CLASS(insns[i].code) == BPF_JMP) {
1470 1.7 alnsn insn_dat[i].u.jdata.checked_length = checked_length;
1471 1.8 alnsn } else if (read_pkt_insn(&insns[i], NULL)) {
1472 1.7 alnsn struct bpfjit_read_pkt_data *rdata =
1473 1.7 alnsn &insn_dat[i].u.rdata;
1474 1.7 alnsn rdata->check_length = 0;
1475 1.7 alnsn if (checked_length < rdata->abc_length) {
1476 1.7 alnsn checked_length = rdata->abc_length;
1477 1.7 alnsn rdata->check_length = checked_length;
1478 1.7 alnsn }
1479 1.1 alnsn }
1480 1.7 alnsn }
1481 1.7 alnsn }
1482 1.1 alnsn
1483 1.7 alnsn static bool
1484 1.19 alnsn optimize(const bpf_ctx_t *bc, const struct bpf_insn *insns,
1485 1.7 alnsn struct bpfjit_insn_data *insn_dat, size_t insn_count,
1486 1.13 alnsn bpf_memword_init_t *initmask, int *nscratches, int *ncopfuncs)
1487 1.7 alnsn {
1488 1.1 alnsn
1489 1.7 alnsn optimize_init(insn_dat, insn_count);
1490 1.7 alnsn
1491 1.19 alnsn if (!optimize_pass1(bc, insns, insn_dat, insn_count,
1492 1.19 alnsn initmask, nscratches, ncopfuncs)) {
1493 1.7 alnsn return false;
1494 1.1 alnsn }
1495 1.1 alnsn
1496 1.19 alnsn optimize_pass2(bc, insns, insn_dat, insn_count);
1497 1.7 alnsn optimize_pass3(insns, insn_dat, insn_count);
1498 1.7 alnsn
1499 1.7 alnsn return true;
1500 1.1 alnsn }
1501 1.1 alnsn
1502 1.1 alnsn /*
1503 1.1 alnsn * Convert BPF_ALU operations except BPF_NEG and BPF_DIV to sljit operation.
1504 1.1 alnsn */
1505 1.1 alnsn static int
1506 1.7 alnsn bpf_alu_to_sljit_op(const struct bpf_insn *pc)
1507 1.1 alnsn {
1508 1.1 alnsn
1509 1.1 alnsn /*
1510 1.1 alnsn * Note: all supported 64bit arches have 32bit multiply
1511 1.1 alnsn * instruction so SLJIT_INT_OP doesn't have any overhead.
1512 1.1 alnsn */
1513 1.1 alnsn switch (BPF_OP(pc->code)) {
1514 1.1 alnsn case BPF_ADD: return SLJIT_ADD;
1515 1.1 alnsn case BPF_SUB: return SLJIT_SUB;
1516 1.1 alnsn case BPF_MUL: return SLJIT_MUL|SLJIT_INT_OP;
1517 1.1 alnsn case BPF_OR: return SLJIT_OR;
1518 1.1 alnsn case BPF_AND: return SLJIT_AND;
1519 1.1 alnsn case BPF_LSH: return SLJIT_SHL;
1520 1.1 alnsn case BPF_RSH: return SLJIT_LSHR|SLJIT_INT_OP;
1521 1.1 alnsn default:
1522 1.7 alnsn BJ_ASSERT(false);
1523 1.1 alnsn return 0;
1524 1.1 alnsn }
1525 1.1 alnsn }
1526 1.1 alnsn
1527 1.1 alnsn /*
1528 1.1 alnsn * Convert BPF_JMP operations except BPF_JA to sljit condition.
1529 1.1 alnsn */
1530 1.1 alnsn static int
1531 1.7 alnsn bpf_jmp_to_sljit_cond(const struct bpf_insn *pc, bool negate)
1532 1.1 alnsn {
1533 1.1 alnsn /*
1534 1.1 alnsn * Note: all supported 64bit arches have 32bit comparison
1535 1.1 alnsn * instructions so SLJIT_INT_OP doesn't have any overhead.
1536 1.1 alnsn */
1537 1.1 alnsn int rv = SLJIT_INT_OP;
1538 1.1 alnsn
1539 1.1 alnsn switch (BPF_OP(pc->code)) {
1540 1.1 alnsn case BPF_JGT:
1541 1.1 alnsn rv |= negate ? SLJIT_C_LESS_EQUAL : SLJIT_C_GREATER;
1542 1.1 alnsn break;
1543 1.1 alnsn case BPF_JGE:
1544 1.1 alnsn rv |= negate ? SLJIT_C_LESS : SLJIT_C_GREATER_EQUAL;
1545 1.1 alnsn break;
1546 1.1 alnsn case BPF_JEQ:
1547 1.1 alnsn rv |= negate ? SLJIT_C_NOT_EQUAL : SLJIT_C_EQUAL;
1548 1.1 alnsn break;
1549 1.1 alnsn case BPF_JSET:
1550 1.1 alnsn rv |= negate ? SLJIT_C_EQUAL : SLJIT_C_NOT_EQUAL;
1551 1.1 alnsn break;
1552 1.1 alnsn default:
1553 1.7 alnsn BJ_ASSERT(false);
1554 1.1 alnsn }
1555 1.1 alnsn
1556 1.1 alnsn return rv;
1557 1.1 alnsn }
1558 1.1 alnsn
1559 1.1 alnsn /*
1560 1.1 alnsn * Convert BPF_K and BPF_X to sljit register.
1561 1.1 alnsn */
1562 1.1 alnsn static int
1563 1.7 alnsn kx_to_reg(const struct bpf_insn *pc)
1564 1.1 alnsn {
1565 1.1 alnsn
1566 1.1 alnsn switch (BPF_SRC(pc->code)) {
1567 1.1 alnsn case BPF_K: return SLJIT_IMM;
1568 1.7 alnsn case BPF_X: return BJ_XREG;
1569 1.1 alnsn default:
1570 1.7 alnsn BJ_ASSERT(false);
1571 1.1 alnsn return 0;
1572 1.1 alnsn }
1573 1.1 alnsn }
1574 1.1 alnsn
1575 1.12 alnsn static sljit_sw
1576 1.7 alnsn kx_to_reg_arg(const struct bpf_insn *pc)
1577 1.1 alnsn {
1578 1.1 alnsn
1579 1.1 alnsn switch (BPF_SRC(pc->code)) {
1580 1.1 alnsn case BPF_K: return (uint32_t)pc->k; /* SLJIT_IMM, pc->k, */
1581 1.7 alnsn case BPF_X: return 0; /* BJ_XREG, 0, */
1582 1.1 alnsn default:
1583 1.7 alnsn BJ_ASSERT(false);
1584 1.1 alnsn return 0;
1585 1.1 alnsn }
1586 1.1 alnsn }
1587 1.1 alnsn
1588 1.19 alnsn static bool
1589 1.19 alnsn generate_insn_code(struct sljit_compiler *compiler, const bpf_ctx_t *bc,
1590 1.19 alnsn const struct bpf_insn *insns, struct bpfjit_insn_data *insn_dat,
1591 1.19 alnsn size_t insn_count)
1592 1.1 alnsn {
1593 1.1 alnsn /* a list of jumps to out-of-bound return from a generated function */
1594 1.1 alnsn struct sljit_jump **ret0;
1595 1.7 alnsn size_t ret0_size, ret0_maxsize;
1596 1.1 alnsn
1597 1.19 alnsn struct sljit_jump *jump;
1598 1.19 alnsn struct sljit_label *label;
1599 1.7 alnsn const struct bpf_insn *pc;
1600 1.1 alnsn struct bpfjit_jump *bjump, *jtf;
1601 1.1 alnsn struct sljit_jump *to_mchain_jump;
1602 1.1 alnsn
1603 1.19 alnsn size_t i;
1604 1.19 alnsn int status;
1605 1.19 alnsn int branching, negate;
1606 1.19 alnsn unsigned int rval, mode, src;
1607 1.1 alnsn uint32_t jt, jf;
1608 1.1 alnsn
1609 1.19 alnsn bool unconditional_ret;
1610 1.19 alnsn bool rv;
1611 1.19 alnsn
1612 1.19 alnsn const size_t extwords = GET_EXTWORDS(bc);
1613 1.19 alnsn const size_t memwords = GET_MEMWORDS(bc);
1614 1.13 alnsn
1615 1.13 alnsn ret0 = NULL;
1616 1.19 alnsn rv = false;
1617 1.7 alnsn
1618 1.1 alnsn ret0_size = 0;
1619 1.7 alnsn ret0_maxsize = 64;
1620 1.7 alnsn ret0 = BJ_ALLOC(ret0_maxsize * sizeof(ret0[0]));
1621 1.7 alnsn if (ret0 == NULL)
1622 1.1 alnsn goto fail;
1623 1.1 alnsn
1624 1.1 alnsn for (i = 0; i < insn_count; i++) {
1625 1.7 alnsn if (insn_dat[i].unreachable)
1626 1.1 alnsn continue;
1627 1.1 alnsn
1628 1.1 alnsn /*
1629 1.1 alnsn * Resolve jumps to the current insn.
1630 1.1 alnsn */
1631 1.1 alnsn label = NULL;
1632 1.7 alnsn SLIST_FOREACH(bjump, &insn_dat[i].bjumps, entries) {
1633 1.7 alnsn if (bjump->sjump != NULL) {
1634 1.1 alnsn if (label == NULL)
1635 1.1 alnsn label = sljit_emit_label(compiler);
1636 1.1 alnsn if (label == NULL)
1637 1.1 alnsn goto fail;
1638 1.7 alnsn sljit_set_label(bjump->sjump, label);
1639 1.1 alnsn }
1640 1.1 alnsn }
1641 1.1 alnsn
1642 1.9 alnsn to_mchain_jump = NULL;
1643 1.9 alnsn unconditional_ret = false;
1644 1.9 alnsn
1645 1.9 alnsn if (read_pkt_insn(&insns[i], NULL)) {
1646 1.9 alnsn if (insn_dat[i].u.rdata.check_length > UINT32_MAX) {
1647 1.9 alnsn /* Jump to "return 0" unconditionally. */
1648 1.9 alnsn unconditional_ret = true;
1649 1.9 alnsn jump = sljit_emit_jump(compiler, SLJIT_JUMP);
1650 1.9 alnsn if (jump == NULL)
1651 1.9 alnsn goto fail;
1652 1.9 alnsn if (!append_jump(jump, &ret0,
1653 1.9 alnsn &ret0_size, &ret0_maxsize))
1654 1.9 alnsn goto fail;
1655 1.9 alnsn } else if (insn_dat[i].u.rdata.check_length > 0) {
1656 1.9 alnsn /* if (buflen < check_length) return 0; */
1657 1.9 alnsn jump = sljit_emit_cmp(compiler,
1658 1.9 alnsn SLJIT_C_LESS,
1659 1.9 alnsn BJ_BUFLEN, 0,
1660 1.9 alnsn SLJIT_IMM,
1661 1.9 alnsn insn_dat[i].u.rdata.check_length);
1662 1.9 alnsn if (jump == NULL)
1663 1.9 alnsn goto fail;
1664 1.1 alnsn #ifdef _KERNEL
1665 1.9 alnsn to_mchain_jump = jump;
1666 1.1 alnsn #else
1667 1.9 alnsn if (!append_jump(jump, &ret0,
1668 1.9 alnsn &ret0_size, &ret0_maxsize))
1669 1.9 alnsn goto fail;
1670 1.1 alnsn #endif
1671 1.9 alnsn }
1672 1.1 alnsn }
1673 1.1 alnsn
1674 1.1 alnsn pc = &insns[i];
1675 1.1 alnsn switch (BPF_CLASS(pc->code)) {
1676 1.1 alnsn
1677 1.1 alnsn default:
1678 1.1 alnsn goto fail;
1679 1.1 alnsn
1680 1.1 alnsn case BPF_LD:
1681 1.1 alnsn /* BPF_LD+BPF_IMM A <- k */
1682 1.1 alnsn if (pc->code == (BPF_LD|BPF_IMM)) {
1683 1.1 alnsn status = sljit_emit_op1(compiler,
1684 1.1 alnsn SLJIT_MOV,
1685 1.7 alnsn BJ_AREG, 0,
1686 1.1 alnsn SLJIT_IMM, (uint32_t)pc->k);
1687 1.1 alnsn if (status != SLJIT_SUCCESS)
1688 1.1 alnsn goto fail;
1689 1.1 alnsn
1690 1.1 alnsn continue;
1691 1.1 alnsn }
1692 1.1 alnsn
1693 1.1 alnsn /* BPF_LD+BPF_MEM A <- M[k] */
1694 1.1 alnsn if (pc->code == (BPF_LD|BPF_MEM)) {
1695 1.13 alnsn if ((uint32_t)pc->k >= memwords)
1696 1.1 alnsn goto fail;
1697 1.13 alnsn status = emit_memload(compiler,
1698 1.13 alnsn BJ_AREG, pc->k, extwords);
1699 1.1 alnsn if (status != SLJIT_SUCCESS)
1700 1.1 alnsn goto fail;
1701 1.1 alnsn
1702 1.1 alnsn continue;
1703 1.1 alnsn }
1704 1.1 alnsn
1705 1.1 alnsn /* BPF_LD+BPF_W+BPF_LEN A <- len */
1706 1.1 alnsn if (pc->code == (BPF_LD|BPF_W|BPF_LEN)) {
1707 1.1 alnsn status = sljit_emit_op1(compiler,
1708 1.1 alnsn SLJIT_MOV,
1709 1.7 alnsn BJ_AREG, 0,
1710 1.13 alnsn SLJIT_MEM1(BJ_ARGS),
1711 1.13 alnsn offsetof(struct bpf_args, wirelen));
1712 1.1 alnsn if (status != SLJIT_SUCCESS)
1713 1.1 alnsn goto fail;
1714 1.1 alnsn
1715 1.1 alnsn continue;
1716 1.1 alnsn }
1717 1.1 alnsn
1718 1.1 alnsn mode = BPF_MODE(pc->code);
1719 1.1 alnsn if (mode != BPF_ABS && mode != BPF_IND)
1720 1.1 alnsn goto fail;
1721 1.1 alnsn
1722 1.9 alnsn if (unconditional_ret)
1723 1.9 alnsn continue;
1724 1.9 alnsn
1725 1.1 alnsn status = emit_pkt_read(compiler, pc,
1726 1.7 alnsn to_mchain_jump, &ret0, &ret0_size, &ret0_maxsize);
1727 1.1 alnsn if (status != SLJIT_SUCCESS)
1728 1.1 alnsn goto fail;
1729 1.1 alnsn
1730 1.1 alnsn continue;
1731 1.1 alnsn
1732 1.1 alnsn case BPF_LDX:
1733 1.1 alnsn mode = BPF_MODE(pc->code);
1734 1.1 alnsn
1735 1.1 alnsn /* BPF_LDX+BPF_W+BPF_IMM X <- k */
1736 1.1 alnsn if (mode == BPF_IMM) {
1737 1.1 alnsn if (BPF_SIZE(pc->code) != BPF_W)
1738 1.1 alnsn goto fail;
1739 1.1 alnsn status = sljit_emit_op1(compiler,
1740 1.1 alnsn SLJIT_MOV,
1741 1.7 alnsn BJ_XREG, 0,
1742 1.1 alnsn SLJIT_IMM, (uint32_t)pc->k);
1743 1.1 alnsn if (status != SLJIT_SUCCESS)
1744 1.1 alnsn goto fail;
1745 1.1 alnsn
1746 1.1 alnsn continue;
1747 1.1 alnsn }
1748 1.1 alnsn
1749 1.1 alnsn /* BPF_LDX+BPF_W+BPF_LEN X <- len */
1750 1.1 alnsn if (mode == BPF_LEN) {
1751 1.1 alnsn if (BPF_SIZE(pc->code) != BPF_W)
1752 1.1 alnsn goto fail;
1753 1.1 alnsn status = sljit_emit_op1(compiler,
1754 1.1 alnsn SLJIT_MOV,
1755 1.7 alnsn BJ_XREG, 0,
1756 1.13 alnsn SLJIT_MEM1(BJ_ARGS),
1757 1.13 alnsn offsetof(struct bpf_args, wirelen));
1758 1.1 alnsn if (status != SLJIT_SUCCESS)
1759 1.1 alnsn goto fail;
1760 1.1 alnsn
1761 1.1 alnsn continue;
1762 1.1 alnsn }
1763 1.1 alnsn
1764 1.1 alnsn /* BPF_LDX+BPF_W+BPF_MEM X <- M[k] */
1765 1.1 alnsn if (mode == BPF_MEM) {
1766 1.1 alnsn if (BPF_SIZE(pc->code) != BPF_W)
1767 1.1 alnsn goto fail;
1768 1.13 alnsn if ((uint32_t)pc->k >= memwords)
1769 1.1 alnsn goto fail;
1770 1.13 alnsn status = emit_memload(compiler,
1771 1.13 alnsn BJ_XREG, pc->k, extwords);
1772 1.1 alnsn if (status != SLJIT_SUCCESS)
1773 1.1 alnsn goto fail;
1774 1.1 alnsn
1775 1.1 alnsn continue;
1776 1.1 alnsn }
1777 1.1 alnsn
1778 1.1 alnsn /* BPF_LDX+BPF_B+BPF_MSH X <- 4*(P[k:1]&0xf) */
1779 1.1 alnsn if (mode != BPF_MSH || BPF_SIZE(pc->code) != BPF_B)
1780 1.1 alnsn goto fail;
1781 1.1 alnsn
1782 1.9 alnsn if (unconditional_ret)
1783 1.9 alnsn continue;
1784 1.9 alnsn
1785 1.1 alnsn status = emit_msh(compiler, pc,
1786 1.7 alnsn to_mchain_jump, &ret0, &ret0_size, &ret0_maxsize);
1787 1.1 alnsn if (status != SLJIT_SUCCESS)
1788 1.1 alnsn goto fail;
1789 1.1 alnsn
1790 1.1 alnsn continue;
1791 1.1 alnsn
1792 1.1 alnsn case BPF_ST:
1793 1.8 alnsn if (pc->code != BPF_ST ||
1794 1.13 alnsn (uint32_t)pc->k >= memwords) {
1795 1.1 alnsn goto fail;
1796 1.8 alnsn }
1797 1.1 alnsn
1798 1.13 alnsn status = emit_memstore(compiler,
1799 1.13 alnsn BJ_AREG, pc->k, extwords);
1800 1.1 alnsn if (status != SLJIT_SUCCESS)
1801 1.1 alnsn goto fail;
1802 1.1 alnsn
1803 1.1 alnsn continue;
1804 1.1 alnsn
1805 1.1 alnsn case BPF_STX:
1806 1.8 alnsn if (pc->code != BPF_STX ||
1807 1.13 alnsn (uint32_t)pc->k >= memwords) {
1808 1.1 alnsn goto fail;
1809 1.8 alnsn }
1810 1.1 alnsn
1811 1.13 alnsn status = emit_memstore(compiler,
1812 1.13 alnsn BJ_XREG, pc->k, extwords);
1813 1.1 alnsn if (status != SLJIT_SUCCESS)
1814 1.1 alnsn goto fail;
1815 1.1 alnsn
1816 1.1 alnsn continue;
1817 1.1 alnsn
1818 1.1 alnsn case BPF_ALU:
1819 1.1 alnsn if (pc->code == (BPF_ALU|BPF_NEG)) {
1820 1.1 alnsn status = sljit_emit_op1(compiler,
1821 1.1 alnsn SLJIT_NEG,
1822 1.7 alnsn BJ_AREG, 0,
1823 1.7 alnsn BJ_AREG, 0);
1824 1.1 alnsn if (status != SLJIT_SUCCESS)
1825 1.1 alnsn goto fail;
1826 1.1 alnsn
1827 1.1 alnsn continue;
1828 1.1 alnsn }
1829 1.1 alnsn
1830 1.1 alnsn if (BPF_OP(pc->code) != BPF_DIV) {
1831 1.1 alnsn status = sljit_emit_op2(compiler,
1832 1.1 alnsn bpf_alu_to_sljit_op(pc),
1833 1.7 alnsn BJ_AREG, 0,
1834 1.7 alnsn BJ_AREG, 0,
1835 1.1 alnsn kx_to_reg(pc), kx_to_reg_arg(pc));
1836 1.1 alnsn if (status != SLJIT_SUCCESS)
1837 1.1 alnsn goto fail;
1838 1.1 alnsn
1839 1.1 alnsn continue;
1840 1.1 alnsn }
1841 1.1 alnsn
1842 1.1 alnsn /* BPF_DIV */
1843 1.1 alnsn
1844 1.1 alnsn src = BPF_SRC(pc->code);
1845 1.1 alnsn if (src != BPF_X && src != BPF_K)
1846 1.1 alnsn goto fail;
1847 1.1 alnsn
1848 1.1 alnsn /* division by zero? */
1849 1.1 alnsn if (src == BPF_X) {
1850 1.1 alnsn jump = sljit_emit_cmp(compiler,
1851 1.1 alnsn SLJIT_C_EQUAL|SLJIT_INT_OP,
1852 1.8 alnsn BJ_XREG, 0,
1853 1.1 alnsn SLJIT_IMM, 0);
1854 1.1 alnsn if (jump == NULL)
1855 1.1 alnsn goto fail;
1856 1.7 alnsn if (!append_jump(jump, &ret0,
1857 1.7 alnsn &ret0_size, &ret0_maxsize))
1858 1.7 alnsn goto fail;
1859 1.1 alnsn } else if (pc->k == 0) {
1860 1.1 alnsn jump = sljit_emit_jump(compiler, SLJIT_JUMP);
1861 1.1 alnsn if (jump == NULL)
1862 1.1 alnsn goto fail;
1863 1.7 alnsn if (!append_jump(jump, &ret0,
1864 1.7 alnsn &ret0_size, &ret0_maxsize))
1865 1.7 alnsn goto fail;
1866 1.1 alnsn }
1867 1.1 alnsn
1868 1.1 alnsn if (src == BPF_X) {
1869 1.7 alnsn status = emit_division(compiler, BJ_XREG, 0);
1870 1.1 alnsn if (status != SLJIT_SUCCESS)
1871 1.1 alnsn goto fail;
1872 1.1 alnsn } else if (pc->k != 0) {
1873 1.1 alnsn if (pc->k & (pc->k - 1)) {
1874 1.1 alnsn status = emit_division(compiler,
1875 1.1 alnsn SLJIT_IMM, (uint32_t)pc->k);
1876 1.1 alnsn } else {
1877 1.7 alnsn status = emit_pow2_division(compiler,
1878 1.1 alnsn (uint32_t)pc->k);
1879 1.1 alnsn }
1880 1.1 alnsn if (status != SLJIT_SUCCESS)
1881 1.1 alnsn goto fail;
1882 1.1 alnsn }
1883 1.1 alnsn
1884 1.1 alnsn continue;
1885 1.1 alnsn
1886 1.1 alnsn case BPF_JMP:
1887 1.7 alnsn if (BPF_OP(pc->code) == BPF_JA) {
1888 1.1 alnsn jt = jf = pc->k;
1889 1.1 alnsn } else {
1890 1.1 alnsn jt = pc->jt;
1891 1.1 alnsn jf = pc->jf;
1892 1.1 alnsn }
1893 1.1 alnsn
1894 1.1 alnsn negate = (jt == 0) ? 1 : 0;
1895 1.1 alnsn branching = (jt == jf) ? 0 : 1;
1896 1.7 alnsn jtf = insn_dat[i].u.jdata.jtf;
1897 1.1 alnsn
1898 1.1 alnsn if (branching) {
1899 1.1 alnsn if (BPF_OP(pc->code) != BPF_JSET) {
1900 1.1 alnsn jump = sljit_emit_cmp(compiler,
1901 1.1 alnsn bpf_jmp_to_sljit_cond(pc, negate),
1902 1.7 alnsn BJ_AREG, 0,
1903 1.1 alnsn kx_to_reg(pc), kx_to_reg_arg(pc));
1904 1.1 alnsn } else {
1905 1.1 alnsn status = sljit_emit_op2(compiler,
1906 1.1 alnsn SLJIT_AND,
1907 1.7 alnsn BJ_TMP1REG, 0,
1908 1.7 alnsn BJ_AREG, 0,
1909 1.1 alnsn kx_to_reg(pc), kx_to_reg_arg(pc));
1910 1.1 alnsn if (status != SLJIT_SUCCESS)
1911 1.1 alnsn goto fail;
1912 1.1 alnsn
1913 1.1 alnsn jump = sljit_emit_cmp(compiler,
1914 1.1 alnsn bpf_jmp_to_sljit_cond(pc, negate),
1915 1.7 alnsn BJ_TMP1REG, 0,
1916 1.1 alnsn SLJIT_IMM, 0);
1917 1.1 alnsn }
1918 1.1 alnsn
1919 1.1 alnsn if (jump == NULL)
1920 1.1 alnsn goto fail;
1921 1.1 alnsn
1922 1.7 alnsn BJ_ASSERT(jtf[negate].sjump == NULL);
1923 1.7 alnsn jtf[negate].sjump = jump;
1924 1.1 alnsn }
1925 1.1 alnsn
1926 1.1 alnsn if (!branching || (jt != 0 && jf != 0)) {
1927 1.1 alnsn jump = sljit_emit_jump(compiler, SLJIT_JUMP);
1928 1.1 alnsn if (jump == NULL)
1929 1.1 alnsn goto fail;
1930 1.1 alnsn
1931 1.7 alnsn BJ_ASSERT(jtf[branching].sjump == NULL);
1932 1.7 alnsn jtf[branching].sjump = jump;
1933 1.1 alnsn }
1934 1.1 alnsn
1935 1.1 alnsn continue;
1936 1.1 alnsn
1937 1.1 alnsn case BPF_RET:
1938 1.1 alnsn rval = BPF_RVAL(pc->code);
1939 1.1 alnsn if (rval == BPF_X)
1940 1.1 alnsn goto fail;
1941 1.1 alnsn
1942 1.1 alnsn /* BPF_RET+BPF_K accept k bytes */
1943 1.1 alnsn if (rval == BPF_K) {
1944 1.7 alnsn status = sljit_emit_return(compiler,
1945 1.7 alnsn SLJIT_MOV_UI,
1946 1.1 alnsn SLJIT_IMM, (uint32_t)pc->k);
1947 1.1 alnsn if (status != SLJIT_SUCCESS)
1948 1.1 alnsn goto fail;
1949 1.1 alnsn }
1950 1.1 alnsn
1951 1.1 alnsn /* BPF_RET+BPF_A accept A bytes */
1952 1.1 alnsn if (rval == BPF_A) {
1953 1.7 alnsn status = sljit_emit_return(compiler,
1954 1.7 alnsn SLJIT_MOV_UI,
1955 1.7 alnsn BJ_AREG, 0);
1956 1.1 alnsn if (status != SLJIT_SUCCESS)
1957 1.1 alnsn goto fail;
1958 1.1 alnsn }
1959 1.1 alnsn
1960 1.1 alnsn continue;
1961 1.1 alnsn
1962 1.1 alnsn case BPF_MISC:
1963 1.7 alnsn switch (BPF_MISCOP(pc->code)) {
1964 1.7 alnsn case BPF_TAX:
1965 1.1 alnsn status = sljit_emit_op1(compiler,
1966 1.1 alnsn SLJIT_MOV_UI,
1967 1.7 alnsn BJ_XREG, 0,
1968 1.7 alnsn BJ_AREG, 0);
1969 1.1 alnsn if (status != SLJIT_SUCCESS)
1970 1.1 alnsn goto fail;
1971 1.1 alnsn
1972 1.1 alnsn continue;
1973 1.1 alnsn
1974 1.7 alnsn case BPF_TXA:
1975 1.1 alnsn status = sljit_emit_op1(compiler,
1976 1.1 alnsn SLJIT_MOV,
1977 1.7 alnsn BJ_AREG, 0,
1978 1.7 alnsn BJ_XREG, 0);
1979 1.1 alnsn if (status != SLJIT_SUCCESS)
1980 1.1 alnsn goto fail;
1981 1.1 alnsn
1982 1.1 alnsn continue;
1983 1.13 alnsn
1984 1.13 alnsn case BPF_COP:
1985 1.13 alnsn case BPF_COPX:
1986 1.13 alnsn if (bc == NULL || bc->copfuncs == NULL)
1987 1.13 alnsn goto fail;
1988 1.13 alnsn if (BPF_MISCOP(pc->code) == BPF_COP &&
1989 1.13 alnsn (uint32_t)pc->k >= bc->nfuncs) {
1990 1.13 alnsn goto fail;
1991 1.13 alnsn }
1992 1.13 alnsn
1993 1.13 alnsn jump = NULL;
1994 1.13 alnsn status = emit_cop(compiler, bc, pc, &jump);
1995 1.13 alnsn if (status != SLJIT_SUCCESS)
1996 1.13 alnsn goto fail;
1997 1.13 alnsn
1998 1.13 alnsn if (jump != NULL && !append_jump(jump,
1999 1.13 alnsn &ret0, &ret0_size, &ret0_maxsize))
2000 1.13 alnsn goto fail;
2001 1.13 alnsn
2002 1.13 alnsn continue;
2003 1.1 alnsn }
2004 1.1 alnsn
2005 1.1 alnsn goto fail;
2006 1.1 alnsn } /* switch */
2007 1.1 alnsn } /* main loop */
2008 1.1 alnsn
2009 1.7 alnsn BJ_ASSERT(ret0_size <= ret0_maxsize);
2010 1.1 alnsn
2011 1.7 alnsn if (ret0_size > 0) {
2012 1.1 alnsn label = sljit_emit_label(compiler);
2013 1.1 alnsn if (label == NULL)
2014 1.1 alnsn goto fail;
2015 1.7 alnsn for (i = 0; i < ret0_size; i++)
2016 1.7 alnsn sljit_set_label(ret0[i], label);
2017 1.1 alnsn }
2018 1.1 alnsn
2019 1.19 alnsn rv = true;
2020 1.19 alnsn
2021 1.19 alnsn fail:
2022 1.19 alnsn if (ret0 != NULL)
2023 1.19 alnsn BJ_FREE(ret0, ret0_maxsize * sizeof(ret0[0]));
2024 1.19 alnsn
2025 1.19 alnsn return rv;
2026 1.19 alnsn }
2027 1.19 alnsn
2028 1.19 alnsn bpfjit_func_t
2029 1.19 alnsn bpfjit_generate_code(const bpf_ctx_t *bc,
2030 1.19 alnsn const struct bpf_insn *insns, size_t insn_count)
2031 1.19 alnsn {
2032 1.19 alnsn void *rv;
2033 1.19 alnsn struct sljit_compiler *compiler;
2034 1.19 alnsn
2035 1.19 alnsn size_t i;
2036 1.19 alnsn int status;
2037 1.19 alnsn
2038 1.19 alnsn /* optimization related */
2039 1.19 alnsn bpf_memword_init_t initmask;
2040 1.19 alnsn int nscratches, ncopfuncs;
2041 1.19 alnsn
2042 1.19 alnsn /* memory store location for initial zero initialization */
2043 1.19 alnsn sljit_si mem_reg;
2044 1.19 alnsn sljit_sw mem_off;
2045 1.19 alnsn
2046 1.19 alnsn struct bpfjit_insn_data *insn_dat;
2047 1.19 alnsn
2048 1.19 alnsn const size_t extwords = GET_EXTWORDS(bc);
2049 1.19 alnsn const size_t memwords = GET_MEMWORDS(bc);
2050 1.19 alnsn const bpf_memword_init_t preinited = extwords ? bc->preinited : 0;
2051 1.19 alnsn
2052 1.19 alnsn rv = NULL;
2053 1.19 alnsn compiler = NULL;
2054 1.19 alnsn insn_dat = NULL;
2055 1.19 alnsn
2056 1.19 alnsn if (memwords > MAX_MEMWORDS)
2057 1.19 alnsn goto fail;
2058 1.19 alnsn
2059 1.19 alnsn if (insn_count == 0 || insn_count > SIZE_MAX / sizeof(insn_dat[0]))
2060 1.19 alnsn goto fail;
2061 1.19 alnsn
2062 1.19 alnsn insn_dat = BJ_ALLOC(insn_count * sizeof(insn_dat[0]));
2063 1.19 alnsn if (insn_dat == NULL)
2064 1.19 alnsn goto fail;
2065 1.19 alnsn
2066 1.19 alnsn if (!optimize(bc, insns, insn_dat, insn_count,
2067 1.19 alnsn &initmask, &nscratches, &ncopfuncs)) {
2068 1.19 alnsn goto fail;
2069 1.19 alnsn }
2070 1.19 alnsn
2071 1.19 alnsn compiler = sljit_create_compiler();
2072 1.19 alnsn if (compiler == NULL)
2073 1.19 alnsn goto fail;
2074 1.19 alnsn
2075 1.19 alnsn #if !defined(_KERNEL) && defined(SLJIT_VERBOSE) && SLJIT_VERBOSE
2076 1.19 alnsn sljit_compiler_verbose(compiler, stderr);
2077 1.19 alnsn #endif
2078 1.19 alnsn
2079 1.19 alnsn status = sljit_emit_enter(compiler,
2080 1.19 alnsn 2, nscratches, 3, sizeof(struct bpfjit_stack));
2081 1.19 alnsn if (status != SLJIT_SUCCESS)
2082 1.19 alnsn goto fail;
2083 1.19 alnsn
2084 1.19 alnsn if (ncopfuncs > 0) {
2085 1.19 alnsn /* save ctx argument */
2086 1.19 alnsn status = sljit_emit_op1(compiler,
2087 1.19 alnsn SLJIT_MOV_P,
2088 1.19 alnsn SLJIT_MEM1(SLJIT_LOCALS_REG),
2089 1.19 alnsn offsetof(struct bpfjit_stack, ctx),
2090 1.19 alnsn BJ_CTX_ARG, 0);
2091 1.19 alnsn if (status != SLJIT_SUCCESS)
2092 1.19 alnsn goto fail;
2093 1.19 alnsn }
2094 1.19 alnsn
2095 1.19 alnsn if (extwords == 0) {
2096 1.19 alnsn mem_reg = SLJIT_MEM1(SLJIT_LOCALS_REG);
2097 1.19 alnsn mem_off = offsetof(struct bpfjit_stack, mem);
2098 1.19 alnsn } else {
2099 1.19 alnsn /* copy "mem" argument from bpf_args to bpfjit_stack */
2100 1.19 alnsn status = sljit_emit_op1(compiler,
2101 1.19 alnsn SLJIT_MOV_P,
2102 1.19 alnsn BJ_TMP1REG, 0,
2103 1.19 alnsn SLJIT_MEM1(BJ_ARGS), offsetof(struct bpf_args, mem));
2104 1.19 alnsn if (status != SLJIT_SUCCESS)
2105 1.19 alnsn goto fail;
2106 1.19 alnsn
2107 1.19 alnsn status = sljit_emit_op1(compiler,
2108 1.19 alnsn SLJIT_MOV_P,
2109 1.19 alnsn SLJIT_MEM1(SLJIT_LOCALS_REG),
2110 1.19 alnsn offsetof(struct bpfjit_stack, extmem),
2111 1.19 alnsn BJ_TMP1REG, 0);
2112 1.19 alnsn if (status != SLJIT_SUCCESS)
2113 1.19 alnsn goto fail;
2114 1.19 alnsn
2115 1.19 alnsn mem_reg = SLJIT_MEM1(BJ_TMP1REG);
2116 1.19 alnsn mem_off = 0;
2117 1.19 alnsn }
2118 1.19 alnsn
2119 1.19 alnsn /*
2120 1.19 alnsn * Exclude pre-initialised external memory words but keep
2121 1.19 alnsn * initialization statuses of A and X registers in case
2122 1.19 alnsn * bc->preinited wrongly sets those two bits.
2123 1.19 alnsn */
2124 1.19 alnsn initmask &= ~preinited | BJ_INIT_ABIT | BJ_INIT_XBIT;
2125 1.19 alnsn
2126 1.19 alnsn #if defined(_KERNEL)
2127 1.19 alnsn /* bpf_filter() checks initialization of memwords. */
2128 1.19 alnsn BJ_ASSERT((initmask & (BJ_INIT_MBIT(memwords) - 1)) == 0);
2129 1.19 alnsn #endif
2130 1.19 alnsn for (i = 0; i < memwords; i++) {
2131 1.19 alnsn if (initmask & BJ_INIT_MBIT(i)) {
2132 1.19 alnsn /* M[i] = 0; */
2133 1.19 alnsn status = sljit_emit_op1(compiler,
2134 1.19 alnsn SLJIT_MOV_UI,
2135 1.19 alnsn mem_reg, mem_off + i * sizeof(uint32_t),
2136 1.19 alnsn SLJIT_IMM, 0);
2137 1.19 alnsn if (status != SLJIT_SUCCESS)
2138 1.19 alnsn goto fail;
2139 1.19 alnsn }
2140 1.19 alnsn }
2141 1.19 alnsn
2142 1.19 alnsn if (initmask & BJ_INIT_ABIT) {
2143 1.19 alnsn /* A = 0; */
2144 1.19 alnsn status = sljit_emit_op1(compiler,
2145 1.19 alnsn SLJIT_MOV,
2146 1.19 alnsn BJ_AREG, 0,
2147 1.19 alnsn SLJIT_IMM, 0);
2148 1.19 alnsn if (status != SLJIT_SUCCESS)
2149 1.19 alnsn goto fail;
2150 1.19 alnsn }
2151 1.19 alnsn
2152 1.19 alnsn if (initmask & BJ_INIT_XBIT) {
2153 1.19 alnsn /* X = 0; */
2154 1.19 alnsn status = sljit_emit_op1(compiler,
2155 1.19 alnsn SLJIT_MOV,
2156 1.19 alnsn BJ_XREG, 0,
2157 1.19 alnsn SLJIT_IMM, 0);
2158 1.19 alnsn if (status != SLJIT_SUCCESS)
2159 1.19 alnsn goto fail;
2160 1.19 alnsn }
2161 1.19 alnsn
2162 1.19 alnsn status = load_buf_buflen(compiler);
2163 1.19 alnsn if (status != SLJIT_SUCCESS)
2164 1.19 alnsn goto fail;
2165 1.19 alnsn
2166 1.19 alnsn if (!generate_insn_code(compiler, bc, insns, insn_dat, insn_count))
2167 1.19 alnsn goto fail;
2168 1.19 alnsn
2169 1.1 alnsn status = sljit_emit_return(compiler,
2170 1.1 alnsn SLJIT_MOV_UI,
2171 1.7 alnsn SLJIT_IMM, 0);
2172 1.1 alnsn if (status != SLJIT_SUCCESS)
2173 1.1 alnsn goto fail;
2174 1.1 alnsn
2175 1.1 alnsn rv = sljit_generate_code(compiler);
2176 1.1 alnsn
2177 1.1 alnsn fail:
2178 1.1 alnsn if (compiler != NULL)
2179 1.1 alnsn sljit_free_compiler(compiler);
2180 1.1 alnsn
2181 1.1 alnsn if (insn_dat != NULL)
2182 1.7 alnsn BJ_FREE(insn_dat, insn_count * sizeof(insn_dat[0]));
2183 1.1 alnsn
2184 1.4 rmind return (bpfjit_func_t)rv;
2185 1.1 alnsn }
2186 1.1 alnsn
2187 1.1 alnsn void
2188 1.4 rmind bpfjit_free_code(bpfjit_func_t code)
2189 1.1 alnsn {
2190 1.7 alnsn
2191 1.1 alnsn sljit_free_code((void *)code);
2192 1.1 alnsn }
2193