bpfjit.c revision 1.30 1 1.30 alnsn /* $NetBSD: bpfjit.c,v 1.30 2014/07/22 08:29:51 alnsn Exp $ */
2 1.3 rmind
3 1.1 alnsn /*-
4 1.7 alnsn * Copyright (c) 2011-2014 Alexander Nasonov.
5 1.1 alnsn * All rights reserved.
6 1.1 alnsn *
7 1.1 alnsn * Redistribution and use in source and binary forms, with or without
8 1.1 alnsn * modification, are permitted provided that the following conditions
9 1.1 alnsn * are met:
10 1.1 alnsn *
11 1.1 alnsn * 1. Redistributions of source code must retain the above copyright
12 1.1 alnsn * notice, this list of conditions and the following disclaimer.
13 1.1 alnsn * 2. Redistributions in binary form must reproduce the above copyright
14 1.1 alnsn * notice, this list of conditions and the following disclaimer in
15 1.1 alnsn * the documentation and/or other materials provided with the
16 1.1 alnsn * distribution.
17 1.1 alnsn *
18 1.1 alnsn * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
19 1.1 alnsn * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
20 1.1 alnsn * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
21 1.1 alnsn * FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
22 1.1 alnsn * COPYRIGHT HOLDERS OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
23 1.1 alnsn * INCIDENTAL, SPECIAL, EXEMPLARY OR CONSEQUENTIAL DAMAGES (INCLUDING,
24 1.1 alnsn * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
25 1.1 alnsn * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED
26 1.1 alnsn * AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
27 1.1 alnsn * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT
28 1.1 alnsn * OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
29 1.1 alnsn * SUCH DAMAGE.
30 1.1 alnsn */
31 1.1 alnsn
32 1.2 alnsn #include <sys/cdefs.h>
33 1.2 alnsn #ifdef _KERNEL
34 1.30 alnsn __KERNEL_RCSID(0, "$NetBSD: bpfjit.c,v 1.30 2014/07/22 08:29:51 alnsn Exp $");
35 1.2 alnsn #else
36 1.30 alnsn __RCSID("$NetBSD: bpfjit.c,v 1.30 2014/07/22 08:29:51 alnsn Exp $");
37 1.2 alnsn #endif
38 1.2 alnsn
39 1.3 rmind #include <sys/types.h>
40 1.3 rmind #include <sys/queue.h>
41 1.1 alnsn
42 1.1 alnsn #ifndef _KERNEL
43 1.7 alnsn #include <assert.h>
44 1.7 alnsn #define BJ_ASSERT(c) assert(c)
45 1.7 alnsn #else
46 1.7 alnsn #define BJ_ASSERT(c) KASSERT(c)
47 1.7 alnsn #endif
48 1.7 alnsn
49 1.7 alnsn #ifndef _KERNEL
50 1.3 rmind #include <stdlib.h>
51 1.7 alnsn #define BJ_ALLOC(sz) malloc(sz)
52 1.7 alnsn #define BJ_FREE(p, sz) free(p)
53 1.1 alnsn #else
54 1.3 rmind #include <sys/kmem.h>
55 1.7 alnsn #define BJ_ALLOC(sz) kmem_alloc(sz, KM_SLEEP)
56 1.7 alnsn #define BJ_FREE(p, sz) kmem_free(p, sz)
57 1.1 alnsn #endif
58 1.1 alnsn
59 1.1 alnsn #ifndef _KERNEL
60 1.1 alnsn #include <limits.h>
61 1.1 alnsn #include <stdbool.h>
62 1.1 alnsn #include <stddef.h>
63 1.1 alnsn #include <stdint.h>
64 1.1 alnsn #else
65 1.1 alnsn #include <sys/atomic.h>
66 1.1 alnsn #include <sys/module.h>
67 1.1 alnsn #endif
68 1.1 alnsn
69 1.5 rmind #define __BPF_PRIVATE
70 1.5 rmind #include <net/bpf.h>
71 1.3 rmind #include <net/bpfjit.h>
72 1.1 alnsn #include <sljitLir.h>
73 1.1 alnsn
74 1.7 alnsn #if !defined(_KERNEL) && defined(SLJIT_VERBOSE) && SLJIT_VERBOSE
75 1.7 alnsn #include <stdio.h> /* for stderr */
76 1.7 alnsn #endif
77 1.7 alnsn
78 1.7 alnsn /*
79 1.13 alnsn * Arguments of generated bpfjit_func_t.
80 1.13 alnsn * The first argument is reassigned upon entry
81 1.13 alnsn * to a more frequently used buf argument.
82 1.13 alnsn */
83 1.13 alnsn #define BJ_CTX_ARG SLJIT_SAVED_REG1
84 1.13 alnsn #define BJ_ARGS SLJIT_SAVED_REG2
85 1.13 alnsn
86 1.13 alnsn /*
87 1.7 alnsn * Permanent register assignments.
88 1.7 alnsn */
89 1.7 alnsn #define BJ_BUF SLJIT_SAVED_REG1
90 1.13 alnsn //#define BJ_ARGS SLJIT_SAVED_REG2
91 1.7 alnsn #define BJ_BUFLEN SLJIT_SAVED_REG3
92 1.29 alnsn #define BJ_XREG SLJIT_SAVED_EREG1
93 1.29 alnsn #define BJ_ASAVE SLJIT_SAVED_EREG2
94 1.12 alnsn #define BJ_AREG SLJIT_SCRATCH_REG1
95 1.12 alnsn #define BJ_TMP1REG SLJIT_SCRATCH_REG2
96 1.12 alnsn #define BJ_TMP2REG SLJIT_SCRATCH_REG3
97 1.29 alnsn #define BJ_TMP3REG SLJIT_TEMPORARY_EREG1
98 1.7 alnsn
99 1.13 alnsn #ifdef _KERNEL
100 1.13 alnsn #define MAX_MEMWORDS BPF_MAX_MEMWORDS
101 1.13 alnsn #else
102 1.13 alnsn #define MAX_MEMWORDS BPF_MEMWORDS
103 1.13 alnsn #endif
104 1.13 alnsn
105 1.13 alnsn #define BJ_INIT_NOBITS ((bpf_memword_init_t)0)
106 1.13 alnsn #define BJ_INIT_MBIT(k) BPF_MEMWORD_INIT(k)
107 1.13 alnsn #define BJ_INIT_ABIT BJ_INIT_MBIT(MAX_MEMWORDS)
108 1.13 alnsn #define BJ_INIT_XBIT BJ_INIT_MBIT(MAX_MEMWORDS + 1)
109 1.1 alnsn
110 1.9 alnsn /*
111 1.19 alnsn * Get a number of memwords and external memwords from a bpf_ctx object.
112 1.19 alnsn */
113 1.19 alnsn #define GET_EXTWORDS(bc) ((bc) ? (bc)->extwords : 0)
114 1.19 alnsn #define GET_MEMWORDS(bc) (GET_EXTWORDS(bc) ? GET_EXTWORDS(bc) : BPF_MEMWORDS)
115 1.19 alnsn
116 1.19 alnsn /*
117 1.20 alnsn * Optimization hints.
118 1.20 alnsn */
119 1.20 alnsn typedef unsigned int bpfjit_hint_t;
120 1.28 alnsn #define BJ_HINT_ABS 0x01 /* packet read at absolute offset */
121 1.28 alnsn #define BJ_HINT_IND 0x02 /* packet read at variable offset */
122 1.29 alnsn #define BJ_HINT_MSH 0x04 /* BPF_MSH instruction */
123 1.29 alnsn #define BJ_HINT_COP 0x08 /* BPF_COP or BPF_COPX instruction */
124 1.29 alnsn #define BJ_HINT_COPX 0x10 /* BPF_COPX instruction */
125 1.29 alnsn #define BJ_HINT_XREG 0x20 /* BJ_XREG is needed */
126 1.29 alnsn #define BJ_HINT_LDX 0x40 /* BPF_LDX instruction */
127 1.29 alnsn #define BJ_HINT_PKT (BJ_HINT_ABS|BJ_HINT_IND|BJ_HINT_MSH)
128 1.20 alnsn
129 1.20 alnsn /*
130 1.9 alnsn * Datatype for Array Bounds Check Elimination (ABC) pass.
131 1.9 alnsn */
132 1.9 alnsn typedef uint64_t bpfjit_abc_length_t;
133 1.9 alnsn #define MAX_ABC_LENGTH (UINT32_MAX + UINT64_C(4)) /* max. width is 4 */
134 1.8 alnsn
135 1.7 alnsn struct bpfjit_stack
136 1.7 alnsn {
137 1.13 alnsn bpf_ctx_t *ctx;
138 1.13 alnsn uint32_t *extmem; /* pointer to external memory store */
139 1.7 alnsn #ifdef _KERNEL
140 1.21 alnsn int err; /* 3rd argument for m_xword/m_xhalf/m_xbyte function call */
141 1.7 alnsn #endif
142 1.13 alnsn uint32_t mem[BPF_MEMWORDS]; /* internal memory store */
143 1.7 alnsn };
144 1.7 alnsn
145 1.7 alnsn /*
146 1.7 alnsn * Data for BPF_JMP instruction.
147 1.7 alnsn * Forward declaration for struct bpfjit_jump.
148 1.1 alnsn */
149 1.7 alnsn struct bpfjit_jump_data;
150 1.1 alnsn
151 1.1 alnsn /*
152 1.7 alnsn * Node of bjumps list.
153 1.1 alnsn */
154 1.3 rmind struct bpfjit_jump {
155 1.7 alnsn struct sljit_jump *sjump;
156 1.7 alnsn SLIST_ENTRY(bpfjit_jump) entries;
157 1.7 alnsn struct bpfjit_jump_data *jdata;
158 1.1 alnsn };
159 1.1 alnsn
160 1.1 alnsn /*
161 1.1 alnsn * Data for BPF_JMP instruction.
162 1.1 alnsn */
163 1.3 rmind struct bpfjit_jump_data {
164 1.1 alnsn /*
165 1.7 alnsn * These entries make up bjumps list:
166 1.7 alnsn * jtf[0] - when coming from jt path,
167 1.7 alnsn * jtf[1] - when coming from jf path.
168 1.1 alnsn */
169 1.7 alnsn struct bpfjit_jump jtf[2];
170 1.7 alnsn /*
171 1.7 alnsn * Length calculated by Array Bounds Check Elimination (ABC) pass.
172 1.7 alnsn */
173 1.8 alnsn bpfjit_abc_length_t abc_length;
174 1.7 alnsn /*
175 1.7 alnsn * Length checked by the last out-of-bounds check.
176 1.7 alnsn */
177 1.8 alnsn bpfjit_abc_length_t checked_length;
178 1.1 alnsn };
179 1.1 alnsn
180 1.1 alnsn /*
181 1.1 alnsn * Data for "read from packet" instructions.
182 1.1 alnsn * See also read_pkt_insn() function below.
183 1.1 alnsn */
184 1.3 rmind struct bpfjit_read_pkt_data {
185 1.1 alnsn /*
186 1.7 alnsn * Length calculated by Array Bounds Check Elimination (ABC) pass.
187 1.7 alnsn */
188 1.8 alnsn bpfjit_abc_length_t abc_length;
189 1.7 alnsn /*
190 1.7 alnsn * If positive, emit "if (buflen < check_length) return 0"
191 1.7 alnsn * out-of-bounds check.
192 1.9 alnsn * Values greater than UINT32_MAX generate unconditional "return 0".
193 1.1 alnsn */
194 1.8 alnsn bpfjit_abc_length_t check_length;
195 1.1 alnsn };
196 1.1 alnsn
197 1.1 alnsn /*
198 1.1 alnsn * Additional (optimization-related) data for bpf_insn.
199 1.1 alnsn */
200 1.3 rmind struct bpfjit_insn_data {
201 1.1 alnsn /* List of jumps to this insn. */
202 1.7 alnsn SLIST_HEAD(, bpfjit_jump) bjumps;
203 1.1 alnsn
204 1.1 alnsn union {
205 1.7 alnsn struct bpfjit_jump_data jdata;
206 1.7 alnsn struct bpfjit_read_pkt_data rdata;
207 1.7 alnsn } u;
208 1.1 alnsn
209 1.13 alnsn bpf_memword_init_t invalid;
210 1.7 alnsn bool unreachable;
211 1.1 alnsn };
212 1.1 alnsn
213 1.1 alnsn #ifdef _KERNEL
214 1.1 alnsn
215 1.1 alnsn uint32_t m_xword(const struct mbuf *, uint32_t, int *);
216 1.1 alnsn uint32_t m_xhalf(const struct mbuf *, uint32_t, int *);
217 1.1 alnsn uint32_t m_xbyte(const struct mbuf *, uint32_t, int *);
218 1.1 alnsn
219 1.1 alnsn MODULE(MODULE_CLASS_MISC, bpfjit, "sljit")
220 1.1 alnsn
221 1.1 alnsn static int
222 1.1 alnsn bpfjit_modcmd(modcmd_t cmd, void *arg)
223 1.1 alnsn {
224 1.1 alnsn
225 1.1 alnsn switch (cmd) {
226 1.1 alnsn case MODULE_CMD_INIT:
227 1.1 alnsn bpfjit_module_ops.bj_free_code = &bpfjit_free_code;
228 1.1 alnsn membar_producer();
229 1.1 alnsn bpfjit_module_ops.bj_generate_code = &bpfjit_generate_code;
230 1.1 alnsn membar_producer();
231 1.1 alnsn return 0;
232 1.1 alnsn
233 1.1 alnsn case MODULE_CMD_FINI:
234 1.1 alnsn return EOPNOTSUPP;
235 1.1 alnsn
236 1.1 alnsn default:
237 1.1 alnsn return ENOTTY;
238 1.1 alnsn }
239 1.1 alnsn }
240 1.1 alnsn #endif
241 1.1 alnsn
242 1.20 alnsn /*
243 1.21 alnsn * Return a number of scratch registers to pass
244 1.20 alnsn * to sljit_emit_enter() function.
245 1.20 alnsn */
246 1.20 alnsn static sljit_si
247 1.20 alnsn nscratches(bpfjit_hint_t hints)
248 1.20 alnsn {
249 1.20 alnsn sljit_si rv = 2;
250 1.20 alnsn
251 1.22 alnsn #ifdef _KERNEL
252 1.24 alnsn if (hints & BJ_HINT_PKT)
253 1.24 alnsn rv = 3; /* xcall with three arguments */
254 1.22 alnsn #endif
255 1.22 alnsn
256 1.27 alnsn if (hints & BJ_HINT_IND)
257 1.20 alnsn rv = 3; /* uses BJ_TMP2REG */
258 1.20 alnsn
259 1.20 alnsn if (hints & BJ_HINT_COP)
260 1.20 alnsn rv = 3; /* calls copfunc with three arguments */
261 1.20 alnsn
262 1.29 alnsn if (hints & BJ_HINT_COPX)
263 1.29 alnsn rv = 4; /* uses BJ_TMP3REG */
264 1.29 alnsn
265 1.29 alnsn return rv;
266 1.29 alnsn }
267 1.29 alnsn
268 1.29 alnsn /*
269 1.29 alnsn * Return a number of saved registers to pass
270 1.29 alnsn * to sljit_emit_enter() function.
271 1.29 alnsn */
272 1.29 alnsn static sljit_si
273 1.29 alnsn nsaveds(bpfjit_hint_t hints)
274 1.29 alnsn {
275 1.29 alnsn sljit_si rv = 3;
276 1.29 alnsn
277 1.20 alnsn if (hints & BJ_HINT_XREG)
278 1.20 alnsn rv = 4; /* uses BJ_XREG */
279 1.20 alnsn
280 1.20 alnsn #ifdef _KERNEL
281 1.20 alnsn if (hints & BJ_HINT_LDX)
282 1.29 alnsn rv = 5; /* uses BJ_ASAVE */
283 1.20 alnsn #endif
284 1.20 alnsn
285 1.20 alnsn return rv;
286 1.20 alnsn }
287 1.20 alnsn
288 1.1 alnsn static uint32_t
289 1.7 alnsn read_width(const struct bpf_insn *pc)
290 1.1 alnsn {
291 1.1 alnsn
292 1.1 alnsn switch (BPF_SIZE(pc->code)) {
293 1.1 alnsn case BPF_W:
294 1.1 alnsn return 4;
295 1.1 alnsn case BPF_H:
296 1.1 alnsn return 2;
297 1.1 alnsn case BPF_B:
298 1.1 alnsn return 1;
299 1.1 alnsn default:
300 1.7 alnsn BJ_ASSERT(false);
301 1.1 alnsn return 0;
302 1.1 alnsn }
303 1.1 alnsn }
304 1.1 alnsn
305 1.13 alnsn /*
306 1.13 alnsn * Copy buf and buflen members of bpf_args from BJ_ARGS
307 1.13 alnsn * pointer to BJ_BUF and BJ_BUFLEN registers.
308 1.13 alnsn */
309 1.13 alnsn static int
310 1.13 alnsn load_buf_buflen(struct sljit_compiler *compiler)
311 1.13 alnsn {
312 1.13 alnsn int status;
313 1.13 alnsn
314 1.13 alnsn status = sljit_emit_op1(compiler,
315 1.13 alnsn SLJIT_MOV_P,
316 1.13 alnsn BJ_BUF, 0,
317 1.13 alnsn SLJIT_MEM1(BJ_ARGS),
318 1.13 alnsn offsetof(struct bpf_args, pkt));
319 1.13 alnsn if (status != SLJIT_SUCCESS)
320 1.13 alnsn return status;
321 1.13 alnsn
322 1.13 alnsn status = sljit_emit_op1(compiler,
323 1.21 alnsn SLJIT_MOV, /* size_t source */
324 1.13 alnsn BJ_BUFLEN, 0,
325 1.13 alnsn SLJIT_MEM1(BJ_ARGS),
326 1.13 alnsn offsetof(struct bpf_args, buflen));
327 1.13 alnsn
328 1.13 alnsn return status;
329 1.13 alnsn }
330 1.13 alnsn
331 1.7 alnsn static bool
332 1.7 alnsn grow_jumps(struct sljit_jump ***jumps, size_t *size)
333 1.7 alnsn {
334 1.7 alnsn struct sljit_jump **newptr;
335 1.7 alnsn const size_t elemsz = sizeof(struct sljit_jump *);
336 1.7 alnsn size_t old_size = *size;
337 1.7 alnsn size_t new_size = 2 * old_size;
338 1.7 alnsn
339 1.7 alnsn if (new_size < old_size || new_size > SIZE_MAX / elemsz)
340 1.7 alnsn return false;
341 1.7 alnsn
342 1.7 alnsn newptr = BJ_ALLOC(new_size * elemsz);
343 1.7 alnsn if (newptr == NULL)
344 1.7 alnsn return false;
345 1.7 alnsn
346 1.7 alnsn memcpy(newptr, *jumps, old_size * elemsz);
347 1.7 alnsn BJ_FREE(*jumps, old_size * elemsz);
348 1.7 alnsn
349 1.7 alnsn *jumps = newptr;
350 1.7 alnsn *size = new_size;
351 1.7 alnsn return true;
352 1.7 alnsn }
353 1.7 alnsn
354 1.7 alnsn static bool
355 1.7 alnsn append_jump(struct sljit_jump *jump, struct sljit_jump ***jumps,
356 1.7 alnsn size_t *size, size_t *max_size)
357 1.1 alnsn {
358 1.7 alnsn if (*size == *max_size && !grow_jumps(jumps, max_size))
359 1.7 alnsn return false;
360 1.1 alnsn
361 1.7 alnsn (*jumps)[(*size)++] = jump;
362 1.7 alnsn return true;
363 1.1 alnsn }
364 1.1 alnsn
365 1.1 alnsn /*
366 1.24 alnsn * Emit code for BPF_LD+BPF_B+BPF_ABS A <- P[k:1].
367 1.1 alnsn */
368 1.1 alnsn static int
369 1.27 alnsn emit_read8(struct sljit_compiler *compiler, sljit_si src, uint32_t k)
370 1.1 alnsn {
371 1.1 alnsn
372 1.1 alnsn return sljit_emit_op1(compiler,
373 1.1 alnsn SLJIT_MOV_UB,
374 1.7 alnsn BJ_AREG, 0,
375 1.27 alnsn SLJIT_MEM1(src), k);
376 1.1 alnsn }
377 1.1 alnsn
378 1.1 alnsn /*
379 1.24 alnsn * Emit code for BPF_LD+BPF_H+BPF_ABS A <- P[k:2].
380 1.1 alnsn */
381 1.1 alnsn static int
382 1.27 alnsn emit_read16(struct sljit_compiler *compiler, sljit_si src, uint32_t k)
383 1.1 alnsn {
384 1.1 alnsn int status;
385 1.1 alnsn
386 1.27 alnsn BJ_ASSERT(k <= UINT32_MAX - 1);
387 1.27 alnsn
388 1.27 alnsn /* A = buf[k]; */
389 1.1 alnsn status = sljit_emit_op1(compiler,
390 1.1 alnsn SLJIT_MOV_UB,
391 1.27 alnsn BJ_AREG, 0,
392 1.27 alnsn SLJIT_MEM1(src), k);
393 1.1 alnsn if (status != SLJIT_SUCCESS)
394 1.1 alnsn return status;
395 1.1 alnsn
396 1.27 alnsn /* tmp1 = buf[k+1]; */
397 1.1 alnsn status = sljit_emit_op1(compiler,
398 1.1 alnsn SLJIT_MOV_UB,
399 1.27 alnsn BJ_TMP1REG, 0,
400 1.27 alnsn SLJIT_MEM1(src), k+1);
401 1.1 alnsn if (status != SLJIT_SUCCESS)
402 1.1 alnsn return status;
403 1.1 alnsn
404 1.27 alnsn /* A = A << 8; */
405 1.1 alnsn status = sljit_emit_op2(compiler,
406 1.1 alnsn SLJIT_SHL,
407 1.27 alnsn BJ_AREG, 0,
408 1.27 alnsn BJ_AREG, 0,
409 1.1 alnsn SLJIT_IMM, 8);
410 1.1 alnsn if (status != SLJIT_SUCCESS)
411 1.1 alnsn return status;
412 1.1 alnsn
413 1.1 alnsn /* A = A + tmp1; */
414 1.1 alnsn status = sljit_emit_op2(compiler,
415 1.1 alnsn SLJIT_ADD,
416 1.7 alnsn BJ_AREG, 0,
417 1.7 alnsn BJ_AREG, 0,
418 1.7 alnsn BJ_TMP1REG, 0);
419 1.1 alnsn return status;
420 1.1 alnsn }
421 1.1 alnsn
422 1.1 alnsn /*
423 1.24 alnsn * Emit code for BPF_LD+BPF_W+BPF_ABS A <- P[k:4].
424 1.1 alnsn */
425 1.1 alnsn static int
426 1.27 alnsn emit_read32(struct sljit_compiler *compiler, sljit_si src, uint32_t k)
427 1.1 alnsn {
428 1.1 alnsn int status;
429 1.1 alnsn
430 1.27 alnsn BJ_ASSERT(k <= UINT32_MAX - 3);
431 1.1 alnsn
432 1.27 alnsn /* A = buf[k]; */
433 1.1 alnsn status = sljit_emit_op1(compiler,
434 1.1 alnsn SLJIT_MOV_UB,
435 1.27 alnsn BJ_AREG, 0,
436 1.27 alnsn SLJIT_MEM1(src), k);
437 1.1 alnsn if (status != SLJIT_SUCCESS)
438 1.1 alnsn return status;
439 1.1 alnsn
440 1.27 alnsn /* tmp1 = buf[k+1]; */
441 1.1 alnsn status = sljit_emit_op1(compiler,
442 1.1 alnsn SLJIT_MOV_UB,
443 1.27 alnsn BJ_TMP1REG, 0,
444 1.27 alnsn SLJIT_MEM1(src), k+1);
445 1.1 alnsn if (status != SLJIT_SUCCESS)
446 1.1 alnsn return status;
447 1.1 alnsn
448 1.27 alnsn /* A = A << 8; */
449 1.1 alnsn status = sljit_emit_op2(compiler,
450 1.1 alnsn SLJIT_SHL,
451 1.27 alnsn BJ_AREG, 0,
452 1.27 alnsn BJ_AREG, 0,
453 1.27 alnsn SLJIT_IMM, 8);
454 1.1 alnsn if (status != SLJIT_SUCCESS)
455 1.1 alnsn return status;
456 1.1 alnsn
457 1.1 alnsn /* A = A + tmp1; */
458 1.1 alnsn status = sljit_emit_op2(compiler,
459 1.1 alnsn SLJIT_ADD,
460 1.7 alnsn BJ_AREG, 0,
461 1.7 alnsn BJ_AREG, 0,
462 1.7 alnsn BJ_TMP1REG, 0);
463 1.1 alnsn if (status != SLJIT_SUCCESS)
464 1.1 alnsn return status;
465 1.1 alnsn
466 1.1 alnsn /* tmp1 = buf[k+2]; */
467 1.1 alnsn status = sljit_emit_op1(compiler,
468 1.1 alnsn SLJIT_MOV_UB,
469 1.7 alnsn BJ_TMP1REG, 0,
470 1.27 alnsn SLJIT_MEM1(src), k+2);
471 1.1 alnsn if (status != SLJIT_SUCCESS)
472 1.1 alnsn return status;
473 1.1 alnsn
474 1.27 alnsn /* A = A << 8; */
475 1.1 alnsn status = sljit_emit_op2(compiler,
476 1.1 alnsn SLJIT_SHL,
477 1.27 alnsn BJ_AREG, 0,
478 1.27 alnsn BJ_AREG, 0,
479 1.27 alnsn SLJIT_IMM, 8);
480 1.1 alnsn if (status != SLJIT_SUCCESS)
481 1.1 alnsn return status;
482 1.1 alnsn
483 1.27 alnsn /* A = A + tmp1; */
484 1.1 alnsn status = sljit_emit_op2(compiler,
485 1.1 alnsn SLJIT_ADD,
486 1.7 alnsn BJ_AREG, 0,
487 1.7 alnsn BJ_AREG, 0,
488 1.27 alnsn BJ_TMP1REG, 0);
489 1.27 alnsn if (status != SLJIT_SUCCESS)
490 1.27 alnsn return status;
491 1.27 alnsn
492 1.27 alnsn /* tmp1 = buf[k+3]; */
493 1.27 alnsn status = sljit_emit_op1(compiler,
494 1.27 alnsn SLJIT_MOV_UB,
495 1.27 alnsn BJ_TMP1REG, 0,
496 1.27 alnsn SLJIT_MEM1(src), k+3);
497 1.1 alnsn if (status != SLJIT_SUCCESS)
498 1.1 alnsn return status;
499 1.1 alnsn
500 1.27 alnsn /* A = A << 8; */
501 1.1 alnsn status = sljit_emit_op2(compiler,
502 1.1 alnsn SLJIT_SHL,
503 1.27 alnsn BJ_AREG, 0,
504 1.27 alnsn BJ_AREG, 0,
505 1.1 alnsn SLJIT_IMM, 8);
506 1.1 alnsn if (status != SLJIT_SUCCESS)
507 1.1 alnsn return status;
508 1.1 alnsn
509 1.1 alnsn /* A = A + tmp1; */
510 1.1 alnsn status = sljit_emit_op2(compiler,
511 1.1 alnsn SLJIT_ADD,
512 1.7 alnsn BJ_AREG, 0,
513 1.7 alnsn BJ_AREG, 0,
514 1.7 alnsn BJ_TMP1REG, 0);
515 1.1 alnsn return status;
516 1.1 alnsn }
517 1.1 alnsn
518 1.1 alnsn #ifdef _KERNEL
519 1.1 alnsn /*
520 1.24 alnsn * Emit code for m_xword/m_xhalf/m_xbyte call.
521 1.1 alnsn *
522 1.24 alnsn * @pc BPF_LD+BPF_W+BPF_ABS A <- P[k:4]
523 1.24 alnsn * BPF_LD+BPF_H+BPF_ABS A <- P[k:2]
524 1.24 alnsn * BPF_LD+BPF_B+BPF_ABS A <- P[k:1]
525 1.24 alnsn * BPF_LD+BPF_W+BPF_IND A <- P[X+k:4]
526 1.24 alnsn * BPF_LD+BPF_H+BPF_IND A <- P[X+k:2]
527 1.24 alnsn * BPF_LD+BPF_B+BPF_IND A <- P[X+k:1]
528 1.24 alnsn * BPF_LDX+BPF_B+BPF_MSH X <- 4*(P[k:1]&0xf)
529 1.1 alnsn */
530 1.1 alnsn static int
531 1.19 alnsn emit_xcall(struct sljit_compiler *compiler, const struct bpf_insn *pc,
532 1.23 alnsn int dst, struct sljit_jump ***ret0, size_t *ret0_size, size_t *ret0_maxsize,
533 1.1 alnsn uint32_t (*fn)(const struct mbuf *, uint32_t, int *))
534 1.1 alnsn {
535 1.23 alnsn struct sljit_jump *jump;
536 1.1 alnsn int status;
537 1.1 alnsn
538 1.29 alnsn BJ_ASSERT(dst != BJ_ASAVE);
539 1.23 alnsn
540 1.1 alnsn if (BPF_CLASS(pc->code) == BPF_LDX) {
541 1.1 alnsn /* save A */
542 1.1 alnsn status = sljit_emit_op1(compiler,
543 1.1 alnsn SLJIT_MOV,
544 1.29 alnsn BJ_ASAVE, 0,
545 1.7 alnsn BJ_AREG, 0);
546 1.1 alnsn if (status != SLJIT_SUCCESS)
547 1.1 alnsn return status;
548 1.1 alnsn }
549 1.1 alnsn
550 1.1 alnsn /*
551 1.23 alnsn * Prepare registers for fn(mbuf, k, &err) call.
552 1.1 alnsn */
553 1.1 alnsn status = sljit_emit_op1(compiler,
554 1.1 alnsn SLJIT_MOV,
555 1.12 alnsn SLJIT_SCRATCH_REG1, 0,
556 1.7 alnsn BJ_BUF, 0);
557 1.1 alnsn if (status != SLJIT_SUCCESS)
558 1.1 alnsn return status;
559 1.1 alnsn
560 1.1 alnsn if (BPF_CLASS(pc->code) == BPF_LD && BPF_MODE(pc->code) == BPF_IND) {
561 1.26 alnsn /* if (X > UINT32_MAX - pc->k) return 0; */
562 1.26 alnsn jump = sljit_emit_cmp(compiler,
563 1.26 alnsn SLJIT_C_GREATER,
564 1.26 alnsn BJ_XREG, 0,
565 1.26 alnsn SLJIT_IMM, UINT32_MAX - pc->k);
566 1.26 alnsn if (jump == NULL)
567 1.26 alnsn return SLJIT_ERR_ALLOC_FAILED;
568 1.26 alnsn if (!append_jump(jump, ret0, ret0_size, ret0_maxsize))
569 1.26 alnsn return SLJIT_ERR_ALLOC_FAILED;
570 1.26 alnsn
571 1.23 alnsn /* k = X + pc->k; */
572 1.1 alnsn status = sljit_emit_op2(compiler,
573 1.26 alnsn SLJIT_ADD,
574 1.12 alnsn SLJIT_SCRATCH_REG2, 0,
575 1.7 alnsn BJ_XREG, 0,
576 1.1 alnsn SLJIT_IMM, (uint32_t)pc->k);
577 1.24 alnsn if (status != SLJIT_SUCCESS)
578 1.24 alnsn return status;
579 1.1 alnsn } else {
580 1.23 alnsn /* k = pc->k */
581 1.1 alnsn status = sljit_emit_op1(compiler,
582 1.1 alnsn SLJIT_MOV,
583 1.12 alnsn SLJIT_SCRATCH_REG2, 0,
584 1.1 alnsn SLJIT_IMM, (uint32_t)pc->k);
585 1.24 alnsn if (status != SLJIT_SUCCESS)
586 1.24 alnsn return status;
587 1.1 alnsn }
588 1.1 alnsn
589 1.21 alnsn /*
590 1.21 alnsn * The third argument of fn is an address on stack.
591 1.21 alnsn */
592 1.1 alnsn status = sljit_get_local_base(compiler,
593 1.21 alnsn SLJIT_SCRATCH_REG3, 0,
594 1.21 alnsn offsetof(struct bpfjit_stack, err));
595 1.1 alnsn if (status != SLJIT_SUCCESS)
596 1.1 alnsn return status;
597 1.1 alnsn
598 1.1 alnsn /* fn(buf, k, &err); */
599 1.1 alnsn status = sljit_emit_ijump(compiler,
600 1.1 alnsn SLJIT_CALL3,
601 1.1 alnsn SLJIT_IMM, SLJIT_FUNC_OFFSET(fn));
602 1.24 alnsn if (status != SLJIT_SUCCESS)
603 1.24 alnsn return status;
604 1.1 alnsn
605 1.7 alnsn if (dst != SLJIT_RETURN_REG) {
606 1.1 alnsn /* move return value to dst */
607 1.1 alnsn status = sljit_emit_op1(compiler,
608 1.1 alnsn SLJIT_MOV,
609 1.23 alnsn dst, 0,
610 1.1 alnsn SLJIT_RETURN_REG, 0);
611 1.1 alnsn if (status != SLJIT_SUCCESS)
612 1.1 alnsn return status;
613 1.7 alnsn }
614 1.1 alnsn
615 1.30 alnsn /* if (*err != 0) return 0; */
616 1.30 alnsn jump = sljit_emit_cmp(compiler,
617 1.30 alnsn SLJIT_C_NOT_EQUAL|SLJIT_INT_OP,
618 1.21 alnsn SLJIT_MEM1(SLJIT_LOCALS_REG),
619 1.30 alnsn offsetof(struct bpfjit_stack, err),
620 1.1 alnsn SLJIT_IMM, 0);
621 1.23 alnsn if (jump == NULL)
622 1.23 alnsn return SLJIT_ERR_ALLOC_FAILED;
623 1.23 alnsn
624 1.23 alnsn if (!append_jump(jump, ret0, ret0_size, ret0_maxsize))
625 1.1 alnsn return SLJIT_ERR_ALLOC_FAILED;
626 1.1 alnsn
627 1.26 alnsn if (BPF_CLASS(pc->code) == BPF_LDX) {
628 1.26 alnsn /* restore A */
629 1.26 alnsn status = sljit_emit_op1(compiler,
630 1.26 alnsn SLJIT_MOV,
631 1.26 alnsn BJ_AREG, 0,
632 1.29 alnsn BJ_ASAVE, 0);
633 1.26 alnsn if (status != SLJIT_SUCCESS)
634 1.26 alnsn return status;
635 1.26 alnsn }
636 1.26 alnsn
637 1.24 alnsn return SLJIT_SUCCESS;
638 1.1 alnsn }
639 1.1 alnsn #endif
640 1.1 alnsn
641 1.1 alnsn /*
642 1.13 alnsn * Emit code for BPF_COP and BPF_COPX instructions.
643 1.13 alnsn */
644 1.13 alnsn static int
645 1.28 alnsn emit_cop(struct sljit_compiler *compiler,
646 1.28 alnsn const bpf_ctx_t *bc, const struct bpf_insn *pc,
647 1.28 alnsn struct sljit_jump ***ret0, size_t *ret0_size, size_t *ret0_maxsize)
648 1.13 alnsn {
649 1.29 alnsn #if BJ_TMP3REG == SLJIT_SCRATCH_REG1 || \
650 1.28 alnsn BJ_TMP3REG == SLJIT_SCRATCH_REG2 || \
651 1.28 alnsn BJ_TMP3REG == SLJIT_SCRATCH_REG3
652 1.13 alnsn #error "Not supported assignment of registers."
653 1.13 alnsn #endif
654 1.13 alnsn
655 1.13 alnsn struct sljit_jump *jump;
656 1.28 alnsn sljit_si call_reg;
657 1.28 alnsn sljit_sw call_off;
658 1.13 alnsn int status;
659 1.13 alnsn
660 1.13 alnsn BJ_ASSERT(bc != NULL && bc->copfuncs != NULL);
661 1.13 alnsn
662 1.28 alnsn if (BPF_MISCOP(pc->code) == BPF_COP) {
663 1.28 alnsn call_reg = SLJIT_IMM;
664 1.28 alnsn call_off = SLJIT_FUNC_OFFSET(bc->copfuncs[pc->k]);
665 1.28 alnsn } else {
666 1.13 alnsn /* if (X >= bc->nfuncs) return 0; */
667 1.13 alnsn jump = sljit_emit_cmp(compiler,
668 1.13 alnsn SLJIT_C_GREATER_EQUAL,
669 1.13 alnsn BJ_XREG, 0,
670 1.13 alnsn SLJIT_IMM, bc->nfuncs);
671 1.13 alnsn if (jump == NULL)
672 1.13 alnsn return SLJIT_ERR_ALLOC_FAILED;
673 1.28 alnsn if (!append_jump(jump, ret0, ret0_size, ret0_maxsize))
674 1.28 alnsn return SLJIT_ERR_ALLOC_FAILED;
675 1.28 alnsn
676 1.28 alnsn /* tmp1 = ctx; */
677 1.28 alnsn status = sljit_emit_op1(compiler,
678 1.28 alnsn SLJIT_MOV_P,
679 1.28 alnsn BJ_TMP1REG, 0,
680 1.28 alnsn SLJIT_MEM1(SLJIT_LOCALS_REG),
681 1.28 alnsn offsetof(struct bpfjit_stack, ctx));
682 1.28 alnsn if (status != SLJIT_SUCCESS)
683 1.28 alnsn return status;
684 1.28 alnsn
685 1.28 alnsn /* tmp1 = ctx->copfuncs; */
686 1.28 alnsn status = sljit_emit_op1(compiler,
687 1.28 alnsn SLJIT_MOV_P,
688 1.28 alnsn BJ_TMP1REG, 0,
689 1.28 alnsn SLJIT_MEM1(BJ_TMP1REG),
690 1.28 alnsn offsetof(struct bpf_ctx, copfuncs));
691 1.28 alnsn if (status != SLJIT_SUCCESS)
692 1.28 alnsn return status;
693 1.28 alnsn
694 1.28 alnsn /* tmp2 = X; */
695 1.28 alnsn status = sljit_emit_op1(compiler,
696 1.28 alnsn SLJIT_MOV,
697 1.28 alnsn BJ_TMP2REG, 0,
698 1.28 alnsn BJ_XREG, 0);
699 1.28 alnsn if (status != SLJIT_SUCCESS)
700 1.28 alnsn return status;
701 1.28 alnsn
702 1.28 alnsn /* tmp3 = ctx->copfuncs[tmp2]; */
703 1.28 alnsn call_reg = BJ_TMP3REG;
704 1.28 alnsn call_off = 0;
705 1.28 alnsn status = sljit_emit_op1(compiler,
706 1.28 alnsn SLJIT_MOV_P,
707 1.28 alnsn call_reg, call_off,
708 1.28 alnsn SLJIT_MEM2(BJ_TMP1REG, BJ_TMP2REG),
709 1.28 alnsn SLJIT_WORD_SHIFT);
710 1.28 alnsn if (status != SLJIT_SUCCESS)
711 1.28 alnsn return status;
712 1.13 alnsn }
713 1.13 alnsn
714 1.13 alnsn /*
715 1.13 alnsn * Copy bpf_copfunc_t arguments to registers.
716 1.13 alnsn */
717 1.13 alnsn #if BJ_AREG != SLJIT_SCRATCH_REG3
718 1.13 alnsn status = sljit_emit_op1(compiler,
719 1.13 alnsn SLJIT_MOV_UI,
720 1.13 alnsn SLJIT_SCRATCH_REG3, 0,
721 1.13 alnsn BJ_AREG, 0);
722 1.13 alnsn if (status != SLJIT_SUCCESS)
723 1.13 alnsn return status;
724 1.13 alnsn #endif
725 1.13 alnsn
726 1.13 alnsn status = sljit_emit_op1(compiler,
727 1.13 alnsn SLJIT_MOV_P,
728 1.13 alnsn SLJIT_SCRATCH_REG1, 0,
729 1.13 alnsn SLJIT_MEM1(SLJIT_LOCALS_REG),
730 1.13 alnsn offsetof(struct bpfjit_stack, ctx));
731 1.13 alnsn if (status != SLJIT_SUCCESS)
732 1.13 alnsn return status;
733 1.13 alnsn
734 1.13 alnsn status = sljit_emit_op1(compiler,
735 1.13 alnsn SLJIT_MOV_P,
736 1.13 alnsn SLJIT_SCRATCH_REG2, 0,
737 1.13 alnsn BJ_ARGS, 0);
738 1.13 alnsn if (status != SLJIT_SUCCESS)
739 1.13 alnsn return status;
740 1.13 alnsn
741 1.28 alnsn status = sljit_emit_ijump(compiler,
742 1.28 alnsn SLJIT_CALL3, call_reg, call_off);
743 1.28 alnsn if (status != SLJIT_SUCCESS)
744 1.28 alnsn return status;
745 1.13 alnsn
746 1.13 alnsn #if BJ_AREG != SLJIT_RETURN_REG
747 1.13 alnsn status = sljit_emit_op1(compiler,
748 1.13 alnsn SLJIT_MOV,
749 1.13 alnsn BJ_AREG, 0,
750 1.13 alnsn SLJIT_RETURN_REG, 0);
751 1.13 alnsn if (status != SLJIT_SUCCESS)
752 1.13 alnsn return status;
753 1.13 alnsn #endif
754 1.13 alnsn
755 1.24 alnsn return SLJIT_SUCCESS;
756 1.13 alnsn }
757 1.13 alnsn
758 1.13 alnsn /*
759 1.1 alnsn * Generate code for
760 1.1 alnsn * BPF_LD+BPF_W+BPF_ABS A <- P[k:4]
761 1.1 alnsn * BPF_LD+BPF_H+BPF_ABS A <- P[k:2]
762 1.1 alnsn * BPF_LD+BPF_B+BPF_ABS A <- P[k:1]
763 1.1 alnsn * BPF_LD+BPF_W+BPF_IND A <- P[X+k:4]
764 1.1 alnsn * BPF_LD+BPF_H+BPF_IND A <- P[X+k:2]
765 1.1 alnsn * BPF_LD+BPF_B+BPF_IND A <- P[X+k:1]
766 1.1 alnsn */
767 1.1 alnsn static int
768 1.19 alnsn emit_pkt_read(struct sljit_compiler *compiler,
769 1.7 alnsn const struct bpf_insn *pc, struct sljit_jump *to_mchain_jump,
770 1.7 alnsn struct sljit_jump ***ret0, size_t *ret0_size, size_t *ret0_maxsize)
771 1.1 alnsn {
772 1.25 alnsn int status = SLJIT_ERR_ALLOC_FAILED;
773 1.1 alnsn uint32_t width;
774 1.27 alnsn sljit_si ld_reg;
775 1.1 alnsn struct sljit_jump *jump;
776 1.1 alnsn #ifdef _KERNEL
777 1.1 alnsn struct sljit_label *label;
778 1.1 alnsn struct sljit_jump *over_mchain_jump;
779 1.1 alnsn const bool check_zero_buflen = (to_mchain_jump != NULL);
780 1.1 alnsn #endif
781 1.1 alnsn const uint32_t k = pc->k;
782 1.1 alnsn
783 1.1 alnsn #ifdef _KERNEL
784 1.1 alnsn if (to_mchain_jump == NULL) {
785 1.1 alnsn to_mchain_jump = sljit_emit_cmp(compiler,
786 1.1 alnsn SLJIT_C_EQUAL,
787 1.7 alnsn BJ_BUFLEN, 0,
788 1.1 alnsn SLJIT_IMM, 0);
789 1.1 alnsn if (to_mchain_jump == NULL)
790 1.7 alnsn return SLJIT_ERR_ALLOC_FAILED;
791 1.1 alnsn }
792 1.1 alnsn #endif
793 1.1 alnsn
794 1.27 alnsn ld_reg = BJ_BUF;
795 1.1 alnsn width = read_width(pc);
796 1.1 alnsn
797 1.1 alnsn if (BPF_MODE(pc->code) == BPF_IND) {
798 1.1 alnsn /* tmp1 = buflen - (pc->k + width); */
799 1.1 alnsn status = sljit_emit_op2(compiler,
800 1.1 alnsn SLJIT_SUB,
801 1.7 alnsn BJ_TMP1REG, 0,
802 1.7 alnsn BJ_BUFLEN, 0,
803 1.1 alnsn SLJIT_IMM, k + width);
804 1.1 alnsn if (status != SLJIT_SUCCESS)
805 1.1 alnsn return status;
806 1.1 alnsn
807 1.27 alnsn /* ld_reg = buf + X; */
808 1.27 alnsn ld_reg = BJ_TMP2REG;
809 1.1 alnsn status = sljit_emit_op2(compiler,
810 1.1 alnsn SLJIT_ADD,
811 1.27 alnsn ld_reg, 0,
812 1.7 alnsn BJ_BUF, 0,
813 1.7 alnsn BJ_XREG, 0);
814 1.1 alnsn if (status != SLJIT_SUCCESS)
815 1.1 alnsn return status;
816 1.1 alnsn
817 1.1 alnsn /* if (tmp1 < X) return 0; */
818 1.1 alnsn jump = sljit_emit_cmp(compiler,
819 1.1 alnsn SLJIT_C_LESS,
820 1.7 alnsn BJ_TMP1REG, 0,
821 1.7 alnsn BJ_XREG, 0);
822 1.1 alnsn if (jump == NULL)
823 1.7 alnsn return SLJIT_ERR_ALLOC_FAILED;
824 1.7 alnsn if (!append_jump(jump, ret0, ret0_size, ret0_maxsize))
825 1.7 alnsn return SLJIT_ERR_ALLOC_FAILED;
826 1.1 alnsn }
827 1.1 alnsn
828 1.1 alnsn switch (width) {
829 1.1 alnsn case 4:
830 1.27 alnsn status = emit_read32(compiler, ld_reg, k);
831 1.1 alnsn break;
832 1.1 alnsn case 2:
833 1.27 alnsn status = emit_read16(compiler, ld_reg, k);
834 1.1 alnsn break;
835 1.1 alnsn case 1:
836 1.27 alnsn status = emit_read8(compiler, ld_reg, k);
837 1.1 alnsn break;
838 1.1 alnsn }
839 1.1 alnsn
840 1.1 alnsn if (status != SLJIT_SUCCESS)
841 1.1 alnsn return status;
842 1.1 alnsn
843 1.1 alnsn #ifdef _KERNEL
844 1.1 alnsn over_mchain_jump = sljit_emit_jump(compiler, SLJIT_JUMP);
845 1.1 alnsn if (over_mchain_jump == NULL)
846 1.7 alnsn return SLJIT_ERR_ALLOC_FAILED;
847 1.1 alnsn
848 1.1 alnsn /* entry point to mchain handler */
849 1.1 alnsn label = sljit_emit_label(compiler);
850 1.1 alnsn if (label == NULL)
851 1.7 alnsn return SLJIT_ERR_ALLOC_FAILED;
852 1.1 alnsn sljit_set_label(to_mchain_jump, label);
853 1.1 alnsn
854 1.1 alnsn if (check_zero_buflen) {
855 1.1 alnsn /* if (buflen != 0) return 0; */
856 1.1 alnsn jump = sljit_emit_cmp(compiler,
857 1.1 alnsn SLJIT_C_NOT_EQUAL,
858 1.7 alnsn BJ_BUFLEN, 0,
859 1.1 alnsn SLJIT_IMM, 0);
860 1.1 alnsn if (jump == NULL)
861 1.1 alnsn return SLJIT_ERR_ALLOC_FAILED;
862 1.7 alnsn if (!append_jump(jump, ret0, ret0_size, ret0_maxsize))
863 1.7 alnsn return SLJIT_ERR_ALLOC_FAILED;
864 1.1 alnsn }
865 1.1 alnsn
866 1.1 alnsn switch (width) {
867 1.1 alnsn case 4:
868 1.23 alnsn status = emit_xcall(compiler, pc, BJ_AREG,
869 1.23 alnsn ret0, ret0_size, ret0_maxsize, &m_xword);
870 1.1 alnsn break;
871 1.1 alnsn case 2:
872 1.23 alnsn status = emit_xcall(compiler, pc, BJ_AREG,
873 1.23 alnsn ret0, ret0_size, ret0_maxsize, &m_xhalf);
874 1.1 alnsn break;
875 1.1 alnsn case 1:
876 1.23 alnsn status = emit_xcall(compiler, pc, BJ_AREG,
877 1.23 alnsn ret0, ret0_size, ret0_maxsize, &m_xbyte);
878 1.1 alnsn break;
879 1.1 alnsn }
880 1.1 alnsn
881 1.1 alnsn if (status != SLJIT_SUCCESS)
882 1.1 alnsn return status;
883 1.1 alnsn
884 1.1 alnsn label = sljit_emit_label(compiler);
885 1.1 alnsn if (label == NULL)
886 1.1 alnsn return SLJIT_ERR_ALLOC_FAILED;
887 1.1 alnsn sljit_set_label(over_mchain_jump, label);
888 1.1 alnsn #endif
889 1.1 alnsn
890 1.24 alnsn return SLJIT_SUCCESS;
891 1.1 alnsn }
892 1.1 alnsn
893 1.13 alnsn static int
894 1.19 alnsn emit_memload(struct sljit_compiler *compiler,
895 1.13 alnsn sljit_si dst, uint32_t k, size_t extwords)
896 1.13 alnsn {
897 1.13 alnsn int status;
898 1.13 alnsn sljit_si src;
899 1.13 alnsn sljit_sw srcw;
900 1.13 alnsn
901 1.13 alnsn srcw = k * sizeof(uint32_t);
902 1.13 alnsn
903 1.13 alnsn if (extwords == 0) {
904 1.13 alnsn src = SLJIT_MEM1(SLJIT_LOCALS_REG);
905 1.13 alnsn srcw += offsetof(struct bpfjit_stack, mem);
906 1.13 alnsn } else {
907 1.13 alnsn /* copy extmem pointer to the tmp1 register */
908 1.13 alnsn status = sljit_emit_op1(compiler,
909 1.16 alnsn SLJIT_MOV_P,
910 1.13 alnsn BJ_TMP1REG, 0,
911 1.13 alnsn SLJIT_MEM1(SLJIT_LOCALS_REG),
912 1.13 alnsn offsetof(struct bpfjit_stack, extmem));
913 1.13 alnsn if (status != SLJIT_SUCCESS)
914 1.13 alnsn return status;
915 1.13 alnsn src = SLJIT_MEM1(BJ_TMP1REG);
916 1.13 alnsn }
917 1.13 alnsn
918 1.13 alnsn return sljit_emit_op1(compiler, SLJIT_MOV_UI, dst, 0, src, srcw);
919 1.13 alnsn }
920 1.13 alnsn
921 1.13 alnsn static int
922 1.19 alnsn emit_memstore(struct sljit_compiler *compiler,
923 1.13 alnsn sljit_si src, uint32_t k, size_t extwords)
924 1.13 alnsn {
925 1.13 alnsn int status;
926 1.13 alnsn sljit_si dst;
927 1.13 alnsn sljit_sw dstw;
928 1.13 alnsn
929 1.13 alnsn dstw = k * sizeof(uint32_t);
930 1.13 alnsn
931 1.13 alnsn if (extwords == 0) {
932 1.13 alnsn dst = SLJIT_MEM1(SLJIT_LOCALS_REG);
933 1.13 alnsn dstw += offsetof(struct bpfjit_stack, mem);
934 1.13 alnsn } else {
935 1.13 alnsn /* copy extmem pointer to the tmp1 register */
936 1.13 alnsn status = sljit_emit_op1(compiler,
937 1.16 alnsn SLJIT_MOV_P,
938 1.13 alnsn BJ_TMP1REG, 0,
939 1.13 alnsn SLJIT_MEM1(SLJIT_LOCALS_REG),
940 1.13 alnsn offsetof(struct bpfjit_stack, extmem));
941 1.13 alnsn if (status != SLJIT_SUCCESS)
942 1.13 alnsn return status;
943 1.13 alnsn dst = SLJIT_MEM1(BJ_TMP1REG);
944 1.13 alnsn }
945 1.13 alnsn
946 1.13 alnsn return sljit_emit_op1(compiler, SLJIT_MOV_UI, dst, dstw, src, 0);
947 1.13 alnsn }
948 1.13 alnsn
949 1.1 alnsn /*
950 1.24 alnsn * Emit code for BPF_LDX+BPF_B+BPF_MSH X <- 4*(P[k:1]&0xf).
951 1.1 alnsn */
952 1.1 alnsn static int
953 1.19 alnsn emit_msh(struct sljit_compiler *compiler,
954 1.7 alnsn const struct bpf_insn *pc, struct sljit_jump *to_mchain_jump,
955 1.7 alnsn struct sljit_jump ***ret0, size_t *ret0_size, size_t *ret0_maxsize)
956 1.1 alnsn {
957 1.1 alnsn int status;
958 1.1 alnsn #ifdef _KERNEL
959 1.1 alnsn struct sljit_label *label;
960 1.1 alnsn struct sljit_jump *jump, *over_mchain_jump;
961 1.1 alnsn const bool check_zero_buflen = (to_mchain_jump != NULL);
962 1.1 alnsn #endif
963 1.1 alnsn const uint32_t k = pc->k;
964 1.1 alnsn
965 1.1 alnsn #ifdef _KERNEL
966 1.1 alnsn if (to_mchain_jump == NULL) {
967 1.1 alnsn to_mchain_jump = sljit_emit_cmp(compiler,
968 1.1 alnsn SLJIT_C_EQUAL,
969 1.7 alnsn BJ_BUFLEN, 0,
970 1.1 alnsn SLJIT_IMM, 0);
971 1.1 alnsn if (to_mchain_jump == NULL)
972 1.7 alnsn return SLJIT_ERR_ALLOC_FAILED;
973 1.1 alnsn }
974 1.1 alnsn #endif
975 1.1 alnsn
976 1.1 alnsn /* tmp1 = buf[k] */
977 1.1 alnsn status = sljit_emit_op1(compiler,
978 1.1 alnsn SLJIT_MOV_UB,
979 1.7 alnsn BJ_TMP1REG, 0,
980 1.7 alnsn SLJIT_MEM1(BJ_BUF), k);
981 1.1 alnsn if (status != SLJIT_SUCCESS)
982 1.1 alnsn return status;
983 1.1 alnsn
984 1.1 alnsn #ifdef _KERNEL
985 1.1 alnsn over_mchain_jump = sljit_emit_jump(compiler, SLJIT_JUMP);
986 1.1 alnsn if (over_mchain_jump == NULL)
987 1.1 alnsn return SLJIT_ERR_ALLOC_FAILED;
988 1.1 alnsn
989 1.1 alnsn /* entry point to mchain handler */
990 1.1 alnsn label = sljit_emit_label(compiler);
991 1.1 alnsn if (label == NULL)
992 1.1 alnsn return SLJIT_ERR_ALLOC_FAILED;
993 1.1 alnsn sljit_set_label(to_mchain_jump, label);
994 1.1 alnsn
995 1.1 alnsn if (check_zero_buflen) {
996 1.1 alnsn /* if (buflen != 0) return 0; */
997 1.1 alnsn jump = sljit_emit_cmp(compiler,
998 1.1 alnsn SLJIT_C_NOT_EQUAL,
999 1.7 alnsn BJ_BUFLEN, 0,
1000 1.1 alnsn SLJIT_IMM, 0);
1001 1.1 alnsn if (jump == NULL)
1002 1.7 alnsn return SLJIT_ERR_ALLOC_FAILED;
1003 1.7 alnsn if (!append_jump(jump, ret0, ret0_size, ret0_maxsize))
1004 1.7 alnsn return SLJIT_ERR_ALLOC_FAILED;
1005 1.1 alnsn }
1006 1.1 alnsn
1007 1.23 alnsn status = emit_xcall(compiler, pc, BJ_TMP1REG,
1008 1.23 alnsn ret0, ret0_size, ret0_maxsize, &m_xbyte);
1009 1.1 alnsn if (status != SLJIT_SUCCESS)
1010 1.1 alnsn return status;
1011 1.7 alnsn
1012 1.30 alnsn label = sljit_emit_label(compiler);
1013 1.30 alnsn if (label == NULL)
1014 1.30 alnsn return SLJIT_ERR_ALLOC_FAILED;
1015 1.30 alnsn sljit_set_label(over_mchain_jump, label);
1016 1.30 alnsn #endif
1017 1.30 alnsn
1018 1.1 alnsn /* tmp1 &= 0xf */
1019 1.1 alnsn status = sljit_emit_op2(compiler,
1020 1.1 alnsn SLJIT_AND,
1021 1.7 alnsn BJ_TMP1REG, 0,
1022 1.7 alnsn BJ_TMP1REG, 0,
1023 1.1 alnsn SLJIT_IMM, 0xf);
1024 1.1 alnsn if (status != SLJIT_SUCCESS)
1025 1.1 alnsn return status;
1026 1.1 alnsn
1027 1.30 alnsn /* X = tmp1 << 2 */
1028 1.1 alnsn status = sljit_emit_op2(compiler,
1029 1.1 alnsn SLJIT_SHL,
1030 1.7 alnsn BJ_XREG, 0,
1031 1.7 alnsn BJ_TMP1REG, 0,
1032 1.1 alnsn SLJIT_IMM, 2);
1033 1.1 alnsn if (status != SLJIT_SUCCESS)
1034 1.1 alnsn return status;
1035 1.1 alnsn
1036 1.24 alnsn return SLJIT_SUCCESS;
1037 1.1 alnsn }
1038 1.1 alnsn
1039 1.1 alnsn static int
1040 1.19 alnsn emit_pow2_division(struct sljit_compiler *compiler, uint32_t k)
1041 1.1 alnsn {
1042 1.1 alnsn int shift = 0;
1043 1.1 alnsn int status = SLJIT_SUCCESS;
1044 1.1 alnsn
1045 1.1 alnsn while (k > 1) {
1046 1.1 alnsn k >>= 1;
1047 1.1 alnsn shift++;
1048 1.1 alnsn }
1049 1.1 alnsn
1050 1.7 alnsn BJ_ASSERT(k == 1 && shift < 32);
1051 1.1 alnsn
1052 1.1 alnsn if (shift != 0) {
1053 1.1 alnsn status = sljit_emit_op2(compiler,
1054 1.1 alnsn SLJIT_LSHR|SLJIT_INT_OP,
1055 1.7 alnsn BJ_AREG, 0,
1056 1.7 alnsn BJ_AREG, 0,
1057 1.1 alnsn SLJIT_IMM, shift);
1058 1.1 alnsn }
1059 1.1 alnsn
1060 1.1 alnsn return status;
1061 1.1 alnsn }
1062 1.1 alnsn
1063 1.1 alnsn #if !defined(BPFJIT_USE_UDIV)
1064 1.1 alnsn static sljit_uw
1065 1.1 alnsn divide(sljit_uw x, sljit_uw y)
1066 1.1 alnsn {
1067 1.1 alnsn
1068 1.1 alnsn return (uint32_t)x / (uint32_t)y;
1069 1.1 alnsn }
1070 1.1 alnsn #endif
1071 1.1 alnsn
1072 1.1 alnsn /*
1073 1.24 alnsn * Emit code for A = A / div.
1074 1.7 alnsn * divt,divw are either SLJIT_IMM,pc->k or BJ_XREG,0.
1075 1.1 alnsn */
1076 1.1 alnsn static int
1077 1.19 alnsn emit_division(struct sljit_compiler *compiler, int divt, sljit_sw divw)
1078 1.1 alnsn {
1079 1.1 alnsn int status;
1080 1.1 alnsn
1081 1.12 alnsn #if BJ_AREG != SLJIT_SCRATCH_REG1
1082 1.1 alnsn status = sljit_emit_op1(compiler,
1083 1.1 alnsn SLJIT_MOV,
1084 1.12 alnsn SLJIT_SCRATCH_REG1, 0,
1085 1.7 alnsn BJ_AREG, 0);
1086 1.1 alnsn if (status != SLJIT_SUCCESS)
1087 1.1 alnsn return status;
1088 1.1 alnsn #endif
1089 1.1 alnsn
1090 1.1 alnsn status = sljit_emit_op1(compiler,
1091 1.1 alnsn SLJIT_MOV,
1092 1.12 alnsn SLJIT_SCRATCH_REG2, 0,
1093 1.1 alnsn divt, divw);
1094 1.1 alnsn if (status != SLJIT_SUCCESS)
1095 1.1 alnsn return status;
1096 1.1 alnsn
1097 1.1 alnsn #if defined(BPFJIT_USE_UDIV)
1098 1.1 alnsn status = sljit_emit_op0(compiler, SLJIT_UDIV|SLJIT_INT_OP);
1099 1.1 alnsn
1100 1.12 alnsn #if BJ_AREG != SLJIT_SCRATCH_REG1
1101 1.1 alnsn status = sljit_emit_op1(compiler,
1102 1.1 alnsn SLJIT_MOV,
1103 1.7 alnsn BJ_AREG, 0,
1104 1.12 alnsn SLJIT_SCRATCH_REG1, 0);
1105 1.1 alnsn if (status != SLJIT_SUCCESS)
1106 1.1 alnsn return status;
1107 1.1 alnsn #endif
1108 1.1 alnsn #else
1109 1.1 alnsn status = sljit_emit_ijump(compiler,
1110 1.1 alnsn SLJIT_CALL2,
1111 1.1 alnsn SLJIT_IMM, SLJIT_FUNC_OFFSET(divide));
1112 1.1 alnsn
1113 1.7 alnsn #if BJ_AREG != SLJIT_RETURN_REG
1114 1.1 alnsn status = sljit_emit_op1(compiler,
1115 1.1 alnsn SLJIT_MOV,
1116 1.7 alnsn BJ_AREG, 0,
1117 1.1 alnsn SLJIT_RETURN_REG, 0);
1118 1.1 alnsn if (status != SLJIT_SUCCESS)
1119 1.1 alnsn return status;
1120 1.1 alnsn #endif
1121 1.1 alnsn #endif
1122 1.1 alnsn
1123 1.1 alnsn return status;
1124 1.1 alnsn }
1125 1.1 alnsn
1126 1.1 alnsn /*
1127 1.1 alnsn * Return true if pc is a "read from packet" instruction.
1128 1.1 alnsn * If length is not NULL and return value is true, *length will
1129 1.1 alnsn * be set to a safe length required to read a packet.
1130 1.1 alnsn */
1131 1.1 alnsn static bool
1132 1.8 alnsn read_pkt_insn(const struct bpf_insn *pc, bpfjit_abc_length_t *length)
1133 1.1 alnsn {
1134 1.1 alnsn bool rv;
1135 1.8 alnsn bpfjit_abc_length_t width;
1136 1.1 alnsn
1137 1.1 alnsn switch (BPF_CLASS(pc->code)) {
1138 1.1 alnsn default:
1139 1.1 alnsn rv = false;
1140 1.1 alnsn break;
1141 1.1 alnsn
1142 1.1 alnsn case BPF_LD:
1143 1.1 alnsn rv = BPF_MODE(pc->code) == BPF_ABS ||
1144 1.1 alnsn BPF_MODE(pc->code) == BPF_IND;
1145 1.1 alnsn if (rv)
1146 1.1 alnsn width = read_width(pc);
1147 1.1 alnsn break;
1148 1.1 alnsn
1149 1.1 alnsn case BPF_LDX:
1150 1.1 alnsn rv = pc->code == (BPF_LDX|BPF_B|BPF_MSH);
1151 1.1 alnsn width = 1;
1152 1.1 alnsn break;
1153 1.1 alnsn }
1154 1.1 alnsn
1155 1.1 alnsn if (rv && length != NULL) {
1156 1.9 alnsn /*
1157 1.9 alnsn * Values greater than UINT32_MAX will generate
1158 1.9 alnsn * unconditional "return 0".
1159 1.9 alnsn */
1160 1.9 alnsn *length = (uint32_t)pc->k + width;
1161 1.1 alnsn }
1162 1.1 alnsn
1163 1.1 alnsn return rv;
1164 1.1 alnsn }
1165 1.1 alnsn
1166 1.1 alnsn static void
1167 1.7 alnsn optimize_init(struct bpfjit_insn_data *insn_dat, size_t insn_count)
1168 1.1 alnsn {
1169 1.7 alnsn size_t i;
1170 1.1 alnsn
1171 1.7 alnsn for (i = 0; i < insn_count; i++) {
1172 1.7 alnsn SLIST_INIT(&insn_dat[i].bjumps);
1173 1.7 alnsn insn_dat[i].invalid = BJ_INIT_NOBITS;
1174 1.1 alnsn }
1175 1.1 alnsn }
1176 1.1 alnsn
1177 1.1 alnsn /*
1178 1.1 alnsn * The function divides instructions into blocks. Destination of a jump
1179 1.1 alnsn * instruction starts a new block. BPF_RET and BPF_JMP instructions
1180 1.1 alnsn * terminate a block. Blocks are linear, that is, there are no jumps out
1181 1.1 alnsn * from the middle of a block and there are no jumps in to the middle of
1182 1.1 alnsn * a block.
1183 1.7 alnsn *
1184 1.7 alnsn * The function also sets bits in *initmask for memwords that
1185 1.7 alnsn * need to be initialized to zero. Note that this set should be empty
1186 1.7 alnsn * for any valid kernel filter program.
1187 1.1 alnsn */
1188 1.7 alnsn static bool
1189 1.19 alnsn optimize_pass1(const bpf_ctx_t *bc, const struct bpf_insn *insns,
1190 1.19 alnsn struct bpfjit_insn_data *insn_dat, size_t insn_count,
1191 1.20 alnsn bpf_memword_init_t *initmask, bpfjit_hint_t *hints)
1192 1.1 alnsn {
1193 1.7 alnsn struct bpfjit_jump *jtf;
1194 1.1 alnsn size_t i;
1195 1.7 alnsn uint32_t jt, jf;
1196 1.10 alnsn bpfjit_abc_length_t length;
1197 1.13 alnsn bpf_memword_init_t invalid; /* borrowed from bpf_filter() */
1198 1.1 alnsn bool unreachable;
1199 1.1 alnsn
1200 1.19 alnsn const size_t memwords = GET_MEMWORDS(bc);
1201 1.13 alnsn
1202 1.20 alnsn *hints = 0;
1203 1.7 alnsn *initmask = BJ_INIT_NOBITS;
1204 1.1 alnsn
1205 1.1 alnsn unreachable = false;
1206 1.7 alnsn invalid = ~BJ_INIT_NOBITS;
1207 1.1 alnsn
1208 1.1 alnsn for (i = 0; i < insn_count; i++) {
1209 1.7 alnsn if (!SLIST_EMPTY(&insn_dat[i].bjumps))
1210 1.1 alnsn unreachable = false;
1211 1.7 alnsn insn_dat[i].unreachable = unreachable;
1212 1.1 alnsn
1213 1.1 alnsn if (unreachable)
1214 1.1 alnsn continue;
1215 1.1 alnsn
1216 1.7 alnsn invalid |= insn_dat[i].invalid;
1217 1.1 alnsn
1218 1.10 alnsn if (read_pkt_insn(&insns[i], &length) && length > UINT32_MAX)
1219 1.10 alnsn unreachable = true;
1220 1.10 alnsn
1221 1.1 alnsn switch (BPF_CLASS(insns[i].code)) {
1222 1.1 alnsn case BPF_RET:
1223 1.7 alnsn if (BPF_RVAL(insns[i].code) == BPF_A)
1224 1.7 alnsn *initmask |= invalid & BJ_INIT_ABIT;
1225 1.7 alnsn
1226 1.1 alnsn unreachable = true;
1227 1.1 alnsn continue;
1228 1.1 alnsn
1229 1.7 alnsn case BPF_LD:
1230 1.27 alnsn if (BPF_MODE(insns[i].code) == BPF_ABS)
1231 1.27 alnsn *hints |= BJ_HINT_ABS;
1232 1.7 alnsn
1233 1.20 alnsn if (BPF_MODE(insns[i].code) == BPF_IND) {
1234 1.27 alnsn *hints |= BJ_HINT_IND | BJ_HINT_XREG;
1235 1.7 alnsn *initmask |= invalid & BJ_INIT_XBIT;
1236 1.20 alnsn }
1237 1.7 alnsn
1238 1.7 alnsn if (BPF_MODE(insns[i].code) == BPF_MEM &&
1239 1.13 alnsn (uint32_t)insns[i].k < memwords) {
1240 1.7 alnsn *initmask |= invalid & BJ_INIT_MBIT(insns[i].k);
1241 1.7 alnsn }
1242 1.7 alnsn
1243 1.7 alnsn invalid &= ~BJ_INIT_ABIT;
1244 1.7 alnsn continue;
1245 1.7 alnsn
1246 1.7 alnsn case BPF_LDX:
1247 1.20 alnsn *hints |= BJ_HINT_XREG | BJ_HINT_LDX;
1248 1.7 alnsn
1249 1.7 alnsn if (BPF_MODE(insns[i].code) == BPF_MEM &&
1250 1.13 alnsn (uint32_t)insns[i].k < memwords) {
1251 1.7 alnsn *initmask |= invalid & BJ_INIT_MBIT(insns[i].k);
1252 1.7 alnsn }
1253 1.7 alnsn
1254 1.29 alnsn if (BPF_MODE(insns[i].code) == BPF_MSH &&
1255 1.29 alnsn BPF_SIZE(insns[i].code) == BPF_B) {
1256 1.29 alnsn *hints |= BJ_HINT_MSH;
1257 1.29 alnsn }
1258 1.29 alnsn
1259 1.7 alnsn invalid &= ~BJ_INIT_XBIT;
1260 1.7 alnsn continue;
1261 1.7 alnsn
1262 1.7 alnsn case BPF_ST:
1263 1.7 alnsn *initmask |= invalid & BJ_INIT_ABIT;
1264 1.7 alnsn
1265 1.13 alnsn if ((uint32_t)insns[i].k < memwords)
1266 1.7 alnsn invalid &= ~BJ_INIT_MBIT(insns[i].k);
1267 1.7 alnsn
1268 1.7 alnsn continue;
1269 1.7 alnsn
1270 1.7 alnsn case BPF_STX:
1271 1.20 alnsn *hints |= BJ_HINT_XREG;
1272 1.7 alnsn *initmask |= invalid & BJ_INIT_XBIT;
1273 1.7 alnsn
1274 1.13 alnsn if ((uint32_t)insns[i].k < memwords)
1275 1.7 alnsn invalid &= ~BJ_INIT_MBIT(insns[i].k);
1276 1.7 alnsn
1277 1.7 alnsn continue;
1278 1.7 alnsn
1279 1.7 alnsn case BPF_ALU:
1280 1.7 alnsn *initmask |= invalid & BJ_INIT_ABIT;
1281 1.7 alnsn
1282 1.7 alnsn if (insns[i].code != (BPF_ALU|BPF_NEG) &&
1283 1.7 alnsn BPF_SRC(insns[i].code) == BPF_X) {
1284 1.20 alnsn *hints |= BJ_HINT_XREG;
1285 1.7 alnsn *initmask |= invalid & BJ_INIT_XBIT;
1286 1.7 alnsn }
1287 1.7 alnsn
1288 1.7 alnsn invalid &= ~BJ_INIT_ABIT;
1289 1.7 alnsn continue;
1290 1.7 alnsn
1291 1.7 alnsn case BPF_MISC:
1292 1.7 alnsn switch (BPF_MISCOP(insns[i].code)) {
1293 1.7 alnsn case BPF_TAX: // X <- A
1294 1.20 alnsn *hints |= BJ_HINT_XREG;
1295 1.7 alnsn *initmask |= invalid & BJ_INIT_ABIT;
1296 1.7 alnsn invalid &= ~BJ_INIT_XBIT;
1297 1.7 alnsn continue;
1298 1.7 alnsn
1299 1.7 alnsn case BPF_TXA: // A <- X
1300 1.20 alnsn *hints |= BJ_HINT_XREG;
1301 1.7 alnsn *initmask |= invalid & BJ_INIT_XBIT;
1302 1.7 alnsn invalid &= ~BJ_INIT_ABIT;
1303 1.7 alnsn continue;
1304 1.13 alnsn
1305 1.13 alnsn case BPF_COPX:
1306 1.28 alnsn *hints |= BJ_HINT_XREG | BJ_HINT_COPX;
1307 1.13 alnsn /* FALLTHROUGH */
1308 1.13 alnsn
1309 1.13 alnsn case BPF_COP:
1310 1.20 alnsn *hints |= BJ_HINT_COP;
1311 1.13 alnsn *initmask |= invalid & BJ_INIT_ABIT;
1312 1.13 alnsn invalid &= ~BJ_INIT_ABIT;
1313 1.13 alnsn continue;
1314 1.7 alnsn }
1315 1.7 alnsn
1316 1.7 alnsn continue;
1317 1.7 alnsn
1318 1.1 alnsn case BPF_JMP:
1319 1.7 alnsn /* Initialize abc_length for ABC pass. */
1320 1.8 alnsn insn_dat[i].u.jdata.abc_length = MAX_ABC_LENGTH;
1321 1.7 alnsn
1322 1.7 alnsn if (BPF_OP(insns[i].code) == BPF_JA) {
1323 1.1 alnsn jt = jf = insns[i].k;
1324 1.1 alnsn } else {
1325 1.1 alnsn jt = insns[i].jt;
1326 1.1 alnsn jf = insns[i].jf;
1327 1.1 alnsn }
1328 1.1 alnsn
1329 1.1 alnsn if (jt >= insn_count - (i + 1) ||
1330 1.1 alnsn jf >= insn_count - (i + 1)) {
1331 1.7 alnsn return false;
1332 1.1 alnsn }
1333 1.1 alnsn
1334 1.1 alnsn if (jt > 0 && jf > 0)
1335 1.1 alnsn unreachable = true;
1336 1.1 alnsn
1337 1.7 alnsn jt += i + 1;
1338 1.7 alnsn jf += i + 1;
1339 1.7 alnsn
1340 1.7 alnsn jtf = insn_dat[i].u.jdata.jtf;
1341 1.1 alnsn
1342 1.7 alnsn jtf[0].jdata = &insn_dat[i].u.jdata;
1343 1.7 alnsn SLIST_INSERT_HEAD(&insn_dat[jt].bjumps,
1344 1.7 alnsn &jtf[0], entries);
1345 1.1 alnsn
1346 1.1 alnsn if (jf != jt) {
1347 1.7 alnsn jtf[1].jdata = &insn_dat[i].u.jdata;
1348 1.7 alnsn SLIST_INSERT_HEAD(&insn_dat[jf].bjumps,
1349 1.7 alnsn &jtf[1], entries);
1350 1.1 alnsn }
1351 1.1 alnsn
1352 1.7 alnsn insn_dat[jf].invalid |= invalid;
1353 1.7 alnsn insn_dat[jt].invalid |= invalid;
1354 1.7 alnsn invalid = 0;
1355 1.7 alnsn
1356 1.1 alnsn continue;
1357 1.1 alnsn }
1358 1.1 alnsn }
1359 1.1 alnsn
1360 1.7 alnsn return true;
1361 1.1 alnsn }
1362 1.1 alnsn
1363 1.1 alnsn /*
1364 1.7 alnsn * Array Bounds Check Elimination (ABC) pass.
1365 1.1 alnsn */
1366 1.7 alnsn static void
1367 1.19 alnsn optimize_pass2(const bpf_ctx_t *bc, const struct bpf_insn *insns,
1368 1.19 alnsn struct bpfjit_insn_data *insn_dat, size_t insn_count)
1369 1.7 alnsn {
1370 1.7 alnsn struct bpfjit_jump *jmp;
1371 1.7 alnsn const struct bpf_insn *pc;
1372 1.7 alnsn struct bpfjit_insn_data *pd;
1373 1.7 alnsn size_t i;
1374 1.8 alnsn bpfjit_abc_length_t length, abc_length = 0;
1375 1.7 alnsn
1376 1.19 alnsn const size_t extwords = GET_EXTWORDS(bc);
1377 1.19 alnsn
1378 1.7 alnsn for (i = insn_count; i != 0; i--) {
1379 1.7 alnsn pc = &insns[i-1];
1380 1.7 alnsn pd = &insn_dat[i-1];
1381 1.7 alnsn
1382 1.7 alnsn if (pd->unreachable)
1383 1.7 alnsn continue;
1384 1.7 alnsn
1385 1.7 alnsn switch (BPF_CLASS(pc->code)) {
1386 1.7 alnsn case BPF_RET:
1387 1.11 alnsn /*
1388 1.11 alnsn * It's quite common for bpf programs to
1389 1.11 alnsn * check packet bytes in increasing order
1390 1.11 alnsn * and return zero if bytes don't match
1391 1.11 alnsn * specified critetion. Such programs disable
1392 1.11 alnsn * ABC optimization completely because for
1393 1.11 alnsn * every jump there is a branch with no read
1394 1.11 alnsn * instruction.
1395 1.13 alnsn * With no side effects, BPF_STMT(BPF_RET+BPF_K, 0)
1396 1.13 alnsn * is indistinguishable from out-of-bound load.
1397 1.11 alnsn * Therefore, abc_length can be set to
1398 1.11 alnsn * MAX_ABC_LENGTH and enable ABC for many
1399 1.11 alnsn * bpf programs.
1400 1.13 alnsn * If this optimization encounters any
1401 1.11 alnsn * instruction with a side effect, it will
1402 1.11 alnsn * reset abc_length.
1403 1.11 alnsn */
1404 1.11 alnsn if (BPF_RVAL(pc->code) == BPF_K && pc->k == 0)
1405 1.11 alnsn abc_length = MAX_ABC_LENGTH;
1406 1.11 alnsn else
1407 1.11 alnsn abc_length = 0;
1408 1.7 alnsn break;
1409 1.7 alnsn
1410 1.13 alnsn case BPF_MISC:
1411 1.13 alnsn if (BPF_MISCOP(pc->code) == BPF_COP ||
1412 1.13 alnsn BPF_MISCOP(pc->code) == BPF_COPX) {
1413 1.13 alnsn /* COP instructions can have side effects. */
1414 1.13 alnsn abc_length = 0;
1415 1.13 alnsn }
1416 1.13 alnsn break;
1417 1.13 alnsn
1418 1.13 alnsn case BPF_ST:
1419 1.13 alnsn case BPF_STX:
1420 1.13 alnsn if (extwords != 0) {
1421 1.13 alnsn /* Write to memory is visible after a call. */
1422 1.13 alnsn abc_length = 0;
1423 1.13 alnsn }
1424 1.13 alnsn break;
1425 1.13 alnsn
1426 1.7 alnsn case BPF_JMP:
1427 1.7 alnsn abc_length = pd->u.jdata.abc_length;
1428 1.7 alnsn break;
1429 1.7 alnsn
1430 1.7 alnsn default:
1431 1.7 alnsn if (read_pkt_insn(pc, &length)) {
1432 1.7 alnsn if (abc_length < length)
1433 1.7 alnsn abc_length = length;
1434 1.7 alnsn pd->u.rdata.abc_length = abc_length;
1435 1.7 alnsn }
1436 1.7 alnsn break;
1437 1.7 alnsn }
1438 1.7 alnsn
1439 1.7 alnsn SLIST_FOREACH(jmp, &pd->bjumps, entries) {
1440 1.7 alnsn if (jmp->jdata->abc_length > abc_length)
1441 1.7 alnsn jmp->jdata->abc_length = abc_length;
1442 1.7 alnsn }
1443 1.7 alnsn }
1444 1.7 alnsn }
1445 1.7 alnsn
1446 1.7 alnsn static void
1447 1.7 alnsn optimize_pass3(const struct bpf_insn *insns,
1448 1.7 alnsn struct bpfjit_insn_data *insn_dat, size_t insn_count)
1449 1.1 alnsn {
1450 1.7 alnsn struct bpfjit_jump *jmp;
1451 1.1 alnsn size_t i;
1452 1.8 alnsn bpfjit_abc_length_t checked_length = 0;
1453 1.1 alnsn
1454 1.1 alnsn for (i = 0; i < insn_count; i++) {
1455 1.7 alnsn if (insn_dat[i].unreachable)
1456 1.7 alnsn continue;
1457 1.1 alnsn
1458 1.7 alnsn SLIST_FOREACH(jmp, &insn_dat[i].bjumps, entries) {
1459 1.7 alnsn if (jmp->jdata->checked_length < checked_length)
1460 1.7 alnsn checked_length = jmp->jdata->checked_length;
1461 1.1 alnsn }
1462 1.1 alnsn
1463 1.7 alnsn if (BPF_CLASS(insns[i].code) == BPF_JMP) {
1464 1.7 alnsn insn_dat[i].u.jdata.checked_length = checked_length;
1465 1.8 alnsn } else if (read_pkt_insn(&insns[i], NULL)) {
1466 1.7 alnsn struct bpfjit_read_pkt_data *rdata =
1467 1.7 alnsn &insn_dat[i].u.rdata;
1468 1.7 alnsn rdata->check_length = 0;
1469 1.7 alnsn if (checked_length < rdata->abc_length) {
1470 1.7 alnsn checked_length = rdata->abc_length;
1471 1.7 alnsn rdata->check_length = checked_length;
1472 1.7 alnsn }
1473 1.1 alnsn }
1474 1.7 alnsn }
1475 1.7 alnsn }
1476 1.1 alnsn
1477 1.7 alnsn static bool
1478 1.19 alnsn optimize(const bpf_ctx_t *bc, const struct bpf_insn *insns,
1479 1.7 alnsn struct bpfjit_insn_data *insn_dat, size_t insn_count,
1480 1.20 alnsn bpf_memword_init_t *initmask, bpfjit_hint_t *hints)
1481 1.7 alnsn {
1482 1.1 alnsn
1483 1.7 alnsn optimize_init(insn_dat, insn_count);
1484 1.7 alnsn
1485 1.20 alnsn if (!optimize_pass1(bc, insns, insn_dat, insn_count, initmask, hints))
1486 1.7 alnsn return false;
1487 1.1 alnsn
1488 1.19 alnsn optimize_pass2(bc, insns, insn_dat, insn_count);
1489 1.7 alnsn optimize_pass3(insns, insn_dat, insn_count);
1490 1.7 alnsn
1491 1.7 alnsn return true;
1492 1.1 alnsn }
1493 1.1 alnsn
1494 1.1 alnsn /*
1495 1.1 alnsn * Convert BPF_ALU operations except BPF_NEG and BPF_DIV to sljit operation.
1496 1.1 alnsn */
1497 1.1 alnsn static int
1498 1.7 alnsn bpf_alu_to_sljit_op(const struct bpf_insn *pc)
1499 1.1 alnsn {
1500 1.1 alnsn
1501 1.1 alnsn /*
1502 1.1 alnsn * Note: all supported 64bit arches have 32bit multiply
1503 1.1 alnsn * instruction so SLJIT_INT_OP doesn't have any overhead.
1504 1.1 alnsn */
1505 1.1 alnsn switch (BPF_OP(pc->code)) {
1506 1.1 alnsn case BPF_ADD: return SLJIT_ADD;
1507 1.1 alnsn case BPF_SUB: return SLJIT_SUB;
1508 1.1 alnsn case BPF_MUL: return SLJIT_MUL|SLJIT_INT_OP;
1509 1.1 alnsn case BPF_OR: return SLJIT_OR;
1510 1.1 alnsn case BPF_AND: return SLJIT_AND;
1511 1.1 alnsn case BPF_LSH: return SLJIT_SHL;
1512 1.1 alnsn case BPF_RSH: return SLJIT_LSHR|SLJIT_INT_OP;
1513 1.1 alnsn default:
1514 1.7 alnsn BJ_ASSERT(false);
1515 1.1 alnsn return 0;
1516 1.1 alnsn }
1517 1.1 alnsn }
1518 1.1 alnsn
1519 1.1 alnsn /*
1520 1.1 alnsn * Convert BPF_JMP operations except BPF_JA to sljit condition.
1521 1.1 alnsn */
1522 1.1 alnsn static int
1523 1.7 alnsn bpf_jmp_to_sljit_cond(const struct bpf_insn *pc, bool negate)
1524 1.1 alnsn {
1525 1.1 alnsn /*
1526 1.1 alnsn * Note: all supported 64bit arches have 32bit comparison
1527 1.1 alnsn * instructions so SLJIT_INT_OP doesn't have any overhead.
1528 1.1 alnsn */
1529 1.1 alnsn int rv = SLJIT_INT_OP;
1530 1.1 alnsn
1531 1.1 alnsn switch (BPF_OP(pc->code)) {
1532 1.1 alnsn case BPF_JGT:
1533 1.1 alnsn rv |= negate ? SLJIT_C_LESS_EQUAL : SLJIT_C_GREATER;
1534 1.1 alnsn break;
1535 1.1 alnsn case BPF_JGE:
1536 1.1 alnsn rv |= negate ? SLJIT_C_LESS : SLJIT_C_GREATER_EQUAL;
1537 1.1 alnsn break;
1538 1.1 alnsn case BPF_JEQ:
1539 1.1 alnsn rv |= negate ? SLJIT_C_NOT_EQUAL : SLJIT_C_EQUAL;
1540 1.1 alnsn break;
1541 1.1 alnsn case BPF_JSET:
1542 1.1 alnsn rv |= negate ? SLJIT_C_EQUAL : SLJIT_C_NOT_EQUAL;
1543 1.1 alnsn break;
1544 1.1 alnsn default:
1545 1.7 alnsn BJ_ASSERT(false);
1546 1.1 alnsn }
1547 1.1 alnsn
1548 1.1 alnsn return rv;
1549 1.1 alnsn }
1550 1.1 alnsn
1551 1.1 alnsn /*
1552 1.1 alnsn * Convert BPF_K and BPF_X to sljit register.
1553 1.1 alnsn */
1554 1.1 alnsn static int
1555 1.7 alnsn kx_to_reg(const struct bpf_insn *pc)
1556 1.1 alnsn {
1557 1.1 alnsn
1558 1.1 alnsn switch (BPF_SRC(pc->code)) {
1559 1.1 alnsn case BPF_K: return SLJIT_IMM;
1560 1.7 alnsn case BPF_X: return BJ_XREG;
1561 1.1 alnsn default:
1562 1.7 alnsn BJ_ASSERT(false);
1563 1.1 alnsn return 0;
1564 1.1 alnsn }
1565 1.1 alnsn }
1566 1.1 alnsn
1567 1.12 alnsn static sljit_sw
1568 1.7 alnsn kx_to_reg_arg(const struct bpf_insn *pc)
1569 1.1 alnsn {
1570 1.1 alnsn
1571 1.1 alnsn switch (BPF_SRC(pc->code)) {
1572 1.1 alnsn case BPF_K: return (uint32_t)pc->k; /* SLJIT_IMM, pc->k, */
1573 1.7 alnsn case BPF_X: return 0; /* BJ_XREG, 0, */
1574 1.1 alnsn default:
1575 1.7 alnsn BJ_ASSERT(false);
1576 1.1 alnsn return 0;
1577 1.1 alnsn }
1578 1.1 alnsn }
1579 1.1 alnsn
1580 1.19 alnsn static bool
1581 1.19 alnsn generate_insn_code(struct sljit_compiler *compiler, const bpf_ctx_t *bc,
1582 1.19 alnsn const struct bpf_insn *insns, struct bpfjit_insn_data *insn_dat,
1583 1.19 alnsn size_t insn_count)
1584 1.1 alnsn {
1585 1.1 alnsn /* a list of jumps to out-of-bound return from a generated function */
1586 1.1 alnsn struct sljit_jump **ret0;
1587 1.7 alnsn size_t ret0_size, ret0_maxsize;
1588 1.1 alnsn
1589 1.19 alnsn struct sljit_jump *jump;
1590 1.19 alnsn struct sljit_label *label;
1591 1.7 alnsn const struct bpf_insn *pc;
1592 1.1 alnsn struct bpfjit_jump *bjump, *jtf;
1593 1.1 alnsn struct sljit_jump *to_mchain_jump;
1594 1.1 alnsn
1595 1.19 alnsn size_t i;
1596 1.19 alnsn int status;
1597 1.19 alnsn int branching, negate;
1598 1.19 alnsn unsigned int rval, mode, src;
1599 1.1 alnsn uint32_t jt, jf;
1600 1.1 alnsn
1601 1.19 alnsn bool unconditional_ret;
1602 1.19 alnsn bool rv;
1603 1.19 alnsn
1604 1.19 alnsn const size_t extwords = GET_EXTWORDS(bc);
1605 1.19 alnsn const size_t memwords = GET_MEMWORDS(bc);
1606 1.13 alnsn
1607 1.13 alnsn ret0 = NULL;
1608 1.19 alnsn rv = false;
1609 1.7 alnsn
1610 1.1 alnsn ret0_size = 0;
1611 1.7 alnsn ret0_maxsize = 64;
1612 1.7 alnsn ret0 = BJ_ALLOC(ret0_maxsize * sizeof(ret0[0]));
1613 1.7 alnsn if (ret0 == NULL)
1614 1.1 alnsn goto fail;
1615 1.1 alnsn
1616 1.24 alnsn /* reset sjump members of jdata */
1617 1.24 alnsn for (i = 0; i < insn_count; i++) {
1618 1.24 alnsn if (insn_dat[i].unreachable ||
1619 1.24 alnsn BPF_CLASS(insns[i].code) != BPF_JMP) {
1620 1.24 alnsn continue;
1621 1.24 alnsn }
1622 1.24 alnsn
1623 1.24 alnsn jtf = insn_dat[i].u.jdata.jtf;
1624 1.24 alnsn jtf[0].sjump = jtf[1].sjump = NULL;
1625 1.24 alnsn }
1626 1.24 alnsn
1627 1.24 alnsn /* main loop */
1628 1.1 alnsn for (i = 0; i < insn_count; i++) {
1629 1.7 alnsn if (insn_dat[i].unreachable)
1630 1.1 alnsn continue;
1631 1.1 alnsn
1632 1.1 alnsn /*
1633 1.1 alnsn * Resolve jumps to the current insn.
1634 1.1 alnsn */
1635 1.1 alnsn label = NULL;
1636 1.7 alnsn SLIST_FOREACH(bjump, &insn_dat[i].bjumps, entries) {
1637 1.7 alnsn if (bjump->sjump != NULL) {
1638 1.1 alnsn if (label == NULL)
1639 1.1 alnsn label = sljit_emit_label(compiler);
1640 1.1 alnsn if (label == NULL)
1641 1.1 alnsn goto fail;
1642 1.7 alnsn sljit_set_label(bjump->sjump, label);
1643 1.1 alnsn }
1644 1.1 alnsn }
1645 1.1 alnsn
1646 1.9 alnsn to_mchain_jump = NULL;
1647 1.9 alnsn unconditional_ret = false;
1648 1.9 alnsn
1649 1.9 alnsn if (read_pkt_insn(&insns[i], NULL)) {
1650 1.9 alnsn if (insn_dat[i].u.rdata.check_length > UINT32_MAX) {
1651 1.9 alnsn /* Jump to "return 0" unconditionally. */
1652 1.9 alnsn unconditional_ret = true;
1653 1.9 alnsn jump = sljit_emit_jump(compiler, SLJIT_JUMP);
1654 1.9 alnsn if (jump == NULL)
1655 1.9 alnsn goto fail;
1656 1.9 alnsn if (!append_jump(jump, &ret0,
1657 1.9 alnsn &ret0_size, &ret0_maxsize))
1658 1.9 alnsn goto fail;
1659 1.9 alnsn } else if (insn_dat[i].u.rdata.check_length > 0) {
1660 1.9 alnsn /* if (buflen < check_length) return 0; */
1661 1.9 alnsn jump = sljit_emit_cmp(compiler,
1662 1.9 alnsn SLJIT_C_LESS,
1663 1.9 alnsn BJ_BUFLEN, 0,
1664 1.9 alnsn SLJIT_IMM,
1665 1.9 alnsn insn_dat[i].u.rdata.check_length);
1666 1.9 alnsn if (jump == NULL)
1667 1.9 alnsn goto fail;
1668 1.1 alnsn #ifdef _KERNEL
1669 1.9 alnsn to_mchain_jump = jump;
1670 1.1 alnsn #else
1671 1.9 alnsn if (!append_jump(jump, &ret0,
1672 1.9 alnsn &ret0_size, &ret0_maxsize))
1673 1.9 alnsn goto fail;
1674 1.1 alnsn #endif
1675 1.9 alnsn }
1676 1.1 alnsn }
1677 1.1 alnsn
1678 1.1 alnsn pc = &insns[i];
1679 1.1 alnsn switch (BPF_CLASS(pc->code)) {
1680 1.1 alnsn
1681 1.1 alnsn default:
1682 1.1 alnsn goto fail;
1683 1.1 alnsn
1684 1.1 alnsn case BPF_LD:
1685 1.1 alnsn /* BPF_LD+BPF_IMM A <- k */
1686 1.1 alnsn if (pc->code == (BPF_LD|BPF_IMM)) {
1687 1.1 alnsn status = sljit_emit_op1(compiler,
1688 1.1 alnsn SLJIT_MOV,
1689 1.7 alnsn BJ_AREG, 0,
1690 1.1 alnsn SLJIT_IMM, (uint32_t)pc->k);
1691 1.1 alnsn if (status != SLJIT_SUCCESS)
1692 1.1 alnsn goto fail;
1693 1.1 alnsn
1694 1.1 alnsn continue;
1695 1.1 alnsn }
1696 1.1 alnsn
1697 1.1 alnsn /* BPF_LD+BPF_MEM A <- M[k] */
1698 1.1 alnsn if (pc->code == (BPF_LD|BPF_MEM)) {
1699 1.13 alnsn if ((uint32_t)pc->k >= memwords)
1700 1.1 alnsn goto fail;
1701 1.13 alnsn status = emit_memload(compiler,
1702 1.13 alnsn BJ_AREG, pc->k, extwords);
1703 1.1 alnsn if (status != SLJIT_SUCCESS)
1704 1.1 alnsn goto fail;
1705 1.1 alnsn
1706 1.1 alnsn continue;
1707 1.1 alnsn }
1708 1.1 alnsn
1709 1.1 alnsn /* BPF_LD+BPF_W+BPF_LEN A <- len */
1710 1.1 alnsn if (pc->code == (BPF_LD|BPF_W|BPF_LEN)) {
1711 1.1 alnsn status = sljit_emit_op1(compiler,
1712 1.21 alnsn SLJIT_MOV, /* size_t source */
1713 1.7 alnsn BJ_AREG, 0,
1714 1.13 alnsn SLJIT_MEM1(BJ_ARGS),
1715 1.13 alnsn offsetof(struct bpf_args, wirelen));
1716 1.1 alnsn if (status != SLJIT_SUCCESS)
1717 1.1 alnsn goto fail;
1718 1.1 alnsn
1719 1.1 alnsn continue;
1720 1.1 alnsn }
1721 1.1 alnsn
1722 1.1 alnsn mode = BPF_MODE(pc->code);
1723 1.1 alnsn if (mode != BPF_ABS && mode != BPF_IND)
1724 1.1 alnsn goto fail;
1725 1.1 alnsn
1726 1.9 alnsn if (unconditional_ret)
1727 1.9 alnsn continue;
1728 1.9 alnsn
1729 1.1 alnsn status = emit_pkt_read(compiler, pc,
1730 1.7 alnsn to_mchain_jump, &ret0, &ret0_size, &ret0_maxsize);
1731 1.1 alnsn if (status != SLJIT_SUCCESS)
1732 1.1 alnsn goto fail;
1733 1.1 alnsn
1734 1.1 alnsn continue;
1735 1.1 alnsn
1736 1.1 alnsn case BPF_LDX:
1737 1.1 alnsn mode = BPF_MODE(pc->code);
1738 1.1 alnsn
1739 1.1 alnsn /* BPF_LDX+BPF_W+BPF_IMM X <- k */
1740 1.1 alnsn if (mode == BPF_IMM) {
1741 1.1 alnsn if (BPF_SIZE(pc->code) != BPF_W)
1742 1.1 alnsn goto fail;
1743 1.1 alnsn status = sljit_emit_op1(compiler,
1744 1.1 alnsn SLJIT_MOV,
1745 1.7 alnsn BJ_XREG, 0,
1746 1.1 alnsn SLJIT_IMM, (uint32_t)pc->k);
1747 1.1 alnsn if (status != SLJIT_SUCCESS)
1748 1.1 alnsn goto fail;
1749 1.1 alnsn
1750 1.1 alnsn continue;
1751 1.1 alnsn }
1752 1.1 alnsn
1753 1.1 alnsn /* BPF_LDX+BPF_W+BPF_LEN X <- len */
1754 1.1 alnsn if (mode == BPF_LEN) {
1755 1.1 alnsn if (BPF_SIZE(pc->code) != BPF_W)
1756 1.1 alnsn goto fail;
1757 1.1 alnsn status = sljit_emit_op1(compiler,
1758 1.21 alnsn SLJIT_MOV, /* size_t source */
1759 1.7 alnsn BJ_XREG, 0,
1760 1.13 alnsn SLJIT_MEM1(BJ_ARGS),
1761 1.13 alnsn offsetof(struct bpf_args, wirelen));
1762 1.1 alnsn if (status != SLJIT_SUCCESS)
1763 1.1 alnsn goto fail;
1764 1.1 alnsn
1765 1.1 alnsn continue;
1766 1.1 alnsn }
1767 1.1 alnsn
1768 1.1 alnsn /* BPF_LDX+BPF_W+BPF_MEM X <- M[k] */
1769 1.1 alnsn if (mode == BPF_MEM) {
1770 1.1 alnsn if (BPF_SIZE(pc->code) != BPF_W)
1771 1.1 alnsn goto fail;
1772 1.13 alnsn if ((uint32_t)pc->k >= memwords)
1773 1.1 alnsn goto fail;
1774 1.13 alnsn status = emit_memload(compiler,
1775 1.13 alnsn BJ_XREG, pc->k, extwords);
1776 1.1 alnsn if (status != SLJIT_SUCCESS)
1777 1.1 alnsn goto fail;
1778 1.1 alnsn
1779 1.1 alnsn continue;
1780 1.1 alnsn }
1781 1.1 alnsn
1782 1.1 alnsn /* BPF_LDX+BPF_B+BPF_MSH X <- 4*(P[k:1]&0xf) */
1783 1.1 alnsn if (mode != BPF_MSH || BPF_SIZE(pc->code) != BPF_B)
1784 1.1 alnsn goto fail;
1785 1.1 alnsn
1786 1.9 alnsn if (unconditional_ret)
1787 1.9 alnsn continue;
1788 1.9 alnsn
1789 1.1 alnsn status = emit_msh(compiler, pc,
1790 1.7 alnsn to_mchain_jump, &ret0, &ret0_size, &ret0_maxsize);
1791 1.1 alnsn if (status != SLJIT_SUCCESS)
1792 1.1 alnsn goto fail;
1793 1.1 alnsn
1794 1.1 alnsn continue;
1795 1.1 alnsn
1796 1.1 alnsn case BPF_ST:
1797 1.8 alnsn if (pc->code != BPF_ST ||
1798 1.13 alnsn (uint32_t)pc->k >= memwords) {
1799 1.1 alnsn goto fail;
1800 1.8 alnsn }
1801 1.1 alnsn
1802 1.13 alnsn status = emit_memstore(compiler,
1803 1.13 alnsn BJ_AREG, pc->k, extwords);
1804 1.1 alnsn if (status != SLJIT_SUCCESS)
1805 1.1 alnsn goto fail;
1806 1.1 alnsn
1807 1.1 alnsn continue;
1808 1.1 alnsn
1809 1.1 alnsn case BPF_STX:
1810 1.8 alnsn if (pc->code != BPF_STX ||
1811 1.13 alnsn (uint32_t)pc->k >= memwords) {
1812 1.1 alnsn goto fail;
1813 1.8 alnsn }
1814 1.1 alnsn
1815 1.13 alnsn status = emit_memstore(compiler,
1816 1.13 alnsn BJ_XREG, pc->k, extwords);
1817 1.1 alnsn if (status != SLJIT_SUCCESS)
1818 1.1 alnsn goto fail;
1819 1.1 alnsn
1820 1.1 alnsn continue;
1821 1.1 alnsn
1822 1.1 alnsn case BPF_ALU:
1823 1.1 alnsn if (pc->code == (BPF_ALU|BPF_NEG)) {
1824 1.1 alnsn status = sljit_emit_op1(compiler,
1825 1.1 alnsn SLJIT_NEG,
1826 1.7 alnsn BJ_AREG, 0,
1827 1.7 alnsn BJ_AREG, 0);
1828 1.1 alnsn if (status != SLJIT_SUCCESS)
1829 1.1 alnsn goto fail;
1830 1.1 alnsn
1831 1.1 alnsn continue;
1832 1.1 alnsn }
1833 1.1 alnsn
1834 1.1 alnsn if (BPF_OP(pc->code) != BPF_DIV) {
1835 1.1 alnsn status = sljit_emit_op2(compiler,
1836 1.1 alnsn bpf_alu_to_sljit_op(pc),
1837 1.7 alnsn BJ_AREG, 0,
1838 1.7 alnsn BJ_AREG, 0,
1839 1.1 alnsn kx_to_reg(pc), kx_to_reg_arg(pc));
1840 1.1 alnsn if (status != SLJIT_SUCCESS)
1841 1.1 alnsn goto fail;
1842 1.1 alnsn
1843 1.1 alnsn continue;
1844 1.1 alnsn }
1845 1.1 alnsn
1846 1.1 alnsn /* BPF_DIV */
1847 1.1 alnsn
1848 1.1 alnsn src = BPF_SRC(pc->code);
1849 1.1 alnsn if (src != BPF_X && src != BPF_K)
1850 1.1 alnsn goto fail;
1851 1.1 alnsn
1852 1.1 alnsn /* division by zero? */
1853 1.1 alnsn if (src == BPF_X) {
1854 1.1 alnsn jump = sljit_emit_cmp(compiler,
1855 1.1 alnsn SLJIT_C_EQUAL|SLJIT_INT_OP,
1856 1.8 alnsn BJ_XREG, 0,
1857 1.1 alnsn SLJIT_IMM, 0);
1858 1.1 alnsn if (jump == NULL)
1859 1.1 alnsn goto fail;
1860 1.7 alnsn if (!append_jump(jump, &ret0,
1861 1.7 alnsn &ret0_size, &ret0_maxsize))
1862 1.7 alnsn goto fail;
1863 1.1 alnsn } else if (pc->k == 0) {
1864 1.1 alnsn jump = sljit_emit_jump(compiler, SLJIT_JUMP);
1865 1.1 alnsn if (jump == NULL)
1866 1.1 alnsn goto fail;
1867 1.7 alnsn if (!append_jump(jump, &ret0,
1868 1.7 alnsn &ret0_size, &ret0_maxsize))
1869 1.7 alnsn goto fail;
1870 1.1 alnsn }
1871 1.1 alnsn
1872 1.1 alnsn if (src == BPF_X) {
1873 1.7 alnsn status = emit_division(compiler, BJ_XREG, 0);
1874 1.1 alnsn if (status != SLJIT_SUCCESS)
1875 1.1 alnsn goto fail;
1876 1.1 alnsn } else if (pc->k != 0) {
1877 1.1 alnsn if (pc->k & (pc->k - 1)) {
1878 1.1 alnsn status = emit_division(compiler,
1879 1.1 alnsn SLJIT_IMM, (uint32_t)pc->k);
1880 1.1 alnsn } else {
1881 1.7 alnsn status = emit_pow2_division(compiler,
1882 1.1 alnsn (uint32_t)pc->k);
1883 1.1 alnsn }
1884 1.1 alnsn if (status != SLJIT_SUCCESS)
1885 1.1 alnsn goto fail;
1886 1.1 alnsn }
1887 1.1 alnsn
1888 1.1 alnsn continue;
1889 1.1 alnsn
1890 1.1 alnsn case BPF_JMP:
1891 1.7 alnsn if (BPF_OP(pc->code) == BPF_JA) {
1892 1.1 alnsn jt = jf = pc->k;
1893 1.1 alnsn } else {
1894 1.1 alnsn jt = pc->jt;
1895 1.1 alnsn jf = pc->jf;
1896 1.1 alnsn }
1897 1.1 alnsn
1898 1.1 alnsn negate = (jt == 0) ? 1 : 0;
1899 1.1 alnsn branching = (jt == jf) ? 0 : 1;
1900 1.7 alnsn jtf = insn_dat[i].u.jdata.jtf;
1901 1.1 alnsn
1902 1.1 alnsn if (branching) {
1903 1.1 alnsn if (BPF_OP(pc->code) != BPF_JSET) {
1904 1.1 alnsn jump = sljit_emit_cmp(compiler,
1905 1.1 alnsn bpf_jmp_to_sljit_cond(pc, negate),
1906 1.7 alnsn BJ_AREG, 0,
1907 1.1 alnsn kx_to_reg(pc), kx_to_reg_arg(pc));
1908 1.1 alnsn } else {
1909 1.1 alnsn status = sljit_emit_op2(compiler,
1910 1.1 alnsn SLJIT_AND,
1911 1.7 alnsn BJ_TMP1REG, 0,
1912 1.7 alnsn BJ_AREG, 0,
1913 1.1 alnsn kx_to_reg(pc), kx_to_reg_arg(pc));
1914 1.1 alnsn if (status != SLJIT_SUCCESS)
1915 1.1 alnsn goto fail;
1916 1.1 alnsn
1917 1.1 alnsn jump = sljit_emit_cmp(compiler,
1918 1.1 alnsn bpf_jmp_to_sljit_cond(pc, negate),
1919 1.7 alnsn BJ_TMP1REG, 0,
1920 1.1 alnsn SLJIT_IMM, 0);
1921 1.1 alnsn }
1922 1.1 alnsn
1923 1.1 alnsn if (jump == NULL)
1924 1.1 alnsn goto fail;
1925 1.1 alnsn
1926 1.7 alnsn BJ_ASSERT(jtf[negate].sjump == NULL);
1927 1.7 alnsn jtf[negate].sjump = jump;
1928 1.1 alnsn }
1929 1.1 alnsn
1930 1.1 alnsn if (!branching || (jt != 0 && jf != 0)) {
1931 1.1 alnsn jump = sljit_emit_jump(compiler, SLJIT_JUMP);
1932 1.1 alnsn if (jump == NULL)
1933 1.1 alnsn goto fail;
1934 1.1 alnsn
1935 1.7 alnsn BJ_ASSERT(jtf[branching].sjump == NULL);
1936 1.7 alnsn jtf[branching].sjump = jump;
1937 1.1 alnsn }
1938 1.1 alnsn
1939 1.1 alnsn continue;
1940 1.1 alnsn
1941 1.1 alnsn case BPF_RET:
1942 1.1 alnsn rval = BPF_RVAL(pc->code);
1943 1.1 alnsn if (rval == BPF_X)
1944 1.1 alnsn goto fail;
1945 1.1 alnsn
1946 1.1 alnsn /* BPF_RET+BPF_K accept k bytes */
1947 1.1 alnsn if (rval == BPF_K) {
1948 1.7 alnsn status = sljit_emit_return(compiler,
1949 1.7 alnsn SLJIT_MOV_UI,
1950 1.1 alnsn SLJIT_IMM, (uint32_t)pc->k);
1951 1.1 alnsn if (status != SLJIT_SUCCESS)
1952 1.1 alnsn goto fail;
1953 1.1 alnsn }
1954 1.1 alnsn
1955 1.1 alnsn /* BPF_RET+BPF_A accept A bytes */
1956 1.1 alnsn if (rval == BPF_A) {
1957 1.7 alnsn status = sljit_emit_return(compiler,
1958 1.7 alnsn SLJIT_MOV_UI,
1959 1.7 alnsn BJ_AREG, 0);
1960 1.1 alnsn if (status != SLJIT_SUCCESS)
1961 1.1 alnsn goto fail;
1962 1.1 alnsn }
1963 1.1 alnsn
1964 1.1 alnsn continue;
1965 1.1 alnsn
1966 1.1 alnsn case BPF_MISC:
1967 1.7 alnsn switch (BPF_MISCOP(pc->code)) {
1968 1.7 alnsn case BPF_TAX:
1969 1.1 alnsn status = sljit_emit_op1(compiler,
1970 1.1 alnsn SLJIT_MOV_UI,
1971 1.7 alnsn BJ_XREG, 0,
1972 1.7 alnsn BJ_AREG, 0);
1973 1.1 alnsn if (status != SLJIT_SUCCESS)
1974 1.1 alnsn goto fail;
1975 1.1 alnsn
1976 1.1 alnsn continue;
1977 1.1 alnsn
1978 1.7 alnsn case BPF_TXA:
1979 1.1 alnsn status = sljit_emit_op1(compiler,
1980 1.1 alnsn SLJIT_MOV,
1981 1.7 alnsn BJ_AREG, 0,
1982 1.7 alnsn BJ_XREG, 0);
1983 1.1 alnsn if (status != SLJIT_SUCCESS)
1984 1.1 alnsn goto fail;
1985 1.1 alnsn
1986 1.1 alnsn continue;
1987 1.13 alnsn
1988 1.13 alnsn case BPF_COP:
1989 1.13 alnsn case BPF_COPX:
1990 1.13 alnsn if (bc == NULL || bc->copfuncs == NULL)
1991 1.13 alnsn goto fail;
1992 1.13 alnsn if (BPF_MISCOP(pc->code) == BPF_COP &&
1993 1.13 alnsn (uint32_t)pc->k >= bc->nfuncs) {
1994 1.13 alnsn goto fail;
1995 1.13 alnsn }
1996 1.13 alnsn
1997 1.28 alnsn status = emit_cop(compiler, bc, pc,
1998 1.28 alnsn &ret0, &ret0_size, &ret0_maxsize);
1999 1.13 alnsn if (status != SLJIT_SUCCESS)
2000 1.13 alnsn goto fail;
2001 1.13 alnsn
2002 1.13 alnsn continue;
2003 1.1 alnsn }
2004 1.1 alnsn
2005 1.1 alnsn goto fail;
2006 1.1 alnsn } /* switch */
2007 1.1 alnsn } /* main loop */
2008 1.1 alnsn
2009 1.7 alnsn BJ_ASSERT(ret0_size <= ret0_maxsize);
2010 1.1 alnsn
2011 1.7 alnsn if (ret0_size > 0) {
2012 1.1 alnsn label = sljit_emit_label(compiler);
2013 1.1 alnsn if (label == NULL)
2014 1.1 alnsn goto fail;
2015 1.7 alnsn for (i = 0; i < ret0_size; i++)
2016 1.7 alnsn sljit_set_label(ret0[i], label);
2017 1.1 alnsn }
2018 1.1 alnsn
2019 1.23 alnsn status = sljit_emit_return(compiler,
2020 1.23 alnsn SLJIT_MOV_UI,
2021 1.23 alnsn SLJIT_IMM, 0);
2022 1.23 alnsn if (status != SLJIT_SUCCESS)
2023 1.23 alnsn goto fail;
2024 1.23 alnsn
2025 1.19 alnsn rv = true;
2026 1.19 alnsn
2027 1.19 alnsn fail:
2028 1.19 alnsn if (ret0 != NULL)
2029 1.19 alnsn BJ_FREE(ret0, ret0_maxsize * sizeof(ret0[0]));
2030 1.19 alnsn
2031 1.19 alnsn return rv;
2032 1.19 alnsn }
2033 1.19 alnsn
2034 1.19 alnsn bpfjit_func_t
2035 1.19 alnsn bpfjit_generate_code(const bpf_ctx_t *bc,
2036 1.19 alnsn const struct bpf_insn *insns, size_t insn_count)
2037 1.19 alnsn {
2038 1.19 alnsn void *rv;
2039 1.19 alnsn struct sljit_compiler *compiler;
2040 1.19 alnsn
2041 1.19 alnsn size_t i;
2042 1.19 alnsn int status;
2043 1.19 alnsn
2044 1.19 alnsn /* optimization related */
2045 1.19 alnsn bpf_memword_init_t initmask;
2046 1.20 alnsn bpfjit_hint_t hints;
2047 1.19 alnsn
2048 1.19 alnsn /* memory store location for initial zero initialization */
2049 1.19 alnsn sljit_si mem_reg;
2050 1.19 alnsn sljit_sw mem_off;
2051 1.19 alnsn
2052 1.19 alnsn struct bpfjit_insn_data *insn_dat;
2053 1.19 alnsn
2054 1.19 alnsn const size_t extwords = GET_EXTWORDS(bc);
2055 1.19 alnsn const size_t memwords = GET_MEMWORDS(bc);
2056 1.19 alnsn const bpf_memword_init_t preinited = extwords ? bc->preinited : 0;
2057 1.19 alnsn
2058 1.19 alnsn rv = NULL;
2059 1.19 alnsn compiler = NULL;
2060 1.19 alnsn insn_dat = NULL;
2061 1.19 alnsn
2062 1.19 alnsn if (memwords > MAX_MEMWORDS)
2063 1.19 alnsn goto fail;
2064 1.19 alnsn
2065 1.19 alnsn if (insn_count == 0 || insn_count > SIZE_MAX / sizeof(insn_dat[0]))
2066 1.19 alnsn goto fail;
2067 1.19 alnsn
2068 1.19 alnsn insn_dat = BJ_ALLOC(insn_count * sizeof(insn_dat[0]));
2069 1.19 alnsn if (insn_dat == NULL)
2070 1.19 alnsn goto fail;
2071 1.19 alnsn
2072 1.20 alnsn if (!optimize(bc, insns, insn_dat, insn_count, &initmask, &hints))
2073 1.19 alnsn goto fail;
2074 1.19 alnsn
2075 1.19 alnsn compiler = sljit_create_compiler();
2076 1.19 alnsn if (compiler == NULL)
2077 1.19 alnsn goto fail;
2078 1.19 alnsn
2079 1.19 alnsn #if !defined(_KERNEL) && defined(SLJIT_VERBOSE) && SLJIT_VERBOSE
2080 1.19 alnsn sljit_compiler_verbose(compiler, stderr);
2081 1.19 alnsn #endif
2082 1.19 alnsn
2083 1.30 alnsn status = sljit_emit_enter(compiler,
2084 1.30 alnsn 2, nscratches(hints), nsaveds(hints), sizeof(struct bpfjit_stack));
2085 1.19 alnsn if (status != SLJIT_SUCCESS)
2086 1.19 alnsn goto fail;
2087 1.19 alnsn
2088 1.20 alnsn if (hints & BJ_HINT_COP) {
2089 1.19 alnsn /* save ctx argument */
2090 1.19 alnsn status = sljit_emit_op1(compiler,
2091 1.19 alnsn SLJIT_MOV_P,
2092 1.19 alnsn SLJIT_MEM1(SLJIT_LOCALS_REG),
2093 1.19 alnsn offsetof(struct bpfjit_stack, ctx),
2094 1.19 alnsn BJ_CTX_ARG, 0);
2095 1.19 alnsn if (status != SLJIT_SUCCESS)
2096 1.19 alnsn goto fail;
2097 1.19 alnsn }
2098 1.19 alnsn
2099 1.19 alnsn if (extwords == 0) {
2100 1.19 alnsn mem_reg = SLJIT_MEM1(SLJIT_LOCALS_REG);
2101 1.19 alnsn mem_off = offsetof(struct bpfjit_stack, mem);
2102 1.19 alnsn } else {
2103 1.19 alnsn /* copy "mem" argument from bpf_args to bpfjit_stack */
2104 1.19 alnsn status = sljit_emit_op1(compiler,
2105 1.19 alnsn SLJIT_MOV_P,
2106 1.19 alnsn BJ_TMP1REG, 0,
2107 1.19 alnsn SLJIT_MEM1(BJ_ARGS), offsetof(struct bpf_args, mem));
2108 1.19 alnsn if (status != SLJIT_SUCCESS)
2109 1.19 alnsn goto fail;
2110 1.19 alnsn
2111 1.19 alnsn status = sljit_emit_op1(compiler,
2112 1.19 alnsn SLJIT_MOV_P,
2113 1.19 alnsn SLJIT_MEM1(SLJIT_LOCALS_REG),
2114 1.19 alnsn offsetof(struct bpfjit_stack, extmem),
2115 1.19 alnsn BJ_TMP1REG, 0);
2116 1.19 alnsn if (status != SLJIT_SUCCESS)
2117 1.19 alnsn goto fail;
2118 1.19 alnsn
2119 1.19 alnsn mem_reg = SLJIT_MEM1(BJ_TMP1REG);
2120 1.19 alnsn mem_off = 0;
2121 1.19 alnsn }
2122 1.19 alnsn
2123 1.19 alnsn /*
2124 1.19 alnsn * Exclude pre-initialised external memory words but keep
2125 1.19 alnsn * initialization statuses of A and X registers in case
2126 1.19 alnsn * bc->preinited wrongly sets those two bits.
2127 1.19 alnsn */
2128 1.19 alnsn initmask &= ~preinited | BJ_INIT_ABIT | BJ_INIT_XBIT;
2129 1.19 alnsn
2130 1.19 alnsn #if defined(_KERNEL)
2131 1.19 alnsn /* bpf_filter() checks initialization of memwords. */
2132 1.19 alnsn BJ_ASSERT((initmask & (BJ_INIT_MBIT(memwords) - 1)) == 0);
2133 1.19 alnsn #endif
2134 1.19 alnsn for (i = 0; i < memwords; i++) {
2135 1.19 alnsn if (initmask & BJ_INIT_MBIT(i)) {
2136 1.19 alnsn /* M[i] = 0; */
2137 1.19 alnsn status = sljit_emit_op1(compiler,
2138 1.19 alnsn SLJIT_MOV_UI,
2139 1.19 alnsn mem_reg, mem_off + i * sizeof(uint32_t),
2140 1.19 alnsn SLJIT_IMM, 0);
2141 1.19 alnsn if (status != SLJIT_SUCCESS)
2142 1.19 alnsn goto fail;
2143 1.19 alnsn }
2144 1.19 alnsn }
2145 1.19 alnsn
2146 1.19 alnsn if (initmask & BJ_INIT_ABIT) {
2147 1.19 alnsn /* A = 0; */
2148 1.19 alnsn status = sljit_emit_op1(compiler,
2149 1.19 alnsn SLJIT_MOV,
2150 1.19 alnsn BJ_AREG, 0,
2151 1.19 alnsn SLJIT_IMM, 0);
2152 1.19 alnsn if (status != SLJIT_SUCCESS)
2153 1.19 alnsn goto fail;
2154 1.19 alnsn }
2155 1.19 alnsn
2156 1.19 alnsn if (initmask & BJ_INIT_XBIT) {
2157 1.19 alnsn /* X = 0; */
2158 1.19 alnsn status = sljit_emit_op1(compiler,
2159 1.19 alnsn SLJIT_MOV,
2160 1.19 alnsn BJ_XREG, 0,
2161 1.19 alnsn SLJIT_IMM, 0);
2162 1.19 alnsn if (status != SLJIT_SUCCESS)
2163 1.19 alnsn goto fail;
2164 1.19 alnsn }
2165 1.19 alnsn
2166 1.19 alnsn status = load_buf_buflen(compiler);
2167 1.19 alnsn if (status != SLJIT_SUCCESS)
2168 1.19 alnsn goto fail;
2169 1.19 alnsn
2170 1.19 alnsn if (!generate_insn_code(compiler, bc, insns, insn_dat, insn_count))
2171 1.19 alnsn goto fail;
2172 1.19 alnsn
2173 1.1 alnsn rv = sljit_generate_code(compiler);
2174 1.1 alnsn
2175 1.1 alnsn fail:
2176 1.1 alnsn if (compiler != NULL)
2177 1.1 alnsn sljit_free_compiler(compiler);
2178 1.1 alnsn
2179 1.1 alnsn if (insn_dat != NULL)
2180 1.7 alnsn BJ_FREE(insn_dat, insn_count * sizeof(insn_dat[0]));
2181 1.1 alnsn
2182 1.4 rmind return (bpfjit_func_t)rv;
2183 1.1 alnsn }
2184 1.1 alnsn
2185 1.1 alnsn void
2186 1.4 rmind bpfjit_free_code(bpfjit_func_t code)
2187 1.1 alnsn {
2188 1.7 alnsn
2189 1.1 alnsn sljit_free_code((void *)code);
2190 1.1 alnsn }
2191