emul.c revision 1.201 1 1.201 riastrad /* $NetBSD: emul.c,v 1.201 2023/10/15 11:11:37 riastradh Exp $ */
2 1.1 pooka
3 1.1 pooka /*
4 1.150 pooka * Copyright (c) 2007-2011 Antti Kantee. All Rights Reserved.
5 1.1 pooka *
6 1.1 pooka * Redistribution and use in source and binary forms, with or without
7 1.1 pooka * modification, are permitted provided that the following conditions
8 1.1 pooka * are met:
9 1.1 pooka * 1. Redistributions of source code must retain the above copyright
10 1.1 pooka * notice, this list of conditions and the following disclaimer.
11 1.1 pooka * 2. Redistributions in binary form must reproduce the above copyright
12 1.1 pooka * notice, this list of conditions and the following disclaimer in the
13 1.1 pooka * documentation and/or other materials provided with the distribution.
14 1.1 pooka *
15 1.1 pooka * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
16 1.1 pooka * OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
17 1.1 pooka * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
18 1.1 pooka * DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
19 1.1 pooka * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
20 1.1 pooka * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
21 1.1 pooka * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
22 1.1 pooka * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
23 1.1 pooka * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
24 1.1 pooka * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
25 1.1 pooka * SUCH DAMAGE.
26 1.1 pooka */
27 1.1 pooka
28 1.61 pooka #include <sys/cdefs.h>
29 1.201 riastrad __KERNEL_RCSID(0, "$NetBSD: emul.c,v 1.201 2023/10/15 11:11:37 riastradh Exp $");
30 1.9 pooka
31 1.1 pooka #include <sys/param.h>
32 1.176 pooka #include <sys/cprng.h>
33 1.176 pooka #include <sys/filedesc.h>
34 1.181 hannken #include <sys/fstrans.h>
35 1.1 pooka #include <sys/kauth.h>
36 1.66 pooka #include <sys/module.h>
37 1.67 pooka #include <sys/reboot.h>
38 1.154 pooka #include <sys/syscall.h>
39 1.185 ozaki #include <sys/pserialize.h>
40 1.178 ozaki #ifdef LOCKDEBUG
41 1.178 ozaki #include <sys/sleepq.h>
42 1.178 ozaki #endif
43 1.201 riastrad #include <sys/syncobj.h>
44 1.67 pooka
45 1.67 pooka #include <dev/cons.h>
46 1.1 pooka
47 1.179 pooka #include <rump-sys/kern.h>
48 1.179 pooka
49 1.44 pooka #include <rump/rumpuser.h>
50 1.44 pooka
51 1.165 pooka void (*rump_vfs_fini)(void) = (void *)nullop;
52 1.165 pooka
53 1.149 pooka /*
54 1.149 pooka * physmem is largely unused (except for nmbcluster calculations),
55 1.149 pooka * so pick a default value which suits ZFS. if an application wants
56 1.149 pooka * a very small memory footprint, it can still adjust this before
57 1.149 pooka * calling rump_init()
58 1.149 pooka */
59 1.149 pooka #define PHYSMEM 512*256
60 1.180 cherry psize_t physmem = PHYSMEM;
61 1.197 skrll size_t nkmempages = PHYSMEM/2; /* from le chapeau */
62 1.149 pooka #undef PHYSMEM
63 1.149 pooka
64 1.1 pooka struct vnode *rootvp;
65 1.124 pooka dev_t rootdev = NODEV;
66 1.149 pooka
67 1.19 pooka const int schedppq = 1;
68 1.66 pooka int cold = 1;
69 1.195 thorpej int shutting_down;
70 1.95 pooka int boothowto = AB_SILENT;
71 1.67 pooka struct tty *constty;
72 1.1 pooka
73 1.135 pooka const struct bdevsw *bdevsw0[255];
74 1.64 pooka const struct bdevsw **bdevsw = bdevsw0;
75 1.135 pooka const int sys_cdevsws = 255;
76 1.135 pooka int max_cdevsws = 255;
77 1.64 pooka
78 1.135 pooka const struct cdevsw *cdevsw0[255];
79 1.64 pooka const struct cdevsw **cdevsw = cdevsw0;
80 1.135 pooka const int sys_bdevsws = 255;
81 1.135 pooka int max_bdevsws = 255;
82 1.64 pooka
83 1.76 pooka int mem_no = 2;
84 1.76 pooka
85 1.151 chs device_t booted_device;
86 1.151 chs device_t booted_wedge;
87 1.200 manu daddr_t booted_startblk;
88 1.200 manu uint64_t booted_nblks;
89 1.92 pooka int booted_partition;
90 1.183 christos const char *booted_method;
91 1.92 pooka
92 1.120 pooka /* XXX: unused */
93 1.76 pooka kmutex_t tty_lock;
94 1.120 pooka krwlock_t exec_lock;
95 1.64 pooka
96 1.139 pooka /* sparc doesn't sport constant page size, pretend we have 4k pages */
97 1.109 pooka #ifdef __sparc__
98 1.109 pooka int nbpg = 4096;
99 1.139 pooka int pgofset = 4096-1;
100 1.139 pooka int pgshift = 12;
101 1.109 pooka #endif
102 1.109 pooka
103 1.146 tsutsui /* on sun3 VM_MAX_ADDRESS is a const variable */
104 1.146 tsutsui /* XXX: should be moved into rump.c and initialize for sun3 and sun3x? */
105 1.141 pooka #ifdef sun3
106 1.146 tsutsui const vaddr_t kernbase = KERNBASE3;
107 1.140 pooka #endif
108 1.140 pooka
109 1.117 pooka struct loadavg averunnable = {
110 1.117 pooka { 0 * FSCALE,
111 1.117 pooka 1 * FSCALE,
112 1.117 pooka 11 * FSCALE, },
113 1.117 pooka FSCALE,
114 1.117 pooka };
115 1.117 pooka
116 1.174 pgoyette /*
117 1.174 pgoyette * Include the autogenerated list of auto-loadable syscalls
118 1.174 pgoyette */
119 1.174 pgoyette #include <kern/syscalls_autoload.c>
120 1.174 pgoyette
121 1.126 pooka struct emul emul_netbsd = {
122 1.126 pooka .e_name = "netbsd-rump",
123 1.126 pooka .e_sysent = rump_sysent,
124 1.186 pgoyette .e_nomodbits = rump_sysent_nomodbits,
125 1.154 pooka #ifndef __HAVE_MINIMAL_EMUL
126 1.154 pooka .e_nsysent = SYS_NSYSENT,
127 1.154 pooka #endif
128 1.128 pooka .e_vm_default_addr = uvm_default_mapaddr,
129 1.138 pooka #ifdef __HAVE_SYSCALL_INTERN
130 1.138 pooka .e_syscall_intern = syscall_intern,
131 1.138 pooka #endif
132 1.174 pgoyette .e_sc_autoload = netbsd_syscalls_autoload,
133 1.126 pooka };
134 1.126 pooka
135 1.164 pooka /* not used, but need the symbols for pointer comparisons */
136 1.164 pooka syncobj_t mutex_syncobj, rw_syncobj;
137 1.164 pooka
138 1.20 pooka int
139 1.20 pooka kpause(const char *wmesg, bool intr, int timeo, kmutex_t *mtx)
140 1.20 pooka {
141 1.20 pooka extern int hz;
142 1.166 justin int rv __diagused;
143 1.78 pooka uint64_t sec, nsec;
144 1.127 pooka
145 1.20 pooka if (mtx)
146 1.20 pooka mutex_exit(mtx);
147 1.40 pooka
148 1.78 pooka sec = timeo / hz;
149 1.78 pooka nsec = (timeo % hz) * (1000000000 / hz);
150 1.158 pooka rv = rumpuser_clock_sleep(RUMPUSER_CLOCK_RELWALL, sec, nsec);
151 1.156 pooka KASSERT(rv == 0);
152 1.156 pooka
153 1.20 pooka if (mtx)
154 1.20 pooka mutex_enter(mtx);
155 1.20 pooka
156 1.20 pooka return 0;
157 1.20 pooka }
158 1.27 pooka
159 1.34 yamt vaddr_t
160 1.155 para calc_cache_size(vsize_t vasz, int pct, int va_pct)
161 1.34 yamt {
162 1.34 yamt paddr_t t;
163 1.34 yamt
164 1.34 yamt t = (paddr_t)physmem * pct / 100 * PAGE_SIZE;
165 1.34 yamt if ((vaddr_t)t != t) {
166 1.34 yamt panic("%s: needs tweak", __func__);
167 1.34 yamt }
168 1.34 yamt return t;
169 1.34 yamt }
170 1.35 martin
171 1.184 ozaki #define RETURN_ADDRESS (uintptr_t)__builtin_return_address(0)
172 1.184 ozaki
173 1.41 pooka void
174 1.41 pooka assert_sleepable(void)
175 1.41 pooka {
176 1.184 ozaki const char *reason = NULL;
177 1.41 pooka
178 1.41 pooka /* always sleepable, although we should improve this */
179 1.184 ozaki
180 1.184 ozaki if (!pserialize_not_in_read_section()) {
181 1.184 ozaki reason = "pserialize";
182 1.184 ozaki }
183 1.184 ozaki
184 1.184 ozaki if (reason) {
185 1.184 ozaki panic("%s: %s caller=%p", __func__, reason,
186 1.184 ozaki (void *)RETURN_ADDRESS);
187 1.184 ozaki }
188 1.41 pooka }
189 1.43 pooka
190 1.66 pooka void
191 1.80 cegger module_init_md(void)
192 1.66 pooka {
193 1.66 pooka
194 1.66 pooka /*
195 1.66 pooka * Nothing for now. However, we should load the librump
196 1.66 pooka * symbol table.
197 1.66 pooka */
198 1.66 pooka }
199 1.67 pooka
200 1.167 pooka /*
201 1.167 pooka * Try to emulate all the MD definitions of DELAY() / delay().
202 1.167 pooka * Would be nice to fix the #defines in MD headers, but this quicker.
203 1.168 pooka *
204 1.168 pooka * XXX: we'd need a rumpuser_clock_sleep_nowrap() here. Since we
205 1.168 pooka * don't have it in the current hypercall revision, busyloop.
206 1.168 pooka * Note that rather than calibrate a loop delay and work with that,
207 1.168 pooka * get call gettime (which does not block) in a loop to make sure
208 1.168 pooka * we didn't get virtual ghosttime. That might be slightly inaccurate
209 1.168 pooka * for very small delays ...
210 1.168 pooka *
211 1.168 pooka * The other option would be to run a thread in the hypervisor which
212 1.168 pooka * sleeps for us and we can wait for it using rumpuser_cv_wait_nowrap()
213 1.168 pooka * Probably too fussy. Better just wait for hypercall rev 18 ;)
214 1.167 pooka */
215 1.69 pooka static void
216 1.69 pooka rump_delay(unsigned int us)
217 1.67 pooka {
218 1.168 pooka struct timespec target, tmp;
219 1.168 pooka uint64_t sec, sec_ini, sec_now;
220 1.168 pooka long nsec, nsec_ini, nsec_now;
221 1.168 pooka int loops;
222 1.168 pooka
223 1.168 pooka rumpuser_clock_gettime(RUMPUSER_CLOCK_ABSMONO, &sec_ini, &nsec_ini);
224 1.67 pooka
225 1.167 pooka #ifdef __mac68k__
226 1.167 pooka sec = us / 1000;
227 1.167 pooka nsec = (us % 1000) * 1000000;
228 1.167 pooka #else
229 1.78 pooka sec = us / 1000000;
230 1.78 pooka nsec = (us % 1000000) * 1000;
231 1.167 pooka #endif
232 1.67 pooka
233 1.168 pooka target.tv_sec = sec_ini;
234 1.168 pooka tmp.tv_sec = sec;
235 1.168 pooka target.tv_nsec = nsec_ini;
236 1.168 pooka tmp.tv_nsec = nsec;
237 1.168 pooka timespecadd(&target, &tmp, &target);
238 1.168 pooka
239 1.78 pooka if (__predict_false(sec != 0))
240 1.67 pooka printf("WARNING: over 1s delay\n");
241 1.67 pooka
242 1.168 pooka for (loops = 0; loops < 1000*1000*100; loops++) {
243 1.168 pooka struct timespec cur;
244 1.168 pooka
245 1.168 pooka rumpuser_clock_gettime(RUMPUSER_CLOCK_ABSMONO,
246 1.168 pooka &sec_now, &nsec_now);
247 1.168 pooka cur.tv_sec = sec_now;
248 1.168 pooka cur.tv_nsec = nsec_now;
249 1.168 pooka if (timespeccmp(&cur, &target, >=)) {
250 1.168 pooka return;
251 1.168 pooka }
252 1.168 pooka }
253 1.168 pooka printf("WARNING: DELAY ESCAPED\n");
254 1.67 pooka }
255 1.69 pooka void (*delay_func)(unsigned int) = rump_delay;
256 1.167 pooka __strong_alias(delay,rump_delay);
257 1.167 pooka __strong_alias(_delay,rump_delay);
258 1.67 pooka
259 1.191 kre /* Weak alias for getcwd_common to be used unless librumpvfs is present. */
260 1.191 kre
261 1.191 kre int rump_getcwd_common(struct vnode *, struct vnode *, char **, char *,
262 1.191 kre int, int, struct lwp *);
263 1.191 kre int
264 1.191 kre rump_getcwd_common(struct vnode *lvp, struct vnode *rvp, char **bpp, char *bufp,
265 1.191 kre int limit, int flags, struct lwp *l)
266 1.191 kre {
267 1.191 kre
268 1.191 kre return ENOENT;
269 1.191 kre }
270 1.191 kre __weak_alias(getcwd_common,rump_getcwd_common);
271 1.191 kre
272 1.192 bad /* Weak alias for vnode_to_path to be used unless librumpvfs is present. */
273 1.192 bad
274 1.192 bad int rump_vnode_to_path(char *, size_t, struct vnode *, struct lwp *,
275 1.192 bad struct proc *);
276 1.192 bad int
277 1.192 bad rump_vnode_to_path(char *path, size_t len, struct vnode *vp, struct lwp *curl,
278 1.192 bad struct proc *p)
279 1.192 bad {
280 1.192 bad
281 1.192 bad return ENOENT; /* pretend getcwd_common() failed. */
282 1.192 bad }
283 1.192 bad __weak_alias(vnode_to_path,rump_vnode_to_path);
284 1.192 bad
285 1.192 bad
286 1.181 hannken /* Weak aliases for fstrans to be used unless librumpvfs is present. */
287 1.181 hannken
288 1.182 hannken void rump_fstrans_start(struct mount *);
289 1.182 hannken void
290 1.182 hannken rump_fstrans_start(struct mount *mp)
291 1.182 hannken {
292 1.182 hannken
293 1.182 hannken }
294 1.182 hannken __weak_alias(fstrans_start,rump_fstrans_start);
295 1.182 hannken
296 1.182 hannken int rump_fstrans_start_nowait(struct mount *);
297 1.181 hannken int
298 1.182 hannken rump_fstrans_start_nowait(struct mount *mp)
299 1.181 hannken {
300 1.181 hannken
301 1.181 hannken return 0;
302 1.181 hannken }
303 1.182 hannken __weak_alias(fstrans_start_nowait,rump_fstrans_start_nowait);
304 1.181 hannken
305 1.187 hannken void rump_fstrans_start_lazy(struct mount *);
306 1.187 hannken void
307 1.187 hannken rump_fstrans_start_lazy(struct mount *mp)
308 1.187 hannken {
309 1.187 hannken
310 1.187 hannken }
311 1.187 hannken __weak_alias(fstrans_start_lazy,rump_fstrans_start_lazy);
312 1.187 hannken
313 1.187 hannken
314 1.181 hannken void rump_fstrans_done(struct mount *);
315 1.181 hannken void
316 1.181 hannken rump_fstrans_done(struct mount *mp)
317 1.181 hannken {
318 1.181 hannken
319 1.181 hannken }
320 1.181 hannken __weak_alias(fstrans_done,rump_fstrans_done);
321 1.181 hannken
322 1.190 hannken
323 1.190 hannken void rump_fstrans_lwp_dtor(struct lwp *);
324 1.190 hannken void
325 1.190 hannken rump_fstrans_lwp_dtor(struct lwp *l)
326 1.190 hannken {
327 1.190 hannken
328 1.190 hannken }
329 1.190 hannken __weak_alias(fstrans_lwp_dtor,rump_fstrans_lwp_dtor);
330 1.190 hannken
331 1.198 riastrad static int
332 1.198 riastrad rump_filt_fsattach(struct knote *kn)
333 1.198 riastrad {
334 1.198 riastrad
335 1.198 riastrad return EOPNOTSUPP;
336 1.198 riastrad }
337 1.198 riastrad
338 1.198 riastrad struct filterops rump_fs_filtops = {
339 1.198 riastrad .f_attach = rump_filt_fsattach,
340 1.198 riastrad };
341 1.198 riastrad __weak_alias(fs_filtops,rump_fs_filtops);
342 1.198 riastrad
343 1.199 riastrad struct pool_cache *rump_pnbuf_cache;
344 1.199 riastrad __weak_alias(pnbuf_cache,rump_pnbuf_cache);
345 1.199 riastrad
346 1.142 pooka /*
347 1.142 pooka * Provide weak aliases for tty routines used by printf.
348 1.142 pooka * They will be used unless the rumpkern_tty component is present.
349 1.142 pooka */
350 1.142 pooka
351 1.142 pooka int rump_ttycheckoutq(struct tty *, int);
352 1.105 pooka int
353 1.142 pooka rump_ttycheckoutq(struct tty *tp, int wait)
354 1.67 pooka {
355 1.67 pooka
356 1.67 pooka return 1;
357 1.67 pooka }
358 1.142 pooka __weak_alias(ttycheckoutq,rump_ttycheckoutq);
359 1.67 pooka
360 1.142 pooka int rump_tputchar(int, int, struct tty *);
361 1.142 pooka int
362 1.142 pooka rump_tputchar(int c, int flags, struct tty *tp)
363 1.142 pooka {
364 1.142 pooka
365 1.142 pooka cnputc(c);
366 1.142 pooka return 0;
367 1.142 pooka }
368 1.142 pooka __weak_alias(tputchar,rump_tputchar);
369 1.142 pooka
370 1.67 pooka void
371 1.67 pooka cnputc(int c)
372 1.67 pooka {
373 1.67 pooka
374 1.157 pooka rumpuser_putchar(c);
375 1.67 pooka }
376 1.67 pooka
377 1.67 pooka void
378 1.80 cegger cnflush(void)
379 1.67 pooka {
380 1.67 pooka
381 1.67 pooka /* done */
382 1.67 pooka }
383 1.67 pooka
384 1.163 pooka void
385 1.163 pooka resettodr(void)
386 1.163 pooka {
387 1.163 pooka
388 1.163 pooka /* setting clocks is not in the jurisdiction of rump kernels */
389 1.163 pooka }
390 1.163 pooka
391 1.138 pooka #ifdef __HAVE_SYSCALL_INTERN
392 1.138 pooka void
393 1.138 pooka syscall_intern(struct proc *p)
394 1.138 pooka {
395 1.138 pooka
396 1.160 pooka p->p_emuldata = NULL;
397 1.138 pooka }
398 1.138 pooka #endif
399 1.144 pooka
400 1.148 pooka #ifdef LOCKDEBUG
401 1.148 pooka void
402 1.148 pooka turnstile_print(volatile void *obj, void (*pr)(const char *, ...))
403 1.148 pooka {
404 1.148 pooka
405 1.148 pooka /* nada */
406 1.148 pooka }
407 1.148 pooka #endif
408 1.165 pooka
409 1.165 pooka void
410 1.165 pooka cpu_reboot(int howto, char *bootstr)
411 1.165 pooka {
412 1.165 pooka int ruhow = 0;
413 1.165 pooka void *finiarg;
414 1.165 pooka
415 1.165 pooka printf("rump kernel halting...\n");
416 1.165 pooka
417 1.165 pooka if (!RUMP_LOCALPROC_P(curproc))
418 1.170 pooka finiarg = RUMP_SPVM2CTL(curproc->p_vmspace);
419 1.165 pooka else
420 1.165 pooka finiarg = NULL;
421 1.165 pooka
422 1.165 pooka /* dump means we really take the dive here */
423 1.165 pooka if ((howto & RB_DUMP) || panicstr) {
424 1.165 pooka ruhow = RUMPUSER_PANIC;
425 1.165 pooka goto out;
426 1.165 pooka }
427 1.165 pooka
428 1.165 pooka /* try to sync */
429 1.165 pooka if (!((howto & RB_NOSYNC) || panicstr)) {
430 1.165 pooka rump_vfs_fini();
431 1.165 pooka }
432 1.165 pooka
433 1.165 pooka doshutdownhooks();
434 1.165 pooka
435 1.165 pooka /* your wish is my command */
436 1.165 pooka if (howto & RB_HALT) {
437 1.172 pooka printf("rump kernel halted (with RB_HALT, not exiting)\n");
438 1.169 pooka rump_sysproxy_fini(finiarg);
439 1.165 pooka for (;;) {
440 1.165 pooka rumpuser_clock_sleep(RUMPUSER_CLOCK_RELWALL, 10, 0);
441 1.165 pooka }
442 1.165 pooka }
443 1.165 pooka
444 1.165 pooka /* this function is __dead, we must exit */
445 1.165 pooka out:
446 1.169 pooka rump_sysproxy_fini(finiarg);
447 1.165 pooka rumpuser_exit(ruhow);
448 1.165 pooka }
449