emul.c revision 1.175 1 1.175 pooka /* $NetBSD: emul.c,v 1.175 2016/01/18 15:53:38 pooka Exp $ */
2 1.1 pooka
3 1.1 pooka /*
4 1.150 pooka * Copyright (c) 2007-2011 Antti Kantee. All Rights Reserved.
5 1.1 pooka *
6 1.1 pooka * Redistribution and use in source and binary forms, with or without
7 1.1 pooka * modification, are permitted provided that the following conditions
8 1.1 pooka * are met:
9 1.1 pooka * 1. Redistributions of source code must retain the above copyright
10 1.1 pooka * notice, this list of conditions and the following disclaimer.
11 1.1 pooka * 2. Redistributions in binary form must reproduce the above copyright
12 1.1 pooka * notice, this list of conditions and the following disclaimer in the
13 1.1 pooka * documentation and/or other materials provided with the distribution.
14 1.1 pooka *
15 1.1 pooka * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
16 1.1 pooka * OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
17 1.1 pooka * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
18 1.1 pooka * DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
19 1.1 pooka * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
20 1.1 pooka * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
21 1.1 pooka * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
22 1.1 pooka * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
23 1.1 pooka * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
24 1.1 pooka * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
25 1.1 pooka * SUCH DAMAGE.
26 1.1 pooka */
27 1.1 pooka
28 1.61 pooka #include <sys/cdefs.h>
29 1.175 pooka __KERNEL_RCSID(0, "$NetBSD: emul.c,v 1.175 2016/01/18 15:53:38 pooka Exp $");
30 1.9 pooka
31 1.1 pooka #include <sys/param.h>
32 1.1 pooka #include <sys/null.h>
33 1.1 pooka #include <sys/vnode.h>
34 1.1 pooka #include <sys/stat.h>
35 1.35 martin #include <sys/select.h>
36 1.1 pooka #include <sys/syslog.h>
37 1.1 pooka #include <sys/namei.h>
38 1.1 pooka #include <sys/kauth.h>
39 1.175 pooka #include <sys/kernel.h>
40 1.1 pooka #include <sys/conf.h>
41 1.1 pooka #include <sys/device.h>
42 1.1 pooka #include <sys/queue.h>
43 1.20 pooka #include <sys/file.h>
44 1.162 pooka #include <sys/filedesc.h>
45 1.15 ad #include <sys/cpu.h>
46 1.17 pooka #include <sys/kmem.h>
47 1.20 pooka #include <sys/poll.h>
48 1.66 pooka #include <sys/timetc.h>
49 1.53 pooka #include <sys/tprintf.h>
50 1.66 pooka #include <sys/module.h>
51 1.67 pooka #include <sys/tty.h>
52 1.67 pooka #include <sys/reboot.h>
53 1.154 pooka #include <sys/syscall.h>
54 1.109 pooka #include <sys/syscallvar.h>
55 1.109 pooka #include <sys/xcall.h>
56 1.148 pooka #include <sys/sleepq.h>
57 1.161 pooka #include <sys/cprng.h>
58 1.67 pooka
59 1.67 pooka #include <dev/cons.h>
60 1.1 pooka
61 1.44 pooka #include <rump/rumpuser.h>
62 1.44 pooka
63 1.8 pooka #include <uvm/uvm_map.h>
64 1.8 pooka
65 1.10 pooka #include "rump_private.h"
66 1.1 pooka
67 1.165 pooka void (*rump_vfs_fini)(void) = (void *)nullop;
68 1.165 pooka
69 1.149 pooka /*
70 1.149 pooka * physmem is largely unused (except for nmbcluster calculations),
71 1.149 pooka * so pick a default value which suits ZFS. if an application wants
72 1.149 pooka * a very small memory footprint, it can still adjust this before
73 1.149 pooka * calling rump_init()
74 1.149 pooka */
75 1.149 pooka #define PHYSMEM 512*256
76 1.149 pooka int physmem = PHYSMEM;
77 1.149 pooka int nkmempages = PHYSMEM/2; /* from le chapeau */
78 1.149 pooka #undef PHYSMEM
79 1.149 pooka
80 1.162 pooka struct lwp lwp0 = {
81 1.162 pooka .l_lid = 1,
82 1.162 pooka .l_proc = &proc0,
83 1.162 pooka .l_fd = &filedesc0,
84 1.162 pooka };
85 1.1 pooka struct vnode *rootvp;
86 1.124 pooka dev_t rootdev = NODEV;
87 1.149 pooka
88 1.19 pooka const int schedppq = 1;
89 1.53 pooka bool mp_online = false;
90 1.175 pooka struct timespec boottime;
91 1.66 pooka int cold = 1;
92 1.95 pooka int boothowto = AB_SILENT;
93 1.67 pooka struct tty *constty;
94 1.1 pooka
95 1.135 pooka const struct bdevsw *bdevsw0[255];
96 1.64 pooka const struct bdevsw **bdevsw = bdevsw0;
97 1.135 pooka const int sys_cdevsws = 255;
98 1.135 pooka int max_cdevsws = 255;
99 1.64 pooka
100 1.135 pooka const struct cdevsw *cdevsw0[255];
101 1.64 pooka const struct cdevsw **cdevsw = cdevsw0;
102 1.135 pooka const int sys_bdevsws = 255;
103 1.135 pooka int max_bdevsws = 255;
104 1.64 pooka
105 1.76 pooka int mem_no = 2;
106 1.76 pooka
107 1.151 chs device_t booted_device;
108 1.151 chs device_t booted_wedge;
109 1.92 pooka int booted_partition;
110 1.92 pooka
111 1.120 pooka /* XXX: unused */
112 1.76 pooka kmutex_t tty_lock;
113 1.120 pooka krwlock_t exec_lock;
114 1.64 pooka
115 1.125 pooka struct lwplist alllwp = LIST_HEAD_INITIALIZER(alllwp);
116 1.125 pooka
117 1.139 pooka /* sparc doesn't sport constant page size, pretend we have 4k pages */
118 1.109 pooka #ifdef __sparc__
119 1.109 pooka int nbpg = 4096;
120 1.139 pooka int pgofset = 4096-1;
121 1.139 pooka int pgshift = 12;
122 1.109 pooka #endif
123 1.109 pooka
124 1.146 tsutsui /* on sun3 VM_MAX_ADDRESS is a const variable */
125 1.146 tsutsui /* XXX: should be moved into rump.c and initialize for sun3 and sun3x? */
126 1.141 pooka #ifdef sun3
127 1.146 tsutsui const vaddr_t kernbase = KERNBASE3;
128 1.140 pooka #endif
129 1.140 pooka
130 1.117 pooka struct loadavg averunnable = {
131 1.117 pooka { 0 * FSCALE,
132 1.117 pooka 1 * FSCALE,
133 1.117 pooka 11 * FSCALE, },
134 1.117 pooka FSCALE,
135 1.117 pooka };
136 1.117 pooka
137 1.174 pgoyette /*
138 1.174 pgoyette * Include the autogenerated list of auto-loadable syscalls
139 1.174 pgoyette */
140 1.174 pgoyette #include <kern/syscalls_autoload.c>
141 1.174 pgoyette
142 1.126 pooka struct emul emul_netbsd = {
143 1.126 pooka .e_name = "netbsd-rump",
144 1.126 pooka .e_sysent = rump_sysent,
145 1.154 pooka #ifndef __HAVE_MINIMAL_EMUL
146 1.154 pooka .e_nsysent = SYS_NSYSENT,
147 1.154 pooka #endif
148 1.128 pooka .e_vm_default_addr = uvm_default_mapaddr,
149 1.138 pooka #ifdef __HAVE_SYSCALL_INTERN
150 1.138 pooka .e_syscall_intern = syscall_intern,
151 1.138 pooka #endif
152 1.174 pgoyette .e_sc_autoload = netbsd_syscalls_autoload,
153 1.126 pooka };
154 1.126 pooka
155 1.138 pooka u_int nprocs = 1;
156 1.20 pooka
157 1.161 pooka cprng_strong_t *kern_cprng;
158 1.161 pooka
159 1.164 pooka /* not used, but need the symbols for pointer comparisons */
160 1.164 pooka syncobj_t mutex_syncobj, rw_syncobj;
161 1.164 pooka
162 1.20 pooka int
163 1.20 pooka kpause(const char *wmesg, bool intr, int timeo, kmutex_t *mtx)
164 1.20 pooka {
165 1.20 pooka extern int hz;
166 1.166 justin int rv __diagused;
167 1.78 pooka uint64_t sec, nsec;
168 1.127 pooka
169 1.20 pooka if (mtx)
170 1.20 pooka mutex_exit(mtx);
171 1.40 pooka
172 1.78 pooka sec = timeo / hz;
173 1.78 pooka nsec = (timeo % hz) * (1000000000 / hz);
174 1.158 pooka rv = rumpuser_clock_sleep(RUMPUSER_CLOCK_RELWALL, sec, nsec);
175 1.156 pooka KASSERT(rv == 0);
176 1.156 pooka
177 1.20 pooka if (mtx)
178 1.20 pooka mutex_enter(mtx);
179 1.20 pooka
180 1.20 pooka return 0;
181 1.20 pooka }
182 1.27 pooka
183 1.27 pooka void
184 1.32 bjs lwp_unsleep(lwp_t *l, bool cleanup)
185 1.32 bjs {
186 1.32 bjs
187 1.32 bjs KASSERT(mutex_owned(l->l_mutex));
188 1.32 bjs
189 1.104 rmind (*l->l_syncobj->sobj_unsleep)(l, cleanup);
190 1.32 bjs }
191 1.34 yamt
192 1.145 pooka void
193 1.145 pooka lwp_update_creds(struct lwp *l)
194 1.145 pooka {
195 1.145 pooka struct proc *p;
196 1.145 pooka kauth_cred_t oldcred;
197 1.145 pooka
198 1.145 pooka p = l->l_proc;
199 1.145 pooka oldcred = l->l_cred;
200 1.145 pooka l->l_prflag &= ~LPR_CRMOD;
201 1.145 pooka
202 1.145 pooka mutex_enter(p->p_lock);
203 1.145 pooka kauth_cred_hold(p->p_cred);
204 1.145 pooka l->l_cred = p->p_cred;
205 1.145 pooka mutex_exit(p->p_lock);
206 1.145 pooka
207 1.145 pooka if (oldcred != NULL)
208 1.145 pooka kauth_cred_free(oldcred);
209 1.145 pooka }
210 1.145 pooka
211 1.34 yamt vaddr_t
212 1.155 para calc_cache_size(vsize_t vasz, int pct, int va_pct)
213 1.34 yamt {
214 1.34 yamt paddr_t t;
215 1.34 yamt
216 1.34 yamt t = (paddr_t)physmem * pct / 100 * PAGE_SIZE;
217 1.34 yamt if ((vaddr_t)t != t) {
218 1.34 yamt panic("%s: needs tweak", __func__);
219 1.34 yamt }
220 1.34 yamt return t;
221 1.34 yamt }
222 1.35 martin
223 1.41 pooka void
224 1.41 pooka assert_sleepable(void)
225 1.41 pooka {
226 1.41 pooka
227 1.41 pooka /* always sleepable, although we should improve this */
228 1.41 pooka }
229 1.43 pooka
230 1.66 pooka void
231 1.80 cegger module_init_md(void)
232 1.66 pooka {
233 1.66 pooka
234 1.66 pooka /*
235 1.66 pooka * Nothing for now. However, we should load the librump
236 1.66 pooka * symbol table.
237 1.66 pooka */
238 1.66 pooka }
239 1.67 pooka
240 1.167 pooka /*
241 1.167 pooka * Try to emulate all the MD definitions of DELAY() / delay().
242 1.167 pooka * Would be nice to fix the #defines in MD headers, but this quicker.
243 1.168 pooka *
244 1.168 pooka * XXX: we'd need a rumpuser_clock_sleep_nowrap() here. Since we
245 1.168 pooka * don't have it in the current hypercall revision, busyloop.
246 1.168 pooka * Note that rather than calibrate a loop delay and work with that,
247 1.168 pooka * get call gettime (which does not block) in a loop to make sure
248 1.168 pooka * we didn't get virtual ghosttime. That might be slightly inaccurate
249 1.168 pooka * for very small delays ...
250 1.168 pooka *
251 1.168 pooka * The other option would be to run a thread in the hypervisor which
252 1.168 pooka * sleeps for us and we can wait for it using rumpuser_cv_wait_nowrap()
253 1.168 pooka * Probably too fussy. Better just wait for hypercall rev 18 ;)
254 1.167 pooka */
255 1.69 pooka static void
256 1.69 pooka rump_delay(unsigned int us)
257 1.67 pooka {
258 1.168 pooka struct timespec target, tmp;
259 1.168 pooka uint64_t sec, sec_ini, sec_now;
260 1.168 pooka long nsec, nsec_ini, nsec_now;
261 1.168 pooka int loops;
262 1.168 pooka
263 1.168 pooka rumpuser_clock_gettime(RUMPUSER_CLOCK_ABSMONO, &sec_ini, &nsec_ini);
264 1.67 pooka
265 1.167 pooka #ifdef __mac68k__
266 1.167 pooka sec = us / 1000;
267 1.167 pooka nsec = (us % 1000) * 1000000;
268 1.167 pooka #else
269 1.78 pooka sec = us / 1000000;
270 1.78 pooka nsec = (us % 1000000) * 1000;
271 1.167 pooka #endif
272 1.67 pooka
273 1.168 pooka target.tv_sec = sec_ini;
274 1.168 pooka tmp.tv_sec = sec;
275 1.168 pooka target.tv_nsec = nsec_ini;
276 1.168 pooka tmp.tv_nsec = nsec;
277 1.168 pooka timespecadd(&target, &tmp, &target);
278 1.168 pooka
279 1.78 pooka if (__predict_false(sec != 0))
280 1.67 pooka printf("WARNING: over 1s delay\n");
281 1.67 pooka
282 1.168 pooka for (loops = 0; loops < 1000*1000*100; loops++) {
283 1.168 pooka struct timespec cur;
284 1.168 pooka
285 1.168 pooka rumpuser_clock_gettime(RUMPUSER_CLOCK_ABSMONO,
286 1.168 pooka &sec_now, &nsec_now);
287 1.168 pooka cur.tv_sec = sec_now;
288 1.168 pooka cur.tv_nsec = nsec_now;
289 1.168 pooka if (timespeccmp(&cur, &target, >=)) {
290 1.168 pooka return;
291 1.168 pooka }
292 1.168 pooka }
293 1.168 pooka printf("WARNING: DELAY ESCAPED\n");
294 1.67 pooka }
295 1.69 pooka void (*delay_func)(unsigned int) = rump_delay;
296 1.167 pooka __strong_alias(delay,rump_delay);
297 1.167 pooka __strong_alias(_delay,rump_delay);
298 1.67 pooka
299 1.142 pooka /*
300 1.142 pooka * Provide weak aliases for tty routines used by printf.
301 1.142 pooka * They will be used unless the rumpkern_tty component is present.
302 1.142 pooka */
303 1.142 pooka
304 1.142 pooka int rump_ttycheckoutq(struct tty *, int);
305 1.105 pooka int
306 1.142 pooka rump_ttycheckoutq(struct tty *tp, int wait)
307 1.67 pooka {
308 1.67 pooka
309 1.67 pooka return 1;
310 1.67 pooka }
311 1.142 pooka __weak_alias(ttycheckoutq,rump_ttycheckoutq);
312 1.67 pooka
313 1.142 pooka int rump_tputchar(int, int, struct tty *);
314 1.142 pooka int
315 1.142 pooka rump_tputchar(int c, int flags, struct tty *tp)
316 1.142 pooka {
317 1.142 pooka
318 1.142 pooka cnputc(c);
319 1.142 pooka return 0;
320 1.142 pooka }
321 1.142 pooka __weak_alias(tputchar,rump_tputchar);
322 1.142 pooka
323 1.67 pooka void
324 1.67 pooka cnputc(int c)
325 1.67 pooka {
326 1.67 pooka
327 1.157 pooka rumpuser_putchar(c);
328 1.67 pooka }
329 1.67 pooka
330 1.67 pooka void
331 1.80 cegger cnflush(void)
332 1.67 pooka {
333 1.67 pooka
334 1.67 pooka /* done */
335 1.67 pooka }
336 1.67 pooka
337 1.163 pooka void
338 1.163 pooka resettodr(void)
339 1.163 pooka {
340 1.163 pooka
341 1.163 pooka /* setting clocks is not in the jurisdiction of rump kernels */
342 1.163 pooka }
343 1.163 pooka
344 1.138 pooka #ifdef __HAVE_SYSCALL_INTERN
345 1.138 pooka void
346 1.138 pooka syscall_intern(struct proc *p)
347 1.138 pooka {
348 1.138 pooka
349 1.160 pooka p->p_emuldata = NULL;
350 1.138 pooka }
351 1.138 pooka #endif
352 1.144 pooka
353 1.148 pooka #ifdef LOCKDEBUG
354 1.148 pooka void
355 1.148 pooka turnstile_print(volatile void *obj, void (*pr)(const char *, ...))
356 1.148 pooka {
357 1.148 pooka
358 1.148 pooka /* nada */
359 1.148 pooka }
360 1.148 pooka #endif
361 1.165 pooka
362 1.165 pooka void
363 1.165 pooka cpu_reboot(int howto, char *bootstr)
364 1.165 pooka {
365 1.165 pooka int ruhow = 0;
366 1.165 pooka void *finiarg;
367 1.165 pooka
368 1.165 pooka printf("rump kernel halting...\n");
369 1.165 pooka
370 1.165 pooka if (!RUMP_LOCALPROC_P(curproc))
371 1.170 pooka finiarg = RUMP_SPVM2CTL(curproc->p_vmspace);
372 1.165 pooka else
373 1.165 pooka finiarg = NULL;
374 1.165 pooka
375 1.165 pooka /* dump means we really take the dive here */
376 1.165 pooka if ((howto & RB_DUMP) || panicstr) {
377 1.165 pooka ruhow = RUMPUSER_PANIC;
378 1.165 pooka goto out;
379 1.165 pooka }
380 1.165 pooka
381 1.165 pooka /* try to sync */
382 1.165 pooka if (!((howto & RB_NOSYNC) || panicstr)) {
383 1.165 pooka rump_vfs_fini();
384 1.165 pooka }
385 1.165 pooka
386 1.165 pooka doshutdownhooks();
387 1.165 pooka
388 1.165 pooka /* your wish is my command */
389 1.165 pooka if (howto & RB_HALT) {
390 1.172 pooka printf("rump kernel halted (with RB_HALT, not exiting)\n");
391 1.169 pooka rump_sysproxy_fini(finiarg);
392 1.165 pooka for (;;) {
393 1.165 pooka rumpuser_clock_sleep(RUMPUSER_CLOCK_RELWALL, 10, 0);
394 1.165 pooka }
395 1.165 pooka }
396 1.165 pooka
397 1.165 pooka /* this function is __dead, we must exit */
398 1.165 pooka out:
399 1.169 pooka rump_sysproxy_fini(finiarg);
400 1.165 pooka rumpuser_exit(ruhow);
401 1.165 pooka }
402 1.173 pooka
403 1.173 pooka const char *
404 1.173 pooka cpu_getmodel(void)
405 1.173 pooka {
406 1.173 pooka
407 1.173 pooka return "rumpcore (virtual)";
408 1.173 pooka }
409