kern_subr.c revision 1.194 1 1.194 ad /* $NetBSD: kern_subr.c,v 1.194 2008/11/12 14:29:31 ad Exp $ */
2 1.31 thorpej
3 1.31 thorpej /*-
4 1.185 ad * Copyright (c) 1997, 1998, 1999, 2002, 2007, 2008 The NetBSD Foundation, Inc.
5 1.31 thorpej * All rights reserved.
6 1.31 thorpej *
7 1.31 thorpej * This code is derived from software contributed to The NetBSD Foundation
8 1.31 thorpej * by Jason R. Thorpe of the Numerical Aerospace Simulation Facility,
9 1.48 lukem * NASA Ames Research Center, and by Luke Mewburn.
10 1.31 thorpej *
11 1.31 thorpej * Redistribution and use in source and binary forms, with or without
12 1.31 thorpej * modification, are permitted provided that the following conditions
13 1.31 thorpej * are met:
14 1.31 thorpej * 1. Redistributions of source code must retain the above copyright
15 1.31 thorpej * notice, this list of conditions and the following disclaimer.
16 1.31 thorpej * 2. Redistributions in binary form must reproduce the above copyright
17 1.31 thorpej * notice, this list of conditions and the following disclaimer in the
18 1.31 thorpej * documentation and/or other materials provided with the distribution.
19 1.31 thorpej *
20 1.31 thorpej * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
21 1.31 thorpej * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
22 1.31 thorpej * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
23 1.31 thorpej * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
24 1.31 thorpej * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
25 1.31 thorpej * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
26 1.31 thorpej * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
27 1.31 thorpej * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
28 1.31 thorpej * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
29 1.31 thorpej * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
30 1.31 thorpej * POSSIBILITY OF SUCH DAMAGE.
31 1.31 thorpej */
32 1.12 cgd
33 1.9 cgd /*
34 1.10 cgd * Copyright (c) 1982, 1986, 1991, 1993
35 1.10 cgd * The Regents of the University of California. All rights reserved.
36 1.9 cgd * (c) UNIX System Laboratories, Inc.
37 1.9 cgd * All or some portions of this file are derived from material licensed
38 1.9 cgd * to the University of California by American Telephone and Telegraph
39 1.9 cgd * Co. or Unix System Laboratories, Inc. and are reproduced herein with
40 1.9 cgd * the permission of UNIX System Laboratories, Inc.
41 1.9 cgd *
42 1.18 thorpej * Copyright (c) 1992, 1993
43 1.18 thorpej * The Regents of the University of California. All rights reserved.
44 1.18 thorpej *
45 1.18 thorpej * This software was developed by the Computer Systems Engineering group
46 1.18 thorpej * at Lawrence Berkeley Laboratory under DARPA contract BG 91-66 and
47 1.18 thorpej * contributed to Berkeley.
48 1.18 thorpej *
49 1.18 thorpej * All advertising materials mentioning features or use of this software
50 1.18 thorpej * must display the following acknowledgement:
51 1.18 thorpej * This product includes software developed by the University of
52 1.18 thorpej * California, Lawrence Berkeley Laboratory.
53 1.18 thorpej *
54 1.9 cgd * Redistribution and use in source and binary forms, with or without
55 1.9 cgd * modification, are permitted provided that the following conditions
56 1.9 cgd * are met:
57 1.9 cgd * 1. Redistributions of source code must retain the above copyright
58 1.9 cgd * notice, this list of conditions and the following disclaimer.
59 1.9 cgd * 2. Redistributions in binary form must reproduce the above copyright
60 1.9 cgd * notice, this list of conditions and the following disclaimer in the
61 1.9 cgd * documentation and/or other materials provided with the distribution.
62 1.103 agc * 3. Neither the name of the University nor the names of its contributors
63 1.9 cgd * may be used to endorse or promote products derived from this software
64 1.9 cgd * without specific prior written permission.
65 1.9 cgd *
66 1.9 cgd * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
67 1.9 cgd * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
68 1.9 cgd * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
69 1.9 cgd * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
70 1.9 cgd * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
71 1.9 cgd * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
72 1.9 cgd * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
73 1.9 cgd * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
74 1.9 cgd * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
75 1.9 cgd * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
76 1.9 cgd * SUCH DAMAGE.
77 1.9 cgd *
78 1.38 fvdl * @(#)kern_subr.c 8.4 (Berkeley) 2/14/95
79 1.9 cgd */
80 1.77 lukem
81 1.77 lukem #include <sys/cdefs.h>
82 1.194 ad __KERNEL_RCSID(0, "$NetBSD: kern_subr.c,v 1.194 2008/11/12 14:29:31 ad Exp $");
83 1.34 mrg
84 1.78 thorpej #include "opt_ddb.h"
85 1.43 jonathan #include "opt_md.h"
86 1.81 christos #include "opt_syscall_debug.h"
87 1.81 christos #include "opt_ktrace.h"
88 1.142 matt #include "opt_ptrace.h"
89 1.144 jmcneill #include "opt_powerhook.h"
90 1.157 manu #include "opt_tftproot.h"
91 1.9 cgd
92 1.9 cgd #include <sys/param.h>
93 1.9 cgd #include <sys/systm.h>
94 1.9 cgd #include <sys/proc.h>
95 1.10 cgd #include <sys/malloc.h>
96 1.18 thorpej #include <sys/mount.h>
97 1.18 thorpej #include <sys/device.h>
98 1.18 thorpej #include <sys/reboot.h>
99 1.18 thorpej #include <sys/conf.h>
100 1.159 dyoung #include <sys/disk.h>
101 1.18 thorpej #include <sys/disklabel.h>
102 1.10 cgd #include <sys/queue.h>
103 1.81 christos #include <sys/ktrace.h>
104 1.128 christos #include <sys/ptrace.h>
105 1.119 reinoud #include <sys/fcntl.h>
106 1.160 christos #include <sys/kauth.h>
107 1.160 christos #include <sys/vnode.h>
108 1.194 ad #include <sys/syscallvar.h>
109 1.194 ad #include <sys/xcall.h>
110 1.194 ad #include <sys/module.h>
111 1.9 cgd
112 1.82 thorpej #include <uvm/uvm_extern.h>
113 1.82 thorpej
114 1.18 thorpej #include <dev/cons.h>
115 1.18 thorpej
116 1.18 thorpej #include <net/if.h>
117 1.18 thorpej
118 1.18 thorpej /* XXX these should eventually move to subr_autoconf.c */
119 1.109 junyoung static struct device *finddevice(const char *);
120 1.109 junyoung static struct device *getdisk(char *, int, int, dev_t *, int);
121 1.109 junyoung static struct device *parsedisk(char *, int, int, dev_t *);
122 1.159 dyoung static const char *getwedgename(const char *, int);
123 1.18 thorpej
124 1.80 christos /*
125 1.80 christos * A generic linear hook.
126 1.80 christos */
127 1.80 christos struct hook_desc {
128 1.80 christos LIST_ENTRY(hook_desc) hk_list;
129 1.109 junyoung void (*hk_fn)(void *);
130 1.80 christos void *hk_arg;
131 1.80 christos };
132 1.80 christos typedef LIST_HEAD(, hook_desc) hook_list_t;
133 1.80 christos
134 1.157 manu #ifdef TFTPROOT
135 1.157 manu int tftproot_dhcpboot(struct device *);
136 1.157 manu #endif
137 1.157 manu
138 1.175 ad dev_t dumpcdev; /* for savecore */
139 1.175 ad
140 1.126 yamt void
141 1.126 yamt uio_setup_sysspace(struct uio *uio)
142 1.126 yamt {
143 1.126 yamt
144 1.126 yamt uio->uio_vmspace = vmspace_kernel();
145 1.126 yamt }
146 1.126 yamt
147 1.11 mycroft int
148 1.117 thorpej uiomove(void *buf, size_t n, struct uio *uio)
149 1.9 cgd {
150 1.126 yamt struct vmspace *vm = uio->uio_vmspace;
151 1.63 augustss struct iovec *iov;
152 1.180 njoly size_t cnt;
153 1.9 cgd int error = 0;
154 1.16 christos char *cp = buf;
155 1.112 yamt
156 1.183 yamt ASSERT_SLEEPABLE();
157 1.68 enami
158 1.68 enami #ifdef DIAGNOSTIC
159 1.9 cgd if (uio->uio_rw != UIO_READ && uio->uio_rw != UIO_WRITE)
160 1.9 cgd panic("uiomove: mode");
161 1.9 cgd #endif
162 1.9 cgd while (n > 0 && uio->uio_resid) {
163 1.9 cgd iov = uio->uio_iov;
164 1.9 cgd cnt = iov->iov_len;
165 1.9 cgd if (cnt == 0) {
166 1.105 yamt KASSERT(uio->uio_iovcnt > 0);
167 1.9 cgd uio->uio_iov++;
168 1.9 cgd uio->uio_iovcnt--;
169 1.9 cgd continue;
170 1.9 cgd }
171 1.9 cgd if (cnt > n)
172 1.9 cgd cnt = n;
173 1.126 yamt if (!VMSPACE_IS_KERNEL_P(vm)) {
174 1.104 yamt if (curcpu()->ci_schedstate.spc_flags &
175 1.67 thorpej SPCF_SHOULDYIELD)
176 1.151 ad preempt();
177 1.126 yamt }
178 1.9 cgd
179 1.126 yamt if (uio->uio_rw == UIO_READ) {
180 1.126 yamt error = copyout_vmspace(vm, cp, iov->iov_base,
181 1.126 yamt cnt);
182 1.126 yamt } else {
183 1.126 yamt error = copyin_vmspace(vm, iov->iov_base, cp,
184 1.126 yamt cnt);
185 1.126 yamt }
186 1.126 yamt if (error) {
187 1.9 cgd break;
188 1.9 cgd }
189 1.155 christos iov->iov_base = (char *)iov->iov_base + cnt;
190 1.9 cgd iov->iov_len -= cnt;
191 1.9 cgd uio->uio_resid -= cnt;
192 1.9 cgd uio->uio_offset += cnt;
193 1.9 cgd cp += cnt;
194 1.85 thorpej KDASSERT(cnt <= n);
195 1.9 cgd n -= cnt;
196 1.9 cgd }
197 1.165 ad
198 1.9 cgd return (error);
199 1.9 cgd }
200 1.9 cgd
201 1.9 cgd /*
202 1.110 itojun * Wrapper for uiomove() that validates the arguments against a known-good
203 1.111 matt * kernel buffer.
204 1.110 itojun */
205 1.110 itojun int
206 1.111 matt uiomove_frombuf(void *buf, size_t buflen, struct uio *uio)
207 1.110 itojun {
208 1.111 matt size_t offset;
209 1.110 itojun
210 1.143 christos if (uio->uio_offset < 0 || /* uio->uio_resid < 0 || */
211 1.110 itojun (offset = uio->uio_offset) != uio->uio_offset)
212 1.110 itojun return (EINVAL);
213 1.111 matt if (offset >= buflen)
214 1.110 itojun return (0);
215 1.111 matt return (uiomove((char *)buf + offset, buflen - offset, uio));
216 1.110 itojun }
217 1.110 itojun
218 1.110 itojun /*
219 1.9 cgd * Give next character to user as result of read.
220 1.9 cgd */
221 1.11 mycroft int
222 1.117 thorpej ureadc(int c, struct uio *uio)
223 1.9 cgd {
224 1.63 augustss struct iovec *iov;
225 1.9 cgd
226 1.11 mycroft if (uio->uio_resid <= 0)
227 1.11 mycroft panic("ureadc: non-positive resid");
228 1.9 cgd again:
229 1.11 mycroft if (uio->uio_iovcnt <= 0)
230 1.11 mycroft panic("ureadc: non-positive iovcnt");
231 1.9 cgd iov = uio->uio_iov;
232 1.11 mycroft if (iov->iov_len <= 0) {
233 1.9 cgd uio->uio_iovcnt--;
234 1.9 cgd uio->uio_iov++;
235 1.9 cgd goto again;
236 1.9 cgd }
237 1.126 yamt if (!VMSPACE_IS_KERNEL_P(uio->uio_vmspace)) {
238 1.9 cgd if (subyte(iov->iov_base, c) < 0)
239 1.9 cgd return (EFAULT);
240 1.126 yamt } else {
241 1.39 kleink *(char *)iov->iov_base = c;
242 1.9 cgd }
243 1.155 christos iov->iov_base = (char *)iov->iov_base + 1;
244 1.9 cgd iov->iov_len--;
245 1.9 cgd uio->uio_resid--;
246 1.9 cgd uio->uio_offset++;
247 1.9 cgd return (0);
248 1.82 thorpej }
249 1.82 thorpej
250 1.82 thorpej /*
251 1.126 yamt * Like copyin(), but operates on an arbitrary vmspace.
252 1.82 thorpej */
253 1.82 thorpej int
254 1.126 yamt copyin_vmspace(struct vmspace *vm, const void *uaddr, void *kaddr, size_t len)
255 1.82 thorpej {
256 1.82 thorpej struct iovec iov;
257 1.82 thorpej struct uio uio;
258 1.82 thorpej int error;
259 1.82 thorpej
260 1.82 thorpej if (len == 0)
261 1.82 thorpej return (0);
262 1.82 thorpej
263 1.126 yamt if (VMSPACE_IS_KERNEL_P(vm)) {
264 1.126 yamt return kcopy(uaddr, kaddr, len);
265 1.126 yamt }
266 1.126 yamt if (__predict_true(vm == curproc->p_vmspace)) {
267 1.118 christos return copyin(uaddr, kaddr, len);
268 1.126 yamt }
269 1.118 christos
270 1.82 thorpej iov.iov_base = kaddr;
271 1.82 thorpej iov.iov_len = len;
272 1.82 thorpej uio.uio_iov = &iov;
273 1.82 thorpej uio.uio_iovcnt = 1;
274 1.191 rmind uio.uio_offset = (off_t)(uintptr_t)uaddr;
275 1.82 thorpej uio.uio_resid = len;
276 1.82 thorpej uio.uio_rw = UIO_READ;
277 1.134 yamt UIO_SETUP_SYSSPACE(&uio);
278 1.126 yamt error = uvm_io(&vm->vm_map, &uio);
279 1.82 thorpej
280 1.82 thorpej return (error);
281 1.82 thorpej }
282 1.82 thorpej
283 1.82 thorpej /*
284 1.126 yamt * Like copyout(), but operates on an arbitrary vmspace.
285 1.82 thorpej */
286 1.82 thorpej int
287 1.126 yamt copyout_vmspace(struct vmspace *vm, const void *kaddr, void *uaddr, size_t len)
288 1.82 thorpej {
289 1.82 thorpej struct iovec iov;
290 1.82 thorpej struct uio uio;
291 1.82 thorpej int error;
292 1.82 thorpej
293 1.82 thorpej if (len == 0)
294 1.82 thorpej return (0);
295 1.82 thorpej
296 1.126 yamt if (VMSPACE_IS_KERNEL_P(vm)) {
297 1.126 yamt return kcopy(kaddr, uaddr, len);
298 1.126 yamt }
299 1.126 yamt if (__predict_true(vm == curproc->p_vmspace)) {
300 1.118 christos return copyout(kaddr, uaddr, len);
301 1.126 yamt }
302 1.118 christos
303 1.116 christos iov.iov_base = __UNCONST(kaddr); /* XXXUNCONST cast away const */
304 1.82 thorpej iov.iov_len = len;
305 1.82 thorpej uio.uio_iov = &iov;
306 1.82 thorpej uio.uio_iovcnt = 1;
307 1.191 rmind uio.uio_offset = (off_t)(uintptr_t)uaddr;
308 1.82 thorpej uio.uio_resid = len;
309 1.82 thorpej uio.uio_rw = UIO_WRITE;
310 1.134 yamt UIO_SETUP_SYSSPACE(&uio);
311 1.126 yamt error = uvm_io(&vm->vm_map, &uio);
312 1.126 yamt
313 1.126 yamt return (error);
314 1.126 yamt }
315 1.126 yamt
316 1.126 yamt /*
317 1.126 yamt * Like copyin(), but operates on an arbitrary process.
318 1.126 yamt */
319 1.126 yamt int
320 1.126 yamt copyin_proc(struct proc *p, const void *uaddr, void *kaddr, size_t len)
321 1.126 yamt {
322 1.126 yamt struct vmspace *vm;
323 1.126 yamt int error;
324 1.126 yamt
325 1.126 yamt error = proc_vmspace_getref(p, &vm);
326 1.126 yamt if (error) {
327 1.126 yamt return error;
328 1.126 yamt }
329 1.126 yamt error = copyin_vmspace(vm, uaddr, kaddr, len);
330 1.126 yamt uvmspace_free(vm);
331 1.82 thorpej
332 1.126 yamt return error;
333 1.126 yamt }
334 1.82 thorpej
335 1.126 yamt /*
336 1.126 yamt * Like copyout(), but operates on an arbitrary process.
337 1.126 yamt */
338 1.126 yamt int
339 1.126 yamt copyout_proc(struct proc *p, const void *kaddr, void *uaddr, size_t len)
340 1.126 yamt {
341 1.126 yamt struct vmspace *vm;
342 1.126 yamt int error;
343 1.126 yamt
344 1.126 yamt error = proc_vmspace_getref(p, &vm);
345 1.126 yamt if (error) {
346 1.126 yamt return error;
347 1.126 yamt }
348 1.132 yamt error = copyout_vmspace(vm, kaddr, uaddr, len);
349 1.126 yamt uvmspace_free(vm);
350 1.126 yamt
351 1.126 yamt return error;
352 1.9 cgd }
353 1.10 cgd
354 1.10 cgd /*
355 1.119 reinoud * Like copyin(), except it operates on kernel addresses when the FKIOCTL
356 1.119 reinoud * flag is passed in `ioctlflags' from the ioctl call.
357 1.119 reinoud */
358 1.119 reinoud int
359 1.119 reinoud ioctl_copyin(int ioctlflags, const void *src, void *dst, size_t len)
360 1.119 reinoud {
361 1.119 reinoud if (ioctlflags & FKIOCTL)
362 1.119 reinoud return kcopy(src, dst, len);
363 1.119 reinoud return copyin(src, dst, len);
364 1.119 reinoud }
365 1.119 reinoud
366 1.119 reinoud /*
367 1.119 reinoud * Like copyout(), except it operates on kernel addresses when the FKIOCTL
368 1.119 reinoud * flag is passed in `ioctlflags' from the ioctl call.
369 1.119 reinoud */
370 1.119 reinoud int
371 1.119 reinoud ioctl_copyout(int ioctlflags, const void *src, void *dst, size_t len)
372 1.119 reinoud {
373 1.119 reinoud if (ioctlflags & FKIOCTL)
374 1.119 reinoud return kcopy(src, dst, len);
375 1.119 reinoud return copyout(src, dst, len);
376 1.119 reinoud }
377 1.119 reinoud
378 1.80 christos static void *
379 1.117 thorpej hook_establish(hook_list_t *list, void (*fn)(void *), void *arg)
380 1.14 cgd {
381 1.80 christos struct hook_desc *hd;
382 1.14 cgd
383 1.80 christos hd = malloc(sizeof(*hd), M_DEVBUF, M_NOWAIT);
384 1.80 christos if (hd == NULL)
385 1.59 enami return (NULL);
386 1.14 cgd
387 1.80 christos hd->hk_fn = fn;
388 1.80 christos hd->hk_arg = arg;
389 1.80 christos LIST_INSERT_HEAD(list, hd, hk_list);
390 1.14 cgd
391 1.80 christos return (hd);
392 1.14 cgd }
393 1.14 cgd
394 1.80 christos static void
395 1.150 yamt hook_disestablish(hook_list_t *list, void *vhook)
396 1.14 cgd {
397 1.14 cgd #ifdef DIAGNOSTIC
398 1.80 christos struct hook_desc *hd;
399 1.14 cgd
400 1.83 matt LIST_FOREACH(hd, list, hk_list) {
401 1.80 christos if (hd == vhook)
402 1.14 cgd break;
403 1.83 matt }
404 1.83 matt
405 1.80 christos if (hd == NULL)
406 1.83 matt panic("hook_disestablish: hook %p not established", vhook);
407 1.14 cgd #endif
408 1.80 christos LIST_REMOVE((struct hook_desc *)vhook, hk_list);
409 1.80 christos free(vhook, M_DEVBUF);
410 1.80 christos }
411 1.80 christos
412 1.80 christos static void
413 1.117 thorpej hook_destroy(hook_list_t *list)
414 1.80 christos {
415 1.80 christos struct hook_desc *hd;
416 1.80 christos
417 1.87 matt while ((hd = LIST_FIRST(list)) != NULL) {
418 1.80 christos LIST_REMOVE(hd, hk_list);
419 1.80 christos free(hd, M_DEVBUF);
420 1.80 christos }
421 1.80 christos }
422 1.14 cgd
423 1.80 christos static void
424 1.117 thorpej hook_proc_run(hook_list_t *list, struct proc *p)
425 1.80 christos {
426 1.80 christos struct hook_desc *hd;
427 1.80 christos
428 1.178 dyoung LIST_FOREACH(hd, list, hk_list)
429 1.178 dyoung ((void (*)(struct proc *, void *))*hd->hk_fn)(p, hd->hk_arg);
430 1.80 christos }
431 1.80 christos
432 1.80 christos /*
433 1.80 christos * "Shutdown hook" types, functions, and variables.
434 1.80 christos *
435 1.80 christos * Should be invoked immediately before the
436 1.80 christos * system is halted or rebooted, i.e. after file systems unmounted,
437 1.80 christos * after crash dump done, etc.
438 1.80 christos *
439 1.80 christos * Each shutdown hook is removed from the list before it's run, so that
440 1.80 christos * it won't be run again.
441 1.80 christos */
442 1.80 christos
443 1.117 thorpej static hook_list_t shutdownhook_list;
444 1.80 christos
445 1.80 christos void *
446 1.117 thorpej shutdownhook_establish(void (*fn)(void *), void *arg)
447 1.80 christos {
448 1.80 christos return hook_establish(&shutdownhook_list, fn, arg);
449 1.80 christos }
450 1.80 christos
451 1.80 christos void
452 1.117 thorpej shutdownhook_disestablish(void *vhook)
453 1.80 christos {
454 1.89 simonb hook_disestablish(&shutdownhook_list, vhook);
455 1.14 cgd }
456 1.14 cgd
457 1.14 cgd /*
458 1.14 cgd * Run shutdown hooks. Should be invoked immediately before the
459 1.14 cgd * system is halted or rebooted, i.e. after file systems unmounted,
460 1.14 cgd * after crash dump done, etc.
461 1.17 cgd *
462 1.17 cgd * Each shutdown hook is removed from the list before it's run, so that
463 1.17 cgd * it won't be run again.
464 1.14 cgd */
465 1.14 cgd void
466 1.117 thorpej doshutdownhooks(void)
467 1.14 cgd {
468 1.80 christos struct hook_desc *dp;
469 1.14 cgd
470 1.87 matt while ((dp = LIST_FIRST(&shutdownhook_list)) != NULL) {
471 1.80 christos LIST_REMOVE(dp, hk_list);
472 1.80 christos (*dp->hk_fn)(dp->hk_arg);
473 1.17 cgd #if 0
474 1.17 cgd /*
475 1.17 cgd * Don't bother freeing the hook structure,, since we may
476 1.17 cgd * be rebooting because of a memory corruption problem,
477 1.17 cgd * and this might only make things worse. It doesn't
478 1.17 cgd * matter, anyway, since the system is just about to
479 1.17 cgd * reboot.
480 1.17 cgd */
481 1.17 cgd free(dp, M_DEVBUF);
482 1.17 cgd #endif
483 1.52 augustss }
484 1.52 augustss }
485 1.52 augustss
486 1.52 augustss /*
487 1.80 christos * "Mountroot hook" types, functions, and variables.
488 1.80 christos */
489 1.80 christos
490 1.117 thorpej static hook_list_t mountroothook_list;
491 1.80 christos
492 1.80 christos void *
493 1.117 thorpej mountroothook_establish(void (*fn)(struct device *), struct device *dev)
494 1.80 christos {
495 1.109 junyoung return hook_establish(&mountroothook_list, (void (*)(void *))fn, dev);
496 1.80 christos }
497 1.80 christos
498 1.80 christos void
499 1.117 thorpej mountroothook_disestablish(void *vhook)
500 1.80 christos {
501 1.89 simonb hook_disestablish(&mountroothook_list, vhook);
502 1.80 christos }
503 1.80 christos
504 1.80 christos void
505 1.117 thorpej mountroothook_destroy(void)
506 1.80 christos {
507 1.80 christos hook_destroy(&mountroothook_list);
508 1.80 christos }
509 1.80 christos
510 1.80 christos void
511 1.117 thorpej domountroothook(void)
512 1.80 christos {
513 1.80 christos struct hook_desc *hd;
514 1.80 christos
515 1.83 matt LIST_FOREACH(hd, &mountroothook_list, hk_list) {
516 1.80 christos if (hd->hk_arg == (void *)root_device) {
517 1.80 christos (*hd->hk_fn)(hd->hk_arg);
518 1.80 christos return;
519 1.80 christos }
520 1.80 christos }
521 1.80 christos }
522 1.80 christos
523 1.117 thorpej static hook_list_t exechook_list;
524 1.80 christos
525 1.80 christos void *
526 1.117 thorpej exechook_establish(void (*fn)(struct proc *, void *), void *arg)
527 1.80 christos {
528 1.109 junyoung return hook_establish(&exechook_list, (void (*)(void *))fn, arg);
529 1.80 christos }
530 1.80 christos
531 1.80 christos void
532 1.117 thorpej exechook_disestablish(void *vhook)
533 1.80 christos {
534 1.80 christos hook_disestablish(&exechook_list, vhook);
535 1.80 christos }
536 1.80 christos
537 1.80 christos /*
538 1.80 christos * Run exec hooks.
539 1.80 christos */
540 1.80 christos void
541 1.117 thorpej doexechooks(struct proc *p)
542 1.80 christos {
543 1.80 christos hook_proc_run(&exechook_list, p);
544 1.80 christos }
545 1.80 christos
546 1.117 thorpej static hook_list_t exithook_list;
547 1.80 christos
548 1.80 christos void *
549 1.117 thorpej exithook_establish(void (*fn)(struct proc *, void *), void *arg)
550 1.80 christos {
551 1.109 junyoung return hook_establish(&exithook_list, (void (*)(void *))fn, arg);
552 1.80 christos }
553 1.80 christos
554 1.80 christos void
555 1.117 thorpej exithook_disestablish(void *vhook)
556 1.80 christos {
557 1.80 christos hook_disestablish(&exithook_list, vhook);
558 1.80 christos }
559 1.80 christos
560 1.80 christos /*
561 1.80 christos * Run exit hooks.
562 1.80 christos */
563 1.80 christos void
564 1.117 thorpej doexithooks(struct proc *p)
565 1.80 christos {
566 1.80 christos hook_proc_run(&exithook_list, p);
567 1.96 thorpej }
568 1.96 thorpej
569 1.117 thorpej static hook_list_t forkhook_list;
570 1.96 thorpej
571 1.96 thorpej void *
572 1.117 thorpej forkhook_establish(void (*fn)(struct proc *, struct proc *))
573 1.96 thorpej {
574 1.109 junyoung return hook_establish(&forkhook_list, (void (*)(void *))fn, NULL);
575 1.96 thorpej }
576 1.96 thorpej
577 1.96 thorpej void
578 1.117 thorpej forkhook_disestablish(void *vhook)
579 1.96 thorpej {
580 1.96 thorpej hook_disestablish(&forkhook_list, vhook);
581 1.96 thorpej }
582 1.96 thorpej
583 1.96 thorpej /*
584 1.96 thorpej * Run fork hooks.
585 1.96 thorpej */
586 1.96 thorpej void
587 1.117 thorpej doforkhooks(struct proc *p2, struct proc *p1)
588 1.96 thorpej {
589 1.96 thorpej struct hook_desc *hd;
590 1.96 thorpej
591 1.96 thorpej LIST_FOREACH(hd, &forkhook_list, hk_list) {
592 1.109 junyoung ((void (*)(struct proc *, struct proc *))*hd->hk_fn)
593 1.96 thorpej (p2, p1);
594 1.96 thorpej }
595 1.80 christos }
596 1.80 christos
597 1.80 christos /*
598 1.52 augustss * "Power hook" types, functions, and variables.
599 1.71 augustss * The list of power hooks is kept ordered with the last registered hook
600 1.71 augustss * first.
601 1.71 augustss * When running the hooks on power down the hooks are called in reverse
602 1.71 augustss * registration order, when powering up in registration order.
603 1.52 augustss */
604 1.52 augustss struct powerhook_desc {
605 1.71 augustss CIRCLEQ_ENTRY(powerhook_desc) sfd_list;
606 1.109 junyoung void (*sfd_fn)(int, void *);
607 1.52 augustss void *sfd_arg;
608 1.144 jmcneill char sfd_name[16];
609 1.52 augustss };
610 1.52 augustss
611 1.117 thorpej static CIRCLEQ_HEAD(, powerhook_desc) powerhook_list =
612 1.117 thorpej CIRCLEQ_HEAD_INITIALIZER(powerhook_list);
613 1.52 augustss
614 1.52 augustss void *
615 1.145 dogcow powerhook_establish(const char *name, void (*fn)(int, void *), void *arg)
616 1.52 augustss {
617 1.52 augustss struct powerhook_desc *ndp;
618 1.52 augustss
619 1.52 augustss ndp = (struct powerhook_desc *)
620 1.52 augustss malloc(sizeof(*ndp), M_DEVBUF, M_NOWAIT);
621 1.52 augustss if (ndp == NULL)
622 1.59 enami return (NULL);
623 1.52 augustss
624 1.52 augustss ndp->sfd_fn = fn;
625 1.52 augustss ndp->sfd_arg = arg;
626 1.144 jmcneill strlcpy(ndp->sfd_name, name, sizeof(ndp->sfd_name));
627 1.71 augustss CIRCLEQ_INSERT_HEAD(&powerhook_list, ndp, sfd_list);
628 1.52 augustss
629 1.167 jmcneill aprint_error("%s: WARNING: powerhook_establish is deprecated\n", name);
630 1.52 augustss return (ndp);
631 1.52 augustss }
632 1.52 augustss
633 1.52 augustss void
634 1.117 thorpej powerhook_disestablish(void *vhook)
635 1.52 augustss {
636 1.52 augustss #ifdef DIAGNOSTIC
637 1.52 augustss struct powerhook_desc *dp;
638 1.52 augustss
639 1.71 augustss CIRCLEQ_FOREACH(dp, &powerhook_list, sfd_list)
640 1.52 augustss if (dp == vhook)
641 1.71 augustss goto found;
642 1.83 matt panic("powerhook_disestablish: hook %p not established", vhook);
643 1.71 augustss found:
644 1.52 augustss #endif
645 1.52 augustss
646 1.71 augustss CIRCLEQ_REMOVE(&powerhook_list, (struct powerhook_desc *)vhook,
647 1.71 augustss sfd_list);
648 1.52 augustss free(vhook, M_DEVBUF);
649 1.52 augustss }
650 1.52 augustss
651 1.52 augustss /*
652 1.52 augustss * Run power hooks.
653 1.52 augustss */
654 1.52 augustss void
655 1.117 thorpej dopowerhooks(int why)
656 1.52 augustss {
657 1.52 augustss struct powerhook_desc *dp;
658 1.52 augustss
659 1.144 jmcneill #ifdef POWERHOOK_DEBUG
660 1.162 christos const char *why_name;
661 1.163 degroote static const char * pwr_names[] = {PWR_NAMES};
662 1.163 degroote why_name = why < __arraycount(pwr_names) ? pwr_names[why] : "???";
663 1.144 jmcneill #endif
664 1.144 jmcneill
665 1.73 takemura if (why == PWR_RESUME || why == PWR_SOFTRESUME) {
666 1.71 augustss CIRCLEQ_FOREACH_REVERSE(dp, &powerhook_list, sfd_list) {
667 1.144 jmcneill #ifdef POWERHOOK_DEBUG
668 1.162 christos printf("dopowerhooks %s: %s (%p)\n", why_name, dp->sfd_name, dp);
669 1.144 jmcneill #endif
670 1.71 augustss (*dp->sfd_fn)(why, dp->sfd_arg);
671 1.71 augustss }
672 1.71 augustss } else {
673 1.71 augustss CIRCLEQ_FOREACH(dp, &powerhook_list, sfd_list) {
674 1.144 jmcneill #ifdef POWERHOOK_DEBUG
675 1.162 christos printf("dopowerhooks %s: %s (%p)\n", why_name, dp->sfd_name, dp);
676 1.144 jmcneill #endif
677 1.71 augustss (*dp->sfd_fn)(why, dp->sfd_arg);
678 1.71 augustss }
679 1.18 thorpej }
680 1.144 jmcneill
681 1.144 jmcneill #ifdef POWERHOOK_DEBUG
682 1.162 christos printf("dopowerhooks: %s done\n", why_name);
683 1.144 jmcneill #endif
684 1.18 thorpej }
685 1.18 thorpej
686 1.160 christos static int
687 1.160 christos isswap(struct device *dv)
688 1.160 christos {
689 1.160 christos struct dkwedge_info wi;
690 1.160 christos struct vnode *vn;
691 1.160 christos int error;
692 1.160 christos
693 1.160 christos if (device_class(dv) != DV_DISK || !device_is_a(dv, "dk"))
694 1.160 christos return 0;
695 1.160 christos
696 1.160 christos if ((vn = opendisk(dv)) == NULL)
697 1.160 christos return 0;
698 1.160 christos
699 1.166 pooka error = VOP_IOCTL(vn, DIOCGWEDGEINFO, &wi, FREAD, NOCRED);
700 1.166 pooka VOP_CLOSE(vn, FREAD, NOCRED);
701 1.160 christos vput(vn);
702 1.160 christos if (error) {
703 1.160 christos #ifdef DEBUG_WEDGE
704 1.184 cegger printf("%s: Get wedge info returned %d\n", device_xname(dv), error);
705 1.160 christos #endif
706 1.160 christos return 0;
707 1.160 christos }
708 1.160 christos return strcmp(wi.dkw_ptype, DKW_PTYPE_SWAP) == 0;
709 1.160 christos }
710 1.160 christos
711 1.18 thorpej /*
712 1.18 thorpej * Determine the root device and, if instructed to, the root file system.
713 1.18 thorpej */
714 1.18 thorpej
715 1.18 thorpej #include "md.h"
716 1.18 thorpej
717 1.187 ad #if NMD > 0
718 1.127 cube extern struct cfdriver md_cd;
719 1.108 christos #ifdef MEMORY_DISK_IS_ROOT
720 1.187 ad int md_is_root = 1;
721 1.187 ad #else
722 1.187 ad int md_is_root = 0;
723 1.108 christos #endif
724 1.190 drochner #endif
725 1.108 christos
726 1.113 thorpej /*
727 1.113 thorpej * The device and wedge that we booted from. If booted_wedge is NULL,
728 1.113 thorpej * the we might consult booted_partition.
729 1.113 thorpej */
730 1.113 thorpej struct device *booted_device;
731 1.113 thorpej struct device *booted_wedge;
732 1.113 thorpej int booted_partition;
733 1.113 thorpej
734 1.113 thorpej /*
735 1.113 thorpej * Use partition letters if it's a disk class but not a wedge.
736 1.113 thorpej * XXX Check for wedge is kinda gross.
737 1.113 thorpej */
738 1.113 thorpej #define DEV_USES_PARTITIONS(dv) \
739 1.124 thorpej (device_class((dv)) == DV_DISK && \
740 1.125 thorpej !device_is_a((dv), "dk"))
741 1.113 thorpej
742 1.18 thorpej void
743 1.117 thorpej setroot(struct device *bootdv, int bootpartition)
744 1.18 thorpej {
745 1.18 thorpej struct device *dv;
746 1.159 dyoung int len, majdev;
747 1.25 mrg dev_t nrootdev;
748 1.26 thorpej dev_t ndumpdev = NODEV;
749 1.18 thorpej char buf[128];
750 1.18 thorpej const char *rootdevname;
751 1.26 thorpej const char *dumpdevname;
752 1.26 thorpej struct device *rootdv = NULL; /* XXX gcc -Wuninitialized */
753 1.26 thorpej struct device *dumpdv = NULL;
754 1.18 thorpej struct ifnet *ifp;
755 1.18 thorpej const char *deffsname;
756 1.18 thorpej struct vfsops *vops;
757 1.18 thorpej
758 1.157 manu #ifdef TFTPROOT
759 1.157 manu if (tftproot_dhcpboot(bootdv) != 0)
760 1.157 manu boothowto |= RB_ASKNAME;
761 1.157 manu #endif
762 1.157 manu
763 1.187 ad #if NMD > 0
764 1.187 ad if (md_is_root) {
765 1.190 drochner /*
766 1.190 drochner * XXX there should be "root on md0" in the config file,
767 1.190 drochner * but it isn't always
768 1.190 drochner */
769 1.190 drochner bootdv = md_cd.cd_devs[0];
770 1.187 ad bootpartition = 0;
771 1.28 leo }
772 1.18 thorpej #endif
773 1.18 thorpej
774 1.18 thorpej /*
775 1.18 thorpej * If NFS is specified as the file system, and we found
776 1.18 thorpej * a DV_DISK boot device (or no boot device at all), then
777 1.18 thorpej * find a reasonable network interface for "rootspec".
778 1.18 thorpej */
779 1.18 thorpej vops = vfs_getopsbyname("nfs");
780 1.18 thorpej if (vops != NULL && vops->vfs_mountroot == mountroot &&
781 1.18 thorpej rootspec == NULL &&
782 1.124 thorpej (bootdv == NULL || device_class(bootdv) != DV_IFNET)) {
783 1.115 matt IFNET_FOREACH(ifp) {
784 1.18 thorpej if ((ifp->if_flags &
785 1.18 thorpej (IFF_LOOPBACK|IFF_POINTOPOINT)) == 0)
786 1.18 thorpej break;
787 1.83 matt }
788 1.18 thorpej if (ifp == NULL) {
789 1.18 thorpej /*
790 1.18 thorpej * Can't find a suitable interface; ask the
791 1.18 thorpej * user.
792 1.18 thorpej */
793 1.18 thorpej boothowto |= RB_ASKNAME;
794 1.18 thorpej } else {
795 1.18 thorpej /*
796 1.18 thorpej * Have a suitable interface; behave as if
797 1.18 thorpej * the user specified this interface.
798 1.18 thorpej */
799 1.18 thorpej rootspec = (const char *)ifp->if_xname;
800 1.18 thorpej }
801 1.18 thorpej }
802 1.165 ad if (vops != NULL)
803 1.165 ad vfs_delref(vops);
804 1.24 thorpej
805 1.24 thorpej /*
806 1.24 thorpej * If wildcarded root and we the boot device wasn't determined,
807 1.24 thorpej * ask the user.
808 1.24 thorpej */
809 1.24 thorpej if (rootspec == NULL && bootdv == NULL)
810 1.24 thorpej boothowto |= RB_ASKNAME;
811 1.18 thorpej
812 1.18 thorpej top:
813 1.18 thorpej if (boothowto & RB_ASKNAME) {
814 1.26 thorpej struct device *defdumpdv;
815 1.26 thorpej
816 1.18 thorpej for (;;) {
817 1.18 thorpej printf("root device");
818 1.18 thorpej if (bootdv != NULL) {
819 1.184 cegger printf(" (default %s", device_xname(bootdv));
820 1.113 thorpej if (DEV_USES_PARTITIONS(bootdv))
821 1.18 thorpej printf("%c", bootpartition + 'a');
822 1.18 thorpej printf(")");
823 1.18 thorpej }
824 1.18 thorpej printf(": ");
825 1.64 itojun len = cngetsn(buf, sizeof(buf));
826 1.18 thorpej if (len == 0 && bootdv != NULL) {
827 1.184 cegger strlcpy(buf, device_xname(bootdv), sizeof(buf));
828 1.18 thorpej len = strlen(buf);
829 1.18 thorpej }
830 1.18 thorpej if (len > 0 && buf[len - 1] == '*') {
831 1.18 thorpej buf[--len] = '\0';
832 1.51 thorpej dv = getdisk(buf, len, 1, &nrootdev, 0);
833 1.18 thorpej if (dv != NULL) {
834 1.18 thorpej rootdv = dv;
835 1.25 mrg break;
836 1.18 thorpej }
837 1.18 thorpej }
838 1.51 thorpej dv = getdisk(buf, len, bootpartition, &nrootdev, 0);
839 1.18 thorpej if (dv != NULL) {
840 1.18 thorpej rootdv = dv;
841 1.18 thorpej break;
842 1.18 thorpej }
843 1.18 thorpej }
844 1.18 thorpej
845 1.26 thorpej /*
846 1.26 thorpej * Set up the default dump device. If root is on
847 1.26 thorpej * a network device, there is no default dump
848 1.26 thorpej * device, since we don't support dumps to the
849 1.26 thorpej * network.
850 1.26 thorpej */
851 1.113 thorpej if (DEV_USES_PARTITIONS(rootdv) == 0)
852 1.26 thorpej defdumpdv = NULL;
853 1.26 thorpej else
854 1.26 thorpej defdumpdv = rootdv;
855 1.26 thorpej
856 1.26 thorpej for (;;) {
857 1.26 thorpej printf("dump device");
858 1.26 thorpej if (defdumpdv != NULL) {
859 1.26 thorpej /*
860 1.26 thorpej * Note, we know it's a disk if we get here.
861 1.26 thorpej */
862 1.184 cegger printf(" (default %sb)", device_xname(defdumpdv));
863 1.26 thorpej }
864 1.26 thorpej printf(": ");
865 1.64 itojun len = cngetsn(buf, sizeof(buf));
866 1.26 thorpej if (len == 0) {
867 1.26 thorpej if (defdumpdv != NULL) {
868 1.26 thorpej ndumpdev = MAKEDISKDEV(major(nrootdev),
869 1.26 thorpej DISKUNIT(nrootdev), 1);
870 1.26 thorpej }
871 1.54 enami dumpdv = defdumpdv;
872 1.26 thorpej break;
873 1.26 thorpej }
874 1.26 thorpej if (len == 4 && strcmp(buf, "none") == 0) {
875 1.55 enami dumpdv = NULL;
876 1.54 enami break;
877 1.26 thorpej }
878 1.51 thorpej dv = getdisk(buf, len, 1, &ndumpdev, 1);
879 1.55 enami if (dv != NULL) {
880 1.26 thorpej dumpdv = dv;
881 1.26 thorpej break;
882 1.26 thorpej }
883 1.26 thorpej }
884 1.26 thorpej
885 1.18 thorpej rootdev = nrootdev;
886 1.26 thorpej dumpdev = ndumpdev;
887 1.18 thorpej
888 1.36 thorpej for (vops = LIST_FIRST(&vfs_list); vops != NULL;
889 1.36 thorpej vops = LIST_NEXT(vops, vfs_list)) {
890 1.36 thorpej if (vops->vfs_mountroot != NULL &&
891 1.36 thorpej vops->vfs_mountroot == mountroot)
892 1.38 fvdl break;
893 1.18 thorpej }
894 1.36 thorpej
895 1.36 thorpej if (vops == NULL) {
896 1.18 thorpej mountroot = NULL;
897 1.18 thorpej deffsname = "generic";
898 1.18 thorpej } else
899 1.36 thorpej deffsname = vops->vfs_name;
900 1.36 thorpej
901 1.18 thorpej for (;;) {
902 1.18 thorpej printf("file system (default %s): ", deffsname);
903 1.64 itojun len = cngetsn(buf, sizeof(buf));
904 1.18 thorpej if (len == 0)
905 1.18 thorpej break;
906 1.18 thorpej if (len == 4 && strcmp(buf, "halt") == 0)
907 1.23 gwr cpu_reboot(RB_HALT, NULL);
908 1.76 thorpej else if (len == 6 && strcmp(buf, "reboot") == 0)
909 1.76 thorpej cpu_reboot(0, NULL);
910 1.78 thorpej #if defined(DDB)
911 1.78 thorpej else if (len == 3 && strcmp(buf, "ddb") == 0) {
912 1.78 thorpej console_debugger();
913 1.78 thorpej }
914 1.78 thorpej #endif
915 1.18 thorpej else if (len == 7 && strcmp(buf, "generic") == 0) {
916 1.18 thorpej mountroot = NULL;
917 1.18 thorpej break;
918 1.18 thorpej }
919 1.18 thorpej vops = vfs_getopsbyname(buf);
920 1.18 thorpej if (vops == NULL || vops->vfs_mountroot == NULL) {
921 1.18 thorpej printf("use one of: generic");
922 1.36 thorpej for (vops = LIST_FIRST(&vfs_list);
923 1.36 thorpej vops != NULL;
924 1.36 thorpej vops = LIST_NEXT(vops, vfs_list)) {
925 1.36 thorpej if (vops->vfs_mountroot != NULL)
926 1.36 thorpej printf(" %s", vops->vfs_name);
927 1.36 thorpej }
928 1.78 thorpej #if defined(DDB)
929 1.78 thorpej printf(" ddb");
930 1.78 thorpej #endif
931 1.76 thorpej printf(" halt reboot\n");
932 1.18 thorpej } else {
933 1.18 thorpej mountroot = vops->vfs_mountroot;
934 1.165 ad vfs_delref(vops);
935 1.18 thorpej break;
936 1.18 thorpej }
937 1.18 thorpej }
938 1.18 thorpej
939 1.18 thorpej } else if (rootspec == NULL) {
940 1.18 thorpej /*
941 1.18 thorpej * Wildcarded root; use the boot device.
942 1.18 thorpej */
943 1.26 thorpej rootdv = bootdv;
944 1.26 thorpej
945 1.188 christos if (bootdv)
946 1.188 christos majdev = devsw_name2blk(device_xname(bootdv), NULL, 0);
947 1.188 christos else
948 1.188 christos majdev = -1;
949 1.18 thorpej if (majdev >= 0) {
950 1.18 thorpej /*
951 1.113 thorpej * Root is on a disk. `bootpartition' is root,
952 1.113 thorpej * unless the device does not use partitions.
953 1.18 thorpej */
954 1.113 thorpej if (DEV_USES_PARTITIONS(bootdv))
955 1.135 thorpej rootdev = MAKEDISKDEV(majdev,
956 1.135 thorpej device_unit(bootdv),
957 1.135 thorpej bootpartition);
958 1.113 thorpej else
959 1.135 thorpej rootdev = makedev(majdev, device_unit(bootdv));
960 1.18 thorpej }
961 1.18 thorpej } else {
962 1.18 thorpej
963 1.18 thorpej /*
964 1.25 mrg * `root on <dev> ...'
965 1.18 thorpej */
966 1.18 thorpej
967 1.18 thorpej /*
968 1.18 thorpej * If it's a network interface, we can bail out
969 1.18 thorpej * early.
970 1.18 thorpej */
971 1.56 enami dv = finddevice(rootspec);
972 1.124 thorpej if (dv != NULL && device_class(dv) == DV_IFNET) {
973 1.26 thorpej rootdv = dv;
974 1.26 thorpej goto haveroot;
975 1.18 thorpej }
976 1.18 thorpej
977 1.159 dyoung if (rootdev == NODEV &&
978 1.159 dyoung device_class(dv) == DV_DISK && device_is_a(dv, "dk") &&
979 1.184 cegger (majdev = devsw_name2blk(device_xname(dv), NULL, 0)) >= 0)
980 1.159 dyoung rootdev = makedev(majdev, device_unit(dv));
981 1.159 dyoung
982 1.88 gehenna rootdevname = devsw_blk2name(major(rootdev));
983 1.18 thorpej if (rootdevname == NULL) {
984 1.18 thorpej printf("unknown device major 0x%x\n", rootdev);
985 1.18 thorpej boothowto |= RB_ASKNAME;
986 1.18 thorpej goto top;
987 1.18 thorpej }
988 1.41 perry memset(buf, 0, sizeof(buf));
989 1.110 itojun snprintf(buf, sizeof(buf), "%s%d", rootdevname,
990 1.110 itojun DISKUNIT(rootdev));
991 1.18 thorpej
992 1.56 enami rootdv = finddevice(buf);
993 1.26 thorpej if (rootdv == NULL) {
994 1.18 thorpej printf("device %s (0x%x) not configured\n",
995 1.18 thorpej buf, rootdev);
996 1.18 thorpej boothowto |= RB_ASKNAME;
997 1.18 thorpej goto top;
998 1.18 thorpej }
999 1.26 thorpej }
1000 1.18 thorpej
1001 1.26 thorpej haveroot:
1002 1.18 thorpej
1003 1.18 thorpej root_device = rootdv;
1004 1.18 thorpej
1005 1.124 thorpej switch (device_class(rootdv)) {
1006 1.18 thorpej case DV_IFNET:
1007 1.139 christos case DV_DISK:
1008 1.184 cegger aprint_normal("root on %s", device_xname(rootdv));
1009 1.140 christos if (DEV_USES_PARTITIONS(rootdv))
1010 1.139 christos aprint_normal("%c", DISKPART(rootdev) + 'a');
1011 1.18 thorpej break;
1012 1.18 thorpej
1013 1.18 thorpej default:
1014 1.18 thorpej printf("can't determine root device\n");
1015 1.18 thorpej boothowto |= RB_ASKNAME;
1016 1.18 thorpej goto top;
1017 1.18 thorpej }
1018 1.26 thorpej
1019 1.26 thorpej /*
1020 1.26 thorpej * Now configure the dump device.
1021 1.55 enami *
1022 1.26 thorpej * If we haven't figured out the dump device, do so, with
1023 1.26 thorpej * the following rules:
1024 1.26 thorpej *
1025 1.26 thorpej * (a) We already know dumpdv in the RB_ASKNAME case.
1026 1.26 thorpej *
1027 1.26 thorpej * (b) If dumpspec is set, try to use it. If the device
1028 1.26 thorpej * is not available, punt.
1029 1.26 thorpej *
1030 1.26 thorpej * (c) If dumpspec is not set, the dump device is
1031 1.26 thorpej * wildcarded or unspecified. If the root device
1032 1.26 thorpej * is DV_IFNET, punt. Otherwise, use partition b
1033 1.26 thorpej * of the root device.
1034 1.26 thorpej */
1035 1.26 thorpej
1036 1.55 enami if (boothowto & RB_ASKNAME) { /* (a) */
1037 1.55 enami if (dumpdv == NULL)
1038 1.55 enami goto nodumpdev;
1039 1.55 enami } else if (dumpspec != NULL) { /* (b) */
1040 1.55 enami if (strcmp(dumpspec, "none") == 0 || dumpdev == NODEV) {
1041 1.26 thorpej /*
1042 1.55 enami * Operator doesn't want a dump device.
1043 1.55 enami * Or looks like they tried to pick a network
1044 1.26 thorpej * device. Oops.
1045 1.26 thorpej */
1046 1.26 thorpej goto nodumpdev;
1047 1.26 thorpej }
1048 1.26 thorpej
1049 1.88 gehenna dumpdevname = devsw_blk2name(major(dumpdev));
1050 1.26 thorpej if (dumpdevname == NULL)
1051 1.26 thorpej goto nodumpdev;
1052 1.41 perry memset(buf, 0, sizeof(buf));
1053 1.110 itojun snprintf(buf, sizeof(buf), "%s%d", dumpdevname,
1054 1.110 itojun DISKUNIT(dumpdev));
1055 1.26 thorpej
1056 1.56 enami dumpdv = finddevice(buf);
1057 1.56 enami if (dumpdv == NULL) {
1058 1.26 thorpej /*
1059 1.26 thorpej * Device not configured.
1060 1.26 thorpej */
1061 1.26 thorpej goto nodumpdev;
1062 1.26 thorpej }
1063 1.55 enami } else { /* (c) */
1064 1.160 christos if (DEV_USES_PARTITIONS(rootdv) == 0) {
1065 1.160 christos for (dv = TAILQ_FIRST(&alldevs); dv != NULL;
1066 1.160 christos dv = TAILQ_NEXT(dv, dv_list))
1067 1.160 christos if (isswap(dv))
1068 1.160 christos break;
1069 1.160 christos if (dv == NULL)
1070 1.160 christos goto nodumpdev;
1071 1.160 christos
1072 1.184 cegger majdev = devsw_name2blk(device_xname(dv), NULL, 0);
1073 1.160 christos if (majdev < 0)
1074 1.160 christos goto nodumpdev;
1075 1.160 christos dumpdv = dv;
1076 1.160 christos dumpdev = makedev(majdev, device_unit(dumpdv));
1077 1.160 christos } else {
1078 1.55 enami dumpdv = rootdv;
1079 1.55 enami dumpdev = MAKEDISKDEV(major(rootdev),
1080 1.135 thorpej device_unit(dumpdv), 1);
1081 1.55 enami }
1082 1.26 thorpej }
1083 1.26 thorpej
1084 1.175 ad dumpcdev = devsw_blk2chr(dumpdev);
1085 1.184 cegger aprint_normal(" dumps on %s", device_xname(dumpdv));
1086 1.140 christos if (DEV_USES_PARTITIONS(dumpdv))
1087 1.140 christos aprint_normal("%c", DISKPART(dumpdev) + 'a');
1088 1.140 christos aprint_normal("\n");
1089 1.26 thorpej return;
1090 1.26 thorpej
1091 1.26 thorpej nodumpdev:
1092 1.26 thorpej dumpdev = NODEV;
1093 1.175 ad dumpcdev = NODEV;
1094 1.100 thorpej aprint_normal("\n");
1095 1.18 thorpej }
1096 1.18 thorpej
1097 1.18 thorpej static struct device *
1098 1.117 thorpej finddevice(const char *name)
1099 1.56 enami {
1100 1.159 dyoung const char *wname;
1101 1.108 christos
1102 1.159 dyoung if ((wname = getwedgename(name, strlen(name))) != NULL)
1103 1.159 dyoung return dkwedge_find_by_wname(wname);
1104 1.159 dyoung
1105 1.179 joerg return device_find_by_xname(name);
1106 1.56 enami }
1107 1.56 enami
1108 1.56 enami static struct device *
1109 1.117 thorpej getdisk(char *str, int len, int defpart, dev_t *devp, int isdump)
1110 1.18 thorpej {
1111 1.28 leo struct device *dv;
1112 1.18 thorpej
1113 1.51 thorpej if ((dv = parsedisk(str, len, defpart, devp)) == NULL) {
1114 1.18 thorpej printf("use one of:");
1115 1.83 matt TAILQ_FOREACH(dv, &alldevs, dv_list) {
1116 1.113 thorpej if (DEV_USES_PARTITIONS(dv))
1117 1.184 cegger printf(" %s[a-%c]", device_xname(dv),
1118 1.19 cgd 'a' + MAXPARTITIONS - 1);
1119 1.124 thorpej else if (device_class(dv) == DV_DISK)
1120 1.184 cegger printf(" %s", device_xname(dv));
1121 1.124 thorpej if (isdump == 0 && device_class(dv) == DV_IFNET)
1122 1.184 cegger printf(" %s", device_xname(dv));
1123 1.18 thorpej }
1124 1.159 dyoung dkwedge_print_wnames();
1125 1.26 thorpej if (isdump)
1126 1.26 thorpej printf(" none");
1127 1.78 thorpej #if defined(DDB)
1128 1.78 thorpej printf(" ddb");
1129 1.78 thorpej #endif
1130 1.76 thorpej printf(" halt reboot\n");
1131 1.18 thorpej }
1132 1.159 dyoung return dv;
1133 1.159 dyoung }
1134 1.159 dyoung
1135 1.159 dyoung static const char *
1136 1.159 dyoung getwedgename(const char *name, int namelen)
1137 1.159 dyoung {
1138 1.159 dyoung const char *wpfx = "wedge:";
1139 1.159 dyoung const int wpfxlen = strlen(wpfx);
1140 1.159 dyoung
1141 1.159 dyoung if (namelen < wpfxlen || strncmp(name, wpfx, wpfxlen) != 0)
1142 1.159 dyoung return NULL;
1143 1.159 dyoung
1144 1.159 dyoung return name + wpfxlen;
1145 1.18 thorpej }
1146 1.18 thorpej
1147 1.18 thorpej static struct device *
1148 1.117 thorpej parsedisk(char *str, int len, int defpart, dev_t *devp)
1149 1.18 thorpej {
1150 1.18 thorpej struct device *dv;
1151 1.159 dyoung const char *wname;
1152 1.18 thorpej char *cp, c;
1153 1.29 drochner int majdev, part;
1154 1.18 thorpej if (len == 0)
1155 1.18 thorpej return (NULL);
1156 1.18 thorpej
1157 1.18 thorpej if (len == 4 && strcmp(str, "halt") == 0)
1158 1.23 gwr cpu_reboot(RB_HALT, NULL);
1159 1.76 thorpej else if (len == 6 && strcmp(str, "reboot") == 0)
1160 1.76 thorpej cpu_reboot(0, NULL);
1161 1.78 thorpej #if defined(DDB)
1162 1.78 thorpej else if (len == 3 && strcmp(str, "ddb") == 0)
1163 1.78 thorpej console_debugger();
1164 1.78 thorpej #endif
1165 1.18 thorpej
1166 1.18 thorpej cp = str + len - 1;
1167 1.18 thorpej c = *cp;
1168 1.159 dyoung
1169 1.159 dyoung if ((wname = getwedgename(str, len)) != NULL) {
1170 1.159 dyoung if ((dv = dkwedge_find_by_wname(wname)) == NULL)
1171 1.159 dyoung return NULL;
1172 1.159 dyoung part = defpart;
1173 1.159 dyoung goto gotdisk;
1174 1.159 dyoung } else if (c >= 'a' && c <= ('a' + MAXPARTITIONS - 1)) {
1175 1.18 thorpej part = c - 'a';
1176 1.18 thorpej *cp = '\0';
1177 1.18 thorpej } else
1178 1.18 thorpej part = defpart;
1179 1.18 thorpej
1180 1.56 enami dv = finddevice(str);
1181 1.56 enami if (dv != NULL) {
1182 1.124 thorpej if (device_class(dv) == DV_DISK) {
1183 1.18 thorpej gotdisk:
1184 1.184 cegger majdev = devsw_name2blk(device_xname(dv), NULL, 0);
1185 1.18 thorpej if (majdev < 0)
1186 1.18 thorpej panic("parsedisk");
1187 1.113 thorpej if (DEV_USES_PARTITIONS(dv))
1188 1.135 thorpej *devp = MAKEDISKDEV(majdev, device_unit(dv),
1189 1.135 thorpej part);
1190 1.113 thorpej else
1191 1.135 thorpej *devp = makedev(majdev, device_unit(dv));
1192 1.18 thorpej }
1193 1.18 thorpej
1194 1.124 thorpej if (device_class(dv) == DV_IFNET)
1195 1.18 thorpej *devp = NODEV;
1196 1.18 thorpej }
1197 1.18 thorpej
1198 1.18 thorpej *cp = c;
1199 1.18 thorpej return (dv);
1200 1.48 lukem }
1201 1.48 lukem
1202 1.48 lukem /*
1203 1.49 lukem * snprintf() `bytes' into `buf', reformatting it so that the number,
1204 1.49 lukem * plus a possible `x' + suffix extension) fits into len bytes (including
1205 1.49 lukem * the terminating NUL).
1206 1.60 enami * Returns the number of bytes stored in buf, or -1 if there was a problem.
1207 1.109 junyoung * E.g, given a len of 9 and a suffix of `B':
1208 1.48 lukem * bytes result
1209 1.48 lukem * ----- ------
1210 1.49 lukem * 99999 `99999 B'
1211 1.90 wiz * 100000 `97 kB'
1212 1.90 wiz * 66715648 `65152 kB'
1213 1.48 lukem * 252215296 `240 MB'
1214 1.48 lukem */
1215 1.48 lukem int
1216 1.117 thorpej humanize_number(char *buf, size_t len, uint64_t bytes, const char *suffix,
1217 1.117 thorpej int divisor)
1218 1.48 lukem {
1219 1.91 drochner /* prefixes are: (none), kilo, Mega, Giga, Tera, Peta, Exa */
1220 1.91 drochner const char *prefixes;
1221 1.86 thorpej int r;
1222 1.121 perry uint64_t umax;
1223 1.86 thorpej size_t i, suffixlen;
1224 1.48 lukem
1225 1.49 lukem if (buf == NULL || suffix == NULL)
1226 1.49 lukem return (-1);
1227 1.48 lukem if (len > 0)
1228 1.48 lukem buf[0] = '\0';
1229 1.49 lukem suffixlen = strlen(suffix);
1230 1.91 drochner /* check if enough room for `x y' + suffix + `\0' */
1231 1.49 lukem if (len < 4 + suffixlen)
1232 1.49 lukem return (-1);
1233 1.48 lukem
1234 1.91 drochner if (divisor == 1024) {
1235 1.91 drochner /*
1236 1.91 drochner * binary multiplies
1237 1.91 drochner * XXX IEC 60027-2 recommends Ki, Mi, Gi...
1238 1.91 drochner */
1239 1.91 drochner prefixes = " KMGTPE";
1240 1.91 drochner } else
1241 1.91 drochner prefixes = " kMGTPE"; /* SI for decimal multiplies */
1242 1.91 drochner
1243 1.116 christos umax = 1;
1244 1.49 lukem for (i = 0; i < len - suffixlen - 3; i++)
1245 1.116 christos umax *= 10;
1246 1.116 christos for (i = 0; bytes >= umax && prefixes[i + 1]; i++)
1247 1.58 sommerfe bytes /= divisor;
1248 1.48 lukem
1249 1.50 lukem r = snprintf(buf, len, "%qu%s%c%s", (unsigned long long)bytes,
1250 1.49 lukem i == 0 ? "" : " ", prefixes[i], suffix);
1251 1.48 lukem
1252 1.48 lukem return (r);
1253 1.49 lukem }
1254 1.49 lukem
1255 1.49 lukem int
1256 1.117 thorpej format_bytes(char *buf, size_t len, uint64_t bytes)
1257 1.49 lukem {
1258 1.49 lukem int rv;
1259 1.49 lukem size_t nlen;
1260 1.49 lukem
1261 1.58 sommerfe rv = humanize_number(buf, len, bytes, "B", 1024);
1262 1.49 lukem if (rv != -1) {
1263 1.49 lukem /* nuke the trailing ` B' if it exists */
1264 1.49 lukem nlen = strlen(buf) - 2;
1265 1.49 lukem if (strcmp(&buf[nlen], " B") == 0)
1266 1.49 lukem buf[nlen] = '\0';
1267 1.49 lukem }
1268 1.49 lukem return (rv);
1269 1.81 christos }
1270 1.81 christos
1271 1.92 jdolecek /*
1272 1.154 thorpej * Return true if system call tracing is enabled for the specified process.
1273 1.130 thorpej */
1274 1.153 thorpej bool
1275 1.130 thorpej trace_is_enabled(struct proc *p)
1276 1.130 thorpej {
1277 1.131 thorpej #ifdef SYSCALL_DEBUG
1278 1.154 thorpej return (true);
1279 1.131 thorpej #endif
1280 1.130 thorpej #ifdef KTRACE
1281 1.130 thorpej if (ISSET(p->p_traceflag, (KTRFAC_SYSCALL | KTRFAC_SYSRET)))
1282 1.154 thorpej return (true);
1283 1.130 thorpej #endif
1284 1.142 matt #ifdef PTRACE
1285 1.151 ad if (ISSET(p->p_slflag, PSL_SYSCALL))
1286 1.154 thorpej return (true);
1287 1.142 matt #endif
1288 1.130 thorpej
1289 1.154 thorpej return (false);
1290 1.130 thorpej }
1291 1.130 thorpej
1292 1.130 thorpej /*
1293 1.92 jdolecek * Start trace of particular system call. If process is being traced,
1294 1.92 jdolecek * this routine is called by MD syscall dispatch code just before
1295 1.92 jdolecek * a system call is actually executed.
1296 1.92 jdolecek */
1297 1.81 christos int
1298 1.177 dsl trace_enter(register_t code, const register_t *args, int narg)
1299 1.81 christos {
1300 1.81 christos #ifdef SYSCALL_DEBUG
1301 1.171 dsl scdebug_call(code, args);
1302 1.81 christos #endif /* SYSCALL_DEBUG */
1303 1.81 christos
1304 1.177 dsl ktrsyscall(code, args, narg);
1305 1.81 christos
1306 1.142 matt #ifdef PTRACE
1307 1.172 dsl if ((curlwp->l_proc->p_slflag & (PSL_SYSCALL|PSL_TRACED)) ==
1308 1.151 ad (PSL_SYSCALL|PSL_TRACED))
1309 1.172 dsl process_stoptrace();
1310 1.142 matt #endif
1311 1.81 christos return 0;
1312 1.81 christos }
1313 1.81 christos
1314 1.92 jdolecek /*
1315 1.92 jdolecek * End trace of particular system call. If process is being traced,
1316 1.92 jdolecek * this routine is called by MD syscall dispatch code just after
1317 1.92 jdolecek * a system call finishes.
1318 1.92 jdolecek * MD caller guarantees the passed 'code' is within the supported
1319 1.92 jdolecek * system call number range for emulation the process runs under.
1320 1.92 jdolecek */
1321 1.81 christos void
1322 1.177 dsl trace_exit(register_t code, register_t rval[], int error)
1323 1.81 christos {
1324 1.81 christos #ifdef SYSCALL_DEBUG
1325 1.171 dsl scdebug_ret(code, error, rval);
1326 1.81 christos #endif /* SYSCALL_DEBUG */
1327 1.81 christos
1328 1.164 ad ktrsysret(code, error, rval);
1329 1.128 christos
1330 1.142 matt #ifdef PTRACE
1331 1.172 dsl if ((curlwp->l_proc->p_slflag & (PSL_SYSCALL|PSL_TRACED)) ==
1332 1.151 ad (PSL_SYSCALL|PSL_TRACED))
1333 1.172 dsl process_stoptrace();
1334 1.142 matt #endif
1335 1.10 cgd }
1336 1.194 ad
1337 1.194 ad int
1338 1.194 ad syscall_establish(const struct emul *em, const struct syscall_package *sp)
1339 1.194 ad {
1340 1.194 ad struct sysent *sy;
1341 1.194 ad int i;
1342 1.194 ad
1343 1.194 ad KASSERT(mutex_owned(&module_lock));
1344 1.194 ad
1345 1.194 ad if (em == NULL) {
1346 1.194 ad em = &emul_netbsd;
1347 1.194 ad }
1348 1.194 ad sy = em->e_sysent;
1349 1.194 ad
1350 1.194 ad /*
1351 1.194 ad * Ensure that all preconditions are valid, since this is
1352 1.194 ad * an all or nothing deal. Once a system call is entered,
1353 1.194 ad * it can become busy and we could be unable to remove it
1354 1.194 ad * on error.
1355 1.194 ad */
1356 1.194 ad for (i = 0; sp[i].sp_call != NULL; i++) {
1357 1.194 ad if (sy[sp[i].sp_code].sy_call != sys_nomodule) {
1358 1.194 ad return EBUSY;
1359 1.194 ad }
1360 1.194 ad }
1361 1.194 ad /* Everything looks good, patch them in. */
1362 1.194 ad for (i = 0; sp[i].sp_call != NULL; i++) {
1363 1.194 ad sy[sp[i].sp_code].sy_call = sp[i].sp_call;
1364 1.194 ad }
1365 1.194 ad
1366 1.194 ad return 0;
1367 1.194 ad }
1368 1.194 ad
1369 1.194 ad int
1370 1.194 ad syscall_disestablish(const struct emul *em, const struct syscall_package *sp)
1371 1.194 ad {
1372 1.194 ad struct sysent *sy;
1373 1.194 ad uint64_t where;
1374 1.194 ad lwp_t *l;
1375 1.194 ad int i;
1376 1.194 ad
1377 1.194 ad KASSERT(mutex_owned(&module_lock));
1378 1.194 ad
1379 1.194 ad if (em == NULL) {
1380 1.194 ad em = &emul_netbsd;
1381 1.194 ad }
1382 1.194 ad sy = em->e_sysent;
1383 1.194 ad
1384 1.194 ad /*
1385 1.194 ad * First, patch the system calls to sys_nomodule to gate further
1386 1.194 ad * activity.
1387 1.194 ad */
1388 1.194 ad for (i = 0; sp[i].sp_call != NULL; i++) {
1389 1.194 ad KASSERT(sy[sp[i].sp_code].sy_call == sp[i].sp_call);
1390 1.194 ad sy[sp[i].sp_code].sy_call = sys_nomodule;
1391 1.194 ad }
1392 1.194 ad
1393 1.194 ad /*
1394 1.194 ad * Run a cross call to cycle through all CPUs. This does two
1395 1.194 ad * things: lock activity provides a barrier and makes our update
1396 1.194 ad * of sy_call visible to all CPUs, and upon return we can be sure
1397 1.194 ad * that we see pertinent values of l_sysent posted by remote CPUs.
1398 1.194 ad */
1399 1.194 ad where = xc_broadcast(0, (xcfunc_t)nullop, NULL, NULL);
1400 1.194 ad xc_wait(where);
1401 1.194 ad
1402 1.194 ad /*
1403 1.194 ad * Now it's safe to check l_sysent. Run through all LWPs and see
1404 1.194 ad * if anyone is still using the system call.
1405 1.194 ad */
1406 1.194 ad for (i = 0; sp[i].sp_call != NULL; i++) {
1407 1.194 ad mutex_enter(proc_lock);
1408 1.194 ad LIST_FOREACH(l, &alllwp, l_list) {
1409 1.194 ad if (l->l_sysent == &sy[sp[i].sp_code]) {
1410 1.194 ad break;
1411 1.194 ad }
1412 1.194 ad }
1413 1.194 ad mutex_exit(proc_lock);
1414 1.194 ad if (l == NULL) {
1415 1.194 ad continue;
1416 1.194 ad }
1417 1.194 ad /*
1418 1.194 ad * We lose: one or more calls are still in use. Put back
1419 1.194 ad * the old entrypoints and act like nothing happened.
1420 1.194 ad * When we drop module_lock, any system calls held in
1421 1.194 ad * sys_nomodule() will be restarted.
1422 1.194 ad */
1423 1.194 ad for (i = 0; sp[i].sp_call != NULL; i++) {
1424 1.194 ad sy[sp[i].sp_code].sy_call = sp[i].sp_call;
1425 1.194 ad }
1426 1.194 ad return EBUSY;
1427 1.194 ad }
1428 1.194 ad
1429 1.194 ad return 0;
1430 1.194 ad }
1431