kern_subr.c revision 1.139 1 1.139 christos /* $NetBSD: kern_subr.c,v 1.139 2006/08/12 19:58:55 christos Exp $ */
2 1.31 thorpej
3 1.31 thorpej /*-
4 1.78 thorpej * Copyright (c) 1997, 1998, 1999, 2002 The NetBSD Foundation, Inc.
5 1.31 thorpej * All rights reserved.
6 1.31 thorpej *
7 1.31 thorpej * This code is derived from software contributed to The NetBSD Foundation
8 1.31 thorpej * by Jason R. Thorpe of the Numerical Aerospace Simulation Facility,
9 1.48 lukem * NASA Ames Research Center, and by Luke Mewburn.
10 1.31 thorpej *
11 1.31 thorpej * Redistribution and use in source and binary forms, with or without
12 1.31 thorpej * modification, are permitted provided that the following conditions
13 1.31 thorpej * are met:
14 1.31 thorpej * 1. Redistributions of source code must retain the above copyright
15 1.31 thorpej * notice, this list of conditions and the following disclaimer.
16 1.31 thorpej * 2. Redistributions in binary form must reproduce the above copyright
17 1.31 thorpej * notice, this list of conditions and the following disclaimer in the
18 1.31 thorpej * documentation and/or other materials provided with the distribution.
19 1.31 thorpej * 3. All advertising materials mentioning features or use of this software
20 1.31 thorpej * must display the following acknowledgement:
21 1.31 thorpej * This product includes software developed by the NetBSD
22 1.31 thorpej * Foundation, Inc. and its contributors.
23 1.31 thorpej * 4. Neither the name of The NetBSD Foundation nor the names of its
24 1.31 thorpej * contributors may be used to endorse or promote products derived
25 1.31 thorpej * from this software without specific prior written permission.
26 1.31 thorpej *
27 1.31 thorpej * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
28 1.31 thorpej * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
29 1.31 thorpej * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
30 1.31 thorpej * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
31 1.31 thorpej * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
32 1.31 thorpej * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
33 1.31 thorpej * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
34 1.31 thorpej * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
35 1.31 thorpej * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
36 1.31 thorpej * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
37 1.31 thorpej * POSSIBILITY OF SUCH DAMAGE.
38 1.31 thorpej */
39 1.12 cgd
40 1.9 cgd /*
41 1.10 cgd * Copyright (c) 1982, 1986, 1991, 1993
42 1.10 cgd * The Regents of the University of California. All rights reserved.
43 1.9 cgd * (c) UNIX System Laboratories, Inc.
44 1.9 cgd * All or some portions of this file are derived from material licensed
45 1.9 cgd * to the University of California by American Telephone and Telegraph
46 1.9 cgd * Co. or Unix System Laboratories, Inc. and are reproduced herein with
47 1.9 cgd * the permission of UNIX System Laboratories, Inc.
48 1.9 cgd *
49 1.18 thorpej * Copyright (c) 1992, 1993
50 1.18 thorpej * The Regents of the University of California. All rights reserved.
51 1.18 thorpej *
52 1.18 thorpej * This software was developed by the Computer Systems Engineering group
53 1.18 thorpej * at Lawrence Berkeley Laboratory under DARPA contract BG 91-66 and
54 1.18 thorpej * contributed to Berkeley.
55 1.18 thorpej *
56 1.18 thorpej * All advertising materials mentioning features or use of this software
57 1.18 thorpej * must display the following acknowledgement:
58 1.18 thorpej * This product includes software developed by the University of
59 1.18 thorpej * California, Lawrence Berkeley Laboratory.
60 1.18 thorpej *
61 1.9 cgd * Redistribution and use in source and binary forms, with or without
62 1.9 cgd * modification, are permitted provided that the following conditions
63 1.9 cgd * are met:
64 1.9 cgd * 1. Redistributions of source code must retain the above copyright
65 1.9 cgd * notice, this list of conditions and the following disclaimer.
66 1.9 cgd * 2. Redistributions in binary form must reproduce the above copyright
67 1.9 cgd * notice, this list of conditions and the following disclaimer in the
68 1.9 cgd * documentation and/or other materials provided with the distribution.
69 1.103 agc * 3. Neither the name of the University nor the names of its contributors
70 1.9 cgd * may be used to endorse or promote products derived from this software
71 1.9 cgd * without specific prior written permission.
72 1.9 cgd *
73 1.9 cgd * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
74 1.9 cgd * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
75 1.9 cgd * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
76 1.9 cgd * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
77 1.9 cgd * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
78 1.9 cgd * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
79 1.9 cgd * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
80 1.9 cgd * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
81 1.9 cgd * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
82 1.9 cgd * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
83 1.9 cgd * SUCH DAMAGE.
84 1.9 cgd *
85 1.38 fvdl * @(#)kern_subr.c 8.4 (Berkeley) 2/14/95
86 1.9 cgd */
87 1.77 lukem
88 1.77 lukem #include <sys/cdefs.h>
89 1.139 christos __KERNEL_RCSID(0, "$NetBSD: kern_subr.c,v 1.139 2006/08/12 19:58:55 christos Exp $");
90 1.34 mrg
91 1.78 thorpej #include "opt_ddb.h"
92 1.43 jonathan #include "opt_md.h"
93 1.81 christos #include "opt_syscall_debug.h"
94 1.81 christos #include "opt_ktrace.h"
95 1.81 christos #include "opt_systrace.h"
96 1.9 cgd
97 1.9 cgd #include <sys/param.h>
98 1.9 cgd #include <sys/systm.h>
99 1.9 cgd #include <sys/proc.h>
100 1.10 cgd #include <sys/malloc.h>
101 1.18 thorpej #include <sys/mount.h>
102 1.18 thorpej #include <sys/device.h>
103 1.18 thorpej #include <sys/reboot.h>
104 1.18 thorpej #include <sys/conf.h>
105 1.18 thorpej #include <sys/disklabel.h>
106 1.10 cgd #include <sys/queue.h>
107 1.81 christos #include <sys/systrace.h>
108 1.81 christos #include <sys/ktrace.h>
109 1.128 christos #include <sys/ptrace.h>
110 1.119 reinoud #include <sys/fcntl.h>
111 1.9 cgd
112 1.82 thorpej #include <uvm/uvm_extern.h>
113 1.82 thorpej
114 1.18 thorpej #include <dev/cons.h>
115 1.18 thorpej
116 1.18 thorpej #include <net/if.h>
117 1.18 thorpej
118 1.18 thorpej /* XXX these should eventually move to subr_autoconf.c */
119 1.109 junyoung static struct device *finddevice(const char *);
120 1.109 junyoung static struct device *getdisk(char *, int, int, dev_t *, int);
121 1.109 junyoung static struct device *parsedisk(char *, int, int, dev_t *);
122 1.18 thorpej
123 1.80 christos /*
124 1.80 christos * A generic linear hook.
125 1.80 christos */
126 1.80 christos struct hook_desc {
127 1.80 christos LIST_ENTRY(hook_desc) hk_list;
128 1.109 junyoung void (*hk_fn)(void *);
129 1.80 christos void *hk_arg;
130 1.80 christos };
131 1.80 christos typedef LIST_HEAD(, hook_desc) hook_list_t;
132 1.80 christos
133 1.97 thorpej MALLOC_DEFINE(M_IOV, "iov", "large iov's");
134 1.97 thorpej
135 1.126 yamt void
136 1.126 yamt uio_setup_sysspace(struct uio *uio)
137 1.126 yamt {
138 1.126 yamt
139 1.126 yamt uio->uio_vmspace = vmspace_kernel();
140 1.126 yamt }
141 1.126 yamt
142 1.11 mycroft int
143 1.117 thorpej uiomove(void *buf, size_t n, struct uio *uio)
144 1.9 cgd {
145 1.126 yamt struct vmspace *vm = uio->uio_vmspace;
146 1.63 augustss struct iovec *iov;
147 1.9 cgd u_int cnt;
148 1.9 cgd int error = 0;
149 1.16 christos char *cp = buf;
150 1.112 yamt int hold_count;
151 1.112 yamt
152 1.112 yamt hold_count = KERNEL_LOCK_RELEASE_ALL();
153 1.112 yamt
154 1.138 yamt ASSERT_SLEEPABLE(NULL, "uiomove");
155 1.68 enami
156 1.68 enami #ifdef DIAGNOSTIC
157 1.9 cgd if (uio->uio_rw != UIO_READ && uio->uio_rw != UIO_WRITE)
158 1.9 cgd panic("uiomove: mode");
159 1.9 cgd #endif
160 1.9 cgd while (n > 0 && uio->uio_resid) {
161 1.9 cgd iov = uio->uio_iov;
162 1.9 cgd cnt = iov->iov_len;
163 1.9 cgd if (cnt == 0) {
164 1.105 yamt KASSERT(uio->uio_iovcnt > 0);
165 1.9 cgd uio->uio_iov++;
166 1.9 cgd uio->uio_iovcnt--;
167 1.9 cgd continue;
168 1.9 cgd }
169 1.9 cgd if (cnt > n)
170 1.9 cgd cnt = n;
171 1.126 yamt if (!VMSPACE_IS_KERNEL_P(vm)) {
172 1.104 yamt if (curcpu()->ci_schedstate.spc_flags &
173 1.67 thorpej SPCF_SHOULDYIELD)
174 1.95 thorpej preempt(1);
175 1.126 yamt }
176 1.9 cgd
177 1.126 yamt if (uio->uio_rw == UIO_READ) {
178 1.126 yamt error = copyout_vmspace(vm, cp, iov->iov_base,
179 1.126 yamt cnt);
180 1.126 yamt } else {
181 1.126 yamt error = copyin_vmspace(vm, iov->iov_base, cp,
182 1.126 yamt cnt);
183 1.126 yamt }
184 1.126 yamt if (error) {
185 1.9 cgd break;
186 1.9 cgd }
187 1.44 kleink iov->iov_base = (caddr_t)iov->iov_base + cnt;
188 1.9 cgd iov->iov_len -= cnt;
189 1.9 cgd uio->uio_resid -= cnt;
190 1.9 cgd uio->uio_offset += cnt;
191 1.9 cgd cp += cnt;
192 1.85 thorpej KDASSERT(cnt <= n);
193 1.9 cgd n -= cnt;
194 1.9 cgd }
195 1.112 yamt KERNEL_LOCK_ACQUIRE_COUNT(hold_count);
196 1.9 cgd return (error);
197 1.9 cgd }
198 1.9 cgd
199 1.9 cgd /*
200 1.110 itojun * Wrapper for uiomove() that validates the arguments against a known-good
201 1.111 matt * kernel buffer.
202 1.110 itojun */
203 1.110 itojun int
204 1.111 matt uiomove_frombuf(void *buf, size_t buflen, struct uio *uio)
205 1.110 itojun {
206 1.111 matt size_t offset;
207 1.110 itojun
208 1.110 itojun if (uio->uio_offset < 0 || uio->uio_resid < 0 ||
209 1.110 itojun (offset = uio->uio_offset) != uio->uio_offset)
210 1.110 itojun return (EINVAL);
211 1.111 matt if (offset >= buflen)
212 1.110 itojun return (0);
213 1.111 matt return (uiomove((char *)buf + offset, buflen - offset, uio));
214 1.110 itojun }
215 1.110 itojun
216 1.110 itojun /*
217 1.9 cgd * Give next character to user as result of read.
218 1.9 cgd */
219 1.11 mycroft int
220 1.117 thorpej ureadc(int c, struct uio *uio)
221 1.9 cgd {
222 1.63 augustss struct iovec *iov;
223 1.9 cgd
224 1.11 mycroft if (uio->uio_resid <= 0)
225 1.11 mycroft panic("ureadc: non-positive resid");
226 1.9 cgd again:
227 1.11 mycroft if (uio->uio_iovcnt <= 0)
228 1.11 mycroft panic("ureadc: non-positive iovcnt");
229 1.9 cgd iov = uio->uio_iov;
230 1.11 mycroft if (iov->iov_len <= 0) {
231 1.9 cgd uio->uio_iovcnt--;
232 1.9 cgd uio->uio_iov++;
233 1.9 cgd goto again;
234 1.9 cgd }
235 1.126 yamt if (!VMSPACE_IS_KERNEL_P(uio->uio_vmspace)) {
236 1.9 cgd if (subyte(iov->iov_base, c) < 0)
237 1.9 cgd return (EFAULT);
238 1.126 yamt } else {
239 1.39 kleink *(char *)iov->iov_base = c;
240 1.9 cgd }
241 1.44 kleink iov->iov_base = (caddr_t)iov->iov_base + 1;
242 1.9 cgd iov->iov_len--;
243 1.9 cgd uio->uio_resid--;
244 1.9 cgd uio->uio_offset++;
245 1.9 cgd return (0);
246 1.82 thorpej }
247 1.82 thorpej
248 1.82 thorpej /*
249 1.126 yamt * Like copyin(), but operates on an arbitrary vmspace.
250 1.82 thorpej */
251 1.82 thorpej int
252 1.126 yamt copyin_vmspace(struct vmspace *vm, const void *uaddr, void *kaddr, size_t len)
253 1.82 thorpej {
254 1.82 thorpej struct iovec iov;
255 1.82 thorpej struct uio uio;
256 1.82 thorpej int error;
257 1.82 thorpej
258 1.82 thorpej if (len == 0)
259 1.82 thorpej return (0);
260 1.82 thorpej
261 1.126 yamt if (VMSPACE_IS_KERNEL_P(vm)) {
262 1.126 yamt return kcopy(uaddr, kaddr, len);
263 1.126 yamt }
264 1.126 yamt if (__predict_true(vm == curproc->p_vmspace)) {
265 1.118 christos return copyin(uaddr, kaddr, len);
266 1.126 yamt }
267 1.118 christos
268 1.82 thorpej iov.iov_base = kaddr;
269 1.82 thorpej iov.iov_len = len;
270 1.82 thorpej uio.uio_iov = &iov;
271 1.82 thorpej uio.uio_iovcnt = 1;
272 1.82 thorpej uio.uio_offset = (off_t)(intptr_t)uaddr;
273 1.82 thorpej uio.uio_resid = len;
274 1.82 thorpej uio.uio_rw = UIO_READ;
275 1.134 yamt UIO_SETUP_SYSSPACE(&uio);
276 1.126 yamt error = uvm_io(&vm->vm_map, &uio);
277 1.82 thorpej
278 1.82 thorpej return (error);
279 1.82 thorpej }
280 1.82 thorpej
281 1.82 thorpej /*
282 1.126 yamt * Like copyout(), but operates on an arbitrary vmspace.
283 1.82 thorpej */
284 1.82 thorpej int
285 1.126 yamt copyout_vmspace(struct vmspace *vm, const void *kaddr, void *uaddr, size_t len)
286 1.82 thorpej {
287 1.82 thorpej struct iovec iov;
288 1.82 thorpej struct uio uio;
289 1.82 thorpej int error;
290 1.82 thorpej
291 1.82 thorpej if (len == 0)
292 1.82 thorpej return (0);
293 1.82 thorpej
294 1.126 yamt if (VMSPACE_IS_KERNEL_P(vm)) {
295 1.126 yamt return kcopy(kaddr, uaddr, len);
296 1.126 yamt }
297 1.126 yamt if (__predict_true(vm == curproc->p_vmspace)) {
298 1.118 christos return copyout(kaddr, uaddr, len);
299 1.126 yamt }
300 1.118 christos
301 1.116 christos iov.iov_base = __UNCONST(kaddr); /* XXXUNCONST cast away const */
302 1.82 thorpej iov.iov_len = len;
303 1.82 thorpej uio.uio_iov = &iov;
304 1.82 thorpej uio.uio_iovcnt = 1;
305 1.82 thorpej uio.uio_offset = (off_t)(intptr_t)uaddr;
306 1.82 thorpej uio.uio_resid = len;
307 1.82 thorpej uio.uio_rw = UIO_WRITE;
308 1.134 yamt UIO_SETUP_SYSSPACE(&uio);
309 1.126 yamt error = uvm_io(&vm->vm_map, &uio);
310 1.126 yamt
311 1.126 yamt return (error);
312 1.126 yamt }
313 1.126 yamt
314 1.126 yamt /*
315 1.126 yamt * Like copyin(), but operates on an arbitrary process.
316 1.126 yamt */
317 1.126 yamt int
318 1.126 yamt copyin_proc(struct proc *p, const void *uaddr, void *kaddr, size_t len)
319 1.126 yamt {
320 1.126 yamt struct vmspace *vm;
321 1.126 yamt int error;
322 1.126 yamt
323 1.126 yamt error = proc_vmspace_getref(p, &vm);
324 1.126 yamt if (error) {
325 1.126 yamt return error;
326 1.126 yamt }
327 1.126 yamt error = copyin_vmspace(vm, uaddr, kaddr, len);
328 1.126 yamt uvmspace_free(vm);
329 1.82 thorpej
330 1.126 yamt return error;
331 1.126 yamt }
332 1.82 thorpej
333 1.126 yamt /*
334 1.126 yamt * Like copyout(), but operates on an arbitrary process.
335 1.126 yamt */
336 1.126 yamt int
337 1.126 yamt copyout_proc(struct proc *p, const void *kaddr, void *uaddr, size_t len)
338 1.126 yamt {
339 1.126 yamt struct vmspace *vm;
340 1.126 yamt int error;
341 1.126 yamt
342 1.126 yamt error = proc_vmspace_getref(p, &vm);
343 1.126 yamt if (error) {
344 1.126 yamt return error;
345 1.126 yamt }
346 1.132 yamt error = copyout_vmspace(vm, kaddr, uaddr, len);
347 1.126 yamt uvmspace_free(vm);
348 1.126 yamt
349 1.126 yamt return error;
350 1.9 cgd }
351 1.10 cgd
352 1.10 cgd /*
353 1.119 reinoud * Like copyin(), except it operates on kernel addresses when the FKIOCTL
354 1.119 reinoud * flag is passed in `ioctlflags' from the ioctl call.
355 1.119 reinoud */
356 1.119 reinoud int
357 1.119 reinoud ioctl_copyin(int ioctlflags, const void *src, void *dst, size_t len)
358 1.119 reinoud {
359 1.119 reinoud if (ioctlflags & FKIOCTL)
360 1.119 reinoud return kcopy(src, dst, len);
361 1.119 reinoud return copyin(src, dst, len);
362 1.119 reinoud }
363 1.119 reinoud
364 1.119 reinoud /*
365 1.119 reinoud * Like copyout(), except it operates on kernel addresses when the FKIOCTL
366 1.119 reinoud * flag is passed in `ioctlflags' from the ioctl call.
367 1.119 reinoud */
368 1.119 reinoud int
369 1.119 reinoud ioctl_copyout(int ioctlflags, const void *src, void *dst, size_t len)
370 1.119 reinoud {
371 1.119 reinoud if (ioctlflags & FKIOCTL)
372 1.119 reinoud return kcopy(src, dst, len);
373 1.119 reinoud return copyout(src, dst, len);
374 1.119 reinoud }
375 1.119 reinoud
376 1.119 reinoud /*
377 1.10 cgd * General routine to allocate a hash table.
378 1.42 chs * Allocate enough memory to hold at least `elements' list-head pointers.
379 1.42 chs * Return a pointer to the allocated space and set *hashmask to a pattern
380 1.42 chs * suitable for masking a value to use as an index into the returned array.
381 1.10 cgd */
382 1.10 cgd void *
383 1.117 thorpej hashinit(u_int elements, enum hashtype htype, struct malloc_type *mtype,
384 1.117 thorpej int mflags, u_long *hashmask)
385 1.10 cgd {
386 1.84 thorpej u_long hashsize, i;
387 1.72 ad LIST_HEAD(, generic) *hashtbl_list;
388 1.72 ad TAILQ_HEAD(, generic) *hashtbl_tailq;
389 1.84 thorpej size_t esize;
390 1.72 ad void *p;
391 1.10 cgd
392 1.84 thorpej if (elements == 0)
393 1.10 cgd panic("hashinit: bad cnt");
394 1.42 chs for (hashsize = 1; hashsize < elements; hashsize <<= 1)
395 1.10 cgd continue;
396 1.72 ad
397 1.72 ad switch (htype) {
398 1.72 ad case HASH_LIST:
399 1.72 ad esize = sizeof(*hashtbl_list);
400 1.72 ad break;
401 1.72 ad case HASH_TAILQ:
402 1.72 ad esize = sizeof(*hashtbl_tailq);
403 1.72 ad break;
404 1.106 christos default:
405 1.72 ad #ifdef DIAGNOSTIC
406 1.72 ad panic("hashinit: invalid table type");
407 1.106 christos #else
408 1.106 christos return NULL;
409 1.72 ad #endif
410 1.72 ad }
411 1.72 ad
412 1.84 thorpej if ((p = malloc(hashsize * esize, mtype, mflags)) == NULL)
413 1.66 enami return (NULL);
414 1.72 ad
415 1.72 ad switch (htype) {
416 1.72 ad case HASH_LIST:
417 1.72 ad hashtbl_list = p;
418 1.72 ad for (i = 0; i < hashsize; i++)
419 1.72 ad LIST_INIT(&hashtbl_list[i]);
420 1.72 ad break;
421 1.72 ad case HASH_TAILQ:
422 1.72 ad hashtbl_tailq = p;
423 1.72 ad for (i = 0; i < hashsize; i++)
424 1.72 ad TAILQ_INIT(&hashtbl_tailq[i]);
425 1.72 ad break;
426 1.72 ad }
427 1.10 cgd *hashmask = hashsize - 1;
428 1.72 ad return (p);
429 1.61 jdolecek }
430 1.61 jdolecek
431 1.61 jdolecek /*
432 1.61 jdolecek * Free memory from hash table previosly allocated via hashinit().
433 1.61 jdolecek */
434 1.61 jdolecek void
435 1.117 thorpej hashdone(void *hashtbl, struct malloc_type *mtype)
436 1.61 jdolecek {
437 1.65 enami
438 1.72 ad free(hashtbl, mtype);
439 1.14 cgd }
440 1.14 cgd
441 1.14 cgd
442 1.80 christos static void *
443 1.117 thorpej hook_establish(hook_list_t *list, void (*fn)(void *), void *arg)
444 1.14 cgd {
445 1.80 christos struct hook_desc *hd;
446 1.14 cgd
447 1.80 christos hd = malloc(sizeof(*hd), M_DEVBUF, M_NOWAIT);
448 1.80 christos if (hd == NULL)
449 1.59 enami return (NULL);
450 1.14 cgd
451 1.80 christos hd->hk_fn = fn;
452 1.80 christos hd->hk_arg = arg;
453 1.80 christos LIST_INSERT_HEAD(list, hd, hk_list);
454 1.14 cgd
455 1.80 christos return (hd);
456 1.14 cgd }
457 1.14 cgd
458 1.80 christos static void
459 1.117 thorpej hook_disestablish(hook_list_t *list, void *vhook)
460 1.14 cgd {
461 1.14 cgd #ifdef DIAGNOSTIC
462 1.80 christos struct hook_desc *hd;
463 1.14 cgd
464 1.83 matt LIST_FOREACH(hd, list, hk_list) {
465 1.80 christos if (hd == vhook)
466 1.14 cgd break;
467 1.83 matt }
468 1.83 matt
469 1.80 christos if (hd == NULL)
470 1.83 matt panic("hook_disestablish: hook %p not established", vhook);
471 1.14 cgd #endif
472 1.80 christos LIST_REMOVE((struct hook_desc *)vhook, hk_list);
473 1.80 christos free(vhook, M_DEVBUF);
474 1.80 christos }
475 1.80 christos
476 1.80 christos static void
477 1.117 thorpej hook_destroy(hook_list_t *list)
478 1.80 christos {
479 1.80 christos struct hook_desc *hd;
480 1.80 christos
481 1.87 matt while ((hd = LIST_FIRST(list)) != NULL) {
482 1.80 christos LIST_REMOVE(hd, hk_list);
483 1.80 christos free(hd, M_DEVBUF);
484 1.80 christos }
485 1.80 christos }
486 1.14 cgd
487 1.80 christos static void
488 1.117 thorpej hook_proc_run(hook_list_t *list, struct proc *p)
489 1.80 christos {
490 1.80 christos struct hook_desc *hd;
491 1.80 christos
492 1.80 christos for (hd = LIST_FIRST(list); hd != NULL; hd = LIST_NEXT(hd, hk_list)) {
493 1.109 junyoung ((void (*)(struct proc *, void *))*hd->hk_fn)(p,
494 1.80 christos hd->hk_arg);
495 1.80 christos }
496 1.80 christos }
497 1.80 christos
498 1.80 christos /*
499 1.80 christos * "Shutdown hook" types, functions, and variables.
500 1.80 christos *
501 1.80 christos * Should be invoked immediately before the
502 1.80 christos * system is halted or rebooted, i.e. after file systems unmounted,
503 1.80 christos * after crash dump done, etc.
504 1.80 christos *
505 1.80 christos * Each shutdown hook is removed from the list before it's run, so that
506 1.80 christos * it won't be run again.
507 1.80 christos */
508 1.80 christos
509 1.117 thorpej static hook_list_t shutdownhook_list;
510 1.80 christos
511 1.80 christos void *
512 1.117 thorpej shutdownhook_establish(void (*fn)(void *), void *arg)
513 1.80 christos {
514 1.80 christos return hook_establish(&shutdownhook_list, fn, arg);
515 1.80 christos }
516 1.80 christos
517 1.80 christos void
518 1.117 thorpej shutdownhook_disestablish(void *vhook)
519 1.80 christos {
520 1.89 simonb hook_disestablish(&shutdownhook_list, vhook);
521 1.14 cgd }
522 1.14 cgd
523 1.14 cgd /*
524 1.14 cgd * Run shutdown hooks. Should be invoked immediately before the
525 1.14 cgd * system is halted or rebooted, i.e. after file systems unmounted,
526 1.14 cgd * after crash dump done, etc.
527 1.17 cgd *
528 1.17 cgd * Each shutdown hook is removed from the list before it's run, so that
529 1.17 cgd * it won't be run again.
530 1.14 cgd */
531 1.14 cgd void
532 1.117 thorpej doshutdownhooks(void)
533 1.14 cgd {
534 1.80 christos struct hook_desc *dp;
535 1.14 cgd
536 1.87 matt while ((dp = LIST_FIRST(&shutdownhook_list)) != NULL) {
537 1.80 christos LIST_REMOVE(dp, hk_list);
538 1.80 christos (*dp->hk_fn)(dp->hk_arg);
539 1.17 cgd #if 0
540 1.17 cgd /*
541 1.17 cgd * Don't bother freeing the hook structure,, since we may
542 1.17 cgd * be rebooting because of a memory corruption problem,
543 1.17 cgd * and this might only make things worse. It doesn't
544 1.17 cgd * matter, anyway, since the system is just about to
545 1.17 cgd * reboot.
546 1.17 cgd */
547 1.17 cgd free(dp, M_DEVBUF);
548 1.17 cgd #endif
549 1.52 augustss }
550 1.52 augustss }
551 1.52 augustss
552 1.52 augustss /*
553 1.80 christos * "Mountroot hook" types, functions, and variables.
554 1.80 christos */
555 1.80 christos
556 1.117 thorpej static hook_list_t mountroothook_list;
557 1.80 christos
558 1.80 christos void *
559 1.117 thorpej mountroothook_establish(void (*fn)(struct device *), struct device *dev)
560 1.80 christos {
561 1.109 junyoung return hook_establish(&mountroothook_list, (void (*)(void *))fn, dev);
562 1.80 christos }
563 1.80 christos
564 1.80 christos void
565 1.117 thorpej mountroothook_disestablish(void *vhook)
566 1.80 christos {
567 1.89 simonb hook_disestablish(&mountroothook_list, vhook);
568 1.80 christos }
569 1.80 christos
570 1.80 christos void
571 1.117 thorpej mountroothook_destroy(void)
572 1.80 christos {
573 1.80 christos hook_destroy(&mountroothook_list);
574 1.80 christos }
575 1.80 christos
576 1.80 christos void
577 1.117 thorpej domountroothook(void)
578 1.80 christos {
579 1.80 christos struct hook_desc *hd;
580 1.80 christos
581 1.83 matt LIST_FOREACH(hd, &mountroothook_list, hk_list) {
582 1.80 christos if (hd->hk_arg == (void *)root_device) {
583 1.80 christos (*hd->hk_fn)(hd->hk_arg);
584 1.80 christos return;
585 1.80 christos }
586 1.80 christos }
587 1.80 christos }
588 1.80 christos
589 1.117 thorpej static hook_list_t exechook_list;
590 1.80 christos
591 1.80 christos void *
592 1.117 thorpej exechook_establish(void (*fn)(struct proc *, void *), void *arg)
593 1.80 christos {
594 1.109 junyoung return hook_establish(&exechook_list, (void (*)(void *))fn, arg);
595 1.80 christos }
596 1.80 christos
597 1.80 christos void
598 1.117 thorpej exechook_disestablish(void *vhook)
599 1.80 christos {
600 1.80 christos hook_disestablish(&exechook_list, vhook);
601 1.80 christos }
602 1.80 christos
603 1.80 christos /*
604 1.80 christos * Run exec hooks.
605 1.80 christos */
606 1.80 christos void
607 1.117 thorpej doexechooks(struct proc *p)
608 1.80 christos {
609 1.80 christos hook_proc_run(&exechook_list, p);
610 1.80 christos }
611 1.80 christos
612 1.117 thorpej static hook_list_t exithook_list;
613 1.80 christos
614 1.80 christos void *
615 1.117 thorpej exithook_establish(void (*fn)(struct proc *, void *), void *arg)
616 1.80 christos {
617 1.109 junyoung return hook_establish(&exithook_list, (void (*)(void *))fn, arg);
618 1.80 christos }
619 1.80 christos
620 1.80 christos void
621 1.117 thorpej exithook_disestablish(void *vhook)
622 1.80 christos {
623 1.80 christos hook_disestablish(&exithook_list, vhook);
624 1.80 christos }
625 1.80 christos
626 1.80 christos /*
627 1.80 christos * Run exit hooks.
628 1.80 christos */
629 1.80 christos void
630 1.117 thorpej doexithooks(struct proc *p)
631 1.80 christos {
632 1.80 christos hook_proc_run(&exithook_list, p);
633 1.96 thorpej }
634 1.96 thorpej
635 1.117 thorpej static hook_list_t forkhook_list;
636 1.96 thorpej
637 1.96 thorpej void *
638 1.117 thorpej forkhook_establish(void (*fn)(struct proc *, struct proc *))
639 1.96 thorpej {
640 1.109 junyoung return hook_establish(&forkhook_list, (void (*)(void *))fn, NULL);
641 1.96 thorpej }
642 1.96 thorpej
643 1.96 thorpej void
644 1.117 thorpej forkhook_disestablish(void *vhook)
645 1.96 thorpej {
646 1.96 thorpej hook_disestablish(&forkhook_list, vhook);
647 1.96 thorpej }
648 1.96 thorpej
649 1.96 thorpej /*
650 1.96 thorpej * Run fork hooks.
651 1.96 thorpej */
652 1.96 thorpej void
653 1.117 thorpej doforkhooks(struct proc *p2, struct proc *p1)
654 1.96 thorpej {
655 1.96 thorpej struct hook_desc *hd;
656 1.96 thorpej
657 1.96 thorpej LIST_FOREACH(hd, &forkhook_list, hk_list) {
658 1.109 junyoung ((void (*)(struct proc *, struct proc *))*hd->hk_fn)
659 1.96 thorpej (p2, p1);
660 1.96 thorpej }
661 1.80 christos }
662 1.80 christos
663 1.80 christos /*
664 1.52 augustss * "Power hook" types, functions, and variables.
665 1.71 augustss * The list of power hooks is kept ordered with the last registered hook
666 1.71 augustss * first.
667 1.71 augustss * When running the hooks on power down the hooks are called in reverse
668 1.71 augustss * registration order, when powering up in registration order.
669 1.52 augustss */
670 1.52 augustss struct powerhook_desc {
671 1.71 augustss CIRCLEQ_ENTRY(powerhook_desc) sfd_list;
672 1.109 junyoung void (*sfd_fn)(int, void *);
673 1.52 augustss void *sfd_arg;
674 1.52 augustss };
675 1.52 augustss
676 1.117 thorpej static CIRCLEQ_HEAD(, powerhook_desc) powerhook_list =
677 1.117 thorpej CIRCLEQ_HEAD_INITIALIZER(powerhook_list);
678 1.52 augustss
679 1.52 augustss void *
680 1.117 thorpej powerhook_establish(void (*fn)(int, void *), void *arg)
681 1.52 augustss {
682 1.52 augustss struct powerhook_desc *ndp;
683 1.52 augustss
684 1.52 augustss ndp = (struct powerhook_desc *)
685 1.52 augustss malloc(sizeof(*ndp), M_DEVBUF, M_NOWAIT);
686 1.52 augustss if (ndp == NULL)
687 1.59 enami return (NULL);
688 1.52 augustss
689 1.52 augustss ndp->sfd_fn = fn;
690 1.52 augustss ndp->sfd_arg = arg;
691 1.71 augustss CIRCLEQ_INSERT_HEAD(&powerhook_list, ndp, sfd_list);
692 1.52 augustss
693 1.52 augustss return (ndp);
694 1.52 augustss }
695 1.52 augustss
696 1.52 augustss void
697 1.117 thorpej powerhook_disestablish(void *vhook)
698 1.52 augustss {
699 1.52 augustss #ifdef DIAGNOSTIC
700 1.52 augustss struct powerhook_desc *dp;
701 1.52 augustss
702 1.71 augustss CIRCLEQ_FOREACH(dp, &powerhook_list, sfd_list)
703 1.52 augustss if (dp == vhook)
704 1.71 augustss goto found;
705 1.83 matt panic("powerhook_disestablish: hook %p not established", vhook);
706 1.71 augustss found:
707 1.52 augustss #endif
708 1.52 augustss
709 1.71 augustss CIRCLEQ_REMOVE(&powerhook_list, (struct powerhook_desc *)vhook,
710 1.71 augustss sfd_list);
711 1.52 augustss free(vhook, M_DEVBUF);
712 1.52 augustss }
713 1.52 augustss
714 1.52 augustss /*
715 1.52 augustss * Run power hooks.
716 1.52 augustss */
717 1.52 augustss void
718 1.117 thorpej dopowerhooks(int why)
719 1.52 augustss {
720 1.52 augustss struct powerhook_desc *dp;
721 1.52 augustss
722 1.73 takemura if (why == PWR_RESUME || why == PWR_SOFTRESUME) {
723 1.71 augustss CIRCLEQ_FOREACH_REVERSE(dp, &powerhook_list, sfd_list) {
724 1.71 augustss (*dp->sfd_fn)(why, dp->sfd_arg);
725 1.71 augustss }
726 1.71 augustss } else {
727 1.71 augustss CIRCLEQ_FOREACH(dp, &powerhook_list, sfd_list) {
728 1.71 augustss (*dp->sfd_fn)(why, dp->sfd_arg);
729 1.71 augustss }
730 1.18 thorpej }
731 1.18 thorpej }
732 1.18 thorpej
733 1.18 thorpej /*
734 1.18 thorpej * Determine the root device and, if instructed to, the root file system.
735 1.18 thorpej */
736 1.18 thorpej
737 1.18 thorpej #include "md.h"
738 1.18 thorpej #if NMD == 0
739 1.18 thorpej #undef MEMORY_DISK_HOOKS
740 1.18 thorpej #endif
741 1.18 thorpej
742 1.18 thorpej #ifdef MEMORY_DISK_HOOKS
743 1.28 leo static struct device fakemdrootdev[NMD];
744 1.127 cube extern struct cfdriver md_cd;
745 1.18 thorpej #endif
746 1.18 thorpej
747 1.108 christos #ifdef MEMORY_DISK_IS_ROOT
748 1.108 christos #define BOOT_FROM_MEMORY_HOOKS 1
749 1.108 christos #endif
750 1.108 christos
751 1.57 oster #include "raid.h"
752 1.57 oster #if NRAID == 1
753 1.109 junyoung #define BOOT_FROM_RAID_HOOKS 1
754 1.57 oster #endif
755 1.57 oster
756 1.57 oster #ifdef BOOT_FROM_RAID_HOOKS
757 1.57 oster extern int numraid;
758 1.57 oster extern struct device *raidrootdev;
759 1.57 oster #endif
760 1.57 oster
761 1.113 thorpej /*
762 1.113 thorpej * The device and wedge that we booted from. If booted_wedge is NULL,
763 1.113 thorpej * the we might consult booted_partition.
764 1.113 thorpej */
765 1.113 thorpej struct device *booted_device;
766 1.113 thorpej struct device *booted_wedge;
767 1.113 thorpej int booted_partition;
768 1.113 thorpej
769 1.113 thorpej /*
770 1.113 thorpej * Use partition letters if it's a disk class but not a wedge.
771 1.113 thorpej * XXX Check for wedge is kinda gross.
772 1.113 thorpej */
773 1.113 thorpej #define DEV_USES_PARTITIONS(dv) \
774 1.124 thorpej (device_class((dv)) == DV_DISK && \
775 1.125 thorpej !device_is_a((dv), "dk"))
776 1.113 thorpej
777 1.18 thorpej void
778 1.117 thorpej setroot(struct device *bootdv, int bootpartition)
779 1.18 thorpej {
780 1.18 thorpej struct device *dv;
781 1.55 enami int len;
782 1.37 hannken #ifdef MEMORY_DISK_HOOKS
783 1.37 hannken int i;
784 1.37 hannken #endif
785 1.25 mrg dev_t nrootdev;
786 1.26 thorpej dev_t ndumpdev = NODEV;
787 1.18 thorpej char buf[128];
788 1.18 thorpej const char *rootdevname;
789 1.26 thorpej const char *dumpdevname;
790 1.26 thorpej struct device *rootdv = NULL; /* XXX gcc -Wuninitialized */
791 1.26 thorpej struct device *dumpdv = NULL;
792 1.18 thorpej struct ifnet *ifp;
793 1.18 thorpej const char *deffsname;
794 1.18 thorpej struct vfsops *vops;
795 1.18 thorpej
796 1.28 leo #ifdef MEMORY_DISK_HOOKS
797 1.28 leo for (i = 0; i < NMD; i++) {
798 1.28 leo fakemdrootdev[i].dv_class = DV_DISK;
799 1.28 leo fakemdrootdev[i].dv_cfdata = NULL;
800 1.127 cube fakemdrootdev[i].dv_cfdriver = &md_cd;
801 1.28 leo fakemdrootdev[i].dv_unit = i;
802 1.28 leo fakemdrootdev[i].dv_parent = NULL;
803 1.110 itojun snprintf(fakemdrootdev[i].dv_xname,
804 1.110 itojun sizeof(fakemdrootdev[i].dv_xname), "md%d", i);
805 1.28 leo }
806 1.28 leo #endif /* MEMORY_DISK_HOOKS */
807 1.28 leo
808 1.22 leo #ifdef MEMORY_DISK_IS_ROOT
809 1.28 leo bootdv = &fakemdrootdev[0];
810 1.18 thorpej bootpartition = 0;
811 1.18 thorpej #endif
812 1.18 thorpej
813 1.18 thorpej /*
814 1.18 thorpej * If NFS is specified as the file system, and we found
815 1.18 thorpej * a DV_DISK boot device (or no boot device at all), then
816 1.18 thorpej * find a reasonable network interface for "rootspec".
817 1.18 thorpej */
818 1.18 thorpej vops = vfs_getopsbyname("nfs");
819 1.18 thorpej if (vops != NULL && vops->vfs_mountroot == mountroot &&
820 1.18 thorpej rootspec == NULL &&
821 1.124 thorpej (bootdv == NULL || device_class(bootdv) != DV_IFNET)) {
822 1.115 matt IFNET_FOREACH(ifp) {
823 1.18 thorpej if ((ifp->if_flags &
824 1.18 thorpej (IFF_LOOPBACK|IFF_POINTOPOINT)) == 0)
825 1.18 thorpej break;
826 1.83 matt }
827 1.18 thorpej if (ifp == NULL) {
828 1.18 thorpej /*
829 1.18 thorpej * Can't find a suitable interface; ask the
830 1.18 thorpej * user.
831 1.18 thorpej */
832 1.18 thorpej boothowto |= RB_ASKNAME;
833 1.18 thorpej } else {
834 1.18 thorpej /*
835 1.18 thorpej * Have a suitable interface; behave as if
836 1.18 thorpej * the user specified this interface.
837 1.18 thorpej */
838 1.18 thorpej rootspec = (const char *)ifp->if_xname;
839 1.18 thorpej }
840 1.18 thorpej }
841 1.24 thorpej
842 1.24 thorpej /*
843 1.24 thorpej * If wildcarded root and we the boot device wasn't determined,
844 1.24 thorpej * ask the user.
845 1.24 thorpej */
846 1.24 thorpej if (rootspec == NULL && bootdv == NULL)
847 1.24 thorpej boothowto |= RB_ASKNAME;
848 1.18 thorpej
849 1.18 thorpej top:
850 1.18 thorpej if (boothowto & RB_ASKNAME) {
851 1.26 thorpej struct device *defdumpdv;
852 1.26 thorpej
853 1.18 thorpej for (;;) {
854 1.18 thorpej printf("root device");
855 1.18 thorpej if (bootdv != NULL) {
856 1.18 thorpej printf(" (default %s", bootdv->dv_xname);
857 1.113 thorpej if (DEV_USES_PARTITIONS(bootdv))
858 1.18 thorpej printf("%c", bootpartition + 'a');
859 1.18 thorpej printf(")");
860 1.18 thorpej }
861 1.18 thorpej printf(": ");
862 1.64 itojun len = cngetsn(buf, sizeof(buf));
863 1.18 thorpej if (len == 0 && bootdv != NULL) {
864 1.99 itojun strlcpy(buf, bootdv->dv_xname, sizeof(buf));
865 1.18 thorpej len = strlen(buf);
866 1.18 thorpej }
867 1.18 thorpej if (len > 0 && buf[len - 1] == '*') {
868 1.18 thorpej buf[--len] = '\0';
869 1.51 thorpej dv = getdisk(buf, len, 1, &nrootdev, 0);
870 1.18 thorpej if (dv != NULL) {
871 1.18 thorpej rootdv = dv;
872 1.25 mrg break;
873 1.18 thorpej }
874 1.18 thorpej }
875 1.51 thorpej dv = getdisk(buf, len, bootpartition, &nrootdev, 0);
876 1.18 thorpej if (dv != NULL) {
877 1.18 thorpej rootdv = dv;
878 1.18 thorpej break;
879 1.18 thorpej }
880 1.18 thorpej }
881 1.18 thorpej
882 1.26 thorpej /*
883 1.26 thorpej * Set up the default dump device. If root is on
884 1.26 thorpej * a network device, there is no default dump
885 1.26 thorpej * device, since we don't support dumps to the
886 1.26 thorpej * network.
887 1.26 thorpej */
888 1.113 thorpej if (DEV_USES_PARTITIONS(rootdv) == 0)
889 1.26 thorpej defdumpdv = NULL;
890 1.26 thorpej else
891 1.26 thorpej defdumpdv = rootdv;
892 1.26 thorpej
893 1.26 thorpej for (;;) {
894 1.26 thorpej printf("dump device");
895 1.26 thorpej if (defdumpdv != NULL) {
896 1.26 thorpej /*
897 1.26 thorpej * Note, we know it's a disk if we get here.
898 1.26 thorpej */
899 1.26 thorpej printf(" (default %sb)", defdumpdv->dv_xname);
900 1.26 thorpej }
901 1.26 thorpej printf(": ");
902 1.64 itojun len = cngetsn(buf, sizeof(buf));
903 1.26 thorpej if (len == 0) {
904 1.26 thorpej if (defdumpdv != NULL) {
905 1.26 thorpej ndumpdev = MAKEDISKDEV(major(nrootdev),
906 1.26 thorpej DISKUNIT(nrootdev), 1);
907 1.26 thorpej }
908 1.54 enami dumpdv = defdumpdv;
909 1.26 thorpej break;
910 1.26 thorpej }
911 1.26 thorpej if (len == 4 && strcmp(buf, "none") == 0) {
912 1.55 enami dumpdv = NULL;
913 1.54 enami break;
914 1.26 thorpej }
915 1.51 thorpej dv = getdisk(buf, len, 1, &ndumpdev, 1);
916 1.55 enami if (dv != NULL) {
917 1.26 thorpej dumpdv = dv;
918 1.26 thorpej break;
919 1.26 thorpej }
920 1.26 thorpej }
921 1.26 thorpej
922 1.18 thorpej rootdev = nrootdev;
923 1.26 thorpej dumpdev = ndumpdev;
924 1.18 thorpej
925 1.36 thorpej for (vops = LIST_FIRST(&vfs_list); vops != NULL;
926 1.36 thorpej vops = LIST_NEXT(vops, vfs_list)) {
927 1.36 thorpej if (vops->vfs_mountroot != NULL &&
928 1.36 thorpej vops->vfs_mountroot == mountroot)
929 1.38 fvdl break;
930 1.18 thorpej }
931 1.36 thorpej
932 1.36 thorpej if (vops == NULL) {
933 1.18 thorpej mountroot = NULL;
934 1.18 thorpej deffsname = "generic";
935 1.18 thorpej } else
936 1.36 thorpej deffsname = vops->vfs_name;
937 1.36 thorpej
938 1.18 thorpej for (;;) {
939 1.18 thorpej printf("file system (default %s): ", deffsname);
940 1.64 itojun len = cngetsn(buf, sizeof(buf));
941 1.18 thorpej if (len == 0)
942 1.18 thorpej break;
943 1.18 thorpej if (len == 4 && strcmp(buf, "halt") == 0)
944 1.23 gwr cpu_reboot(RB_HALT, NULL);
945 1.76 thorpej else if (len == 6 && strcmp(buf, "reboot") == 0)
946 1.76 thorpej cpu_reboot(0, NULL);
947 1.78 thorpej #if defined(DDB)
948 1.78 thorpej else if (len == 3 && strcmp(buf, "ddb") == 0) {
949 1.78 thorpej console_debugger();
950 1.78 thorpej }
951 1.78 thorpej #endif
952 1.18 thorpej else if (len == 7 && strcmp(buf, "generic") == 0) {
953 1.18 thorpej mountroot = NULL;
954 1.18 thorpej break;
955 1.18 thorpej }
956 1.18 thorpej vops = vfs_getopsbyname(buf);
957 1.18 thorpej if (vops == NULL || vops->vfs_mountroot == NULL) {
958 1.18 thorpej printf("use one of: generic");
959 1.36 thorpej for (vops = LIST_FIRST(&vfs_list);
960 1.36 thorpej vops != NULL;
961 1.36 thorpej vops = LIST_NEXT(vops, vfs_list)) {
962 1.36 thorpej if (vops->vfs_mountroot != NULL)
963 1.36 thorpej printf(" %s", vops->vfs_name);
964 1.36 thorpej }
965 1.78 thorpej #if defined(DDB)
966 1.78 thorpej printf(" ddb");
967 1.78 thorpej #endif
968 1.76 thorpej printf(" halt reboot\n");
969 1.18 thorpej } else {
970 1.18 thorpej mountroot = vops->vfs_mountroot;
971 1.18 thorpej break;
972 1.18 thorpej }
973 1.18 thorpej }
974 1.18 thorpej
975 1.18 thorpej } else if (rootspec == NULL) {
976 1.18 thorpej int majdev;
977 1.18 thorpej
978 1.18 thorpej /*
979 1.18 thorpej * Wildcarded root; use the boot device.
980 1.18 thorpej */
981 1.26 thorpej rootdv = bootdv;
982 1.26 thorpej
983 1.88 gehenna majdev = devsw_name2blk(bootdv->dv_xname, NULL, 0);
984 1.18 thorpej if (majdev >= 0) {
985 1.18 thorpej /*
986 1.113 thorpej * Root is on a disk. `bootpartition' is root,
987 1.113 thorpej * unless the device does not use partitions.
988 1.18 thorpej */
989 1.113 thorpej if (DEV_USES_PARTITIONS(bootdv))
990 1.135 thorpej rootdev = MAKEDISKDEV(majdev,
991 1.135 thorpej device_unit(bootdv),
992 1.135 thorpej bootpartition);
993 1.113 thorpej else
994 1.135 thorpej rootdev = makedev(majdev, device_unit(bootdv));
995 1.18 thorpej }
996 1.18 thorpej } else {
997 1.18 thorpej
998 1.18 thorpej /*
999 1.25 mrg * `root on <dev> ...'
1000 1.18 thorpej */
1001 1.18 thorpej
1002 1.18 thorpej /*
1003 1.18 thorpej * If it's a network interface, we can bail out
1004 1.18 thorpej * early.
1005 1.18 thorpej */
1006 1.56 enami dv = finddevice(rootspec);
1007 1.124 thorpej if (dv != NULL && device_class(dv) == DV_IFNET) {
1008 1.26 thorpej rootdv = dv;
1009 1.26 thorpej goto haveroot;
1010 1.18 thorpej }
1011 1.18 thorpej
1012 1.88 gehenna rootdevname = devsw_blk2name(major(rootdev));
1013 1.18 thorpej if (rootdevname == NULL) {
1014 1.18 thorpej printf("unknown device major 0x%x\n", rootdev);
1015 1.18 thorpej boothowto |= RB_ASKNAME;
1016 1.18 thorpej goto top;
1017 1.18 thorpej }
1018 1.41 perry memset(buf, 0, sizeof(buf));
1019 1.110 itojun snprintf(buf, sizeof(buf), "%s%d", rootdevname,
1020 1.110 itojun DISKUNIT(rootdev));
1021 1.18 thorpej
1022 1.56 enami rootdv = finddevice(buf);
1023 1.26 thorpej if (rootdv == NULL) {
1024 1.18 thorpej printf("device %s (0x%x) not configured\n",
1025 1.18 thorpej buf, rootdev);
1026 1.18 thorpej boothowto |= RB_ASKNAME;
1027 1.18 thorpej goto top;
1028 1.18 thorpej }
1029 1.26 thorpej }
1030 1.18 thorpej
1031 1.26 thorpej haveroot:
1032 1.18 thorpej
1033 1.18 thorpej root_device = rootdv;
1034 1.18 thorpej
1035 1.124 thorpej switch (device_class(rootdv)) {
1036 1.18 thorpej case DV_IFNET:
1037 1.139 christos case DV_DISK:
1038 1.100 thorpej aprint_normal("root on %s", rootdv->dv_xname);
1039 1.139 christos if (DEV_USES_PARTITIONS(bootdv))
1040 1.139 christos aprint_normal("%c", DISKPART(rootdev) + 'a');
1041 1.18 thorpej break;
1042 1.18 thorpej
1043 1.18 thorpej default:
1044 1.18 thorpej printf("can't determine root device\n");
1045 1.18 thorpej boothowto |= RB_ASKNAME;
1046 1.18 thorpej goto top;
1047 1.18 thorpej }
1048 1.26 thorpej
1049 1.26 thorpej /*
1050 1.26 thorpej * Now configure the dump device.
1051 1.55 enami *
1052 1.26 thorpej * If we haven't figured out the dump device, do so, with
1053 1.26 thorpej * the following rules:
1054 1.26 thorpej *
1055 1.26 thorpej * (a) We already know dumpdv in the RB_ASKNAME case.
1056 1.26 thorpej *
1057 1.26 thorpej * (b) If dumpspec is set, try to use it. If the device
1058 1.26 thorpej * is not available, punt.
1059 1.26 thorpej *
1060 1.26 thorpej * (c) If dumpspec is not set, the dump device is
1061 1.26 thorpej * wildcarded or unspecified. If the root device
1062 1.26 thorpej * is DV_IFNET, punt. Otherwise, use partition b
1063 1.26 thorpej * of the root device.
1064 1.26 thorpej */
1065 1.26 thorpej
1066 1.55 enami if (boothowto & RB_ASKNAME) { /* (a) */
1067 1.55 enami if (dumpdv == NULL)
1068 1.55 enami goto nodumpdev;
1069 1.55 enami } else if (dumpspec != NULL) { /* (b) */
1070 1.55 enami if (strcmp(dumpspec, "none") == 0 || dumpdev == NODEV) {
1071 1.26 thorpej /*
1072 1.55 enami * Operator doesn't want a dump device.
1073 1.55 enami * Or looks like they tried to pick a network
1074 1.26 thorpej * device. Oops.
1075 1.26 thorpej */
1076 1.26 thorpej goto nodumpdev;
1077 1.26 thorpej }
1078 1.26 thorpej
1079 1.88 gehenna dumpdevname = devsw_blk2name(major(dumpdev));
1080 1.26 thorpej if (dumpdevname == NULL)
1081 1.26 thorpej goto nodumpdev;
1082 1.41 perry memset(buf, 0, sizeof(buf));
1083 1.110 itojun snprintf(buf, sizeof(buf), "%s%d", dumpdevname,
1084 1.110 itojun DISKUNIT(dumpdev));
1085 1.26 thorpej
1086 1.56 enami dumpdv = finddevice(buf);
1087 1.56 enami if (dumpdv == NULL) {
1088 1.26 thorpej /*
1089 1.26 thorpej * Device not configured.
1090 1.26 thorpej */
1091 1.26 thorpej goto nodumpdev;
1092 1.26 thorpej }
1093 1.55 enami } else { /* (c) */
1094 1.113 thorpej if (DEV_USES_PARTITIONS(rootdv) == 0)
1095 1.55 enami goto nodumpdev;
1096 1.55 enami else {
1097 1.55 enami dumpdv = rootdv;
1098 1.55 enami dumpdev = MAKEDISKDEV(major(rootdev),
1099 1.135 thorpej device_unit(dumpdv), 1);
1100 1.55 enami }
1101 1.26 thorpej }
1102 1.26 thorpej
1103 1.100 thorpej aprint_normal(" dumps on %s%c\n", dumpdv->dv_xname,
1104 1.100 thorpej DISKPART(dumpdev) + 'a');
1105 1.26 thorpej return;
1106 1.26 thorpej
1107 1.26 thorpej nodumpdev:
1108 1.26 thorpej dumpdev = NODEV;
1109 1.100 thorpej aprint_normal("\n");
1110 1.18 thorpej }
1111 1.18 thorpej
1112 1.18 thorpej static struct device *
1113 1.117 thorpej finddevice(const char *name)
1114 1.56 enami {
1115 1.56 enami struct device *dv;
1116 1.108 christos #if defined(BOOT_FROM_RAID_HOOKS) || defined(BOOT_FROM_MEMORY_HOOKS)
1117 1.57 oster int j;
1118 1.108 christos #endif /* BOOT_FROM_RAID_HOOKS || BOOT_FROM_MEMORY_HOOKS */
1119 1.57 oster
1120 1.108 christos #ifdef BOOT_FROM_RAID_HOOKS
1121 1.57 oster for (j = 0; j < numraid; j++) {
1122 1.57 oster if (strcmp(name, raidrootdev[j].dv_xname) == 0) {
1123 1.57 oster dv = &raidrootdev[j];
1124 1.59 enami return (dv);
1125 1.57 oster }
1126 1.57 oster }
1127 1.108 christos #endif /* BOOT_FROM_RAID_HOOKS */
1128 1.108 christos
1129 1.108 christos #ifdef BOOT_FROM_MEMORY_HOOKS
1130 1.108 christos for (j = 0; j < NMD; j++) {
1131 1.108 christos if (strcmp(name, fakemdrootdev[j].dv_xname) == 0) {
1132 1.108 christos dv = &fakemdrootdev[j];
1133 1.108 christos return (dv);
1134 1.108 christos }
1135 1.108 christos }
1136 1.108 christos #endif /* BOOT_FROM_MEMORY_HOOKS */
1137 1.56 enami
1138 1.56 enami for (dv = TAILQ_FIRST(&alldevs); dv != NULL;
1139 1.56 enami dv = TAILQ_NEXT(dv, dv_list))
1140 1.56 enami if (strcmp(dv->dv_xname, name) == 0)
1141 1.56 enami break;
1142 1.56 enami return (dv);
1143 1.56 enami }
1144 1.56 enami
1145 1.56 enami static struct device *
1146 1.117 thorpej getdisk(char *str, int len, int defpart, dev_t *devp, int isdump)
1147 1.18 thorpej {
1148 1.28 leo struct device *dv;
1149 1.29 drochner #ifdef MEMORY_DISK_HOOKS
1150 1.28 leo int i;
1151 1.29 drochner #endif
1152 1.57 oster #ifdef BOOT_FROM_RAID_HOOKS
1153 1.57 oster int j;
1154 1.57 oster #endif
1155 1.18 thorpej
1156 1.51 thorpej if ((dv = parsedisk(str, len, defpart, devp)) == NULL) {
1157 1.18 thorpej printf("use one of:");
1158 1.18 thorpej #ifdef MEMORY_DISK_HOOKS
1159 1.26 thorpej if (isdump == 0)
1160 1.28 leo for (i = 0; i < NMD; i++)
1161 1.28 leo printf(" %s[a-%c]", fakemdrootdev[i].dv_xname,
1162 1.28 leo 'a' + MAXPARTITIONS - 1);
1163 1.18 thorpej #endif
1164 1.57 oster #ifdef BOOT_FROM_RAID_HOOKS
1165 1.57 oster if (isdump == 0)
1166 1.57 oster for (j = 0; j < numraid; j++)
1167 1.59 enami printf(" %s[a-%c]", raidrootdev[j].dv_xname,
1168 1.59 enami 'a' + MAXPARTITIONS - 1);
1169 1.57 oster #endif
1170 1.83 matt TAILQ_FOREACH(dv, &alldevs, dv_list) {
1171 1.113 thorpej if (DEV_USES_PARTITIONS(dv))
1172 1.18 thorpej printf(" %s[a-%c]", dv->dv_xname,
1173 1.19 cgd 'a' + MAXPARTITIONS - 1);
1174 1.124 thorpej else if (device_class(dv) == DV_DISK)
1175 1.113 thorpej printf(" %s", dv->dv_xname);
1176 1.124 thorpej if (isdump == 0 && device_class(dv) == DV_IFNET)
1177 1.18 thorpej printf(" %s", dv->dv_xname);
1178 1.18 thorpej }
1179 1.26 thorpej if (isdump)
1180 1.26 thorpej printf(" none");
1181 1.78 thorpej #if defined(DDB)
1182 1.78 thorpej printf(" ddb");
1183 1.78 thorpej #endif
1184 1.76 thorpej printf(" halt reboot\n");
1185 1.18 thorpej }
1186 1.18 thorpej return (dv);
1187 1.18 thorpej }
1188 1.18 thorpej
1189 1.18 thorpej static struct device *
1190 1.117 thorpej parsedisk(char *str, int len, int defpart, dev_t *devp)
1191 1.18 thorpej {
1192 1.18 thorpej struct device *dv;
1193 1.18 thorpej char *cp, c;
1194 1.29 drochner int majdev, part;
1195 1.29 drochner #ifdef MEMORY_DISK_HOOKS
1196 1.29 drochner int i;
1197 1.29 drochner #endif
1198 1.18 thorpej if (len == 0)
1199 1.18 thorpej return (NULL);
1200 1.18 thorpej
1201 1.18 thorpej if (len == 4 && strcmp(str, "halt") == 0)
1202 1.23 gwr cpu_reboot(RB_HALT, NULL);
1203 1.76 thorpej else if (len == 6 && strcmp(str, "reboot") == 0)
1204 1.76 thorpej cpu_reboot(0, NULL);
1205 1.78 thorpej #if defined(DDB)
1206 1.78 thorpej else if (len == 3 && strcmp(str, "ddb") == 0)
1207 1.78 thorpej console_debugger();
1208 1.78 thorpej #endif
1209 1.18 thorpej
1210 1.18 thorpej cp = str + len - 1;
1211 1.18 thorpej c = *cp;
1212 1.18 thorpej if (c >= 'a' && c <= ('a' + MAXPARTITIONS - 1)) {
1213 1.18 thorpej part = c - 'a';
1214 1.18 thorpej *cp = '\0';
1215 1.18 thorpej } else
1216 1.18 thorpej part = defpart;
1217 1.18 thorpej
1218 1.18 thorpej #ifdef MEMORY_DISK_HOOKS
1219 1.28 leo for (i = 0; i < NMD; i++)
1220 1.28 leo if (strcmp(str, fakemdrootdev[i].dv_xname) == 0) {
1221 1.28 leo dv = &fakemdrootdev[i];
1222 1.28 leo goto gotdisk;
1223 1.28 leo }
1224 1.18 thorpej #endif
1225 1.18 thorpej
1226 1.56 enami dv = finddevice(str);
1227 1.56 enami if (dv != NULL) {
1228 1.124 thorpej if (device_class(dv) == DV_DISK) {
1229 1.18 thorpej #ifdef MEMORY_DISK_HOOKS
1230 1.18 thorpej gotdisk:
1231 1.18 thorpej #endif
1232 1.88 gehenna majdev = devsw_name2blk(dv->dv_xname, NULL, 0);
1233 1.18 thorpej if (majdev < 0)
1234 1.18 thorpej panic("parsedisk");
1235 1.113 thorpej if (DEV_USES_PARTITIONS(dv))
1236 1.135 thorpej *devp = MAKEDISKDEV(majdev, device_unit(dv),
1237 1.135 thorpej part);
1238 1.113 thorpej else
1239 1.135 thorpej *devp = makedev(majdev, device_unit(dv));
1240 1.18 thorpej }
1241 1.18 thorpej
1242 1.124 thorpej if (device_class(dv) == DV_IFNET)
1243 1.18 thorpej *devp = NODEV;
1244 1.18 thorpej }
1245 1.18 thorpej
1246 1.18 thorpej *cp = c;
1247 1.18 thorpej return (dv);
1248 1.48 lukem }
1249 1.48 lukem
1250 1.48 lukem /*
1251 1.49 lukem * snprintf() `bytes' into `buf', reformatting it so that the number,
1252 1.49 lukem * plus a possible `x' + suffix extension) fits into len bytes (including
1253 1.49 lukem * the terminating NUL).
1254 1.60 enami * Returns the number of bytes stored in buf, or -1 if there was a problem.
1255 1.109 junyoung * E.g, given a len of 9 and a suffix of `B':
1256 1.48 lukem * bytes result
1257 1.48 lukem * ----- ------
1258 1.49 lukem * 99999 `99999 B'
1259 1.90 wiz * 100000 `97 kB'
1260 1.90 wiz * 66715648 `65152 kB'
1261 1.48 lukem * 252215296 `240 MB'
1262 1.48 lukem */
1263 1.48 lukem int
1264 1.117 thorpej humanize_number(char *buf, size_t len, uint64_t bytes, const char *suffix,
1265 1.117 thorpej int divisor)
1266 1.48 lukem {
1267 1.91 drochner /* prefixes are: (none), kilo, Mega, Giga, Tera, Peta, Exa */
1268 1.91 drochner const char *prefixes;
1269 1.86 thorpej int r;
1270 1.121 perry uint64_t umax;
1271 1.86 thorpej size_t i, suffixlen;
1272 1.48 lukem
1273 1.49 lukem if (buf == NULL || suffix == NULL)
1274 1.49 lukem return (-1);
1275 1.48 lukem if (len > 0)
1276 1.48 lukem buf[0] = '\0';
1277 1.49 lukem suffixlen = strlen(suffix);
1278 1.91 drochner /* check if enough room for `x y' + suffix + `\0' */
1279 1.49 lukem if (len < 4 + suffixlen)
1280 1.49 lukem return (-1);
1281 1.48 lukem
1282 1.91 drochner if (divisor == 1024) {
1283 1.91 drochner /*
1284 1.91 drochner * binary multiplies
1285 1.91 drochner * XXX IEC 60027-2 recommends Ki, Mi, Gi...
1286 1.91 drochner */
1287 1.91 drochner prefixes = " KMGTPE";
1288 1.91 drochner } else
1289 1.91 drochner prefixes = " kMGTPE"; /* SI for decimal multiplies */
1290 1.91 drochner
1291 1.116 christos umax = 1;
1292 1.49 lukem for (i = 0; i < len - suffixlen - 3; i++)
1293 1.116 christos umax *= 10;
1294 1.116 christos for (i = 0; bytes >= umax && prefixes[i + 1]; i++)
1295 1.58 sommerfe bytes /= divisor;
1296 1.48 lukem
1297 1.50 lukem r = snprintf(buf, len, "%qu%s%c%s", (unsigned long long)bytes,
1298 1.49 lukem i == 0 ? "" : " ", prefixes[i], suffix);
1299 1.48 lukem
1300 1.48 lukem return (r);
1301 1.49 lukem }
1302 1.49 lukem
1303 1.49 lukem int
1304 1.117 thorpej format_bytes(char *buf, size_t len, uint64_t bytes)
1305 1.49 lukem {
1306 1.49 lukem int rv;
1307 1.49 lukem size_t nlen;
1308 1.49 lukem
1309 1.58 sommerfe rv = humanize_number(buf, len, bytes, "B", 1024);
1310 1.49 lukem if (rv != -1) {
1311 1.49 lukem /* nuke the trailing ` B' if it exists */
1312 1.49 lukem nlen = strlen(buf) - 2;
1313 1.49 lukem if (strcmp(&buf[nlen], " B") == 0)
1314 1.49 lukem buf[nlen] = '\0';
1315 1.49 lukem }
1316 1.49 lukem return (rv);
1317 1.81 christos }
1318 1.81 christos
1319 1.92 jdolecek /*
1320 1.130 thorpej * Return TRUE if system call tracing is enabled for the specified process.
1321 1.130 thorpej */
1322 1.130 thorpej boolean_t
1323 1.130 thorpej trace_is_enabled(struct proc *p)
1324 1.130 thorpej {
1325 1.131 thorpej #ifdef SYSCALL_DEBUG
1326 1.131 thorpej return (TRUE);
1327 1.131 thorpej #endif
1328 1.130 thorpej #ifdef KTRACE
1329 1.130 thorpej if (ISSET(p->p_traceflag, (KTRFAC_SYSCALL | KTRFAC_SYSRET)))
1330 1.130 thorpej return (TRUE);
1331 1.130 thorpej #endif
1332 1.130 thorpej #ifdef SYSTRACE
1333 1.130 thorpej if (ISSET(p->p_flag, P_SYSTRACE))
1334 1.130 thorpej return (TRUE);
1335 1.130 thorpej #endif
1336 1.130 thorpej if (ISSET(p->p_flag, P_SYSCALL))
1337 1.130 thorpej return (TRUE);
1338 1.130 thorpej
1339 1.130 thorpej return (FALSE);
1340 1.130 thorpej }
1341 1.130 thorpej
1342 1.130 thorpej /*
1343 1.92 jdolecek * Start trace of particular system call. If process is being traced,
1344 1.92 jdolecek * this routine is called by MD syscall dispatch code just before
1345 1.92 jdolecek * a system call is actually executed.
1346 1.92 jdolecek * MD caller guarantees the passed 'code' is within the supported
1347 1.92 jdolecek * system call number range for emulation the process runs under.
1348 1.92 jdolecek */
1349 1.81 christos int
1350 1.95 thorpej trace_enter(struct lwp *l, register_t code,
1351 1.117 thorpej register_t realcode, const struct sysent *callp, void *args)
1352 1.81 christos {
1353 1.95 thorpej struct proc *p = l->l_proc;
1354 1.95 thorpej
1355 1.81 christos #ifdef SYSCALL_DEBUG
1356 1.95 thorpej scdebug_call(l, code, args);
1357 1.81 christos #endif /* SYSCALL_DEBUG */
1358 1.81 christos
1359 1.81 christos #ifdef KTRACE
1360 1.81 christos if (KTRPOINT(p, KTR_SYSCALL))
1361 1.120 christos ktrsyscall(l, code, realcode, callp, args);
1362 1.81 christos #endif /* KTRACE */
1363 1.81 christos
1364 1.128 christos if ((p->p_flag & (P_SYSCALL|P_TRACED)) == (P_SYSCALL|P_TRACED))
1365 1.128 christos process_stoptrace(l);
1366 1.128 christos
1367 1.81 christos #ifdef SYSTRACE
1368 1.81 christos if (ISSET(p->p_flag, P_SYSTRACE))
1369 1.137 ad return systrace_enter(l, code, args);
1370 1.81 christos #endif
1371 1.81 christos return 0;
1372 1.81 christos }
1373 1.81 christos
1374 1.92 jdolecek /*
1375 1.92 jdolecek * End trace of particular system call. If process is being traced,
1376 1.92 jdolecek * this routine is called by MD syscall dispatch code just after
1377 1.92 jdolecek * a system call finishes.
1378 1.92 jdolecek * MD caller guarantees the passed 'code' is within the supported
1379 1.92 jdolecek * system call number range for emulation the process runs under.
1380 1.92 jdolecek */
1381 1.81 christos void
1382 1.95 thorpej trace_exit(struct lwp *l, register_t code, void *args, register_t rval[],
1383 1.81 christos int error)
1384 1.81 christos {
1385 1.95 thorpej struct proc *p = l->l_proc;
1386 1.95 thorpej
1387 1.81 christos #ifdef SYSCALL_DEBUG
1388 1.95 thorpej scdebug_ret(l, code, error, rval);
1389 1.81 christos #endif /* SYSCALL_DEBUG */
1390 1.81 christos
1391 1.81 christos #ifdef KTRACE
1392 1.81 christos if (KTRPOINT(p, KTR_SYSRET)) {
1393 1.95 thorpej KERNEL_PROC_LOCK(l);
1394 1.120 christos ktrsysret(l, code, error, rval);
1395 1.95 thorpej KERNEL_PROC_UNLOCK(l);
1396 1.81 christos }
1397 1.81 christos #endif /* KTRACE */
1398 1.128 christos
1399 1.128 christos if ((p->p_flag & (P_SYSCALL|P_TRACED)) == (P_SYSCALL|P_TRACED))
1400 1.128 christos process_stoptrace(l);
1401 1.81 christos
1402 1.81 christos #ifdef SYSTRACE
1403 1.122 chs if (ISSET(p->p_flag, P_SYSTRACE)) {
1404 1.122 chs KERNEL_PROC_LOCK(l);
1405 1.137 ad systrace_exit(l, code, args, rval, error);
1406 1.122 chs KERNEL_PROC_UNLOCK(l);
1407 1.122 chs }
1408 1.81 christos #endif
1409 1.10 cgd }
1410