Home | History | Annotate | Line # | Download | only in kern
kern_subr.c revision 1.200
      1  1.200    dyoung /*	$NetBSD: kern_subr.c,v 1.200 2009/09/25 19:21:09 dyoung Exp $	*/
      2   1.31   thorpej 
      3   1.31   thorpej /*-
      4  1.185        ad  * Copyright (c) 1997, 1998, 1999, 2002, 2007, 2008 The NetBSD Foundation, Inc.
      5   1.31   thorpej  * All rights reserved.
      6   1.31   thorpej  *
      7   1.31   thorpej  * This code is derived from software contributed to The NetBSD Foundation
      8   1.31   thorpej  * by Jason R. Thorpe of the Numerical Aerospace Simulation Facility,
      9   1.48     lukem  * NASA Ames Research Center, and by Luke Mewburn.
     10   1.31   thorpej  *
     11   1.31   thorpej  * Redistribution and use in source and binary forms, with or without
     12   1.31   thorpej  * modification, are permitted provided that the following conditions
     13   1.31   thorpej  * are met:
     14   1.31   thorpej  * 1. Redistributions of source code must retain the above copyright
     15   1.31   thorpej  *    notice, this list of conditions and the following disclaimer.
     16   1.31   thorpej  * 2. Redistributions in binary form must reproduce the above copyright
     17   1.31   thorpej  *    notice, this list of conditions and the following disclaimer in the
     18   1.31   thorpej  *    documentation and/or other materials provided with the distribution.
     19   1.31   thorpej  *
     20   1.31   thorpej  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     21   1.31   thorpej  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     22   1.31   thorpej  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     23   1.31   thorpej  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     24   1.31   thorpej  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     25   1.31   thorpej  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     26   1.31   thorpej  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     27   1.31   thorpej  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     28   1.31   thorpej  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     29   1.31   thorpej  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     30   1.31   thorpej  * POSSIBILITY OF SUCH DAMAGE.
     31   1.31   thorpej  */
     32   1.12       cgd 
     33    1.9       cgd /*
     34   1.10       cgd  * Copyright (c) 1982, 1986, 1991, 1993
     35   1.10       cgd  *	The Regents of the University of California.  All rights reserved.
     36    1.9       cgd  * (c) UNIX System Laboratories, Inc.
     37    1.9       cgd  * All or some portions of this file are derived from material licensed
     38    1.9       cgd  * to the University of California by American Telephone and Telegraph
     39    1.9       cgd  * Co. or Unix System Laboratories, Inc. and are reproduced herein with
     40    1.9       cgd  * the permission of UNIX System Laboratories, Inc.
     41    1.9       cgd  *
     42   1.18   thorpej  * Copyright (c) 1992, 1993
     43   1.18   thorpej  *	The Regents of the University of California.  All rights reserved.
     44   1.18   thorpej  *
     45   1.18   thorpej  * This software was developed by the Computer Systems Engineering group
     46   1.18   thorpej  * at Lawrence Berkeley Laboratory under DARPA contract BG 91-66 and
     47   1.18   thorpej  * contributed to Berkeley.
     48   1.18   thorpej  *
     49   1.18   thorpej  * All advertising materials mentioning features or use of this software
     50   1.18   thorpej  * must display the following acknowledgement:
     51   1.18   thorpej  *	This product includes software developed by the University of
     52   1.18   thorpej  *	California, Lawrence Berkeley Laboratory.
     53   1.18   thorpej  *
     54    1.9       cgd  * Redistribution and use in source and binary forms, with or without
     55    1.9       cgd  * modification, are permitted provided that the following conditions
     56    1.9       cgd  * are met:
     57    1.9       cgd  * 1. Redistributions of source code must retain the above copyright
     58    1.9       cgd  *    notice, this list of conditions and the following disclaimer.
     59    1.9       cgd  * 2. Redistributions in binary form must reproduce the above copyright
     60    1.9       cgd  *    notice, this list of conditions and the following disclaimer in the
     61    1.9       cgd  *    documentation and/or other materials provided with the distribution.
     62  1.103       agc  * 3. Neither the name of the University nor the names of its contributors
     63    1.9       cgd  *    may be used to endorse or promote products derived from this software
     64    1.9       cgd  *    without specific prior written permission.
     65    1.9       cgd  *
     66    1.9       cgd  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
     67    1.9       cgd  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     68    1.9       cgd  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     69    1.9       cgd  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
     70    1.9       cgd  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     71    1.9       cgd  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     72    1.9       cgd  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     73    1.9       cgd  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     74    1.9       cgd  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     75    1.9       cgd  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     76    1.9       cgd  * SUCH DAMAGE.
     77    1.9       cgd  *
     78   1.38      fvdl  *	@(#)kern_subr.c	8.4 (Berkeley) 2/14/95
     79    1.9       cgd  */
     80   1.77     lukem 
     81   1.77     lukem #include <sys/cdefs.h>
     82  1.200    dyoung __KERNEL_RCSID(0, "$NetBSD: kern_subr.c,v 1.200 2009/09/25 19:21:09 dyoung Exp $");
     83   1.34       mrg 
     84   1.78   thorpej #include "opt_ddb.h"
     85   1.43  jonathan #include "opt_md.h"
     86   1.81  christos #include "opt_syscall_debug.h"
     87   1.81  christos #include "opt_ktrace.h"
     88  1.142      matt #include "opt_ptrace.h"
     89  1.144  jmcneill #include "opt_powerhook.h"
     90  1.157      manu #include "opt_tftproot.h"
     91    1.9       cgd 
     92    1.9       cgd #include <sys/param.h>
     93    1.9       cgd #include <sys/systm.h>
     94    1.9       cgd #include <sys/proc.h>
     95   1.10       cgd #include <sys/malloc.h>
     96   1.18   thorpej #include <sys/mount.h>
     97   1.18   thorpej #include <sys/device.h>
     98   1.18   thorpej #include <sys/reboot.h>
     99   1.18   thorpej #include <sys/conf.h>
    100  1.159    dyoung #include <sys/disk.h>
    101   1.18   thorpej #include <sys/disklabel.h>
    102   1.10       cgd #include <sys/queue.h>
    103   1.81  christos #include <sys/ktrace.h>
    104  1.128  christos #include <sys/ptrace.h>
    105  1.119   reinoud #include <sys/fcntl.h>
    106  1.160  christos #include <sys/kauth.h>
    107  1.160  christos #include <sys/vnode.h>
    108  1.194        ad #include <sys/syscallvar.h>
    109  1.194        ad #include <sys/xcall.h>
    110  1.194        ad #include <sys/module.h>
    111    1.9       cgd 
    112   1.82   thorpej #include <uvm/uvm_extern.h>
    113   1.82   thorpej 
    114   1.18   thorpej #include <dev/cons.h>
    115   1.18   thorpej 
    116   1.18   thorpej #include <net/if.h>
    117   1.18   thorpej 
    118   1.18   thorpej /* XXX these should eventually move to subr_autoconf.c */
    119  1.200    dyoung static device_t finddevice(const char *);
    120  1.200    dyoung static device_t getdisk(char *, int, int, dev_t *, int);
    121  1.200    dyoung static device_t parsedisk(char *, int, int, dev_t *);
    122  1.159    dyoung static const char *getwedgename(const char *, int);
    123   1.18   thorpej 
    124   1.80  christos /*
    125   1.80  christos  * A generic linear hook.
    126   1.80  christos  */
    127   1.80  christos struct hook_desc {
    128   1.80  christos 	LIST_ENTRY(hook_desc) hk_list;
    129  1.109  junyoung 	void	(*hk_fn)(void *);
    130   1.80  christos 	void	*hk_arg;
    131   1.80  christos };
    132   1.80  christos typedef LIST_HEAD(, hook_desc) hook_list_t;
    133   1.80  christos 
    134  1.157      manu #ifdef TFTPROOT
    135  1.200    dyoung int tftproot_dhcpboot(device_t);
    136  1.157      manu #endif
    137  1.157      manu 
    138  1.175        ad dev_t	dumpcdev;	/* for savecore */
    139  1.175        ad 
    140  1.126      yamt void
    141  1.126      yamt uio_setup_sysspace(struct uio *uio)
    142  1.126      yamt {
    143  1.126      yamt 
    144  1.126      yamt 	uio->uio_vmspace = vmspace_kernel();
    145  1.126      yamt }
    146  1.126      yamt 
    147   1.11   mycroft int
    148  1.117   thorpej uiomove(void *buf, size_t n, struct uio *uio)
    149    1.9       cgd {
    150  1.126      yamt 	struct vmspace *vm = uio->uio_vmspace;
    151   1.63  augustss 	struct iovec *iov;
    152  1.180     njoly 	size_t cnt;
    153    1.9       cgd 	int error = 0;
    154   1.16  christos 	char *cp = buf;
    155  1.112      yamt 
    156  1.183      yamt 	ASSERT_SLEEPABLE();
    157   1.68     enami 
    158   1.68     enami #ifdef DIAGNOSTIC
    159    1.9       cgd 	if (uio->uio_rw != UIO_READ && uio->uio_rw != UIO_WRITE)
    160    1.9       cgd 		panic("uiomove: mode");
    161    1.9       cgd #endif
    162    1.9       cgd 	while (n > 0 && uio->uio_resid) {
    163    1.9       cgd 		iov = uio->uio_iov;
    164    1.9       cgd 		cnt = iov->iov_len;
    165    1.9       cgd 		if (cnt == 0) {
    166  1.105      yamt 			KASSERT(uio->uio_iovcnt > 0);
    167    1.9       cgd 			uio->uio_iov++;
    168    1.9       cgd 			uio->uio_iovcnt--;
    169    1.9       cgd 			continue;
    170    1.9       cgd 		}
    171    1.9       cgd 		if (cnt > n)
    172    1.9       cgd 			cnt = n;
    173  1.126      yamt 		if (!VMSPACE_IS_KERNEL_P(vm)) {
    174  1.104      yamt 			if (curcpu()->ci_schedstate.spc_flags &
    175   1.67   thorpej 			    SPCF_SHOULDYIELD)
    176  1.151        ad 				preempt();
    177  1.126      yamt 		}
    178    1.9       cgd 
    179  1.126      yamt 		if (uio->uio_rw == UIO_READ) {
    180  1.126      yamt 			error = copyout_vmspace(vm, cp, iov->iov_base,
    181  1.126      yamt 			    cnt);
    182  1.126      yamt 		} else {
    183  1.126      yamt 			error = copyin_vmspace(vm, iov->iov_base, cp,
    184  1.126      yamt 			    cnt);
    185  1.126      yamt 		}
    186  1.126      yamt 		if (error) {
    187    1.9       cgd 			break;
    188    1.9       cgd 		}
    189  1.155  christos 		iov->iov_base = (char *)iov->iov_base + cnt;
    190    1.9       cgd 		iov->iov_len -= cnt;
    191    1.9       cgd 		uio->uio_resid -= cnt;
    192    1.9       cgd 		uio->uio_offset += cnt;
    193    1.9       cgd 		cp += cnt;
    194   1.85   thorpej 		KDASSERT(cnt <= n);
    195    1.9       cgd 		n -= cnt;
    196    1.9       cgd 	}
    197  1.165        ad 
    198    1.9       cgd 	return (error);
    199    1.9       cgd }
    200    1.9       cgd 
    201    1.9       cgd /*
    202  1.110    itojun  * Wrapper for uiomove() that validates the arguments against a known-good
    203  1.111      matt  * kernel buffer.
    204  1.110    itojun  */
    205  1.110    itojun int
    206  1.111      matt uiomove_frombuf(void *buf, size_t buflen, struct uio *uio)
    207  1.110    itojun {
    208  1.111      matt 	size_t offset;
    209  1.110    itojun 
    210  1.143  christos 	if (uio->uio_offset < 0 || /* uio->uio_resid < 0 || */
    211  1.110    itojun 	    (offset = uio->uio_offset) != uio->uio_offset)
    212  1.110    itojun 		return (EINVAL);
    213  1.111      matt 	if (offset >= buflen)
    214  1.110    itojun 		return (0);
    215  1.111      matt 	return (uiomove((char *)buf + offset, buflen - offset, uio));
    216  1.110    itojun }
    217  1.110    itojun 
    218  1.110    itojun /*
    219    1.9       cgd  * Give next character to user as result of read.
    220    1.9       cgd  */
    221   1.11   mycroft int
    222  1.117   thorpej ureadc(int c, struct uio *uio)
    223    1.9       cgd {
    224   1.63  augustss 	struct iovec *iov;
    225    1.9       cgd 
    226   1.11   mycroft 	if (uio->uio_resid <= 0)
    227   1.11   mycroft 		panic("ureadc: non-positive resid");
    228    1.9       cgd again:
    229   1.11   mycroft 	if (uio->uio_iovcnt <= 0)
    230   1.11   mycroft 		panic("ureadc: non-positive iovcnt");
    231    1.9       cgd 	iov = uio->uio_iov;
    232   1.11   mycroft 	if (iov->iov_len <= 0) {
    233    1.9       cgd 		uio->uio_iovcnt--;
    234    1.9       cgd 		uio->uio_iov++;
    235    1.9       cgd 		goto again;
    236    1.9       cgd 	}
    237  1.126      yamt 	if (!VMSPACE_IS_KERNEL_P(uio->uio_vmspace)) {
    238    1.9       cgd 		if (subyte(iov->iov_base, c) < 0)
    239    1.9       cgd 			return (EFAULT);
    240  1.126      yamt 	} else {
    241   1.39    kleink 		*(char *)iov->iov_base = c;
    242    1.9       cgd 	}
    243  1.155  christos 	iov->iov_base = (char *)iov->iov_base + 1;
    244    1.9       cgd 	iov->iov_len--;
    245    1.9       cgd 	uio->uio_resid--;
    246    1.9       cgd 	uio->uio_offset++;
    247    1.9       cgd 	return (0);
    248   1.82   thorpej }
    249   1.82   thorpej 
    250   1.82   thorpej /*
    251  1.126      yamt  * Like copyin(), but operates on an arbitrary vmspace.
    252   1.82   thorpej  */
    253   1.82   thorpej int
    254  1.126      yamt copyin_vmspace(struct vmspace *vm, const void *uaddr, void *kaddr, size_t len)
    255   1.82   thorpej {
    256   1.82   thorpej 	struct iovec iov;
    257   1.82   thorpej 	struct uio uio;
    258   1.82   thorpej 	int error;
    259   1.82   thorpej 
    260   1.82   thorpej 	if (len == 0)
    261   1.82   thorpej 		return (0);
    262   1.82   thorpej 
    263  1.126      yamt 	if (VMSPACE_IS_KERNEL_P(vm)) {
    264  1.126      yamt 		return kcopy(uaddr, kaddr, len);
    265  1.126      yamt 	}
    266  1.126      yamt 	if (__predict_true(vm == curproc->p_vmspace)) {
    267  1.118  christos 		return copyin(uaddr, kaddr, len);
    268  1.126      yamt 	}
    269  1.118  christos 
    270   1.82   thorpej 	iov.iov_base = kaddr;
    271   1.82   thorpej 	iov.iov_len = len;
    272   1.82   thorpej 	uio.uio_iov = &iov;
    273   1.82   thorpej 	uio.uio_iovcnt = 1;
    274  1.191     rmind 	uio.uio_offset = (off_t)(uintptr_t)uaddr;
    275   1.82   thorpej 	uio.uio_resid = len;
    276   1.82   thorpej 	uio.uio_rw = UIO_READ;
    277  1.134      yamt 	UIO_SETUP_SYSSPACE(&uio);
    278  1.126      yamt 	error = uvm_io(&vm->vm_map, &uio);
    279   1.82   thorpej 
    280   1.82   thorpej 	return (error);
    281   1.82   thorpej }
    282   1.82   thorpej 
    283   1.82   thorpej /*
    284  1.126      yamt  * Like copyout(), but operates on an arbitrary vmspace.
    285   1.82   thorpej  */
    286   1.82   thorpej int
    287  1.126      yamt copyout_vmspace(struct vmspace *vm, const void *kaddr, void *uaddr, size_t len)
    288   1.82   thorpej {
    289   1.82   thorpej 	struct iovec iov;
    290   1.82   thorpej 	struct uio uio;
    291   1.82   thorpej 	int error;
    292   1.82   thorpej 
    293   1.82   thorpej 	if (len == 0)
    294   1.82   thorpej 		return (0);
    295   1.82   thorpej 
    296  1.126      yamt 	if (VMSPACE_IS_KERNEL_P(vm)) {
    297  1.126      yamt 		return kcopy(kaddr, uaddr, len);
    298  1.126      yamt 	}
    299  1.126      yamt 	if (__predict_true(vm == curproc->p_vmspace)) {
    300  1.118  christos 		return copyout(kaddr, uaddr, len);
    301  1.126      yamt 	}
    302  1.118  christos 
    303  1.116  christos 	iov.iov_base = __UNCONST(kaddr); /* XXXUNCONST cast away const */
    304   1.82   thorpej 	iov.iov_len = len;
    305   1.82   thorpej 	uio.uio_iov = &iov;
    306   1.82   thorpej 	uio.uio_iovcnt = 1;
    307  1.191     rmind 	uio.uio_offset = (off_t)(uintptr_t)uaddr;
    308   1.82   thorpej 	uio.uio_resid = len;
    309   1.82   thorpej 	uio.uio_rw = UIO_WRITE;
    310  1.134      yamt 	UIO_SETUP_SYSSPACE(&uio);
    311  1.126      yamt 	error = uvm_io(&vm->vm_map, &uio);
    312  1.126      yamt 
    313  1.126      yamt 	return (error);
    314  1.126      yamt }
    315  1.126      yamt 
    316  1.126      yamt /*
    317  1.126      yamt  * Like copyin(), but operates on an arbitrary process.
    318  1.126      yamt  */
    319  1.126      yamt int
    320  1.126      yamt copyin_proc(struct proc *p, const void *uaddr, void *kaddr, size_t len)
    321  1.126      yamt {
    322  1.126      yamt 	struct vmspace *vm;
    323  1.126      yamt 	int error;
    324  1.126      yamt 
    325  1.126      yamt 	error = proc_vmspace_getref(p, &vm);
    326  1.126      yamt 	if (error) {
    327  1.126      yamt 		return error;
    328  1.126      yamt 	}
    329  1.126      yamt 	error = copyin_vmspace(vm, uaddr, kaddr, len);
    330  1.126      yamt 	uvmspace_free(vm);
    331   1.82   thorpej 
    332  1.126      yamt 	return error;
    333  1.126      yamt }
    334   1.82   thorpej 
    335  1.126      yamt /*
    336  1.126      yamt  * Like copyout(), but operates on an arbitrary process.
    337  1.126      yamt  */
    338  1.126      yamt int
    339  1.126      yamt copyout_proc(struct proc *p, const void *kaddr, void *uaddr, size_t len)
    340  1.126      yamt {
    341  1.126      yamt 	struct vmspace *vm;
    342  1.126      yamt 	int error;
    343  1.126      yamt 
    344  1.126      yamt 	error = proc_vmspace_getref(p, &vm);
    345  1.126      yamt 	if (error) {
    346  1.126      yamt 		return error;
    347  1.126      yamt 	}
    348  1.132      yamt 	error = copyout_vmspace(vm, kaddr, uaddr, len);
    349  1.126      yamt 	uvmspace_free(vm);
    350  1.126      yamt 
    351  1.126      yamt 	return error;
    352    1.9       cgd }
    353   1.10       cgd 
    354   1.10       cgd /*
    355  1.119   reinoud  * Like copyin(), except it operates on kernel addresses when the FKIOCTL
    356  1.119   reinoud  * flag is passed in `ioctlflags' from the ioctl call.
    357  1.119   reinoud  */
    358  1.119   reinoud int
    359  1.119   reinoud ioctl_copyin(int ioctlflags, const void *src, void *dst, size_t len)
    360  1.119   reinoud {
    361  1.119   reinoud 	if (ioctlflags & FKIOCTL)
    362  1.119   reinoud 		return kcopy(src, dst, len);
    363  1.119   reinoud 	return copyin(src, dst, len);
    364  1.119   reinoud }
    365  1.119   reinoud 
    366  1.119   reinoud /*
    367  1.119   reinoud  * Like copyout(), except it operates on kernel addresses when the FKIOCTL
    368  1.119   reinoud  * flag is passed in `ioctlflags' from the ioctl call.
    369  1.119   reinoud  */
    370  1.119   reinoud int
    371  1.119   reinoud ioctl_copyout(int ioctlflags, const void *src, void *dst, size_t len)
    372  1.119   reinoud {
    373  1.119   reinoud 	if (ioctlflags & FKIOCTL)
    374  1.119   reinoud 		return kcopy(src, dst, len);
    375  1.119   reinoud 	return copyout(src, dst, len);
    376  1.119   reinoud }
    377  1.119   reinoud 
    378   1.80  christos static void *
    379  1.117   thorpej hook_establish(hook_list_t *list, void (*fn)(void *), void *arg)
    380   1.14       cgd {
    381   1.80  christos 	struct hook_desc *hd;
    382   1.14       cgd 
    383   1.80  christos 	hd = malloc(sizeof(*hd), M_DEVBUF, M_NOWAIT);
    384   1.80  christos 	if (hd == NULL)
    385   1.59     enami 		return (NULL);
    386   1.14       cgd 
    387   1.80  christos 	hd->hk_fn = fn;
    388   1.80  christos 	hd->hk_arg = arg;
    389   1.80  christos 	LIST_INSERT_HEAD(list, hd, hk_list);
    390   1.14       cgd 
    391   1.80  christos 	return (hd);
    392   1.14       cgd }
    393   1.14       cgd 
    394   1.80  christos static void
    395  1.150      yamt hook_disestablish(hook_list_t *list, void *vhook)
    396   1.14       cgd {
    397   1.14       cgd #ifdef DIAGNOSTIC
    398   1.80  christos 	struct hook_desc *hd;
    399   1.14       cgd 
    400   1.83      matt 	LIST_FOREACH(hd, list, hk_list) {
    401   1.80  christos                 if (hd == vhook)
    402   1.14       cgd 			break;
    403   1.83      matt 	}
    404   1.83      matt 
    405   1.80  christos 	if (hd == NULL)
    406   1.83      matt 		panic("hook_disestablish: hook %p not established", vhook);
    407   1.14       cgd #endif
    408   1.80  christos 	LIST_REMOVE((struct hook_desc *)vhook, hk_list);
    409   1.80  christos 	free(vhook, M_DEVBUF);
    410   1.80  christos }
    411   1.80  christos 
    412   1.80  christos static void
    413  1.117   thorpej hook_destroy(hook_list_t *list)
    414   1.80  christos {
    415   1.80  christos 	struct hook_desc *hd;
    416   1.80  christos 
    417   1.87      matt 	while ((hd = LIST_FIRST(list)) != NULL) {
    418   1.80  christos 		LIST_REMOVE(hd, hk_list);
    419   1.80  christos 		free(hd, M_DEVBUF);
    420   1.80  christos 	}
    421   1.80  christos }
    422   1.14       cgd 
    423   1.80  christos static void
    424  1.117   thorpej hook_proc_run(hook_list_t *list, struct proc *p)
    425   1.80  christos {
    426   1.80  christos 	struct hook_desc *hd;
    427   1.80  christos 
    428  1.178    dyoung 	LIST_FOREACH(hd, list, hk_list)
    429  1.178    dyoung 		((void (*)(struct proc *, void *))*hd->hk_fn)(p, hd->hk_arg);
    430   1.80  christos }
    431   1.80  christos 
    432   1.80  christos /*
    433   1.80  christos  * "Shutdown hook" types, functions, and variables.
    434   1.80  christos  *
    435   1.80  christos  * Should be invoked immediately before the
    436   1.80  christos  * system is halted or rebooted, i.e. after file systems unmounted,
    437   1.80  christos  * after crash dump done, etc.
    438   1.80  christos  *
    439   1.80  christos  * Each shutdown hook is removed from the list before it's run, so that
    440   1.80  christos  * it won't be run again.
    441   1.80  christos  */
    442   1.80  christos 
    443  1.117   thorpej static hook_list_t shutdownhook_list;
    444   1.80  christos 
    445   1.80  christos void *
    446  1.117   thorpej shutdownhook_establish(void (*fn)(void *), void *arg)
    447   1.80  christos {
    448   1.80  christos 	return hook_establish(&shutdownhook_list, fn, arg);
    449   1.80  christos }
    450   1.80  christos 
    451   1.80  christos void
    452  1.117   thorpej shutdownhook_disestablish(void *vhook)
    453   1.80  christos {
    454   1.89    simonb 	hook_disestablish(&shutdownhook_list, vhook);
    455   1.14       cgd }
    456   1.14       cgd 
    457   1.14       cgd /*
    458   1.14       cgd  * Run shutdown hooks.  Should be invoked immediately before the
    459   1.14       cgd  * system is halted or rebooted, i.e. after file systems unmounted,
    460   1.14       cgd  * after crash dump done, etc.
    461   1.17       cgd  *
    462   1.17       cgd  * Each shutdown hook is removed from the list before it's run, so that
    463   1.17       cgd  * it won't be run again.
    464   1.14       cgd  */
    465   1.14       cgd void
    466  1.117   thorpej doshutdownhooks(void)
    467   1.14       cgd {
    468   1.80  christos 	struct hook_desc *dp;
    469   1.14       cgd 
    470   1.87      matt 	while ((dp = LIST_FIRST(&shutdownhook_list)) != NULL) {
    471   1.80  christos 		LIST_REMOVE(dp, hk_list);
    472   1.80  christos 		(*dp->hk_fn)(dp->hk_arg);
    473   1.17       cgd #if 0
    474   1.17       cgd 		/*
    475   1.17       cgd 		 * Don't bother freeing the hook structure,, since we may
    476   1.17       cgd 		 * be rebooting because of a memory corruption problem,
    477   1.17       cgd 		 * and this might only make things worse.  It doesn't
    478   1.17       cgd 		 * matter, anyway, since the system is just about to
    479   1.17       cgd 		 * reboot.
    480   1.17       cgd 		 */
    481   1.17       cgd 		free(dp, M_DEVBUF);
    482   1.17       cgd #endif
    483   1.52  augustss 	}
    484   1.52  augustss }
    485   1.52  augustss 
    486   1.52  augustss /*
    487   1.80  christos  * "Mountroot hook" types, functions, and variables.
    488   1.80  christos  */
    489   1.80  christos 
    490  1.117   thorpej static hook_list_t mountroothook_list;
    491   1.80  christos 
    492   1.80  christos void *
    493  1.200    dyoung mountroothook_establish(void (*fn)(device_t), device_t dev)
    494   1.80  christos {
    495  1.109  junyoung 	return hook_establish(&mountroothook_list, (void (*)(void *))fn, dev);
    496   1.80  christos }
    497   1.80  christos 
    498   1.80  christos void
    499  1.117   thorpej mountroothook_disestablish(void *vhook)
    500   1.80  christos {
    501   1.89    simonb 	hook_disestablish(&mountroothook_list, vhook);
    502   1.80  christos }
    503   1.80  christos 
    504   1.80  christos void
    505  1.117   thorpej mountroothook_destroy(void)
    506   1.80  christos {
    507   1.80  christos 	hook_destroy(&mountroothook_list);
    508   1.80  christos }
    509   1.80  christos 
    510   1.80  christos void
    511  1.117   thorpej domountroothook(void)
    512   1.80  christos {
    513   1.80  christos 	struct hook_desc *hd;
    514   1.80  christos 
    515   1.83      matt 	LIST_FOREACH(hd, &mountroothook_list, hk_list) {
    516   1.80  christos 		if (hd->hk_arg == (void *)root_device) {
    517   1.80  christos 			(*hd->hk_fn)(hd->hk_arg);
    518   1.80  christos 			return;
    519   1.80  christos 		}
    520   1.80  christos 	}
    521   1.80  christos }
    522   1.80  christos 
    523  1.117   thorpej static hook_list_t exechook_list;
    524   1.80  christos 
    525   1.80  christos void *
    526  1.117   thorpej exechook_establish(void (*fn)(struct proc *, void *), void *arg)
    527   1.80  christos {
    528  1.109  junyoung 	return hook_establish(&exechook_list, (void (*)(void *))fn, arg);
    529   1.80  christos }
    530   1.80  christos 
    531   1.80  christos void
    532  1.117   thorpej exechook_disestablish(void *vhook)
    533   1.80  christos {
    534   1.80  christos 	hook_disestablish(&exechook_list, vhook);
    535   1.80  christos }
    536   1.80  christos 
    537   1.80  christos /*
    538   1.80  christos  * Run exec hooks.
    539   1.80  christos  */
    540   1.80  christos void
    541  1.117   thorpej doexechooks(struct proc *p)
    542   1.80  christos {
    543   1.80  christos 	hook_proc_run(&exechook_list, p);
    544   1.80  christos }
    545   1.80  christos 
    546  1.117   thorpej static hook_list_t exithook_list;
    547  1.195        ad extern krwlock_t exec_lock;
    548   1.80  christos 
    549   1.80  christos void *
    550  1.117   thorpej exithook_establish(void (*fn)(struct proc *, void *), void *arg)
    551   1.80  christos {
    552  1.195        ad 	void *rv;
    553  1.195        ad 
    554  1.195        ad 	rw_enter(&exec_lock, RW_WRITER);
    555  1.195        ad 	rv = hook_establish(&exithook_list, (void (*)(void *))fn, arg);
    556  1.195        ad 	rw_exit(&exec_lock);
    557  1.195        ad 	return rv;
    558   1.80  christos }
    559   1.80  christos 
    560   1.80  christos void
    561  1.117   thorpej exithook_disestablish(void *vhook)
    562   1.80  christos {
    563  1.195        ad 
    564  1.195        ad 	rw_enter(&exec_lock, RW_WRITER);
    565   1.80  christos 	hook_disestablish(&exithook_list, vhook);
    566  1.195        ad 	rw_exit(&exec_lock);
    567   1.80  christos }
    568   1.80  christos 
    569   1.80  christos /*
    570   1.80  christos  * Run exit hooks.
    571   1.80  christos  */
    572   1.80  christos void
    573  1.117   thorpej doexithooks(struct proc *p)
    574   1.80  christos {
    575   1.80  christos 	hook_proc_run(&exithook_list, p);
    576   1.96   thorpej }
    577   1.96   thorpej 
    578  1.117   thorpej static hook_list_t forkhook_list;
    579   1.96   thorpej 
    580   1.96   thorpej void *
    581  1.117   thorpej forkhook_establish(void (*fn)(struct proc *, struct proc *))
    582   1.96   thorpej {
    583  1.109  junyoung 	return hook_establish(&forkhook_list, (void (*)(void *))fn, NULL);
    584   1.96   thorpej }
    585   1.96   thorpej 
    586   1.96   thorpej void
    587  1.117   thorpej forkhook_disestablish(void *vhook)
    588   1.96   thorpej {
    589   1.96   thorpej 	hook_disestablish(&forkhook_list, vhook);
    590   1.96   thorpej }
    591   1.96   thorpej 
    592   1.96   thorpej /*
    593   1.96   thorpej  * Run fork hooks.
    594   1.96   thorpej  */
    595   1.96   thorpej void
    596  1.117   thorpej doforkhooks(struct proc *p2, struct proc *p1)
    597   1.96   thorpej {
    598   1.96   thorpej 	struct hook_desc *hd;
    599   1.96   thorpej 
    600   1.96   thorpej 	LIST_FOREACH(hd, &forkhook_list, hk_list) {
    601  1.109  junyoung 		((void (*)(struct proc *, struct proc *))*hd->hk_fn)
    602   1.96   thorpej 		    (p2, p1);
    603   1.96   thorpej 	}
    604   1.80  christos }
    605   1.80  christos 
    606   1.80  christos /*
    607   1.52  augustss  * "Power hook" types, functions, and variables.
    608   1.71  augustss  * The list of power hooks is kept ordered with the last registered hook
    609   1.71  augustss  * first.
    610   1.71  augustss  * When running the hooks on power down the hooks are called in reverse
    611   1.71  augustss  * registration order, when powering up in registration order.
    612   1.52  augustss  */
    613   1.52  augustss struct powerhook_desc {
    614   1.71  augustss 	CIRCLEQ_ENTRY(powerhook_desc) sfd_list;
    615  1.109  junyoung 	void	(*sfd_fn)(int, void *);
    616   1.52  augustss 	void	*sfd_arg;
    617  1.144  jmcneill 	char	sfd_name[16];
    618   1.52  augustss };
    619   1.52  augustss 
    620  1.117   thorpej static CIRCLEQ_HEAD(, powerhook_desc) powerhook_list =
    621  1.117   thorpej     CIRCLEQ_HEAD_INITIALIZER(powerhook_list);
    622   1.52  augustss 
    623   1.52  augustss void *
    624  1.145    dogcow powerhook_establish(const char *name, void (*fn)(int, void *), void *arg)
    625   1.52  augustss {
    626   1.52  augustss 	struct powerhook_desc *ndp;
    627   1.52  augustss 
    628   1.52  augustss 	ndp = (struct powerhook_desc *)
    629   1.52  augustss 	    malloc(sizeof(*ndp), M_DEVBUF, M_NOWAIT);
    630   1.52  augustss 	if (ndp == NULL)
    631   1.59     enami 		return (NULL);
    632   1.52  augustss 
    633   1.52  augustss 	ndp->sfd_fn = fn;
    634   1.52  augustss 	ndp->sfd_arg = arg;
    635  1.144  jmcneill 	strlcpy(ndp->sfd_name, name, sizeof(ndp->sfd_name));
    636   1.71  augustss 	CIRCLEQ_INSERT_HEAD(&powerhook_list, ndp, sfd_list);
    637   1.52  augustss 
    638  1.167  jmcneill 	aprint_error("%s: WARNING: powerhook_establish is deprecated\n", name);
    639   1.52  augustss 	return (ndp);
    640   1.52  augustss }
    641   1.52  augustss 
    642   1.52  augustss void
    643  1.117   thorpej powerhook_disestablish(void *vhook)
    644   1.52  augustss {
    645   1.52  augustss #ifdef DIAGNOSTIC
    646   1.52  augustss 	struct powerhook_desc *dp;
    647   1.52  augustss 
    648   1.71  augustss 	CIRCLEQ_FOREACH(dp, &powerhook_list, sfd_list)
    649   1.52  augustss                 if (dp == vhook)
    650   1.71  augustss 			goto found;
    651   1.83      matt 	panic("powerhook_disestablish: hook %p not established", vhook);
    652   1.71  augustss  found:
    653   1.52  augustss #endif
    654   1.52  augustss 
    655   1.71  augustss 	CIRCLEQ_REMOVE(&powerhook_list, (struct powerhook_desc *)vhook,
    656   1.71  augustss 	    sfd_list);
    657   1.52  augustss 	free(vhook, M_DEVBUF);
    658   1.52  augustss }
    659   1.52  augustss 
    660   1.52  augustss /*
    661   1.52  augustss  * Run power hooks.
    662   1.52  augustss  */
    663   1.52  augustss void
    664  1.117   thorpej dopowerhooks(int why)
    665   1.52  augustss {
    666   1.52  augustss 	struct powerhook_desc *dp;
    667   1.52  augustss 
    668  1.144  jmcneill #ifdef POWERHOOK_DEBUG
    669  1.162  christos 	const char *why_name;
    670  1.163  degroote 	static const char * pwr_names[] = {PWR_NAMES};
    671  1.163  degroote 	why_name = why < __arraycount(pwr_names) ? pwr_names[why] : "???";
    672  1.144  jmcneill #endif
    673  1.144  jmcneill 
    674   1.73  takemura 	if (why == PWR_RESUME || why == PWR_SOFTRESUME) {
    675   1.71  augustss 		CIRCLEQ_FOREACH_REVERSE(dp, &powerhook_list, sfd_list) {
    676  1.144  jmcneill #ifdef POWERHOOK_DEBUG
    677  1.162  christos 			printf("dopowerhooks %s: %s (%p)\n", why_name, dp->sfd_name, dp);
    678  1.144  jmcneill #endif
    679   1.71  augustss 			(*dp->sfd_fn)(why, dp->sfd_arg);
    680   1.71  augustss 		}
    681   1.71  augustss 	} else {
    682   1.71  augustss 		CIRCLEQ_FOREACH(dp, &powerhook_list, sfd_list) {
    683  1.144  jmcneill #ifdef POWERHOOK_DEBUG
    684  1.162  christos 			printf("dopowerhooks %s: %s (%p)\n", why_name, dp->sfd_name, dp);
    685  1.144  jmcneill #endif
    686   1.71  augustss 			(*dp->sfd_fn)(why, dp->sfd_arg);
    687   1.71  augustss 		}
    688   1.18   thorpej 	}
    689  1.144  jmcneill 
    690  1.144  jmcneill #ifdef POWERHOOK_DEBUG
    691  1.162  christos 	printf("dopowerhooks: %s done\n", why_name);
    692  1.144  jmcneill #endif
    693   1.18   thorpej }
    694   1.18   thorpej 
    695  1.160  christos static int
    696  1.200    dyoung isswap(device_t dv)
    697  1.160  christos {
    698  1.160  christos 	struct dkwedge_info wi;
    699  1.160  christos 	struct vnode *vn;
    700  1.160  christos 	int error;
    701  1.160  christos 
    702  1.160  christos 	if (device_class(dv) != DV_DISK || !device_is_a(dv, "dk"))
    703  1.160  christos 		return 0;
    704  1.160  christos 
    705  1.160  christos 	if ((vn = opendisk(dv)) == NULL)
    706  1.160  christos 		return 0;
    707  1.160  christos 
    708  1.166     pooka 	error = VOP_IOCTL(vn, DIOCGWEDGEINFO, &wi, FREAD, NOCRED);
    709  1.166     pooka 	VOP_CLOSE(vn, FREAD, NOCRED);
    710  1.160  christos 	vput(vn);
    711  1.160  christos 	if (error) {
    712  1.160  christos #ifdef DEBUG_WEDGE
    713  1.184    cegger 		printf("%s: Get wedge info returned %d\n", device_xname(dv), error);
    714  1.160  christos #endif
    715  1.160  christos 		return 0;
    716  1.160  christos 	}
    717  1.160  christos 	return strcmp(wi.dkw_ptype, DKW_PTYPE_SWAP) == 0;
    718  1.160  christos }
    719  1.160  christos 
    720   1.18   thorpej /*
    721   1.18   thorpej  * Determine the root device and, if instructed to, the root file system.
    722   1.18   thorpej  */
    723   1.18   thorpej 
    724   1.18   thorpej #include "md.h"
    725   1.18   thorpej 
    726  1.187        ad #if NMD > 0
    727  1.127      cube extern struct cfdriver md_cd;
    728  1.108  christos #ifdef MEMORY_DISK_IS_ROOT
    729  1.187        ad int md_is_root = 1;
    730  1.187        ad #else
    731  1.187        ad int md_is_root = 0;
    732  1.108  christos #endif
    733  1.190  drochner #endif
    734  1.108  christos 
    735  1.113   thorpej /*
    736  1.113   thorpej  * The device and wedge that we booted from.  If booted_wedge is NULL,
    737  1.113   thorpej  * the we might consult booted_partition.
    738  1.113   thorpej  */
    739  1.200    dyoung device_t booted_device;
    740  1.200    dyoung device_t booted_wedge;
    741  1.113   thorpej int booted_partition;
    742  1.113   thorpej 
    743  1.113   thorpej /*
    744  1.113   thorpej  * Use partition letters if it's a disk class but not a wedge.
    745  1.113   thorpej  * XXX Check for wedge is kinda gross.
    746  1.113   thorpej  */
    747  1.113   thorpej #define	DEV_USES_PARTITIONS(dv)						\
    748  1.124   thorpej 	(device_class((dv)) == DV_DISK &&				\
    749  1.125   thorpej 	 !device_is_a((dv), "dk"))
    750  1.113   thorpej 
    751   1.18   thorpej void
    752  1.200    dyoung setroot(device_t bootdv, int bootpartition)
    753   1.18   thorpej {
    754  1.200    dyoung 	device_t dv;
    755  1.159    dyoung 	int len, majdev;
    756   1.25       mrg 	dev_t nrootdev;
    757   1.26   thorpej 	dev_t ndumpdev = NODEV;
    758   1.18   thorpej 	char buf[128];
    759   1.18   thorpej 	const char *rootdevname;
    760   1.26   thorpej 	const char *dumpdevname;
    761  1.200    dyoung 	device_t rootdv = NULL;		/* XXX gcc -Wuninitialized */
    762  1.200    dyoung 	device_t dumpdv = NULL;
    763   1.18   thorpej 	struct ifnet *ifp;
    764   1.18   thorpej 	const char *deffsname;
    765   1.18   thorpej 	struct vfsops *vops;
    766   1.18   thorpej 
    767  1.157      manu #ifdef TFTPROOT
    768  1.157      manu 	if (tftproot_dhcpboot(bootdv) != 0)
    769  1.157      manu 		boothowto |= RB_ASKNAME;
    770  1.157      manu #endif
    771  1.157      manu 
    772  1.187        ad #if NMD > 0
    773  1.187        ad 	if (md_is_root) {
    774  1.190  drochner 		/*
    775  1.190  drochner 		 * XXX there should be "root on md0" in the config file,
    776  1.190  drochner 		 * but it isn't always
    777  1.190  drochner 		 */
    778  1.190  drochner 		bootdv = md_cd.cd_devs[0];
    779  1.187        ad 		bootpartition = 0;
    780   1.28       leo 	}
    781   1.18   thorpej #endif
    782   1.18   thorpej 
    783   1.18   thorpej 	/*
    784   1.18   thorpej 	 * If NFS is specified as the file system, and we found
    785   1.18   thorpej 	 * a DV_DISK boot device (or no boot device at all), then
    786   1.18   thorpej 	 * find a reasonable network interface for "rootspec".
    787   1.18   thorpej 	 */
    788  1.197  pgoyette 	vops = vfs_getopsbyname(MOUNT_NFS);
    789  1.197  pgoyette 	if (vops != NULL && strcmp(rootfstype, MOUNT_NFS) == 0 &&
    790   1.18   thorpej 	    rootspec == NULL &&
    791  1.124   thorpej 	    (bootdv == NULL || device_class(bootdv) != DV_IFNET)) {
    792  1.115      matt 		IFNET_FOREACH(ifp) {
    793   1.18   thorpej 			if ((ifp->if_flags &
    794   1.18   thorpej 			     (IFF_LOOPBACK|IFF_POINTOPOINT)) == 0)
    795   1.18   thorpej 				break;
    796   1.83      matt 		}
    797   1.18   thorpej 		if (ifp == NULL) {
    798   1.18   thorpej 			/*
    799   1.18   thorpej 			 * Can't find a suitable interface; ask the
    800   1.18   thorpej 			 * user.
    801   1.18   thorpej 			 */
    802   1.18   thorpej 			boothowto |= RB_ASKNAME;
    803   1.18   thorpej 		} else {
    804   1.18   thorpej 			/*
    805   1.18   thorpej 			 * Have a suitable interface; behave as if
    806   1.18   thorpej 			 * the user specified this interface.
    807   1.18   thorpej 			 */
    808   1.18   thorpej 			rootspec = (const char *)ifp->if_xname;
    809   1.18   thorpej 		}
    810   1.18   thorpej 	}
    811  1.165        ad 	if (vops != NULL)
    812  1.165        ad 		vfs_delref(vops);
    813   1.24   thorpej 
    814   1.24   thorpej 	/*
    815   1.24   thorpej 	 * If wildcarded root and we the boot device wasn't determined,
    816   1.24   thorpej 	 * ask the user.
    817   1.24   thorpej 	 */
    818   1.24   thorpej 	if (rootspec == NULL && bootdv == NULL)
    819   1.24   thorpej 		boothowto |= RB_ASKNAME;
    820   1.18   thorpej 
    821   1.18   thorpej  top:
    822   1.18   thorpej 	if (boothowto & RB_ASKNAME) {
    823  1.200    dyoung 		device_t defdumpdv;
    824   1.26   thorpej 
    825   1.18   thorpej 		for (;;) {
    826   1.18   thorpej 			printf("root device");
    827   1.18   thorpej 			if (bootdv != NULL) {
    828  1.184    cegger 				printf(" (default %s", device_xname(bootdv));
    829  1.113   thorpej 				if (DEV_USES_PARTITIONS(bootdv))
    830   1.18   thorpej 					printf("%c", bootpartition + 'a');
    831   1.18   thorpej 				printf(")");
    832   1.18   thorpej 			}
    833   1.18   thorpej 			printf(": ");
    834   1.64    itojun 			len = cngetsn(buf, sizeof(buf));
    835   1.18   thorpej 			if (len == 0 && bootdv != NULL) {
    836  1.184    cegger 				strlcpy(buf, device_xname(bootdv), sizeof(buf));
    837   1.18   thorpej 				len = strlen(buf);
    838   1.18   thorpej 			}
    839   1.18   thorpej 			if (len > 0 && buf[len - 1] == '*') {
    840   1.18   thorpej 				buf[--len] = '\0';
    841   1.51   thorpej 				dv = getdisk(buf, len, 1, &nrootdev, 0);
    842   1.18   thorpej 				if (dv != NULL) {
    843   1.18   thorpej 					rootdv = dv;
    844   1.25       mrg 					break;
    845   1.18   thorpej 				}
    846   1.18   thorpej 			}
    847   1.51   thorpej 			dv = getdisk(buf, len, bootpartition, &nrootdev, 0);
    848   1.18   thorpej 			if (dv != NULL) {
    849   1.18   thorpej 				rootdv = dv;
    850   1.18   thorpej 				break;
    851   1.18   thorpej 			}
    852   1.18   thorpej 		}
    853   1.18   thorpej 
    854   1.26   thorpej 		/*
    855   1.26   thorpej 		 * Set up the default dump device.  If root is on
    856   1.26   thorpej 		 * a network device, there is no default dump
    857   1.26   thorpej 		 * device, since we don't support dumps to the
    858   1.26   thorpej 		 * network.
    859   1.26   thorpej 		 */
    860  1.113   thorpej 		if (DEV_USES_PARTITIONS(rootdv) == 0)
    861   1.26   thorpej 			defdumpdv = NULL;
    862   1.26   thorpej 		else
    863   1.26   thorpej 			defdumpdv = rootdv;
    864   1.26   thorpej 
    865   1.26   thorpej 		for (;;) {
    866   1.26   thorpej 			printf("dump device");
    867   1.26   thorpej 			if (defdumpdv != NULL) {
    868   1.26   thorpej 				/*
    869   1.26   thorpej 				 * Note, we know it's a disk if we get here.
    870   1.26   thorpej 				 */
    871  1.184    cegger 				printf(" (default %sb)", device_xname(defdumpdv));
    872   1.26   thorpej 			}
    873   1.26   thorpej 			printf(": ");
    874   1.64    itojun 			len = cngetsn(buf, sizeof(buf));
    875   1.26   thorpej 			if (len == 0) {
    876   1.26   thorpej 				if (defdumpdv != NULL) {
    877   1.26   thorpej 					ndumpdev = MAKEDISKDEV(major(nrootdev),
    878   1.26   thorpej 					    DISKUNIT(nrootdev), 1);
    879   1.26   thorpej 				}
    880   1.54     enami 				dumpdv = defdumpdv;
    881   1.26   thorpej 				break;
    882   1.26   thorpej 			}
    883   1.26   thorpej 			if (len == 4 && strcmp(buf, "none") == 0) {
    884   1.55     enami 				dumpdv = NULL;
    885   1.54     enami 				break;
    886   1.26   thorpej 			}
    887   1.51   thorpej 			dv = getdisk(buf, len, 1, &ndumpdev, 1);
    888   1.55     enami 			if (dv != NULL) {
    889   1.26   thorpej 				dumpdv = dv;
    890   1.26   thorpej 				break;
    891   1.26   thorpej 			}
    892   1.26   thorpej 		}
    893   1.26   thorpej 
    894   1.18   thorpej 		rootdev = nrootdev;
    895   1.26   thorpej 		dumpdev = ndumpdev;
    896   1.18   thorpej 
    897   1.36   thorpej 		for (vops = LIST_FIRST(&vfs_list); vops != NULL;
    898   1.36   thorpej 		     vops = LIST_NEXT(vops, vfs_list)) {
    899   1.36   thorpej 			if (vops->vfs_mountroot != NULL &&
    900  1.197  pgoyette 			    strcmp(rootfstype, vops->vfs_name) == 0)
    901   1.38      fvdl 			break;
    902   1.18   thorpej 		}
    903   1.36   thorpej 
    904   1.36   thorpej 		if (vops == NULL) {
    905   1.18   thorpej 			deffsname = "generic";
    906   1.18   thorpej 		} else
    907   1.36   thorpej 			deffsname = vops->vfs_name;
    908   1.36   thorpej 
    909   1.18   thorpej 		for (;;) {
    910   1.18   thorpej 			printf("file system (default %s): ", deffsname);
    911   1.64    itojun 			len = cngetsn(buf, sizeof(buf));
    912  1.197  pgoyette 			if (len == 0) {
    913  1.197  pgoyette 				if (strcmp(deffsname, "generic") == 0)
    914  1.197  pgoyette 					rootfstype = ROOT_FSTYPE_ANY;
    915   1.18   thorpej 				break;
    916  1.197  pgoyette 			}
    917   1.18   thorpej 			if (len == 4 && strcmp(buf, "halt") == 0)
    918   1.23       gwr 				cpu_reboot(RB_HALT, NULL);
    919   1.76   thorpej 			else if (len == 6 && strcmp(buf, "reboot") == 0)
    920   1.76   thorpej 				cpu_reboot(0, NULL);
    921   1.78   thorpej #if defined(DDB)
    922   1.78   thorpej 			else if (len == 3 && strcmp(buf, "ddb") == 0) {
    923   1.78   thorpej 				console_debugger();
    924   1.78   thorpej 			}
    925   1.78   thorpej #endif
    926   1.18   thorpej 			else if (len == 7 && strcmp(buf, "generic") == 0) {
    927  1.197  pgoyette 				rootfstype = ROOT_FSTYPE_ANY;
    928   1.18   thorpej 				break;
    929   1.18   thorpej 			}
    930   1.18   thorpej 			vops = vfs_getopsbyname(buf);
    931   1.18   thorpej 			if (vops == NULL || vops->vfs_mountroot == NULL) {
    932   1.18   thorpej 				printf("use one of: generic");
    933   1.36   thorpej 				for (vops = LIST_FIRST(&vfs_list);
    934   1.36   thorpej 				     vops != NULL;
    935   1.36   thorpej 				     vops = LIST_NEXT(vops, vfs_list)) {
    936   1.36   thorpej 					if (vops->vfs_mountroot != NULL)
    937   1.36   thorpej 						printf(" %s", vops->vfs_name);
    938   1.36   thorpej 				}
    939  1.197  pgoyette 				if (vops != NULL)
    940  1.197  pgoyette 					vfs_delref(vops);
    941   1.78   thorpej #if defined(DDB)
    942   1.78   thorpej 				printf(" ddb");
    943   1.78   thorpej #endif
    944   1.76   thorpej 				printf(" halt reboot\n");
    945   1.18   thorpej 			} else {
    946  1.197  pgoyette 				/*
    947  1.197  pgoyette 				 * XXX If *vops gets freed between here and
    948  1.197  pgoyette 				 * the call to mountroot(), rootfstype will
    949  1.197  pgoyette 				 * point to something unexpected.  But in
    950  1.197  pgoyette 				 * this case the system will fail anyway.
    951  1.197  pgoyette 				 */
    952  1.197  pgoyette 				rootfstype = vops->vfs_name;
    953  1.165        ad 				vfs_delref(vops);
    954   1.18   thorpej 				break;
    955   1.18   thorpej 			}
    956   1.18   thorpej 		}
    957   1.18   thorpej 
    958   1.18   thorpej 	} else if (rootspec == NULL) {
    959   1.18   thorpej 		/*
    960   1.18   thorpej 		 * Wildcarded root; use the boot device.
    961   1.18   thorpej 		 */
    962   1.26   thorpej 		rootdv = bootdv;
    963   1.26   thorpej 
    964  1.188  christos 		if (bootdv)
    965  1.188  christos 			majdev = devsw_name2blk(device_xname(bootdv), NULL, 0);
    966  1.188  christos 		else
    967  1.188  christos 			majdev = -1;
    968   1.18   thorpej 		if (majdev >= 0) {
    969   1.18   thorpej 			/*
    970  1.113   thorpej 			 * Root is on a disk.  `bootpartition' is root,
    971  1.113   thorpej 			 * unless the device does not use partitions.
    972   1.18   thorpej 			 */
    973  1.113   thorpej 			if (DEV_USES_PARTITIONS(bootdv))
    974  1.135   thorpej 				rootdev = MAKEDISKDEV(majdev,
    975  1.135   thorpej 						      device_unit(bootdv),
    976  1.135   thorpej 						      bootpartition);
    977  1.113   thorpej 			else
    978  1.135   thorpej 				rootdev = makedev(majdev, device_unit(bootdv));
    979   1.18   thorpej 		}
    980   1.18   thorpej 	} else {
    981   1.18   thorpej 
    982   1.18   thorpej 		/*
    983   1.25       mrg 		 * `root on <dev> ...'
    984   1.18   thorpej 		 */
    985   1.18   thorpej 
    986   1.18   thorpej 		/*
    987   1.18   thorpej 		 * If it's a network interface, we can bail out
    988   1.18   thorpej 		 * early.
    989   1.18   thorpej 		 */
    990   1.56     enami 		dv = finddevice(rootspec);
    991  1.124   thorpej 		if (dv != NULL && device_class(dv) == DV_IFNET) {
    992   1.26   thorpej 			rootdv = dv;
    993   1.26   thorpej 			goto haveroot;
    994   1.18   thorpej 		}
    995   1.18   thorpej 
    996  1.159    dyoung 		if (rootdev == NODEV &&
    997  1.159    dyoung 		    device_class(dv) == DV_DISK && device_is_a(dv, "dk") &&
    998  1.184    cegger 		    (majdev = devsw_name2blk(device_xname(dv), NULL, 0)) >= 0)
    999  1.159    dyoung 			rootdev = makedev(majdev, device_unit(dv));
   1000  1.159    dyoung 
   1001   1.88   gehenna 		rootdevname = devsw_blk2name(major(rootdev));
   1002   1.18   thorpej 		if (rootdevname == NULL) {
   1003  1.198  christos 			printf("unknown device major 0x%llx\n",
   1004  1.198  christos 			    (unsigned long long)rootdev);
   1005   1.18   thorpej 			boothowto |= RB_ASKNAME;
   1006   1.18   thorpej 			goto top;
   1007   1.18   thorpej 		}
   1008   1.41     perry 		memset(buf, 0, sizeof(buf));
   1009  1.198  christos 		snprintf(buf, sizeof(buf), "%s%llu", rootdevname,
   1010  1.198  christos 		    (unsigned long long)DISKUNIT(rootdev));
   1011   1.18   thorpej 
   1012   1.56     enami 		rootdv = finddevice(buf);
   1013   1.26   thorpej 		if (rootdv == NULL) {
   1014  1.198  christos 			printf("device %s (0x%llx) not configured\n",
   1015  1.198  christos 			    buf, (unsigned long long)rootdev);
   1016   1.18   thorpej 			boothowto |= RB_ASKNAME;
   1017   1.18   thorpej 			goto top;
   1018   1.18   thorpej 		}
   1019   1.26   thorpej 	}
   1020   1.18   thorpej 
   1021   1.26   thorpej  haveroot:
   1022   1.18   thorpej 
   1023   1.18   thorpej 	root_device = rootdv;
   1024   1.18   thorpej 
   1025  1.124   thorpej 	switch (device_class(rootdv)) {
   1026   1.18   thorpej 	case DV_IFNET:
   1027  1.139  christos 	case DV_DISK:
   1028  1.184    cegger 		aprint_normal("root on %s", device_xname(rootdv));
   1029  1.140  christos 		if (DEV_USES_PARTITIONS(rootdv))
   1030  1.198  christos 			aprint_normal("%c", (int)DISKPART(rootdev) + 'a');
   1031   1.18   thorpej 		break;
   1032   1.18   thorpej 
   1033   1.18   thorpej 	default:
   1034   1.18   thorpej 		printf("can't determine root device\n");
   1035   1.18   thorpej 		boothowto |= RB_ASKNAME;
   1036   1.18   thorpej 		goto top;
   1037   1.18   thorpej 	}
   1038   1.26   thorpej 
   1039   1.26   thorpej 	/*
   1040   1.26   thorpej 	 * Now configure the dump device.
   1041   1.55     enami 	 *
   1042   1.26   thorpej 	 * If we haven't figured out the dump device, do so, with
   1043   1.26   thorpej 	 * the following rules:
   1044   1.26   thorpej 	 *
   1045   1.26   thorpej 	 *	(a) We already know dumpdv in the RB_ASKNAME case.
   1046   1.26   thorpej 	 *
   1047   1.26   thorpej 	 *	(b) If dumpspec is set, try to use it.  If the device
   1048   1.26   thorpej 	 *	    is not available, punt.
   1049   1.26   thorpej 	 *
   1050   1.26   thorpej 	 *	(c) If dumpspec is not set, the dump device is
   1051   1.26   thorpej 	 *	    wildcarded or unspecified.  If the root device
   1052   1.26   thorpej 	 *	    is DV_IFNET, punt.  Otherwise, use partition b
   1053   1.26   thorpej 	 *	    of the root device.
   1054   1.26   thorpej 	 */
   1055   1.26   thorpej 
   1056   1.55     enami 	if (boothowto & RB_ASKNAME) {		/* (a) */
   1057   1.55     enami 		if (dumpdv == NULL)
   1058   1.55     enami 			goto nodumpdev;
   1059   1.55     enami 	} else if (dumpspec != NULL) {		/* (b) */
   1060   1.55     enami 		if (strcmp(dumpspec, "none") == 0 || dumpdev == NODEV) {
   1061   1.26   thorpej 			/*
   1062   1.55     enami 			 * Operator doesn't want a dump device.
   1063   1.55     enami 			 * Or looks like they tried to pick a network
   1064   1.26   thorpej 			 * device.  Oops.
   1065   1.26   thorpej 			 */
   1066   1.26   thorpej 			goto nodumpdev;
   1067   1.26   thorpej 		}
   1068   1.26   thorpej 
   1069   1.88   gehenna 		dumpdevname = devsw_blk2name(major(dumpdev));
   1070   1.26   thorpej 		if (dumpdevname == NULL)
   1071   1.26   thorpej 			goto nodumpdev;
   1072   1.41     perry 		memset(buf, 0, sizeof(buf));
   1073  1.198  christos 		snprintf(buf, sizeof(buf), "%s%llu", dumpdevname,
   1074  1.198  christos 		    (unsigned long long)DISKUNIT(dumpdev));
   1075   1.26   thorpej 
   1076   1.56     enami 		dumpdv = finddevice(buf);
   1077   1.56     enami 		if (dumpdv == NULL) {
   1078   1.26   thorpej 			/*
   1079   1.26   thorpej 			 * Device not configured.
   1080   1.26   thorpej 			 */
   1081   1.26   thorpej 			goto nodumpdev;
   1082   1.26   thorpej 		}
   1083   1.55     enami 	} else {				/* (c) */
   1084  1.160  christos 		if (DEV_USES_PARTITIONS(rootdv) == 0) {
   1085  1.160  christos 			for (dv = TAILQ_FIRST(&alldevs); dv != NULL;
   1086  1.160  christos 			    dv = TAILQ_NEXT(dv, dv_list))
   1087  1.160  christos 				if (isswap(dv))
   1088  1.160  christos 					break;
   1089  1.160  christos 			if (dv == NULL)
   1090  1.160  christos 				goto nodumpdev;
   1091  1.160  christos 
   1092  1.184    cegger 			majdev = devsw_name2blk(device_xname(dv), NULL, 0);
   1093  1.160  christos 			if (majdev < 0)
   1094  1.160  christos 				goto nodumpdev;
   1095  1.160  christos 			dumpdv = dv;
   1096  1.160  christos 			dumpdev = makedev(majdev, device_unit(dumpdv));
   1097  1.160  christos 		} else {
   1098   1.55     enami 			dumpdv = rootdv;
   1099   1.55     enami 			dumpdev = MAKEDISKDEV(major(rootdev),
   1100  1.135   thorpej 			    device_unit(dumpdv), 1);
   1101   1.55     enami 		}
   1102   1.26   thorpej 	}
   1103   1.26   thorpej 
   1104  1.175        ad 	dumpcdev = devsw_blk2chr(dumpdev);
   1105  1.184    cegger 	aprint_normal(" dumps on %s", device_xname(dumpdv));
   1106  1.140  christos 	if (DEV_USES_PARTITIONS(dumpdv))
   1107  1.198  christos 		aprint_normal("%c", (int)DISKPART(dumpdev) + 'a');
   1108  1.140  christos 	aprint_normal("\n");
   1109   1.26   thorpej 	return;
   1110   1.26   thorpej 
   1111   1.26   thorpej  nodumpdev:
   1112   1.26   thorpej 	dumpdev = NODEV;
   1113  1.175        ad 	dumpcdev = NODEV;
   1114  1.100   thorpej 	aprint_normal("\n");
   1115   1.18   thorpej }
   1116   1.18   thorpej 
   1117  1.200    dyoung static device_t
   1118  1.117   thorpej finddevice(const char *name)
   1119   1.56     enami {
   1120  1.159    dyoung 	const char *wname;
   1121  1.108  christos 
   1122  1.159    dyoung 	if ((wname = getwedgename(name, strlen(name))) != NULL)
   1123  1.159    dyoung 		return dkwedge_find_by_wname(wname);
   1124  1.159    dyoung 
   1125  1.179     joerg 	return device_find_by_xname(name);
   1126   1.56     enami }
   1127   1.56     enami 
   1128  1.200    dyoung static device_t
   1129  1.117   thorpej getdisk(char *str, int len, int defpart, dev_t *devp, int isdump)
   1130   1.18   thorpej {
   1131  1.200    dyoung 	device_t dv;
   1132   1.18   thorpej 
   1133   1.51   thorpej 	if ((dv = parsedisk(str, len, defpart, devp)) == NULL) {
   1134   1.18   thorpej 		printf("use one of:");
   1135   1.83      matt 		TAILQ_FOREACH(dv, &alldevs, dv_list) {
   1136  1.113   thorpej 			if (DEV_USES_PARTITIONS(dv))
   1137  1.184    cegger 				printf(" %s[a-%c]", device_xname(dv),
   1138   1.19       cgd 				    'a' + MAXPARTITIONS - 1);
   1139  1.124   thorpej 			else if (device_class(dv) == DV_DISK)
   1140  1.184    cegger 				printf(" %s", device_xname(dv));
   1141  1.124   thorpej 			if (isdump == 0 && device_class(dv) == DV_IFNET)
   1142  1.184    cegger 				printf(" %s", device_xname(dv));
   1143   1.18   thorpej 		}
   1144  1.159    dyoung 		dkwedge_print_wnames();
   1145   1.26   thorpej 		if (isdump)
   1146   1.26   thorpej 			printf(" none");
   1147   1.78   thorpej #if defined(DDB)
   1148   1.78   thorpej 		printf(" ddb");
   1149   1.78   thorpej #endif
   1150   1.76   thorpej 		printf(" halt reboot\n");
   1151   1.18   thorpej 	}
   1152  1.159    dyoung 	return dv;
   1153  1.159    dyoung }
   1154  1.159    dyoung 
   1155  1.159    dyoung static const char *
   1156  1.159    dyoung getwedgename(const char *name, int namelen)
   1157  1.159    dyoung {
   1158  1.159    dyoung 	const char *wpfx = "wedge:";
   1159  1.159    dyoung 	const int wpfxlen = strlen(wpfx);
   1160  1.159    dyoung 
   1161  1.159    dyoung 	if (namelen < wpfxlen || strncmp(name, wpfx, wpfxlen) != 0)
   1162  1.159    dyoung 		return NULL;
   1163  1.159    dyoung 
   1164  1.159    dyoung 	return name + wpfxlen;
   1165   1.18   thorpej }
   1166   1.18   thorpej 
   1167  1.200    dyoung static device_t
   1168  1.117   thorpej parsedisk(char *str, int len, int defpart, dev_t *devp)
   1169   1.18   thorpej {
   1170  1.200    dyoung 	device_t dv;
   1171  1.159    dyoung 	const char *wname;
   1172   1.18   thorpej 	char *cp, c;
   1173   1.29  drochner 	int majdev, part;
   1174   1.18   thorpej 	if (len == 0)
   1175   1.18   thorpej 		return (NULL);
   1176   1.18   thorpej 
   1177   1.18   thorpej 	if (len == 4 && strcmp(str, "halt") == 0)
   1178   1.23       gwr 		cpu_reboot(RB_HALT, NULL);
   1179   1.76   thorpej 	else if (len == 6 && strcmp(str, "reboot") == 0)
   1180   1.76   thorpej 		cpu_reboot(0, NULL);
   1181   1.78   thorpej #if defined(DDB)
   1182   1.78   thorpej 	else if (len == 3 && strcmp(str, "ddb") == 0)
   1183   1.78   thorpej 		console_debugger();
   1184   1.78   thorpej #endif
   1185   1.18   thorpej 
   1186   1.18   thorpej 	cp = str + len - 1;
   1187   1.18   thorpej 	c = *cp;
   1188  1.159    dyoung 
   1189  1.159    dyoung 	if ((wname = getwedgename(str, len)) != NULL) {
   1190  1.159    dyoung 		if ((dv = dkwedge_find_by_wname(wname)) == NULL)
   1191  1.159    dyoung 			return NULL;
   1192  1.159    dyoung 		part = defpart;
   1193  1.159    dyoung 		goto gotdisk;
   1194  1.159    dyoung 	} else if (c >= 'a' && c <= ('a' + MAXPARTITIONS - 1)) {
   1195   1.18   thorpej 		part = c - 'a';
   1196   1.18   thorpej 		*cp = '\0';
   1197   1.18   thorpej 	} else
   1198   1.18   thorpej 		part = defpart;
   1199   1.18   thorpej 
   1200   1.56     enami 	dv = finddevice(str);
   1201   1.56     enami 	if (dv != NULL) {
   1202  1.124   thorpej 		if (device_class(dv) == DV_DISK) {
   1203   1.18   thorpej  gotdisk:
   1204  1.184    cegger 			majdev = devsw_name2blk(device_xname(dv), NULL, 0);
   1205   1.18   thorpej 			if (majdev < 0)
   1206   1.18   thorpej 				panic("parsedisk");
   1207  1.113   thorpej 			if (DEV_USES_PARTITIONS(dv))
   1208  1.135   thorpej 				*devp = MAKEDISKDEV(majdev, device_unit(dv),
   1209  1.135   thorpej 						    part);
   1210  1.113   thorpej 			else
   1211  1.135   thorpej 				*devp = makedev(majdev, device_unit(dv));
   1212   1.18   thorpej 		}
   1213   1.18   thorpej 
   1214  1.124   thorpej 		if (device_class(dv) == DV_IFNET)
   1215   1.18   thorpej 			*devp = NODEV;
   1216   1.18   thorpej 	}
   1217   1.18   thorpej 
   1218   1.18   thorpej 	*cp = c;
   1219   1.18   thorpej 	return (dv);
   1220   1.48     lukem }
   1221   1.48     lukem 
   1222   1.48     lukem /*
   1223   1.49     lukem  * snprintf() `bytes' into `buf', reformatting it so that the number,
   1224   1.49     lukem  * plus a possible `x' + suffix extension) fits into len bytes (including
   1225   1.49     lukem  * the terminating NUL).
   1226   1.60     enami  * Returns the number of bytes stored in buf, or -1 if there was a problem.
   1227  1.109  junyoung  * E.g, given a len of 9 and a suffix of `B':
   1228   1.48     lukem  *	bytes		result
   1229   1.48     lukem  *	-----		------
   1230   1.49     lukem  *	99999		`99999 B'
   1231   1.90       wiz  *	100000		`97 kB'
   1232   1.90       wiz  *	66715648	`65152 kB'
   1233   1.48     lukem  *	252215296	`240 MB'
   1234   1.48     lukem  */
   1235   1.48     lukem int
   1236  1.117   thorpej humanize_number(char *buf, size_t len, uint64_t bytes, const char *suffix,
   1237  1.117   thorpej     int divisor)
   1238   1.48     lukem {
   1239   1.91  drochner        	/* prefixes are: (none), kilo, Mega, Giga, Tera, Peta, Exa */
   1240   1.91  drochner 	const char *prefixes;
   1241   1.86   thorpej 	int		r;
   1242  1.121     perry 	uint64_t	umax;
   1243   1.86   thorpej 	size_t		i, suffixlen;
   1244   1.48     lukem 
   1245   1.49     lukem 	if (buf == NULL || suffix == NULL)
   1246   1.49     lukem 		return (-1);
   1247   1.48     lukem 	if (len > 0)
   1248   1.48     lukem 		buf[0] = '\0';
   1249   1.49     lukem 	suffixlen = strlen(suffix);
   1250   1.91  drochner 	/* check if enough room for `x y' + suffix + `\0' */
   1251   1.49     lukem 	if (len < 4 + suffixlen)
   1252   1.49     lukem 		return (-1);
   1253   1.48     lukem 
   1254   1.91  drochner 	if (divisor == 1024) {
   1255   1.91  drochner 		/*
   1256   1.91  drochner 		 * binary multiplies
   1257   1.91  drochner 		 * XXX IEC 60027-2 recommends Ki, Mi, Gi...
   1258   1.91  drochner 		 */
   1259   1.91  drochner 		prefixes = " KMGTPE";
   1260   1.91  drochner 	} else
   1261   1.91  drochner 		prefixes = " kMGTPE"; /* SI for decimal multiplies */
   1262   1.91  drochner 
   1263  1.116  christos 	umax = 1;
   1264  1.199  drochner 	for (i = 0; i < len - suffixlen - 3; i++) {
   1265  1.116  christos 		umax *= 10;
   1266  1.199  drochner 		if (umax > bytes)
   1267  1.199  drochner 			break;
   1268  1.199  drochner 	}
   1269  1.116  christos 	for (i = 0; bytes >= umax && prefixes[i + 1]; i++)
   1270   1.58  sommerfe 		bytes /= divisor;
   1271   1.48     lukem 
   1272   1.50     lukem 	r = snprintf(buf, len, "%qu%s%c%s", (unsigned long long)bytes,
   1273   1.49     lukem 	    i == 0 ? "" : " ", prefixes[i], suffix);
   1274   1.48     lukem 
   1275   1.48     lukem 	return (r);
   1276   1.49     lukem }
   1277   1.49     lukem 
   1278   1.49     lukem int
   1279  1.117   thorpej format_bytes(char *buf, size_t len, uint64_t bytes)
   1280   1.49     lukem {
   1281   1.49     lukem 	int	rv;
   1282   1.49     lukem 	size_t	nlen;
   1283   1.49     lukem 
   1284   1.58  sommerfe 	rv = humanize_number(buf, len, bytes, "B", 1024);
   1285   1.49     lukem 	if (rv != -1) {
   1286   1.49     lukem 			/* nuke the trailing ` B' if it exists */
   1287   1.49     lukem 		nlen = strlen(buf) - 2;
   1288   1.49     lukem 		if (strcmp(&buf[nlen], " B") == 0)
   1289   1.49     lukem 			buf[nlen] = '\0';
   1290   1.49     lukem 	}
   1291   1.49     lukem 	return (rv);
   1292   1.81  christos }
   1293   1.81  christos 
   1294   1.92  jdolecek /*
   1295  1.154   thorpej  * Return true if system call tracing is enabled for the specified process.
   1296  1.130   thorpej  */
   1297  1.153   thorpej bool
   1298  1.130   thorpej trace_is_enabled(struct proc *p)
   1299  1.130   thorpej {
   1300  1.131   thorpej #ifdef SYSCALL_DEBUG
   1301  1.154   thorpej 	return (true);
   1302  1.131   thorpej #endif
   1303  1.130   thorpej #ifdef KTRACE
   1304  1.130   thorpej 	if (ISSET(p->p_traceflag, (KTRFAC_SYSCALL | KTRFAC_SYSRET)))
   1305  1.154   thorpej 		return (true);
   1306  1.130   thorpej #endif
   1307  1.142      matt #ifdef PTRACE
   1308  1.151        ad 	if (ISSET(p->p_slflag, PSL_SYSCALL))
   1309  1.154   thorpej 		return (true);
   1310  1.142      matt #endif
   1311  1.130   thorpej 
   1312  1.154   thorpej 	return (false);
   1313  1.130   thorpej }
   1314  1.130   thorpej 
   1315  1.130   thorpej /*
   1316   1.92  jdolecek  * Start trace of particular system call. If process is being traced,
   1317   1.92  jdolecek  * this routine is called by MD syscall dispatch code just before
   1318   1.92  jdolecek  * a system call is actually executed.
   1319   1.92  jdolecek  */
   1320   1.81  christos int
   1321  1.177       dsl trace_enter(register_t code, const register_t *args, int narg)
   1322   1.81  christos {
   1323   1.81  christos #ifdef SYSCALL_DEBUG
   1324  1.171       dsl 	scdebug_call(code, args);
   1325   1.81  christos #endif /* SYSCALL_DEBUG */
   1326   1.81  christos 
   1327  1.177       dsl 	ktrsyscall(code, args, narg);
   1328   1.81  christos 
   1329  1.142      matt #ifdef PTRACE
   1330  1.172       dsl 	if ((curlwp->l_proc->p_slflag & (PSL_SYSCALL|PSL_TRACED)) ==
   1331  1.151        ad 	    (PSL_SYSCALL|PSL_TRACED))
   1332  1.172       dsl 		process_stoptrace();
   1333  1.142      matt #endif
   1334   1.81  christos 	return 0;
   1335   1.81  christos }
   1336   1.81  christos 
   1337   1.92  jdolecek /*
   1338   1.92  jdolecek  * End trace of particular system call. If process is being traced,
   1339   1.92  jdolecek  * this routine is called by MD syscall dispatch code just after
   1340   1.92  jdolecek  * a system call finishes.
   1341   1.92  jdolecek  * MD caller guarantees the passed 'code' is within the supported
   1342   1.92  jdolecek  * system call number range for emulation the process runs under.
   1343   1.92  jdolecek  */
   1344   1.81  christos void
   1345  1.177       dsl trace_exit(register_t code, register_t rval[], int error)
   1346   1.81  christos {
   1347   1.81  christos #ifdef SYSCALL_DEBUG
   1348  1.171       dsl 	scdebug_ret(code, error, rval);
   1349   1.81  christos #endif /* SYSCALL_DEBUG */
   1350   1.81  christos 
   1351  1.164        ad 	ktrsysret(code, error, rval);
   1352  1.128  christos 
   1353  1.142      matt #ifdef PTRACE
   1354  1.172       dsl 	if ((curlwp->l_proc->p_slflag & (PSL_SYSCALL|PSL_TRACED)) ==
   1355  1.151        ad 	    (PSL_SYSCALL|PSL_TRACED))
   1356  1.172       dsl 		process_stoptrace();
   1357  1.142      matt #endif
   1358   1.10       cgd }
   1359  1.194        ad 
   1360  1.194        ad int
   1361  1.194        ad syscall_establish(const struct emul *em, const struct syscall_package *sp)
   1362  1.194        ad {
   1363  1.194        ad 	struct sysent *sy;
   1364  1.194        ad 	int i;
   1365  1.194        ad 
   1366  1.194        ad 	KASSERT(mutex_owned(&module_lock));
   1367  1.194        ad 
   1368  1.194        ad 	if (em == NULL) {
   1369  1.194        ad 		em = &emul_netbsd;
   1370  1.194        ad 	}
   1371  1.194        ad 	sy = em->e_sysent;
   1372  1.194        ad 
   1373  1.194        ad 	/*
   1374  1.194        ad 	 * Ensure that all preconditions are valid, since this is
   1375  1.194        ad 	 * an all or nothing deal.  Once a system call is entered,
   1376  1.194        ad 	 * it can become busy and we could be unable to remove it
   1377  1.194        ad 	 * on error.
   1378  1.194        ad 	 */
   1379  1.194        ad 	for (i = 0; sp[i].sp_call != NULL; i++) {
   1380  1.194        ad 		if (sy[sp[i].sp_code].sy_call != sys_nomodule) {
   1381  1.196  christos #ifdef DIAGNOSTIC
   1382  1.196  christos 			printf("syscall %d is busy\n", sp[i].sp_code);
   1383  1.196  christos #endif
   1384  1.194        ad 			return EBUSY;
   1385  1.194        ad 		}
   1386  1.194        ad 	}
   1387  1.194        ad 	/* Everything looks good, patch them in. */
   1388  1.194        ad 	for (i = 0; sp[i].sp_call != NULL; i++) {
   1389  1.194        ad 		sy[sp[i].sp_code].sy_call = sp[i].sp_call;
   1390  1.194        ad 	}
   1391  1.194        ad 
   1392  1.194        ad 	return 0;
   1393  1.194        ad }
   1394  1.194        ad 
   1395  1.194        ad int
   1396  1.194        ad syscall_disestablish(const struct emul *em, const struct syscall_package *sp)
   1397  1.194        ad {
   1398  1.194        ad 	struct sysent *sy;
   1399  1.194        ad 	uint64_t where;
   1400  1.194        ad 	lwp_t *l;
   1401  1.194        ad 	int i;
   1402  1.194        ad 
   1403  1.194        ad 	KASSERT(mutex_owned(&module_lock));
   1404  1.194        ad 
   1405  1.194        ad 	if (em == NULL) {
   1406  1.194        ad 		em = &emul_netbsd;
   1407  1.194        ad 	}
   1408  1.194        ad 	sy = em->e_sysent;
   1409  1.194        ad 
   1410  1.194        ad 	/*
   1411  1.194        ad 	 * First, patch the system calls to sys_nomodule to gate further
   1412  1.194        ad 	 * activity.
   1413  1.194        ad 	 */
   1414  1.194        ad 	for (i = 0; sp[i].sp_call != NULL; i++) {
   1415  1.194        ad 		KASSERT(sy[sp[i].sp_code].sy_call == sp[i].sp_call);
   1416  1.194        ad 		sy[sp[i].sp_code].sy_call = sys_nomodule;
   1417  1.194        ad 	}
   1418  1.194        ad 
   1419  1.194        ad 	/*
   1420  1.194        ad 	 * Run a cross call to cycle through all CPUs.  This does two
   1421  1.194        ad 	 * things: lock activity provides a barrier and makes our update
   1422  1.194        ad 	 * of sy_call visible to all CPUs, and upon return we can be sure
   1423  1.194        ad 	 * that we see pertinent values of l_sysent posted by remote CPUs.
   1424  1.194        ad 	 */
   1425  1.194        ad 	where = xc_broadcast(0, (xcfunc_t)nullop, NULL, NULL);
   1426  1.194        ad 	xc_wait(where);
   1427  1.194        ad 
   1428  1.194        ad 	/*
   1429  1.194        ad 	 * Now it's safe to check l_sysent.  Run through all LWPs and see
   1430  1.194        ad 	 * if anyone is still using the system call.
   1431  1.194        ad 	 */
   1432  1.194        ad 	for (i = 0; sp[i].sp_call != NULL; i++) {
   1433  1.194        ad 		mutex_enter(proc_lock);
   1434  1.194        ad 		LIST_FOREACH(l, &alllwp, l_list) {
   1435  1.194        ad 			if (l->l_sysent == &sy[sp[i].sp_code]) {
   1436  1.194        ad 				break;
   1437  1.194        ad 			}
   1438  1.194        ad 		}
   1439  1.194        ad 		mutex_exit(proc_lock);
   1440  1.194        ad 		if (l == NULL) {
   1441  1.194        ad 			continue;
   1442  1.194        ad 		}
   1443  1.194        ad 		/*
   1444  1.194        ad 		 * We lose: one or more calls are still in use.  Put back
   1445  1.194        ad 		 * the old entrypoints and act like nothing happened.
   1446  1.194        ad 		 * When we drop module_lock, any system calls held in
   1447  1.194        ad 		 * sys_nomodule() will be restarted.
   1448  1.194        ad 		 */
   1449  1.194        ad 		for (i = 0; sp[i].sp_call != NULL; i++) {
   1450  1.194        ad 			sy[sp[i].sp_code].sy_call = sp[i].sp_call;
   1451  1.194        ad 		}
   1452  1.194        ad 		return EBUSY;
   1453  1.194        ad 	}
   1454  1.194        ad 
   1455  1.194        ad 	return 0;
   1456  1.194        ad }
   1457