Home | History | Annotate | Line # | Download | only in kern
kern_subr.c revision 1.194
      1  1.194        ad /*	$NetBSD: kern_subr.c,v 1.194 2008/11/12 14:29:31 ad Exp $	*/
      2   1.31   thorpej 
      3   1.31   thorpej /*-
      4  1.185        ad  * Copyright (c) 1997, 1998, 1999, 2002, 2007, 2008 The NetBSD Foundation, Inc.
      5   1.31   thorpej  * All rights reserved.
      6   1.31   thorpej  *
      7   1.31   thorpej  * This code is derived from software contributed to The NetBSD Foundation
      8   1.31   thorpej  * by Jason R. Thorpe of the Numerical Aerospace Simulation Facility,
      9   1.48     lukem  * NASA Ames Research Center, and by Luke Mewburn.
     10   1.31   thorpej  *
     11   1.31   thorpej  * Redistribution and use in source and binary forms, with or without
     12   1.31   thorpej  * modification, are permitted provided that the following conditions
     13   1.31   thorpej  * are met:
     14   1.31   thorpej  * 1. Redistributions of source code must retain the above copyright
     15   1.31   thorpej  *    notice, this list of conditions and the following disclaimer.
     16   1.31   thorpej  * 2. Redistributions in binary form must reproduce the above copyright
     17   1.31   thorpej  *    notice, this list of conditions and the following disclaimer in the
     18   1.31   thorpej  *    documentation and/or other materials provided with the distribution.
     19   1.31   thorpej  *
     20   1.31   thorpej  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     21   1.31   thorpej  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     22   1.31   thorpej  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     23   1.31   thorpej  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     24   1.31   thorpej  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     25   1.31   thorpej  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     26   1.31   thorpej  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     27   1.31   thorpej  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     28   1.31   thorpej  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     29   1.31   thorpej  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     30   1.31   thorpej  * POSSIBILITY OF SUCH DAMAGE.
     31   1.31   thorpej  */
     32   1.12       cgd 
     33    1.9       cgd /*
     34   1.10       cgd  * Copyright (c) 1982, 1986, 1991, 1993
     35   1.10       cgd  *	The Regents of the University of California.  All rights reserved.
     36    1.9       cgd  * (c) UNIX System Laboratories, Inc.
     37    1.9       cgd  * All or some portions of this file are derived from material licensed
     38    1.9       cgd  * to the University of California by American Telephone and Telegraph
     39    1.9       cgd  * Co. or Unix System Laboratories, Inc. and are reproduced herein with
     40    1.9       cgd  * the permission of UNIX System Laboratories, Inc.
     41    1.9       cgd  *
     42   1.18   thorpej  * Copyright (c) 1992, 1993
     43   1.18   thorpej  *	The Regents of the University of California.  All rights reserved.
     44   1.18   thorpej  *
     45   1.18   thorpej  * This software was developed by the Computer Systems Engineering group
     46   1.18   thorpej  * at Lawrence Berkeley Laboratory under DARPA contract BG 91-66 and
     47   1.18   thorpej  * contributed to Berkeley.
     48   1.18   thorpej  *
     49   1.18   thorpej  * All advertising materials mentioning features or use of this software
     50   1.18   thorpej  * must display the following acknowledgement:
     51   1.18   thorpej  *	This product includes software developed by the University of
     52   1.18   thorpej  *	California, Lawrence Berkeley Laboratory.
     53   1.18   thorpej  *
     54    1.9       cgd  * Redistribution and use in source and binary forms, with or without
     55    1.9       cgd  * modification, are permitted provided that the following conditions
     56    1.9       cgd  * are met:
     57    1.9       cgd  * 1. Redistributions of source code must retain the above copyright
     58    1.9       cgd  *    notice, this list of conditions and the following disclaimer.
     59    1.9       cgd  * 2. Redistributions in binary form must reproduce the above copyright
     60    1.9       cgd  *    notice, this list of conditions and the following disclaimer in the
     61    1.9       cgd  *    documentation and/or other materials provided with the distribution.
     62  1.103       agc  * 3. Neither the name of the University nor the names of its contributors
     63    1.9       cgd  *    may be used to endorse or promote products derived from this software
     64    1.9       cgd  *    without specific prior written permission.
     65    1.9       cgd  *
     66    1.9       cgd  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
     67    1.9       cgd  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     68    1.9       cgd  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     69    1.9       cgd  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
     70    1.9       cgd  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     71    1.9       cgd  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     72    1.9       cgd  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     73    1.9       cgd  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     74    1.9       cgd  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     75    1.9       cgd  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     76    1.9       cgd  * SUCH DAMAGE.
     77    1.9       cgd  *
     78   1.38      fvdl  *	@(#)kern_subr.c	8.4 (Berkeley) 2/14/95
     79    1.9       cgd  */
     80   1.77     lukem 
     81   1.77     lukem #include <sys/cdefs.h>
     82  1.194        ad __KERNEL_RCSID(0, "$NetBSD: kern_subr.c,v 1.194 2008/11/12 14:29:31 ad Exp $");
     83   1.34       mrg 
     84   1.78   thorpej #include "opt_ddb.h"
     85   1.43  jonathan #include "opt_md.h"
     86   1.81  christos #include "opt_syscall_debug.h"
     87   1.81  christos #include "opt_ktrace.h"
     88  1.142      matt #include "opt_ptrace.h"
     89  1.144  jmcneill #include "opt_powerhook.h"
     90  1.157      manu #include "opt_tftproot.h"
     91    1.9       cgd 
     92    1.9       cgd #include <sys/param.h>
     93    1.9       cgd #include <sys/systm.h>
     94    1.9       cgd #include <sys/proc.h>
     95   1.10       cgd #include <sys/malloc.h>
     96   1.18   thorpej #include <sys/mount.h>
     97   1.18   thorpej #include <sys/device.h>
     98   1.18   thorpej #include <sys/reboot.h>
     99   1.18   thorpej #include <sys/conf.h>
    100  1.159    dyoung #include <sys/disk.h>
    101   1.18   thorpej #include <sys/disklabel.h>
    102   1.10       cgd #include <sys/queue.h>
    103   1.81  christos #include <sys/ktrace.h>
    104  1.128  christos #include <sys/ptrace.h>
    105  1.119   reinoud #include <sys/fcntl.h>
    106  1.160  christos #include <sys/kauth.h>
    107  1.160  christos #include <sys/vnode.h>
    108  1.194        ad #include <sys/syscallvar.h>
    109  1.194        ad #include <sys/xcall.h>
    110  1.194        ad #include <sys/module.h>
    111    1.9       cgd 
    112   1.82   thorpej #include <uvm/uvm_extern.h>
    113   1.82   thorpej 
    114   1.18   thorpej #include <dev/cons.h>
    115   1.18   thorpej 
    116   1.18   thorpej #include <net/if.h>
    117   1.18   thorpej 
    118   1.18   thorpej /* XXX these should eventually move to subr_autoconf.c */
    119  1.109  junyoung static struct device *finddevice(const char *);
    120  1.109  junyoung static struct device *getdisk(char *, int, int, dev_t *, int);
    121  1.109  junyoung static struct device *parsedisk(char *, int, int, dev_t *);
    122  1.159    dyoung static const char *getwedgename(const char *, int);
    123   1.18   thorpej 
    124   1.80  christos /*
    125   1.80  christos  * A generic linear hook.
    126   1.80  christos  */
    127   1.80  christos struct hook_desc {
    128   1.80  christos 	LIST_ENTRY(hook_desc) hk_list;
    129  1.109  junyoung 	void	(*hk_fn)(void *);
    130   1.80  christos 	void	*hk_arg;
    131   1.80  christos };
    132   1.80  christos typedef LIST_HEAD(, hook_desc) hook_list_t;
    133   1.80  christos 
    134  1.157      manu #ifdef TFTPROOT
    135  1.157      manu int tftproot_dhcpboot(struct device *);
    136  1.157      manu #endif
    137  1.157      manu 
    138  1.175        ad dev_t	dumpcdev;	/* for savecore */
    139  1.175        ad 
    140  1.126      yamt void
    141  1.126      yamt uio_setup_sysspace(struct uio *uio)
    142  1.126      yamt {
    143  1.126      yamt 
    144  1.126      yamt 	uio->uio_vmspace = vmspace_kernel();
    145  1.126      yamt }
    146  1.126      yamt 
    147   1.11   mycroft int
    148  1.117   thorpej uiomove(void *buf, size_t n, struct uio *uio)
    149    1.9       cgd {
    150  1.126      yamt 	struct vmspace *vm = uio->uio_vmspace;
    151   1.63  augustss 	struct iovec *iov;
    152  1.180     njoly 	size_t cnt;
    153    1.9       cgd 	int error = 0;
    154   1.16  christos 	char *cp = buf;
    155  1.112      yamt 
    156  1.183      yamt 	ASSERT_SLEEPABLE();
    157   1.68     enami 
    158   1.68     enami #ifdef DIAGNOSTIC
    159    1.9       cgd 	if (uio->uio_rw != UIO_READ && uio->uio_rw != UIO_WRITE)
    160    1.9       cgd 		panic("uiomove: mode");
    161    1.9       cgd #endif
    162    1.9       cgd 	while (n > 0 && uio->uio_resid) {
    163    1.9       cgd 		iov = uio->uio_iov;
    164    1.9       cgd 		cnt = iov->iov_len;
    165    1.9       cgd 		if (cnt == 0) {
    166  1.105      yamt 			KASSERT(uio->uio_iovcnt > 0);
    167    1.9       cgd 			uio->uio_iov++;
    168    1.9       cgd 			uio->uio_iovcnt--;
    169    1.9       cgd 			continue;
    170    1.9       cgd 		}
    171    1.9       cgd 		if (cnt > n)
    172    1.9       cgd 			cnt = n;
    173  1.126      yamt 		if (!VMSPACE_IS_KERNEL_P(vm)) {
    174  1.104      yamt 			if (curcpu()->ci_schedstate.spc_flags &
    175   1.67   thorpej 			    SPCF_SHOULDYIELD)
    176  1.151        ad 				preempt();
    177  1.126      yamt 		}
    178    1.9       cgd 
    179  1.126      yamt 		if (uio->uio_rw == UIO_READ) {
    180  1.126      yamt 			error = copyout_vmspace(vm, cp, iov->iov_base,
    181  1.126      yamt 			    cnt);
    182  1.126      yamt 		} else {
    183  1.126      yamt 			error = copyin_vmspace(vm, iov->iov_base, cp,
    184  1.126      yamt 			    cnt);
    185  1.126      yamt 		}
    186  1.126      yamt 		if (error) {
    187    1.9       cgd 			break;
    188    1.9       cgd 		}
    189  1.155  christos 		iov->iov_base = (char *)iov->iov_base + cnt;
    190    1.9       cgd 		iov->iov_len -= cnt;
    191    1.9       cgd 		uio->uio_resid -= cnt;
    192    1.9       cgd 		uio->uio_offset += cnt;
    193    1.9       cgd 		cp += cnt;
    194   1.85   thorpej 		KDASSERT(cnt <= n);
    195    1.9       cgd 		n -= cnt;
    196    1.9       cgd 	}
    197  1.165        ad 
    198    1.9       cgd 	return (error);
    199    1.9       cgd }
    200    1.9       cgd 
    201    1.9       cgd /*
    202  1.110    itojun  * Wrapper for uiomove() that validates the arguments against a known-good
    203  1.111      matt  * kernel buffer.
    204  1.110    itojun  */
    205  1.110    itojun int
    206  1.111      matt uiomove_frombuf(void *buf, size_t buflen, struct uio *uio)
    207  1.110    itojun {
    208  1.111      matt 	size_t offset;
    209  1.110    itojun 
    210  1.143  christos 	if (uio->uio_offset < 0 || /* uio->uio_resid < 0 || */
    211  1.110    itojun 	    (offset = uio->uio_offset) != uio->uio_offset)
    212  1.110    itojun 		return (EINVAL);
    213  1.111      matt 	if (offset >= buflen)
    214  1.110    itojun 		return (0);
    215  1.111      matt 	return (uiomove((char *)buf + offset, buflen - offset, uio));
    216  1.110    itojun }
    217  1.110    itojun 
    218  1.110    itojun /*
    219    1.9       cgd  * Give next character to user as result of read.
    220    1.9       cgd  */
    221   1.11   mycroft int
    222  1.117   thorpej ureadc(int c, struct uio *uio)
    223    1.9       cgd {
    224   1.63  augustss 	struct iovec *iov;
    225    1.9       cgd 
    226   1.11   mycroft 	if (uio->uio_resid <= 0)
    227   1.11   mycroft 		panic("ureadc: non-positive resid");
    228    1.9       cgd again:
    229   1.11   mycroft 	if (uio->uio_iovcnt <= 0)
    230   1.11   mycroft 		panic("ureadc: non-positive iovcnt");
    231    1.9       cgd 	iov = uio->uio_iov;
    232   1.11   mycroft 	if (iov->iov_len <= 0) {
    233    1.9       cgd 		uio->uio_iovcnt--;
    234    1.9       cgd 		uio->uio_iov++;
    235    1.9       cgd 		goto again;
    236    1.9       cgd 	}
    237  1.126      yamt 	if (!VMSPACE_IS_KERNEL_P(uio->uio_vmspace)) {
    238    1.9       cgd 		if (subyte(iov->iov_base, c) < 0)
    239    1.9       cgd 			return (EFAULT);
    240  1.126      yamt 	} else {
    241   1.39    kleink 		*(char *)iov->iov_base = c;
    242    1.9       cgd 	}
    243  1.155  christos 	iov->iov_base = (char *)iov->iov_base + 1;
    244    1.9       cgd 	iov->iov_len--;
    245    1.9       cgd 	uio->uio_resid--;
    246    1.9       cgd 	uio->uio_offset++;
    247    1.9       cgd 	return (0);
    248   1.82   thorpej }
    249   1.82   thorpej 
    250   1.82   thorpej /*
    251  1.126      yamt  * Like copyin(), but operates on an arbitrary vmspace.
    252   1.82   thorpej  */
    253   1.82   thorpej int
    254  1.126      yamt copyin_vmspace(struct vmspace *vm, const void *uaddr, void *kaddr, size_t len)
    255   1.82   thorpej {
    256   1.82   thorpej 	struct iovec iov;
    257   1.82   thorpej 	struct uio uio;
    258   1.82   thorpej 	int error;
    259   1.82   thorpej 
    260   1.82   thorpej 	if (len == 0)
    261   1.82   thorpej 		return (0);
    262   1.82   thorpej 
    263  1.126      yamt 	if (VMSPACE_IS_KERNEL_P(vm)) {
    264  1.126      yamt 		return kcopy(uaddr, kaddr, len);
    265  1.126      yamt 	}
    266  1.126      yamt 	if (__predict_true(vm == curproc->p_vmspace)) {
    267  1.118  christos 		return copyin(uaddr, kaddr, len);
    268  1.126      yamt 	}
    269  1.118  christos 
    270   1.82   thorpej 	iov.iov_base = kaddr;
    271   1.82   thorpej 	iov.iov_len = len;
    272   1.82   thorpej 	uio.uio_iov = &iov;
    273   1.82   thorpej 	uio.uio_iovcnt = 1;
    274  1.191     rmind 	uio.uio_offset = (off_t)(uintptr_t)uaddr;
    275   1.82   thorpej 	uio.uio_resid = len;
    276   1.82   thorpej 	uio.uio_rw = UIO_READ;
    277  1.134      yamt 	UIO_SETUP_SYSSPACE(&uio);
    278  1.126      yamt 	error = uvm_io(&vm->vm_map, &uio);
    279   1.82   thorpej 
    280   1.82   thorpej 	return (error);
    281   1.82   thorpej }
    282   1.82   thorpej 
    283   1.82   thorpej /*
    284  1.126      yamt  * Like copyout(), but operates on an arbitrary vmspace.
    285   1.82   thorpej  */
    286   1.82   thorpej int
    287  1.126      yamt copyout_vmspace(struct vmspace *vm, const void *kaddr, void *uaddr, size_t len)
    288   1.82   thorpej {
    289   1.82   thorpej 	struct iovec iov;
    290   1.82   thorpej 	struct uio uio;
    291   1.82   thorpej 	int error;
    292   1.82   thorpej 
    293   1.82   thorpej 	if (len == 0)
    294   1.82   thorpej 		return (0);
    295   1.82   thorpej 
    296  1.126      yamt 	if (VMSPACE_IS_KERNEL_P(vm)) {
    297  1.126      yamt 		return kcopy(kaddr, uaddr, len);
    298  1.126      yamt 	}
    299  1.126      yamt 	if (__predict_true(vm == curproc->p_vmspace)) {
    300  1.118  christos 		return copyout(kaddr, uaddr, len);
    301  1.126      yamt 	}
    302  1.118  christos 
    303  1.116  christos 	iov.iov_base = __UNCONST(kaddr); /* XXXUNCONST cast away const */
    304   1.82   thorpej 	iov.iov_len = len;
    305   1.82   thorpej 	uio.uio_iov = &iov;
    306   1.82   thorpej 	uio.uio_iovcnt = 1;
    307  1.191     rmind 	uio.uio_offset = (off_t)(uintptr_t)uaddr;
    308   1.82   thorpej 	uio.uio_resid = len;
    309   1.82   thorpej 	uio.uio_rw = UIO_WRITE;
    310  1.134      yamt 	UIO_SETUP_SYSSPACE(&uio);
    311  1.126      yamt 	error = uvm_io(&vm->vm_map, &uio);
    312  1.126      yamt 
    313  1.126      yamt 	return (error);
    314  1.126      yamt }
    315  1.126      yamt 
    316  1.126      yamt /*
    317  1.126      yamt  * Like copyin(), but operates on an arbitrary process.
    318  1.126      yamt  */
    319  1.126      yamt int
    320  1.126      yamt copyin_proc(struct proc *p, const void *uaddr, void *kaddr, size_t len)
    321  1.126      yamt {
    322  1.126      yamt 	struct vmspace *vm;
    323  1.126      yamt 	int error;
    324  1.126      yamt 
    325  1.126      yamt 	error = proc_vmspace_getref(p, &vm);
    326  1.126      yamt 	if (error) {
    327  1.126      yamt 		return error;
    328  1.126      yamt 	}
    329  1.126      yamt 	error = copyin_vmspace(vm, uaddr, kaddr, len);
    330  1.126      yamt 	uvmspace_free(vm);
    331   1.82   thorpej 
    332  1.126      yamt 	return error;
    333  1.126      yamt }
    334   1.82   thorpej 
    335  1.126      yamt /*
    336  1.126      yamt  * Like copyout(), but operates on an arbitrary process.
    337  1.126      yamt  */
    338  1.126      yamt int
    339  1.126      yamt copyout_proc(struct proc *p, const void *kaddr, void *uaddr, size_t len)
    340  1.126      yamt {
    341  1.126      yamt 	struct vmspace *vm;
    342  1.126      yamt 	int error;
    343  1.126      yamt 
    344  1.126      yamt 	error = proc_vmspace_getref(p, &vm);
    345  1.126      yamt 	if (error) {
    346  1.126      yamt 		return error;
    347  1.126      yamt 	}
    348  1.132      yamt 	error = copyout_vmspace(vm, kaddr, uaddr, len);
    349  1.126      yamt 	uvmspace_free(vm);
    350  1.126      yamt 
    351  1.126      yamt 	return error;
    352    1.9       cgd }
    353   1.10       cgd 
    354   1.10       cgd /*
    355  1.119   reinoud  * Like copyin(), except it operates on kernel addresses when the FKIOCTL
    356  1.119   reinoud  * flag is passed in `ioctlflags' from the ioctl call.
    357  1.119   reinoud  */
    358  1.119   reinoud int
    359  1.119   reinoud ioctl_copyin(int ioctlflags, const void *src, void *dst, size_t len)
    360  1.119   reinoud {
    361  1.119   reinoud 	if (ioctlflags & FKIOCTL)
    362  1.119   reinoud 		return kcopy(src, dst, len);
    363  1.119   reinoud 	return copyin(src, dst, len);
    364  1.119   reinoud }
    365  1.119   reinoud 
    366  1.119   reinoud /*
    367  1.119   reinoud  * Like copyout(), except it operates on kernel addresses when the FKIOCTL
    368  1.119   reinoud  * flag is passed in `ioctlflags' from the ioctl call.
    369  1.119   reinoud  */
    370  1.119   reinoud int
    371  1.119   reinoud ioctl_copyout(int ioctlflags, const void *src, void *dst, size_t len)
    372  1.119   reinoud {
    373  1.119   reinoud 	if (ioctlflags & FKIOCTL)
    374  1.119   reinoud 		return kcopy(src, dst, len);
    375  1.119   reinoud 	return copyout(src, dst, len);
    376  1.119   reinoud }
    377  1.119   reinoud 
    378   1.80  christos static void *
    379  1.117   thorpej hook_establish(hook_list_t *list, void (*fn)(void *), void *arg)
    380   1.14       cgd {
    381   1.80  christos 	struct hook_desc *hd;
    382   1.14       cgd 
    383   1.80  christos 	hd = malloc(sizeof(*hd), M_DEVBUF, M_NOWAIT);
    384   1.80  christos 	if (hd == NULL)
    385   1.59     enami 		return (NULL);
    386   1.14       cgd 
    387   1.80  christos 	hd->hk_fn = fn;
    388   1.80  christos 	hd->hk_arg = arg;
    389   1.80  christos 	LIST_INSERT_HEAD(list, hd, hk_list);
    390   1.14       cgd 
    391   1.80  christos 	return (hd);
    392   1.14       cgd }
    393   1.14       cgd 
    394   1.80  christos static void
    395  1.150      yamt hook_disestablish(hook_list_t *list, void *vhook)
    396   1.14       cgd {
    397   1.14       cgd #ifdef DIAGNOSTIC
    398   1.80  christos 	struct hook_desc *hd;
    399   1.14       cgd 
    400   1.83      matt 	LIST_FOREACH(hd, list, hk_list) {
    401   1.80  christos                 if (hd == vhook)
    402   1.14       cgd 			break;
    403   1.83      matt 	}
    404   1.83      matt 
    405   1.80  christos 	if (hd == NULL)
    406   1.83      matt 		panic("hook_disestablish: hook %p not established", vhook);
    407   1.14       cgd #endif
    408   1.80  christos 	LIST_REMOVE((struct hook_desc *)vhook, hk_list);
    409   1.80  christos 	free(vhook, M_DEVBUF);
    410   1.80  christos }
    411   1.80  christos 
    412   1.80  christos static void
    413  1.117   thorpej hook_destroy(hook_list_t *list)
    414   1.80  christos {
    415   1.80  christos 	struct hook_desc *hd;
    416   1.80  christos 
    417   1.87      matt 	while ((hd = LIST_FIRST(list)) != NULL) {
    418   1.80  christos 		LIST_REMOVE(hd, hk_list);
    419   1.80  christos 		free(hd, M_DEVBUF);
    420   1.80  christos 	}
    421   1.80  christos }
    422   1.14       cgd 
    423   1.80  christos static void
    424  1.117   thorpej hook_proc_run(hook_list_t *list, struct proc *p)
    425   1.80  christos {
    426   1.80  christos 	struct hook_desc *hd;
    427   1.80  christos 
    428  1.178    dyoung 	LIST_FOREACH(hd, list, hk_list)
    429  1.178    dyoung 		((void (*)(struct proc *, void *))*hd->hk_fn)(p, hd->hk_arg);
    430   1.80  christos }
    431   1.80  christos 
    432   1.80  christos /*
    433   1.80  christos  * "Shutdown hook" types, functions, and variables.
    434   1.80  christos  *
    435   1.80  christos  * Should be invoked immediately before the
    436   1.80  christos  * system is halted or rebooted, i.e. after file systems unmounted,
    437   1.80  christos  * after crash dump done, etc.
    438   1.80  christos  *
    439   1.80  christos  * Each shutdown hook is removed from the list before it's run, so that
    440   1.80  christos  * it won't be run again.
    441   1.80  christos  */
    442   1.80  christos 
    443  1.117   thorpej static hook_list_t shutdownhook_list;
    444   1.80  christos 
    445   1.80  christos void *
    446  1.117   thorpej shutdownhook_establish(void (*fn)(void *), void *arg)
    447   1.80  christos {
    448   1.80  christos 	return hook_establish(&shutdownhook_list, fn, arg);
    449   1.80  christos }
    450   1.80  christos 
    451   1.80  christos void
    452  1.117   thorpej shutdownhook_disestablish(void *vhook)
    453   1.80  christos {
    454   1.89    simonb 	hook_disestablish(&shutdownhook_list, vhook);
    455   1.14       cgd }
    456   1.14       cgd 
    457   1.14       cgd /*
    458   1.14       cgd  * Run shutdown hooks.  Should be invoked immediately before the
    459   1.14       cgd  * system is halted or rebooted, i.e. after file systems unmounted,
    460   1.14       cgd  * after crash dump done, etc.
    461   1.17       cgd  *
    462   1.17       cgd  * Each shutdown hook is removed from the list before it's run, so that
    463   1.17       cgd  * it won't be run again.
    464   1.14       cgd  */
    465   1.14       cgd void
    466  1.117   thorpej doshutdownhooks(void)
    467   1.14       cgd {
    468   1.80  christos 	struct hook_desc *dp;
    469   1.14       cgd 
    470   1.87      matt 	while ((dp = LIST_FIRST(&shutdownhook_list)) != NULL) {
    471   1.80  christos 		LIST_REMOVE(dp, hk_list);
    472   1.80  christos 		(*dp->hk_fn)(dp->hk_arg);
    473   1.17       cgd #if 0
    474   1.17       cgd 		/*
    475   1.17       cgd 		 * Don't bother freeing the hook structure,, since we may
    476   1.17       cgd 		 * be rebooting because of a memory corruption problem,
    477   1.17       cgd 		 * and this might only make things worse.  It doesn't
    478   1.17       cgd 		 * matter, anyway, since the system is just about to
    479   1.17       cgd 		 * reboot.
    480   1.17       cgd 		 */
    481   1.17       cgd 		free(dp, M_DEVBUF);
    482   1.17       cgd #endif
    483   1.52  augustss 	}
    484   1.52  augustss }
    485   1.52  augustss 
    486   1.52  augustss /*
    487   1.80  christos  * "Mountroot hook" types, functions, and variables.
    488   1.80  christos  */
    489   1.80  christos 
    490  1.117   thorpej static hook_list_t mountroothook_list;
    491   1.80  christos 
    492   1.80  christos void *
    493  1.117   thorpej mountroothook_establish(void (*fn)(struct device *), struct device *dev)
    494   1.80  christos {
    495  1.109  junyoung 	return hook_establish(&mountroothook_list, (void (*)(void *))fn, dev);
    496   1.80  christos }
    497   1.80  christos 
    498   1.80  christos void
    499  1.117   thorpej mountroothook_disestablish(void *vhook)
    500   1.80  christos {
    501   1.89    simonb 	hook_disestablish(&mountroothook_list, vhook);
    502   1.80  christos }
    503   1.80  christos 
    504   1.80  christos void
    505  1.117   thorpej mountroothook_destroy(void)
    506   1.80  christos {
    507   1.80  christos 	hook_destroy(&mountroothook_list);
    508   1.80  christos }
    509   1.80  christos 
    510   1.80  christos void
    511  1.117   thorpej domountroothook(void)
    512   1.80  christos {
    513   1.80  christos 	struct hook_desc *hd;
    514   1.80  christos 
    515   1.83      matt 	LIST_FOREACH(hd, &mountroothook_list, hk_list) {
    516   1.80  christos 		if (hd->hk_arg == (void *)root_device) {
    517   1.80  christos 			(*hd->hk_fn)(hd->hk_arg);
    518   1.80  christos 			return;
    519   1.80  christos 		}
    520   1.80  christos 	}
    521   1.80  christos }
    522   1.80  christos 
    523  1.117   thorpej static hook_list_t exechook_list;
    524   1.80  christos 
    525   1.80  christos void *
    526  1.117   thorpej exechook_establish(void (*fn)(struct proc *, void *), void *arg)
    527   1.80  christos {
    528  1.109  junyoung 	return hook_establish(&exechook_list, (void (*)(void *))fn, arg);
    529   1.80  christos }
    530   1.80  christos 
    531   1.80  christos void
    532  1.117   thorpej exechook_disestablish(void *vhook)
    533   1.80  christos {
    534   1.80  christos 	hook_disestablish(&exechook_list, vhook);
    535   1.80  christos }
    536   1.80  christos 
    537   1.80  christos /*
    538   1.80  christos  * Run exec hooks.
    539   1.80  christos  */
    540   1.80  christos void
    541  1.117   thorpej doexechooks(struct proc *p)
    542   1.80  christos {
    543   1.80  christos 	hook_proc_run(&exechook_list, p);
    544   1.80  christos }
    545   1.80  christos 
    546  1.117   thorpej static hook_list_t exithook_list;
    547   1.80  christos 
    548   1.80  christos void *
    549  1.117   thorpej exithook_establish(void (*fn)(struct proc *, void *), void *arg)
    550   1.80  christos {
    551  1.109  junyoung 	return hook_establish(&exithook_list, (void (*)(void *))fn, arg);
    552   1.80  christos }
    553   1.80  christos 
    554   1.80  christos void
    555  1.117   thorpej exithook_disestablish(void *vhook)
    556   1.80  christos {
    557   1.80  christos 	hook_disestablish(&exithook_list, vhook);
    558   1.80  christos }
    559   1.80  christos 
    560   1.80  christos /*
    561   1.80  christos  * Run exit hooks.
    562   1.80  christos  */
    563   1.80  christos void
    564  1.117   thorpej doexithooks(struct proc *p)
    565   1.80  christos {
    566   1.80  christos 	hook_proc_run(&exithook_list, p);
    567   1.96   thorpej }
    568   1.96   thorpej 
    569  1.117   thorpej static hook_list_t forkhook_list;
    570   1.96   thorpej 
    571   1.96   thorpej void *
    572  1.117   thorpej forkhook_establish(void (*fn)(struct proc *, struct proc *))
    573   1.96   thorpej {
    574  1.109  junyoung 	return hook_establish(&forkhook_list, (void (*)(void *))fn, NULL);
    575   1.96   thorpej }
    576   1.96   thorpej 
    577   1.96   thorpej void
    578  1.117   thorpej forkhook_disestablish(void *vhook)
    579   1.96   thorpej {
    580   1.96   thorpej 	hook_disestablish(&forkhook_list, vhook);
    581   1.96   thorpej }
    582   1.96   thorpej 
    583   1.96   thorpej /*
    584   1.96   thorpej  * Run fork hooks.
    585   1.96   thorpej  */
    586   1.96   thorpej void
    587  1.117   thorpej doforkhooks(struct proc *p2, struct proc *p1)
    588   1.96   thorpej {
    589   1.96   thorpej 	struct hook_desc *hd;
    590   1.96   thorpej 
    591   1.96   thorpej 	LIST_FOREACH(hd, &forkhook_list, hk_list) {
    592  1.109  junyoung 		((void (*)(struct proc *, struct proc *))*hd->hk_fn)
    593   1.96   thorpej 		    (p2, p1);
    594   1.96   thorpej 	}
    595   1.80  christos }
    596   1.80  christos 
    597   1.80  christos /*
    598   1.52  augustss  * "Power hook" types, functions, and variables.
    599   1.71  augustss  * The list of power hooks is kept ordered with the last registered hook
    600   1.71  augustss  * first.
    601   1.71  augustss  * When running the hooks on power down the hooks are called in reverse
    602   1.71  augustss  * registration order, when powering up in registration order.
    603   1.52  augustss  */
    604   1.52  augustss struct powerhook_desc {
    605   1.71  augustss 	CIRCLEQ_ENTRY(powerhook_desc) sfd_list;
    606  1.109  junyoung 	void	(*sfd_fn)(int, void *);
    607   1.52  augustss 	void	*sfd_arg;
    608  1.144  jmcneill 	char	sfd_name[16];
    609   1.52  augustss };
    610   1.52  augustss 
    611  1.117   thorpej static CIRCLEQ_HEAD(, powerhook_desc) powerhook_list =
    612  1.117   thorpej     CIRCLEQ_HEAD_INITIALIZER(powerhook_list);
    613   1.52  augustss 
    614   1.52  augustss void *
    615  1.145    dogcow powerhook_establish(const char *name, void (*fn)(int, void *), void *arg)
    616   1.52  augustss {
    617   1.52  augustss 	struct powerhook_desc *ndp;
    618   1.52  augustss 
    619   1.52  augustss 	ndp = (struct powerhook_desc *)
    620   1.52  augustss 	    malloc(sizeof(*ndp), M_DEVBUF, M_NOWAIT);
    621   1.52  augustss 	if (ndp == NULL)
    622   1.59     enami 		return (NULL);
    623   1.52  augustss 
    624   1.52  augustss 	ndp->sfd_fn = fn;
    625   1.52  augustss 	ndp->sfd_arg = arg;
    626  1.144  jmcneill 	strlcpy(ndp->sfd_name, name, sizeof(ndp->sfd_name));
    627   1.71  augustss 	CIRCLEQ_INSERT_HEAD(&powerhook_list, ndp, sfd_list);
    628   1.52  augustss 
    629  1.167  jmcneill 	aprint_error("%s: WARNING: powerhook_establish is deprecated\n", name);
    630   1.52  augustss 	return (ndp);
    631   1.52  augustss }
    632   1.52  augustss 
    633   1.52  augustss void
    634  1.117   thorpej powerhook_disestablish(void *vhook)
    635   1.52  augustss {
    636   1.52  augustss #ifdef DIAGNOSTIC
    637   1.52  augustss 	struct powerhook_desc *dp;
    638   1.52  augustss 
    639   1.71  augustss 	CIRCLEQ_FOREACH(dp, &powerhook_list, sfd_list)
    640   1.52  augustss                 if (dp == vhook)
    641   1.71  augustss 			goto found;
    642   1.83      matt 	panic("powerhook_disestablish: hook %p not established", vhook);
    643   1.71  augustss  found:
    644   1.52  augustss #endif
    645   1.52  augustss 
    646   1.71  augustss 	CIRCLEQ_REMOVE(&powerhook_list, (struct powerhook_desc *)vhook,
    647   1.71  augustss 	    sfd_list);
    648   1.52  augustss 	free(vhook, M_DEVBUF);
    649   1.52  augustss }
    650   1.52  augustss 
    651   1.52  augustss /*
    652   1.52  augustss  * Run power hooks.
    653   1.52  augustss  */
    654   1.52  augustss void
    655  1.117   thorpej dopowerhooks(int why)
    656   1.52  augustss {
    657   1.52  augustss 	struct powerhook_desc *dp;
    658   1.52  augustss 
    659  1.144  jmcneill #ifdef POWERHOOK_DEBUG
    660  1.162  christos 	const char *why_name;
    661  1.163  degroote 	static const char * pwr_names[] = {PWR_NAMES};
    662  1.163  degroote 	why_name = why < __arraycount(pwr_names) ? pwr_names[why] : "???";
    663  1.144  jmcneill #endif
    664  1.144  jmcneill 
    665   1.73  takemura 	if (why == PWR_RESUME || why == PWR_SOFTRESUME) {
    666   1.71  augustss 		CIRCLEQ_FOREACH_REVERSE(dp, &powerhook_list, sfd_list) {
    667  1.144  jmcneill #ifdef POWERHOOK_DEBUG
    668  1.162  christos 			printf("dopowerhooks %s: %s (%p)\n", why_name, dp->sfd_name, dp);
    669  1.144  jmcneill #endif
    670   1.71  augustss 			(*dp->sfd_fn)(why, dp->sfd_arg);
    671   1.71  augustss 		}
    672   1.71  augustss 	} else {
    673   1.71  augustss 		CIRCLEQ_FOREACH(dp, &powerhook_list, sfd_list) {
    674  1.144  jmcneill #ifdef POWERHOOK_DEBUG
    675  1.162  christos 			printf("dopowerhooks %s: %s (%p)\n", why_name, dp->sfd_name, dp);
    676  1.144  jmcneill #endif
    677   1.71  augustss 			(*dp->sfd_fn)(why, dp->sfd_arg);
    678   1.71  augustss 		}
    679   1.18   thorpej 	}
    680  1.144  jmcneill 
    681  1.144  jmcneill #ifdef POWERHOOK_DEBUG
    682  1.162  christos 	printf("dopowerhooks: %s done\n", why_name);
    683  1.144  jmcneill #endif
    684   1.18   thorpej }
    685   1.18   thorpej 
    686  1.160  christos static int
    687  1.160  christos isswap(struct device *dv)
    688  1.160  christos {
    689  1.160  christos 	struct dkwedge_info wi;
    690  1.160  christos 	struct vnode *vn;
    691  1.160  christos 	int error;
    692  1.160  christos 
    693  1.160  christos 	if (device_class(dv) != DV_DISK || !device_is_a(dv, "dk"))
    694  1.160  christos 		return 0;
    695  1.160  christos 
    696  1.160  christos 	if ((vn = opendisk(dv)) == NULL)
    697  1.160  christos 		return 0;
    698  1.160  christos 
    699  1.166     pooka 	error = VOP_IOCTL(vn, DIOCGWEDGEINFO, &wi, FREAD, NOCRED);
    700  1.166     pooka 	VOP_CLOSE(vn, FREAD, NOCRED);
    701  1.160  christos 	vput(vn);
    702  1.160  christos 	if (error) {
    703  1.160  christos #ifdef DEBUG_WEDGE
    704  1.184    cegger 		printf("%s: Get wedge info returned %d\n", device_xname(dv), error);
    705  1.160  christos #endif
    706  1.160  christos 		return 0;
    707  1.160  christos 	}
    708  1.160  christos 	return strcmp(wi.dkw_ptype, DKW_PTYPE_SWAP) == 0;
    709  1.160  christos }
    710  1.160  christos 
    711   1.18   thorpej /*
    712   1.18   thorpej  * Determine the root device and, if instructed to, the root file system.
    713   1.18   thorpej  */
    714   1.18   thorpej 
    715   1.18   thorpej #include "md.h"
    716   1.18   thorpej 
    717  1.187        ad #if NMD > 0
    718  1.127      cube extern struct cfdriver md_cd;
    719  1.108  christos #ifdef MEMORY_DISK_IS_ROOT
    720  1.187        ad int md_is_root = 1;
    721  1.187        ad #else
    722  1.187        ad int md_is_root = 0;
    723  1.108  christos #endif
    724  1.190  drochner #endif
    725  1.108  christos 
    726  1.113   thorpej /*
    727  1.113   thorpej  * The device and wedge that we booted from.  If booted_wedge is NULL,
    728  1.113   thorpej  * the we might consult booted_partition.
    729  1.113   thorpej  */
    730  1.113   thorpej struct device *booted_device;
    731  1.113   thorpej struct device *booted_wedge;
    732  1.113   thorpej int booted_partition;
    733  1.113   thorpej 
    734  1.113   thorpej /*
    735  1.113   thorpej  * Use partition letters if it's a disk class but not a wedge.
    736  1.113   thorpej  * XXX Check for wedge is kinda gross.
    737  1.113   thorpej  */
    738  1.113   thorpej #define	DEV_USES_PARTITIONS(dv)						\
    739  1.124   thorpej 	(device_class((dv)) == DV_DISK &&				\
    740  1.125   thorpej 	 !device_is_a((dv), "dk"))
    741  1.113   thorpej 
    742   1.18   thorpej void
    743  1.117   thorpej setroot(struct device *bootdv, int bootpartition)
    744   1.18   thorpej {
    745   1.18   thorpej 	struct device *dv;
    746  1.159    dyoung 	int len, majdev;
    747   1.25       mrg 	dev_t nrootdev;
    748   1.26   thorpej 	dev_t ndumpdev = NODEV;
    749   1.18   thorpej 	char buf[128];
    750   1.18   thorpej 	const char *rootdevname;
    751   1.26   thorpej 	const char *dumpdevname;
    752   1.26   thorpej 	struct device *rootdv = NULL;		/* XXX gcc -Wuninitialized */
    753   1.26   thorpej 	struct device *dumpdv = NULL;
    754   1.18   thorpej 	struct ifnet *ifp;
    755   1.18   thorpej 	const char *deffsname;
    756   1.18   thorpej 	struct vfsops *vops;
    757   1.18   thorpej 
    758  1.157      manu #ifdef TFTPROOT
    759  1.157      manu 	if (tftproot_dhcpboot(bootdv) != 0)
    760  1.157      manu 		boothowto |= RB_ASKNAME;
    761  1.157      manu #endif
    762  1.157      manu 
    763  1.187        ad #if NMD > 0
    764  1.187        ad 	if (md_is_root) {
    765  1.190  drochner 		/*
    766  1.190  drochner 		 * XXX there should be "root on md0" in the config file,
    767  1.190  drochner 		 * but it isn't always
    768  1.190  drochner 		 */
    769  1.190  drochner 		bootdv = md_cd.cd_devs[0];
    770  1.187        ad 		bootpartition = 0;
    771   1.28       leo 	}
    772   1.18   thorpej #endif
    773   1.18   thorpej 
    774   1.18   thorpej 	/*
    775   1.18   thorpej 	 * If NFS is specified as the file system, and we found
    776   1.18   thorpej 	 * a DV_DISK boot device (or no boot device at all), then
    777   1.18   thorpej 	 * find a reasonable network interface for "rootspec".
    778   1.18   thorpej 	 */
    779   1.18   thorpej 	vops = vfs_getopsbyname("nfs");
    780   1.18   thorpej 	if (vops != NULL && vops->vfs_mountroot == mountroot &&
    781   1.18   thorpej 	    rootspec == NULL &&
    782  1.124   thorpej 	    (bootdv == NULL || device_class(bootdv) != DV_IFNET)) {
    783  1.115      matt 		IFNET_FOREACH(ifp) {
    784   1.18   thorpej 			if ((ifp->if_flags &
    785   1.18   thorpej 			     (IFF_LOOPBACK|IFF_POINTOPOINT)) == 0)
    786   1.18   thorpej 				break;
    787   1.83      matt 		}
    788   1.18   thorpej 		if (ifp == NULL) {
    789   1.18   thorpej 			/*
    790   1.18   thorpej 			 * Can't find a suitable interface; ask the
    791   1.18   thorpej 			 * user.
    792   1.18   thorpej 			 */
    793   1.18   thorpej 			boothowto |= RB_ASKNAME;
    794   1.18   thorpej 		} else {
    795   1.18   thorpej 			/*
    796   1.18   thorpej 			 * Have a suitable interface; behave as if
    797   1.18   thorpej 			 * the user specified this interface.
    798   1.18   thorpej 			 */
    799   1.18   thorpej 			rootspec = (const char *)ifp->if_xname;
    800   1.18   thorpej 		}
    801   1.18   thorpej 	}
    802  1.165        ad 	if (vops != NULL)
    803  1.165        ad 		vfs_delref(vops);
    804   1.24   thorpej 
    805   1.24   thorpej 	/*
    806   1.24   thorpej 	 * If wildcarded root and we the boot device wasn't determined,
    807   1.24   thorpej 	 * ask the user.
    808   1.24   thorpej 	 */
    809   1.24   thorpej 	if (rootspec == NULL && bootdv == NULL)
    810   1.24   thorpej 		boothowto |= RB_ASKNAME;
    811   1.18   thorpej 
    812   1.18   thorpej  top:
    813   1.18   thorpej 	if (boothowto & RB_ASKNAME) {
    814   1.26   thorpej 		struct device *defdumpdv;
    815   1.26   thorpej 
    816   1.18   thorpej 		for (;;) {
    817   1.18   thorpej 			printf("root device");
    818   1.18   thorpej 			if (bootdv != NULL) {
    819  1.184    cegger 				printf(" (default %s", device_xname(bootdv));
    820  1.113   thorpej 				if (DEV_USES_PARTITIONS(bootdv))
    821   1.18   thorpej 					printf("%c", bootpartition + 'a');
    822   1.18   thorpej 				printf(")");
    823   1.18   thorpej 			}
    824   1.18   thorpej 			printf(": ");
    825   1.64    itojun 			len = cngetsn(buf, sizeof(buf));
    826   1.18   thorpej 			if (len == 0 && bootdv != NULL) {
    827  1.184    cegger 				strlcpy(buf, device_xname(bootdv), sizeof(buf));
    828   1.18   thorpej 				len = strlen(buf);
    829   1.18   thorpej 			}
    830   1.18   thorpej 			if (len > 0 && buf[len - 1] == '*') {
    831   1.18   thorpej 				buf[--len] = '\0';
    832   1.51   thorpej 				dv = getdisk(buf, len, 1, &nrootdev, 0);
    833   1.18   thorpej 				if (dv != NULL) {
    834   1.18   thorpej 					rootdv = dv;
    835   1.25       mrg 					break;
    836   1.18   thorpej 				}
    837   1.18   thorpej 			}
    838   1.51   thorpej 			dv = getdisk(buf, len, bootpartition, &nrootdev, 0);
    839   1.18   thorpej 			if (dv != NULL) {
    840   1.18   thorpej 				rootdv = dv;
    841   1.18   thorpej 				break;
    842   1.18   thorpej 			}
    843   1.18   thorpej 		}
    844   1.18   thorpej 
    845   1.26   thorpej 		/*
    846   1.26   thorpej 		 * Set up the default dump device.  If root is on
    847   1.26   thorpej 		 * a network device, there is no default dump
    848   1.26   thorpej 		 * device, since we don't support dumps to the
    849   1.26   thorpej 		 * network.
    850   1.26   thorpej 		 */
    851  1.113   thorpej 		if (DEV_USES_PARTITIONS(rootdv) == 0)
    852   1.26   thorpej 			defdumpdv = NULL;
    853   1.26   thorpej 		else
    854   1.26   thorpej 			defdumpdv = rootdv;
    855   1.26   thorpej 
    856   1.26   thorpej 		for (;;) {
    857   1.26   thorpej 			printf("dump device");
    858   1.26   thorpej 			if (defdumpdv != NULL) {
    859   1.26   thorpej 				/*
    860   1.26   thorpej 				 * Note, we know it's a disk if we get here.
    861   1.26   thorpej 				 */
    862  1.184    cegger 				printf(" (default %sb)", device_xname(defdumpdv));
    863   1.26   thorpej 			}
    864   1.26   thorpej 			printf(": ");
    865   1.64    itojun 			len = cngetsn(buf, sizeof(buf));
    866   1.26   thorpej 			if (len == 0) {
    867   1.26   thorpej 				if (defdumpdv != NULL) {
    868   1.26   thorpej 					ndumpdev = MAKEDISKDEV(major(nrootdev),
    869   1.26   thorpej 					    DISKUNIT(nrootdev), 1);
    870   1.26   thorpej 				}
    871   1.54     enami 				dumpdv = defdumpdv;
    872   1.26   thorpej 				break;
    873   1.26   thorpej 			}
    874   1.26   thorpej 			if (len == 4 && strcmp(buf, "none") == 0) {
    875   1.55     enami 				dumpdv = NULL;
    876   1.54     enami 				break;
    877   1.26   thorpej 			}
    878   1.51   thorpej 			dv = getdisk(buf, len, 1, &ndumpdev, 1);
    879   1.55     enami 			if (dv != NULL) {
    880   1.26   thorpej 				dumpdv = dv;
    881   1.26   thorpej 				break;
    882   1.26   thorpej 			}
    883   1.26   thorpej 		}
    884   1.26   thorpej 
    885   1.18   thorpej 		rootdev = nrootdev;
    886   1.26   thorpej 		dumpdev = ndumpdev;
    887   1.18   thorpej 
    888   1.36   thorpej 		for (vops = LIST_FIRST(&vfs_list); vops != NULL;
    889   1.36   thorpej 		     vops = LIST_NEXT(vops, vfs_list)) {
    890   1.36   thorpej 			if (vops->vfs_mountroot != NULL &&
    891   1.36   thorpej 			    vops->vfs_mountroot == mountroot)
    892   1.38      fvdl 			break;
    893   1.18   thorpej 		}
    894   1.36   thorpej 
    895   1.36   thorpej 		if (vops == NULL) {
    896   1.18   thorpej 			mountroot = NULL;
    897   1.18   thorpej 			deffsname = "generic";
    898   1.18   thorpej 		} else
    899   1.36   thorpej 			deffsname = vops->vfs_name;
    900   1.36   thorpej 
    901   1.18   thorpej 		for (;;) {
    902   1.18   thorpej 			printf("file system (default %s): ", deffsname);
    903   1.64    itojun 			len = cngetsn(buf, sizeof(buf));
    904   1.18   thorpej 			if (len == 0)
    905   1.18   thorpej 				break;
    906   1.18   thorpej 			if (len == 4 && strcmp(buf, "halt") == 0)
    907   1.23       gwr 				cpu_reboot(RB_HALT, NULL);
    908   1.76   thorpej 			else if (len == 6 && strcmp(buf, "reboot") == 0)
    909   1.76   thorpej 				cpu_reboot(0, NULL);
    910   1.78   thorpej #if defined(DDB)
    911   1.78   thorpej 			else if (len == 3 && strcmp(buf, "ddb") == 0) {
    912   1.78   thorpej 				console_debugger();
    913   1.78   thorpej 			}
    914   1.78   thorpej #endif
    915   1.18   thorpej 			else if (len == 7 && strcmp(buf, "generic") == 0) {
    916   1.18   thorpej 				mountroot = NULL;
    917   1.18   thorpej 				break;
    918   1.18   thorpej 			}
    919   1.18   thorpej 			vops = vfs_getopsbyname(buf);
    920   1.18   thorpej 			if (vops == NULL || vops->vfs_mountroot == NULL) {
    921   1.18   thorpej 				printf("use one of: generic");
    922   1.36   thorpej 				for (vops = LIST_FIRST(&vfs_list);
    923   1.36   thorpej 				     vops != NULL;
    924   1.36   thorpej 				     vops = LIST_NEXT(vops, vfs_list)) {
    925   1.36   thorpej 					if (vops->vfs_mountroot != NULL)
    926   1.36   thorpej 						printf(" %s", vops->vfs_name);
    927   1.36   thorpej 				}
    928   1.78   thorpej #if defined(DDB)
    929   1.78   thorpej 				printf(" ddb");
    930   1.78   thorpej #endif
    931   1.76   thorpej 				printf(" halt reboot\n");
    932   1.18   thorpej 			} else {
    933   1.18   thorpej 				mountroot = vops->vfs_mountroot;
    934  1.165        ad 				vfs_delref(vops);
    935   1.18   thorpej 				break;
    936   1.18   thorpej 			}
    937   1.18   thorpej 		}
    938   1.18   thorpej 
    939   1.18   thorpej 	} else if (rootspec == NULL) {
    940   1.18   thorpej 		/*
    941   1.18   thorpej 		 * Wildcarded root; use the boot device.
    942   1.18   thorpej 		 */
    943   1.26   thorpej 		rootdv = bootdv;
    944   1.26   thorpej 
    945  1.188  christos 		if (bootdv)
    946  1.188  christos 			majdev = devsw_name2blk(device_xname(bootdv), NULL, 0);
    947  1.188  christos 		else
    948  1.188  christos 			majdev = -1;
    949   1.18   thorpej 		if (majdev >= 0) {
    950   1.18   thorpej 			/*
    951  1.113   thorpej 			 * Root is on a disk.  `bootpartition' is root,
    952  1.113   thorpej 			 * unless the device does not use partitions.
    953   1.18   thorpej 			 */
    954  1.113   thorpej 			if (DEV_USES_PARTITIONS(bootdv))
    955  1.135   thorpej 				rootdev = MAKEDISKDEV(majdev,
    956  1.135   thorpej 						      device_unit(bootdv),
    957  1.135   thorpej 						      bootpartition);
    958  1.113   thorpej 			else
    959  1.135   thorpej 				rootdev = makedev(majdev, device_unit(bootdv));
    960   1.18   thorpej 		}
    961   1.18   thorpej 	} else {
    962   1.18   thorpej 
    963   1.18   thorpej 		/*
    964   1.25       mrg 		 * `root on <dev> ...'
    965   1.18   thorpej 		 */
    966   1.18   thorpej 
    967   1.18   thorpej 		/*
    968   1.18   thorpej 		 * If it's a network interface, we can bail out
    969   1.18   thorpej 		 * early.
    970   1.18   thorpej 		 */
    971   1.56     enami 		dv = finddevice(rootspec);
    972  1.124   thorpej 		if (dv != NULL && device_class(dv) == DV_IFNET) {
    973   1.26   thorpej 			rootdv = dv;
    974   1.26   thorpej 			goto haveroot;
    975   1.18   thorpej 		}
    976   1.18   thorpej 
    977  1.159    dyoung 		if (rootdev == NODEV &&
    978  1.159    dyoung 		    device_class(dv) == DV_DISK && device_is_a(dv, "dk") &&
    979  1.184    cegger 		    (majdev = devsw_name2blk(device_xname(dv), NULL, 0)) >= 0)
    980  1.159    dyoung 			rootdev = makedev(majdev, device_unit(dv));
    981  1.159    dyoung 
    982   1.88   gehenna 		rootdevname = devsw_blk2name(major(rootdev));
    983   1.18   thorpej 		if (rootdevname == NULL) {
    984   1.18   thorpej 			printf("unknown device major 0x%x\n", rootdev);
    985   1.18   thorpej 			boothowto |= RB_ASKNAME;
    986   1.18   thorpej 			goto top;
    987   1.18   thorpej 		}
    988   1.41     perry 		memset(buf, 0, sizeof(buf));
    989  1.110    itojun 		snprintf(buf, sizeof(buf), "%s%d", rootdevname,
    990  1.110    itojun 		    DISKUNIT(rootdev));
    991   1.18   thorpej 
    992   1.56     enami 		rootdv = finddevice(buf);
    993   1.26   thorpej 		if (rootdv == NULL) {
    994   1.18   thorpej 			printf("device %s (0x%x) not configured\n",
    995   1.18   thorpej 			    buf, rootdev);
    996   1.18   thorpej 			boothowto |= RB_ASKNAME;
    997   1.18   thorpej 			goto top;
    998   1.18   thorpej 		}
    999   1.26   thorpej 	}
   1000   1.18   thorpej 
   1001   1.26   thorpej  haveroot:
   1002   1.18   thorpej 
   1003   1.18   thorpej 	root_device = rootdv;
   1004   1.18   thorpej 
   1005  1.124   thorpej 	switch (device_class(rootdv)) {
   1006   1.18   thorpej 	case DV_IFNET:
   1007  1.139  christos 	case DV_DISK:
   1008  1.184    cegger 		aprint_normal("root on %s", device_xname(rootdv));
   1009  1.140  christos 		if (DEV_USES_PARTITIONS(rootdv))
   1010  1.139  christos 			aprint_normal("%c", DISKPART(rootdev) + 'a');
   1011   1.18   thorpej 		break;
   1012   1.18   thorpej 
   1013   1.18   thorpej 	default:
   1014   1.18   thorpej 		printf("can't determine root device\n");
   1015   1.18   thorpej 		boothowto |= RB_ASKNAME;
   1016   1.18   thorpej 		goto top;
   1017   1.18   thorpej 	}
   1018   1.26   thorpej 
   1019   1.26   thorpej 	/*
   1020   1.26   thorpej 	 * Now configure the dump device.
   1021   1.55     enami 	 *
   1022   1.26   thorpej 	 * If we haven't figured out the dump device, do so, with
   1023   1.26   thorpej 	 * the following rules:
   1024   1.26   thorpej 	 *
   1025   1.26   thorpej 	 *	(a) We already know dumpdv in the RB_ASKNAME case.
   1026   1.26   thorpej 	 *
   1027   1.26   thorpej 	 *	(b) If dumpspec is set, try to use it.  If the device
   1028   1.26   thorpej 	 *	    is not available, punt.
   1029   1.26   thorpej 	 *
   1030   1.26   thorpej 	 *	(c) If dumpspec is not set, the dump device is
   1031   1.26   thorpej 	 *	    wildcarded or unspecified.  If the root device
   1032   1.26   thorpej 	 *	    is DV_IFNET, punt.  Otherwise, use partition b
   1033   1.26   thorpej 	 *	    of the root device.
   1034   1.26   thorpej 	 */
   1035   1.26   thorpej 
   1036   1.55     enami 	if (boothowto & RB_ASKNAME) {		/* (a) */
   1037   1.55     enami 		if (dumpdv == NULL)
   1038   1.55     enami 			goto nodumpdev;
   1039   1.55     enami 	} else if (dumpspec != NULL) {		/* (b) */
   1040   1.55     enami 		if (strcmp(dumpspec, "none") == 0 || dumpdev == NODEV) {
   1041   1.26   thorpej 			/*
   1042   1.55     enami 			 * Operator doesn't want a dump device.
   1043   1.55     enami 			 * Or looks like they tried to pick a network
   1044   1.26   thorpej 			 * device.  Oops.
   1045   1.26   thorpej 			 */
   1046   1.26   thorpej 			goto nodumpdev;
   1047   1.26   thorpej 		}
   1048   1.26   thorpej 
   1049   1.88   gehenna 		dumpdevname = devsw_blk2name(major(dumpdev));
   1050   1.26   thorpej 		if (dumpdevname == NULL)
   1051   1.26   thorpej 			goto nodumpdev;
   1052   1.41     perry 		memset(buf, 0, sizeof(buf));
   1053  1.110    itojun 		snprintf(buf, sizeof(buf), "%s%d", dumpdevname,
   1054  1.110    itojun 		    DISKUNIT(dumpdev));
   1055   1.26   thorpej 
   1056   1.56     enami 		dumpdv = finddevice(buf);
   1057   1.56     enami 		if (dumpdv == NULL) {
   1058   1.26   thorpej 			/*
   1059   1.26   thorpej 			 * Device not configured.
   1060   1.26   thorpej 			 */
   1061   1.26   thorpej 			goto nodumpdev;
   1062   1.26   thorpej 		}
   1063   1.55     enami 	} else {				/* (c) */
   1064  1.160  christos 		if (DEV_USES_PARTITIONS(rootdv) == 0) {
   1065  1.160  christos 			for (dv = TAILQ_FIRST(&alldevs); dv != NULL;
   1066  1.160  christos 			    dv = TAILQ_NEXT(dv, dv_list))
   1067  1.160  christos 				if (isswap(dv))
   1068  1.160  christos 					break;
   1069  1.160  christos 			if (dv == NULL)
   1070  1.160  christos 				goto nodumpdev;
   1071  1.160  christos 
   1072  1.184    cegger 			majdev = devsw_name2blk(device_xname(dv), NULL, 0);
   1073  1.160  christos 			if (majdev < 0)
   1074  1.160  christos 				goto nodumpdev;
   1075  1.160  christos 			dumpdv = dv;
   1076  1.160  christos 			dumpdev = makedev(majdev, device_unit(dumpdv));
   1077  1.160  christos 		} else {
   1078   1.55     enami 			dumpdv = rootdv;
   1079   1.55     enami 			dumpdev = MAKEDISKDEV(major(rootdev),
   1080  1.135   thorpej 			    device_unit(dumpdv), 1);
   1081   1.55     enami 		}
   1082   1.26   thorpej 	}
   1083   1.26   thorpej 
   1084  1.175        ad 	dumpcdev = devsw_blk2chr(dumpdev);
   1085  1.184    cegger 	aprint_normal(" dumps on %s", device_xname(dumpdv));
   1086  1.140  christos 	if (DEV_USES_PARTITIONS(dumpdv))
   1087  1.140  christos 		aprint_normal("%c", DISKPART(dumpdev) + 'a');
   1088  1.140  christos 	aprint_normal("\n");
   1089   1.26   thorpej 	return;
   1090   1.26   thorpej 
   1091   1.26   thorpej  nodumpdev:
   1092   1.26   thorpej 	dumpdev = NODEV;
   1093  1.175        ad 	dumpcdev = NODEV;
   1094  1.100   thorpej 	aprint_normal("\n");
   1095   1.18   thorpej }
   1096   1.18   thorpej 
   1097   1.18   thorpej static struct device *
   1098  1.117   thorpej finddevice(const char *name)
   1099   1.56     enami {
   1100  1.159    dyoung 	const char *wname;
   1101  1.108  christos 
   1102  1.159    dyoung 	if ((wname = getwedgename(name, strlen(name))) != NULL)
   1103  1.159    dyoung 		return dkwedge_find_by_wname(wname);
   1104  1.159    dyoung 
   1105  1.179     joerg 	return device_find_by_xname(name);
   1106   1.56     enami }
   1107   1.56     enami 
   1108   1.56     enami static struct device *
   1109  1.117   thorpej getdisk(char *str, int len, int defpart, dev_t *devp, int isdump)
   1110   1.18   thorpej {
   1111   1.28       leo 	struct device	*dv;
   1112   1.18   thorpej 
   1113   1.51   thorpej 	if ((dv = parsedisk(str, len, defpart, devp)) == NULL) {
   1114   1.18   thorpej 		printf("use one of:");
   1115   1.83      matt 		TAILQ_FOREACH(dv, &alldevs, dv_list) {
   1116  1.113   thorpej 			if (DEV_USES_PARTITIONS(dv))
   1117  1.184    cegger 				printf(" %s[a-%c]", device_xname(dv),
   1118   1.19       cgd 				    'a' + MAXPARTITIONS - 1);
   1119  1.124   thorpej 			else if (device_class(dv) == DV_DISK)
   1120  1.184    cegger 				printf(" %s", device_xname(dv));
   1121  1.124   thorpej 			if (isdump == 0 && device_class(dv) == DV_IFNET)
   1122  1.184    cegger 				printf(" %s", device_xname(dv));
   1123   1.18   thorpej 		}
   1124  1.159    dyoung 		dkwedge_print_wnames();
   1125   1.26   thorpej 		if (isdump)
   1126   1.26   thorpej 			printf(" none");
   1127   1.78   thorpej #if defined(DDB)
   1128   1.78   thorpej 		printf(" ddb");
   1129   1.78   thorpej #endif
   1130   1.76   thorpej 		printf(" halt reboot\n");
   1131   1.18   thorpej 	}
   1132  1.159    dyoung 	return dv;
   1133  1.159    dyoung }
   1134  1.159    dyoung 
   1135  1.159    dyoung static const char *
   1136  1.159    dyoung getwedgename(const char *name, int namelen)
   1137  1.159    dyoung {
   1138  1.159    dyoung 	const char *wpfx = "wedge:";
   1139  1.159    dyoung 	const int wpfxlen = strlen(wpfx);
   1140  1.159    dyoung 
   1141  1.159    dyoung 	if (namelen < wpfxlen || strncmp(name, wpfx, wpfxlen) != 0)
   1142  1.159    dyoung 		return NULL;
   1143  1.159    dyoung 
   1144  1.159    dyoung 	return name + wpfxlen;
   1145   1.18   thorpej }
   1146   1.18   thorpej 
   1147   1.18   thorpej static struct device *
   1148  1.117   thorpej parsedisk(char *str, int len, int defpart, dev_t *devp)
   1149   1.18   thorpej {
   1150   1.18   thorpej 	struct device *dv;
   1151  1.159    dyoung 	const char *wname;
   1152   1.18   thorpej 	char *cp, c;
   1153   1.29  drochner 	int majdev, part;
   1154   1.18   thorpej 	if (len == 0)
   1155   1.18   thorpej 		return (NULL);
   1156   1.18   thorpej 
   1157   1.18   thorpej 	if (len == 4 && strcmp(str, "halt") == 0)
   1158   1.23       gwr 		cpu_reboot(RB_HALT, NULL);
   1159   1.76   thorpej 	else if (len == 6 && strcmp(str, "reboot") == 0)
   1160   1.76   thorpej 		cpu_reboot(0, NULL);
   1161   1.78   thorpej #if defined(DDB)
   1162   1.78   thorpej 	else if (len == 3 && strcmp(str, "ddb") == 0)
   1163   1.78   thorpej 		console_debugger();
   1164   1.78   thorpej #endif
   1165   1.18   thorpej 
   1166   1.18   thorpej 	cp = str + len - 1;
   1167   1.18   thorpej 	c = *cp;
   1168  1.159    dyoung 
   1169  1.159    dyoung 	if ((wname = getwedgename(str, len)) != NULL) {
   1170  1.159    dyoung 		if ((dv = dkwedge_find_by_wname(wname)) == NULL)
   1171  1.159    dyoung 			return NULL;
   1172  1.159    dyoung 		part = defpart;
   1173  1.159    dyoung 		goto gotdisk;
   1174  1.159    dyoung 	} else if (c >= 'a' && c <= ('a' + MAXPARTITIONS - 1)) {
   1175   1.18   thorpej 		part = c - 'a';
   1176   1.18   thorpej 		*cp = '\0';
   1177   1.18   thorpej 	} else
   1178   1.18   thorpej 		part = defpart;
   1179   1.18   thorpej 
   1180   1.56     enami 	dv = finddevice(str);
   1181   1.56     enami 	if (dv != NULL) {
   1182  1.124   thorpej 		if (device_class(dv) == DV_DISK) {
   1183   1.18   thorpej  gotdisk:
   1184  1.184    cegger 			majdev = devsw_name2blk(device_xname(dv), NULL, 0);
   1185   1.18   thorpej 			if (majdev < 0)
   1186   1.18   thorpej 				panic("parsedisk");
   1187  1.113   thorpej 			if (DEV_USES_PARTITIONS(dv))
   1188  1.135   thorpej 				*devp = MAKEDISKDEV(majdev, device_unit(dv),
   1189  1.135   thorpej 						    part);
   1190  1.113   thorpej 			else
   1191  1.135   thorpej 				*devp = makedev(majdev, device_unit(dv));
   1192   1.18   thorpej 		}
   1193   1.18   thorpej 
   1194  1.124   thorpej 		if (device_class(dv) == DV_IFNET)
   1195   1.18   thorpej 			*devp = NODEV;
   1196   1.18   thorpej 	}
   1197   1.18   thorpej 
   1198   1.18   thorpej 	*cp = c;
   1199   1.18   thorpej 	return (dv);
   1200   1.48     lukem }
   1201   1.48     lukem 
   1202   1.48     lukem /*
   1203   1.49     lukem  * snprintf() `bytes' into `buf', reformatting it so that the number,
   1204   1.49     lukem  * plus a possible `x' + suffix extension) fits into len bytes (including
   1205   1.49     lukem  * the terminating NUL).
   1206   1.60     enami  * Returns the number of bytes stored in buf, or -1 if there was a problem.
   1207  1.109  junyoung  * E.g, given a len of 9 and a suffix of `B':
   1208   1.48     lukem  *	bytes		result
   1209   1.48     lukem  *	-----		------
   1210   1.49     lukem  *	99999		`99999 B'
   1211   1.90       wiz  *	100000		`97 kB'
   1212   1.90       wiz  *	66715648	`65152 kB'
   1213   1.48     lukem  *	252215296	`240 MB'
   1214   1.48     lukem  */
   1215   1.48     lukem int
   1216  1.117   thorpej humanize_number(char *buf, size_t len, uint64_t bytes, const char *suffix,
   1217  1.117   thorpej     int divisor)
   1218   1.48     lukem {
   1219   1.91  drochner        	/* prefixes are: (none), kilo, Mega, Giga, Tera, Peta, Exa */
   1220   1.91  drochner 	const char *prefixes;
   1221   1.86   thorpej 	int		r;
   1222  1.121     perry 	uint64_t	umax;
   1223   1.86   thorpej 	size_t		i, suffixlen;
   1224   1.48     lukem 
   1225   1.49     lukem 	if (buf == NULL || suffix == NULL)
   1226   1.49     lukem 		return (-1);
   1227   1.48     lukem 	if (len > 0)
   1228   1.48     lukem 		buf[0] = '\0';
   1229   1.49     lukem 	suffixlen = strlen(suffix);
   1230   1.91  drochner 	/* check if enough room for `x y' + suffix + `\0' */
   1231   1.49     lukem 	if (len < 4 + suffixlen)
   1232   1.49     lukem 		return (-1);
   1233   1.48     lukem 
   1234   1.91  drochner 	if (divisor == 1024) {
   1235   1.91  drochner 		/*
   1236   1.91  drochner 		 * binary multiplies
   1237   1.91  drochner 		 * XXX IEC 60027-2 recommends Ki, Mi, Gi...
   1238   1.91  drochner 		 */
   1239   1.91  drochner 		prefixes = " KMGTPE";
   1240   1.91  drochner 	} else
   1241   1.91  drochner 		prefixes = " kMGTPE"; /* SI for decimal multiplies */
   1242   1.91  drochner 
   1243  1.116  christos 	umax = 1;
   1244   1.49     lukem 	for (i = 0; i < len - suffixlen - 3; i++)
   1245  1.116  christos 		umax *= 10;
   1246  1.116  christos 	for (i = 0; bytes >= umax && prefixes[i + 1]; i++)
   1247   1.58  sommerfe 		bytes /= divisor;
   1248   1.48     lukem 
   1249   1.50     lukem 	r = snprintf(buf, len, "%qu%s%c%s", (unsigned long long)bytes,
   1250   1.49     lukem 	    i == 0 ? "" : " ", prefixes[i], suffix);
   1251   1.48     lukem 
   1252   1.48     lukem 	return (r);
   1253   1.49     lukem }
   1254   1.49     lukem 
   1255   1.49     lukem int
   1256  1.117   thorpej format_bytes(char *buf, size_t len, uint64_t bytes)
   1257   1.49     lukem {
   1258   1.49     lukem 	int	rv;
   1259   1.49     lukem 	size_t	nlen;
   1260   1.49     lukem 
   1261   1.58  sommerfe 	rv = humanize_number(buf, len, bytes, "B", 1024);
   1262   1.49     lukem 	if (rv != -1) {
   1263   1.49     lukem 			/* nuke the trailing ` B' if it exists */
   1264   1.49     lukem 		nlen = strlen(buf) - 2;
   1265   1.49     lukem 		if (strcmp(&buf[nlen], " B") == 0)
   1266   1.49     lukem 			buf[nlen] = '\0';
   1267   1.49     lukem 	}
   1268   1.49     lukem 	return (rv);
   1269   1.81  christos }
   1270   1.81  christos 
   1271   1.92  jdolecek /*
   1272  1.154   thorpej  * Return true if system call tracing is enabled for the specified process.
   1273  1.130   thorpej  */
   1274  1.153   thorpej bool
   1275  1.130   thorpej trace_is_enabled(struct proc *p)
   1276  1.130   thorpej {
   1277  1.131   thorpej #ifdef SYSCALL_DEBUG
   1278  1.154   thorpej 	return (true);
   1279  1.131   thorpej #endif
   1280  1.130   thorpej #ifdef KTRACE
   1281  1.130   thorpej 	if (ISSET(p->p_traceflag, (KTRFAC_SYSCALL | KTRFAC_SYSRET)))
   1282  1.154   thorpej 		return (true);
   1283  1.130   thorpej #endif
   1284  1.142      matt #ifdef PTRACE
   1285  1.151        ad 	if (ISSET(p->p_slflag, PSL_SYSCALL))
   1286  1.154   thorpej 		return (true);
   1287  1.142      matt #endif
   1288  1.130   thorpej 
   1289  1.154   thorpej 	return (false);
   1290  1.130   thorpej }
   1291  1.130   thorpej 
   1292  1.130   thorpej /*
   1293   1.92  jdolecek  * Start trace of particular system call. If process is being traced,
   1294   1.92  jdolecek  * this routine is called by MD syscall dispatch code just before
   1295   1.92  jdolecek  * a system call is actually executed.
   1296   1.92  jdolecek  */
   1297   1.81  christos int
   1298  1.177       dsl trace_enter(register_t code, const register_t *args, int narg)
   1299   1.81  christos {
   1300   1.81  christos #ifdef SYSCALL_DEBUG
   1301  1.171       dsl 	scdebug_call(code, args);
   1302   1.81  christos #endif /* SYSCALL_DEBUG */
   1303   1.81  christos 
   1304  1.177       dsl 	ktrsyscall(code, args, narg);
   1305   1.81  christos 
   1306  1.142      matt #ifdef PTRACE
   1307  1.172       dsl 	if ((curlwp->l_proc->p_slflag & (PSL_SYSCALL|PSL_TRACED)) ==
   1308  1.151        ad 	    (PSL_SYSCALL|PSL_TRACED))
   1309  1.172       dsl 		process_stoptrace();
   1310  1.142      matt #endif
   1311   1.81  christos 	return 0;
   1312   1.81  christos }
   1313   1.81  christos 
   1314   1.92  jdolecek /*
   1315   1.92  jdolecek  * End trace of particular system call. If process is being traced,
   1316   1.92  jdolecek  * this routine is called by MD syscall dispatch code just after
   1317   1.92  jdolecek  * a system call finishes.
   1318   1.92  jdolecek  * MD caller guarantees the passed 'code' is within the supported
   1319   1.92  jdolecek  * system call number range for emulation the process runs under.
   1320   1.92  jdolecek  */
   1321   1.81  christos void
   1322  1.177       dsl trace_exit(register_t code, register_t rval[], int error)
   1323   1.81  christos {
   1324   1.81  christos #ifdef SYSCALL_DEBUG
   1325  1.171       dsl 	scdebug_ret(code, error, rval);
   1326   1.81  christos #endif /* SYSCALL_DEBUG */
   1327   1.81  christos 
   1328  1.164        ad 	ktrsysret(code, error, rval);
   1329  1.128  christos 
   1330  1.142      matt #ifdef PTRACE
   1331  1.172       dsl 	if ((curlwp->l_proc->p_slflag & (PSL_SYSCALL|PSL_TRACED)) ==
   1332  1.151        ad 	    (PSL_SYSCALL|PSL_TRACED))
   1333  1.172       dsl 		process_stoptrace();
   1334  1.142      matt #endif
   1335   1.10       cgd }
   1336  1.194        ad 
   1337  1.194        ad int
   1338  1.194        ad syscall_establish(const struct emul *em, const struct syscall_package *sp)
   1339  1.194        ad {
   1340  1.194        ad 	struct sysent *sy;
   1341  1.194        ad 	int i;
   1342  1.194        ad 
   1343  1.194        ad 	KASSERT(mutex_owned(&module_lock));
   1344  1.194        ad 
   1345  1.194        ad 	if (em == NULL) {
   1346  1.194        ad 		em = &emul_netbsd;
   1347  1.194        ad 	}
   1348  1.194        ad 	sy = em->e_sysent;
   1349  1.194        ad 
   1350  1.194        ad 	/*
   1351  1.194        ad 	 * Ensure that all preconditions are valid, since this is
   1352  1.194        ad 	 * an all or nothing deal.  Once a system call is entered,
   1353  1.194        ad 	 * it can become busy and we could be unable to remove it
   1354  1.194        ad 	 * on error.
   1355  1.194        ad 	 */
   1356  1.194        ad 	for (i = 0; sp[i].sp_call != NULL; i++) {
   1357  1.194        ad 		if (sy[sp[i].sp_code].sy_call != sys_nomodule) {
   1358  1.194        ad 			return EBUSY;
   1359  1.194        ad 		}
   1360  1.194        ad 	}
   1361  1.194        ad 	/* Everything looks good, patch them in. */
   1362  1.194        ad 	for (i = 0; sp[i].sp_call != NULL; i++) {
   1363  1.194        ad 		sy[sp[i].sp_code].sy_call = sp[i].sp_call;
   1364  1.194        ad 	}
   1365  1.194        ad 
   1366  1.194        ad 	return 0;
   1367  1.194        ad }
   1368  1.194        ad 
   1369  1.194        ad int
   1370  1.194        ad syscall_disestablish(const struct emul *em, const struct syscall_package *sp)
   1371  1.194        ad {
   1372  1.194        ad 	struct sysent *sy;
   1373  1.194        ad 	uint64_t where;
   1374  1.194        ad 	lwp_t *l;
   1375  1.194        ad 	int i;
   1376  1.194        ad 
   1377  1.194        ad 	KASSERT(mutex_owned(&module_lock));
   1378  1.194        ad 
   1379  1.194        ad 	if (em == NULL) {
   1380  1.194        ad 		em = &emul_netbsd;
   1381  1.194        ad 	}
   1382  1.194        ad 	sy = em->e_sysent;
   1383  1.194        ad 
   1384  1.194        ad 	/*
   1385  1.194        ad 	 * First, patch the system calls to sys_nomodule to gate further
   1386  1.194        ad 	 * activity.
   1387  1.194        ad 	 */
   1388  1.194        ad 	for (i = 0; sp[i].sp_call != NULL; i++) {
   1389  1.194        ad 		KASSERT(sy[sp[i].sp_code].sy_call == sp[i].sp_call);
   1390  1.194        ad 		sy[sp[i].sp_code].sy_call = sys_nomodule;
   1391  1.194        ad 	}
   1392  1.194        ad 
   1393  1.194        ad 	/*
   1394  1.194        ad 	 * Run a cross call to cycle through all CPUs.  This does two
   1395  1.194        ad 	 * things: lock activity provides a barrier and makes our update
   1396  1.194        ad 	 * of sy_call visible to all CPUs, and upon return we can be sure
   1397  1.194        ad 	 * that we see pertinent values of l_sysent posted by remote CPUs.
   1398  1.194        ad 	 */
   1399  1.194        ad 	where = xc_broadcast(0, (xcfunc_t)nullop, NULL, NULL);
   1400  1.194        ad 	xc_wait(where);
   1401  1.194        ad 
   1402  1.194        ad 	/*
   1403  1.194        ad 	 * Now it's safe to check l_sysent.  Run through all LWPs and see
   1404  1.194        ad 	 * if anyone is still using the system call.
   1405  1.194        ad 	 */
   1406  1.194        ad 	for (i = 0; sp[i].sp_call != NULL; i++) {
   1407  1.194        ad 		mutex_enter(proc_lock);
   1408  1.194        ad 		LIST_FOREACH(l, &alllwp, l_list) {
   1409  1.194        ad 			if (l->l_sysent == &sy[sp[i].sp_code]) {
   1410  1.194        ad 				break;
   1411  1.194        ad 			}
   1412  1.194        ad 		}
   1413  1.194        ad 		mutex_exit(proc_lock);
   1414  1.194        ad 		if (l == NULL) {
   1415  1.194        ad 			continue;
   1416  1.194        ad 		}
   1417  1.194        ad 		/*
   1418  1.194        ad 		 * We lose: one or more calls are still in use.  Put back
   1419  1.194        ad 		 * the old entrypoints and act like nothing happened.
   1420  1.194        ad 		 * When we drop module_lock, any system calls held in
   1421  1.194        ad 		 * sys_nomodule() will be restarted.
   1422  1.194        ad 		 */
   1423  1.194        ad 		for (i = 0; sp[i].sp_call != NULL; i++) {
   1424  1.194        ad 			sy[sp[i].sp_code].sy_call = sp[i].sp_call;
   1425  1.194        ad 		}
   1426  1.194        ad 		return EBUSY;
   1427  1.194        ad 	}
   1428  1.194        ad 
   1429  1.194        ad 	return 0;
   1430  1.194        ad }
   1431