Home | History | Annotate | Line # | Download | only in kern
kern_ktrace.c revision 1.88.2.1.4.1
      1  1.88.2.1.4.1    bouyer /*	$NetBSD: kern_ktrace.c,v 1.88.2.1.4.1 2007/02/08 23:09:05 bouyer Exp $	*/
      2          1.11       cgd 
      3           1.1       cgd /*
      4           1.9       cgd  * Copyright (c) 1989, 1993
      5           1.9       cgd  *	The Regents of the University of California.  All rights reserved.
      6           1.1       cgd  *
      7           1.1       cgd  * Redistribution and use in source and binary forms, with or without
      8           1.1       cgd  * modification, are permitted provided that the following conditions
      9           1.1       cgd  * are met:
     10           1.1       cgd  * 1. Redistributions of source code must retain the above copyright
     11           1.1       cgd  *    notice, this list of conditions and the following disclaimer.
     12           1.1       cgd  * 2. Redistributions in binary form must reproduce the above copyright
     13           1.1       cgd  *    notice, this list of conditions and the following disclaimer in the
     14           1.1       cgd  *    documentation and/or other materials provided with the distribution.
     15          1.77       agc  * 3. Neither the name of the University nor the names of its contributors
     16           1.1       cgd  *    may be used to endorse or promote products derived from this software
     17           1.1       cgd  *    without specific prior written permission.
     18           1.1       cgd  *
     19           1.1       cgd  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
     20           1.1       cgd  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     21           1.1       cgd  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     22           1.1       cgd  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
     23           1.1       cgd  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     24           1.1       cgd  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     25           1.1       cgd  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     26           1.1       cgd  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     27           1.1       cgd  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     28           1.1       cgd  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     29           1.1       cgd  * SUCH DAMAGE.
     30           1.1       cgd  *
     31          1.25      fvdl  *	@(#)kern_ktrace.c	8.5 (Berkeley) 5/14/95
     32           1.1       cgd  */
     33          1.55     lukem 
     34          1.55     lukem #include <sys/cdefs.h>
     35  1.88.2.1.4.1    bouyer __KERNEL_RCSID(0, "$NetBSD: kern_ktrace.c,v 1.88.2.1.4.1 2007/02/08 23:09:05 bouyer Exp $");
     36          1.29   thorpej 
     37          1.29   thorpej #include "opt_ktrace.h"
     38          1.62      manu #include "opt_compat_mach.h"
     39           1.1       cgd 
     40           1.7   mycroft #include <sys/param.h>
     41          1.13       cgd #include <sys/systm.h>
     42           1.7   mycroft #include <sys/proc.h>
     43           1.7   mycroft #include <sys/file.h>
     44           1.7   mycroft #include <sys/namei.h>
     45           1.7   mycroft #include <sys/vnode.h>
     46           1.7   mycroft #include <sys/ktrace.h>
     47           1.7   mycroft #include <sys/malloc.h>
     48           1.7   mycroft #include <sys/syslog.h>
     49          1.28  christos #include <sys/filedesc.h>
     50          1.42  sommerfe #include <sys/ioctl.h>
     51           1.1       cgd 
     52          1.13       cgd #include <sys/mount.h>
     53          1.67   thorpej #include <sys/sa.h>
     54          1.13       cgd #include <sys/syscallargs.h>
     55          1.22  christos 
     56          1.51  jdolecek #ifdef KTRACE
     57          1.51  jdolecek 
     58          1.87     enami void	ktrinitheader(struct ktr_header *, struct proc *, int);
     59          1.87     enami int	ktrwrite(struct proc *, struct ktr_header *);
     60          1.74      fvdl int	ktrace_common(struct proc *, int, int, int, struct file *);
     61          1.74      fvdl int	ktrops(struct proc *, struct proc *, int, int, struct file *);
     62          1.74      fvdl int	ktrsetchildren(struct proc *, struct proc *, int, int,
     63          1.47   thorpej 	    struct file *);
     64          1.47   thorpej int	ktrcanset(struct proc *, struct proc *);
     65          1.47   thorpej int	ktrsamefile(struct file *, struct file *);
     66          1.44  sommerfe 
     67          1.44  sommerfe /*
     68          1.44  sommerfe  * "deep" compare of two files for the purposes of clearing a trace.
     69          1.44  sommerfe  * Returns true if they're the same open file, or if they point at the
     70          1.44  sommerfe  * same underlying vnode/socket.
     71          1.44  sommerfe  */
     72          1.44  sommerfe 
     73          1.44  sommerfe int
     74      1.88.2.1        he ktrsamefile(struct file *f1, struct file *f2)
     75          1.44  sommerfe {
     76          1.88     enami 
     77          1.44  sommerfe 	return ((f1 == f2) ||
     78          1.45  sommerfe 	    ((f1 != NULL) && (f2 != NULL) &&
     79          1.45  sommerfe 		(f1->f_type == f2->f_type) &&
     80          1.44  sommerfe 		(f1->f_data == f2->f_data)));
     81          1.44  sommerfe }
     82          1.22  christos 
     83          1.28  christos void
     84      1.88.2.1        he ktrderef(struct proc *p)
     85          1.28  christos {
     86          1.42  sommerfe 	struct file *fp = p->p_tracep;
     87          1.42  sommerfe 	p->p_traceflag = 0;
     88          1.42  sommerfe 	if (fp == NULL)
     89          1.28  christos 		return;
     90          1.84       dsl 	p->p_tracep = NULL;
     91          1.84       dsl 
     92          1.68        pk 	simple_lock(&fp->f_slock);
     93          1.42  sommerfe 	FILE_USE(fp);
     94          1.59  jdolecek 
     95          1.59  jdolecek 	/*
     96          1.59  jdolecek 	 * ktrace file descriptor can't be watched (are not visible to
     97          1.59  jdolecek 	 * userspace), so no kqueue stuff here
     98          1.59  jdolecek 	 */
     99          1.42  sommerfe 	closef(fp, NULL);
    100          1.28  christos }
    101          1.28  christos 
    102          1.28  christos void
    103      1.88.2.1        he ktradref(struct proc *p)
    104          1.28  christos {
    105          1.42  sommerfe 	struct file *fp = p->p_tracep;
    106          1.28  christos 
    107          1.42  sommerfe 	fp->f_count++;
    108          1.28  christos }
    109          1.28  christos 
    110          1.39   thorpej void
    111      1.88.2.1        he ktrinitheader(struct ktr_header *kth, struct proc *p, int type)
    112           1.1       cgd {
    113           1.1       cgd 
    114      1.88.2.1        he 	(void)memset(kth, 0, sizeof(*kth));
    115           1.1       cgd 	kth->ktr_type = type;
    116           1.1       cgd 	microtime(&kth->ktr_time);
    117           1.1       cgd 	kth->ktr_pid = p->p_pid;
    118          1.32     perry 	memcpy(kth->ktr_comm, p->p_comm, MAXCOMLEN);
    119           1.1       cgd }
    120           1.1       cgd 
    121      1.88.2.1        he int
    122      1.88.2.1        he ktrsyscall(struct proc *p, register_t code, register_t realcode,
    123      1.88.2.1        he     const struct sysent *callp, register_t args[])
    124           1.1       cgd {
    125          1.74      fvdl 	struct ktr_header kth;
    126          1.72   darrenr 	struct ktr_syscall *ktp;
    127          1.17       cgd 	register_t *argp;
    128      1.88.2.1        he 	int argsize, error;
    129          1.57      fvdl 	size_t len;
    130          1.60   thorpej 	u_int i;
    131          1.57      fvdl 
    132          1.66      manu 	if (callp == NULL)
    133          1.66      manu 		callp = p->p_emul->e_sysent;
    134          1.88     enami 
    135          1.76  drochner 	argsize = callp[code].sy_argsize;
    136          1.86       mrg #ifdef _LP64
    137          1.86       mrg 	if (p->p_flag & P_32)
    138          1.86       mrg 		argsize = argsize << 1;
    139          1.86       mrg #endif
    140          1.57      fvdl 	len = sizeof(struct ktr_syscall) + argsize;
    141           1.1       cgd 
    142           1.9       cgd 	p->p_traceflag |= KTRFAC_ACTIVE;
    143          1.74      fvdl 	ktrinitheader(&kth, p, KTR_SYSCALL);
    144          1.39   thorpej 	ktp = malloc(len, M_TEMP, M_WAITOK);
    145          1.61      manu 	ktp->ktr_code = realcode;
    146          1.17       cgd 	ktp->ktr_argsize = argsize;
    147          1.17       cgd 	argp = (register_t *)((char *)ktp + sizeof(struct ktr_syscall));
    148          1.31     perry 	for (i = 0; i < (argsize / sizeof(*argp)); i++)
    149           1.1       cgd 		*argp++ = args[i];
    150          1.39   thorpej 	kth.ktr_buf = (caddr_t)ktp;
    151          1.39   thorpej 	kth.ktr_len = len;
    152      1.88.2.1        he 	error = ktrwrite(p, &kth);
    153          1.39   thorpej 	free(ktp, M_TEMP);
    154           1.9       cgd 	p->p_traceflag &= ~KTRFAC_ACTIVE;
    155      1.88.2.1        he 	return error;
    156           1.1       cgd }
    157           1.1       cgd 
    158      1.88.2.1        he int
    159      1.88.2.1        he ktrsysret(struct proc *p, register_t code, int error, register_t *retval)
    160           1.1       cgd {
    161          1.39   thorpej 	struct ktr_header kth;
    162           1.1       cgd 	struct ktr_sysret ktp;
    163           1.1       cgd 
    164           1.9       cgd 	p->p_traceflag |= KTRFAC_ACTIVE;
    165          1.74      fvdl 	ktrinitheader(&kth, p, KTR_SYSRET);
    166           1.1       cgd 	ktp.ktr_code = code;
    167          1.34    kleink 	ktp.ktr_eosys = 0;			/* XXX unused */
    168           1.1       cgd 	ktp.ktr_error = error;
    169          1.71       dsl 	ktp.ktr_retval = retval ? retval[0] : 0;
    170          1.71       dsl 	ktp.ktr_retval_1 = retval ? retval[1] : 0;
    171           1.1       cgd 
    172          1.39   thorpej 	kth.ktr_buf = (caddr_t)&ktp;
    173          1.39   thorpej 	kth.ktr_len = sizeof(struct ktr_sysret);
    174           1.1       cgd 
    175      1.88.2.1        he 	error = ktrwrite(p, &kth);
    176           1.9       cgd 	p->p_traceflag &= ~KTRFAC_ACTIVE;
    177      1.88.2.1        he 	return error;
    178           1.1       cgd }
    179           1.1       cgd 
    180      1.88.2.1        he int
    181      1.88.2.1        he ktrnamei(struct proc *p, char *path)
    182           1.1       cgd {
    183          1.39   thorpej 	struct ktr_header kth;
    184      1.88.2.1        he 	int error;
    185           1.1       cgd 
    186           1.9       cgd 	p->p_traceflag |= KTRFAC_ACTIVE;
    187          1.74      fvdl 	ktrinitheader(&kth, p, KTR_NAMEI);
    188          1.39   thorpej 	kth.ktr_len = strlen(path);
    189          1.39   thorpej 	kth.ktr_buf = path;
    190          1.18  christos 
    191      1.88.2.1        he 	error = ktrwrite(p, &kth);
    192          1.18  christos 	p->p_traceflag &= ~KTRFAC_ACTIVE;
    193      1.88.2.1        he 	return error;
    194          1.18  christos }
    195          1.18  christos 
    196      1.88.2.1        he int
    197      1.88.2.1        he ktremul(struct proc *p)
    198          1.18  christos {
    199          1.39   thorpej 	struct ktr_header kth;
    200          1.74      fvdl 	const char *emul = p->p_emul->e_name;
    201      1.88.2.1        he 	int error;
    202          1.18  christos 
    203          1.18  christos 	p->p_traceflag |= KTRFAC_ACTIVE;
    204          1.74      fvdl 	ktrinitheader(&kth, p, KTR_EMUL);
    205          1.39   thorpej 	kth.ktr_len = strlen(emul);
    206          1.50       scw 	kth.ktr_buf = (caddr_t)emul;
    207           1.1       cgd 
    208      1.88.2.1        he 	error = ktrwrite(p, &kth);
    209           1.9       cgd 	p->p_traceflag &= ~KTRFAC_ACTIVE;
    210      1.88.2.1        he 	return error;
    211           1.1       cgd }
    212           1.1       cgd 
    213      1.88.2.1        he int
    214          1.75       dsl ktrkmem(struct proc *p, int ktr, const void *buf, size_t len)
    215          1.75       dsl {
    216          1.75       dsl 	struct ktr_header kth;
    217      1.88.2.1        he 	int error;
    218          1.75       dsl 
    219          1.75       dsl 	p->p_traceflag |= KTRFAC_ACTIVE;
    220          1.75       dsl 	ktrinitheader(&kth, p, ktr);
    221          1.75       dsl 	kth.ktr_len = len;
    222          1.75       dsl 	kth.ktr_buf = buf;
    223          1.75       dsl 
    224      1.88.2.1        he 	error = ktrwrite(p, &kth);
    225          1.75       dsl 	p->p_traceflag &= ~KTRFAC_ACTIVE;
    226      1.88.2.1        he 	return error;
    227          1.75       dsl }
    228          1.75       dsl 
    229      1.88.2.1        he int
    230      1.88.2.1        he ktrgenio(struct proc *p, int fd, enum uio_rw rw, struct iovec *iov,
    231      1.88.2.1        he     int len, int error)
    232           1.1       cgd {
    233          1.39   thorpej 	struct ktr_header kth;
    234          1.28  christos 	struct ktr_genio *ktp;
    235          1.74      fvdl 	caddr_t cp;
    236          1.72   darrenr 	int resid = len, cnt;
    237          1.39   thorpej 	int buflen;
    238          1.39   thorpej 
    239           1.1       cgd 	if (error)
    240      1.88.2.1        he 		return error;
    241          1.39   thorpej 
    242           1.9       cgd 	p->p_traceflag |= KTRFAC_ACTIVE;
    243          1.39   thorpej 
    244          1.39   thorpej 	buflen = min(PAGE_SIZE, len + sizeof(struct ktr_genio));
    245          1.39   thorpej 
    246          1.74      fvdl 	ktrinitheader(&kth, p, KTR_GENIO);
    247          1.39   thorpej 	ktp = malloc(buflen, M_TEMP, M_WAITOK);
    248           1.1       cgd 	ktp->ktr_fd = fd;
    249           1.1       cgd 	ktp->ktr_rw = rw;
    250          1.39   thorpej 
    251          1.39   thorpej 	kth.ktr_buf = (caddr_t)ktp;
    252          1.39   thorpej 
    253          1.31     perry 	cp = (caddr_t)((char *)ktp + sizeof(struct ktr_genio));
    254          1.39   thorpej 	buflen -= sizeof(struct ktr_genio);
    255          1.39   thorpej 
    256           1.1       cgd 	while (resid > 0) {
    257          1.67   thorpej #if 0 /* XXX NJWLWP */
    258          1.46   thorpej 		KDASSERT(p->p_cpu != NULL);
    259          1.46   thorpej 		KDASSERT(p->p_cpu == curcpu());
    260          1.67   thorpej #endif
    261          1.67   thorpej 		/* XXX NJWLWP */
    262          1.67   thorpej 		if (curcpu()->ci_schedstate.spc_flags & SPCF_SHOULDYIELD)
    263          1.67   thorpej 			preempt(1);
    264          1.39   thorpej 
    265          1.39   thorpej 		cnt = min(iov->iov_len, buflen);
    266          1.39   thorpej 		if (cnt > resid)
    267           1.1       cgd 			cnt = resid;
    268      1.88.2.1        he 		if ((error = copyin(iov->iov_base, cp, cnt)) != 0)
    269          1.39   thorpej 			break;
    270          1.39   thorpej 
    271          1.39   thorpej 		kth.ktr_len = cnt + sizeof(struct ktr_genio);
    272          1.39   thorpej 
    273      1.88.2.1        he 		error = ktrwrite(p, &kth);
    274      1.88.2.1        he 		if (__predict_false(error != 0))
    275          1.39   thorpej 			break;
    276          1.39   thorpej 
    277          1.39   thorpej 		iov->iov_base = (caddr_t)iov->iov_base + cnt;
    278          1.39   thorpej 		iov->iov_len -= cnt;
    279          1.39   thorpej 
    280          1.39   thorpej 		if (iov->iov_len == 0)
    281          1.39   thorpej 			iov++;
    282          1.39   thorpej 
    283           1.1       cgd 		resid -= cnt;
    284           1.1       cgd 	}
    285           1.1       cgd 
    286          1.39   thorpej 	free(ktp, M_TEMP);
    287           1.9       cgd 	p->p_traceflag &= ~KTRFAC_ACTIVE;
    288      1.88.2.1        he 	return error;
    289           1.1       cgd }
    290           1.1       cgd 
    291      1.88.2.1        he int
    292      1.88.2.1        he ktrpsig(struct proc *p, int sig, sig_t action, const sigset_t *mask,
    293      1.88.2.1        he     const ksiginfo_t *ksi)
    294           1.1       cgd {
    295      1.88.2.1        he 	int error;
    296      1.88.2.1        he 
    297          1.39   thorpej 	struct ktr_header kth;
    298          1.78  christos 	struct {
    299          1.78  christos 		struct ktr_psig	kp;
    300          1.78  christos 		siginfo_t	si;
    301          1.78  christos 	} kbuf;
    302           1.1       cgd 
    303           1.9       cgd 	p->p_traceflag |= KTRFAC_ACTIVE;
    304          1.74      fvdl 	ktrinitheader(&kth, p, KTR_PSIG);
    305          1.78  christos 	kbuf.kp.signo = (char)sig;
    306          1.78  christos 	kbuf.kp.action = action;
    307          1.78  christos 	kbuf.kp.mask = *mask;
    308          1.78  christos 	kth.ktr_buf = (caddr_t)&kbuf;
    309          1.78  christos 	if (ksi) {
    310          1.80   thorpej 		kbuf.kp.code = KSI_TRAPCODE(ksi);
    311          1.78  christos 		(void)memset(&kbuf.si, 0, sizeof(kbuf.si));
    312          1.80   thorpej 		kbuf.si._info = ksi->ksi_info;
    313          1.78  christos 		kth.ktr_len = sizeof(kbuf);
    314          1.78  christos 	} else {
    315          1.78  christos 		kbuf.kp.code = 0;
    316          1.78  christos 		kth.ktr_len = sizeof(struct ktr_psig);
    317          1.78  christos 	}
    318      1.88.2.1        he 	error = ktrwrite(p, &kth);
    319           1.9       cgd 	p->p_traceflag &= ~KTRFAC_ACTIVE;
    320      1.88.2.1        he 	return error;
    321           1.9       cgd }
    322           1.9       cgd 
    323      1.88.2.1        he int
    324      1.88.2.1        he ktrcsw(struct proc *p, int out, int user)
    325           1.9       cgd {
    326          1.39   thorpej 	struct ktr_header kth;
    327          1.39   thorpej 	struct ktr_csw kc;
    328      1.88.2.1        he 	int error;
    329           1.9       cgd 
    330           1.9       cgd 	p->p_traceflag |= KTRFAC_ACTIVE;
    331          1.74      fvdl 	ktrinitheader(&kth, p, KTR_CSW);
    332           1.9       cgd 	kc.out = out;
    333           1.9       cgd 	kc.user = user;
    334          1.39   thorpej 	kth.ktr_buf = (caddr_t)&kc;
    335          1.39   thorpej 	kth.ktr_len = sizeof(struct ktr_csw);
    336           1.9       cgd 
    337      1.88.2.1        he 	error = ktrwrite(p, &kth);
    338           1.9       cgd 	p->p_traceflag &= ~KTRFAC_ACTIVE;
    339      1.88.2.1        he 	return error;
    340           1.1       cgd }
    341           1.1       cgd 
    342      1.88.2.1        he int
    343      1.88.2.1        he ktruser(struct proc *p, const char *id, void *addr, size_t len, int ustr)
    344          1.51  jdolecek {
    345          1.51  jdolecek 	struct ktr_header kth;
    346          1.51  jdolecek 	struct ktr_user *ktp;
    347          1.51  jdolecek 	caddr_t user_dta;
    348      1.88.2.1        he 	int error;
    349          1.51  jdolecek 
    350  1.88.2.1.4.1    bouyer 	if (len > KTR_USER_MAXLEN)
    351  1.88.2.1.4.1    bouyer 		return ENOSPC;
    352  1.88.2.1.4.1    bouyer 
    353          1.51  jdolecek 	p->p_traceflag |= KTRFAC_ACTIVE;
    354          1.74      fvdl 	ktrinitheader(&kth, p, KTR_USER);
    355          1.51  jdolecek 	ktp = malloc(sizeof(struct ktr_user) + len, M_TEMP, M_WAITOK);
    356          1.51  jdolecek 	if (ustr) {
    357          1.51  jdolecek 		if (copyinstr(id, ktp->ktr_id, KTR_USER_MAXIDLEN, NULL) != 0)
    358          1.51  jdolecek 			ktp->ktr_id[0] = '\0';
    359          1.51  jdolecek 	} else
    360          1.51  jdolecek 		strncpy(ktp->ktr_id, id, KTR_USER_MAXIDLEN);
    361          1.51  jdolecek 	ktp->ktr_id[KTR_USER_MAXIDLEN-1] = '\0';
    362          1.51  jdolecek 
    363          1.51  jdolecek 	user_dta = (caddr_t) ((char *)ktp + sizeof(struct ktr_user));
    364  1.88.2.1.4.1    bouyer 	if ((error = copyin(addr, (void *)user_dta, len)) != 0)
    365          1.51  jdolecek 		len = 0;
    366          1.51  jdolecek 
    367          1.51  jdolecek 	kth.ktr_buf = (void *)ktp;
    368          1.51  jdolecek 	kth.ktr_len = sizeof(struct ktr_user) + len;
    369      1.88.2.1        he 	error = ktrwrite(p, &kth);
    370          1.51  jdolecek 
    371          1.51  jdolecek 	free(ktp, M_TEMP);
    372          1.51  jdolecek 	p->p_traceflag &= ~KTRFAC_ACTIVE;
    373      1.88.2.1        he 	return error;
    374          1.51  jdolecek 
    375          1.51  jdolecek }
    376          1.51  jdolecek 
    377      1.88.2.1        he int
    378      1.88.2.1        he ktrmmsg(struct proc *p, const void *msgh, size_t size)
    379          1.62      manu {
    380          1.62      manu 	struct ktr_header kth;
    381          1.62      manu 	struct ktr_mmsg	*kp;
    382      1.88.2.1        he 	int error;
    383          1.88     enami 
    384          1.62      manu 	p->p_traceflag |= KTRFAC_ACTIVE;
    385          1.74      fvdl 	ktrinitheader(&kth, p, KTR_MMSG);
    386          1.88     enami 
    387          1.64      manu 	kp = (struct ktr_mmsg *)msgh;
    388          1.62      manu 	kth.ktr_buf = (caddr_t)kp;
    389          1.62      manu 	kth.ktr_len = size;
    390      1.88.2.1        he 	error = ktrwrite(p, &kth);
    391          1.62      manu 	p->p_traceflag &= ~KTRFAC_ACTIVE;
    392      1.88.2.1        he 	return error;
    393          1.62      manu }
    394          1.83      manu 
    395      1.88.2.1        he int
    396      1.88.2.1        he ktrmool(struct proc *p, const void *kaddr, size_t size, const void *uaddr)
    397          1.83      manu {
    398          1.83      manu 	struct ktr_header kth;
    399          1.83      manu 	struct ktr_mool *kp;
    400          1.83      manu 	struct ktr_mool *buf;
    401      1.88.2.1        he 	int error;
    402          1.83      manu 
    403          1.83      manu 	p->p_traceflag |= KTRFAC_ACTIVE;
    404          1.83      manu 	ktrinitheader(&kth, p, KTR_MOOL);
    405          1.83      manu 
    406          1.83      manu 	kp = malloc(size + sizeof(*kp), M_TEMP, M_WAITOK);
    407          1.83      manu 	kp->uaddr = uaddr;
    408          1.83      manu 	kp->size = size;
    409          1.83      manu 	buf = kp + 1; /* Skip uaddr and size */
    410      1.88.2.1        he 	(void)memcpy(buf, kaddr, size);
    411          1.88     enami 
    412          1.83      manu 	kth.ktr_buf = (caddr_t)kp;
    413          1.83      manu 	kth.ktr_len = size + sizeof(*kp);
    414      1.88.2.1        he 	error = ktrwrite(p, &kth);
    415          1.83      manu 	free(kp, M_TEMP);
    416          1.83      manu 
    417          1.83      manu 	p->p_traceflag &= ~KTRFAC_ACTIVE;
    418      1.88.2.1        he 	return error;
    419          1.83      manu }
    420          1.83      manu 
    421          1.62      manu 
    422           1.1       cgd /* Interface and common routines */
    423           1.1       cgd 
    424          1.17       cgd int
    425      1.88.2.1        he ktrace_common(struct proc *curp, int ops, int facs, int pid, struct file *fp)
    426          1.28  christos {
    427          1.74      fvdl 	int ret = 0;
    428          1.72   darrenr 	int error = 0;
    429          1.42  sommerfe 	int one = 1;
    430          1.42  sommerfe 	int descend;
    431          1.74      fvdl 	struct proc *p;
    432          1.74      fvdl 	struct pgrp *pg;
    433          1.28  christos 
    434          1.28  christos 	curp->p_traceflag |= KTRFAC_ACTIVE;
    435          1.42  sommerfe 	descend = ops & KTRFLAG_DESCEND;
    436          1.42  sommerfe 	facs = facs & ~((unsigned) KTRFAC_ROOT);
    437          1.28  christos 
    438          1.28  christos 	/*
    439          1.28  christos 	 * Clear all uses of the tracefile
    440          1.28  christos 	 */
    441          1.28  christos 	if (KTROP(ops) == KTROP_CLEARFILE) {
    442          1.37   thorpej 		proclist_lock_read();
    443          1.81  jdolecek 		LIST_FOREACH(p, &allproc, p_list) {
    444          1.44  sommerfe 			if (ktrsamefile(p->p_tracep, fp)) {
    445          1.28  christos 				if (ktrcanset(curp, p))
    446          1.28  christos 					ktrderef(p);
    447          1.28  christos 				else
    448          1.28  christos 					error = EPERM;
    449          1.28  christos 			}
    450          1.28  christos 		}
    451          1.36   thorpej 		proclist_unlock_read();
    452          1.28  christos 		goto done;
    453          1.28  christos 	}
    454          1.42  sommerfe 
    455          1.42  sommerfe 	/*
    456          1.42  sommerfe 	 * Mark fp non-blocking, to avoid problems from possible deadlocks.
    457          1.42  sommerfe 	 */
    458          1.42  sommerfe 
    459          1.43  sommerfe 	if (fp != NULL) {
    460          1.43  sommerfe 		fp->f_flag |= FNONBLOCK;
    461          1.74      fvdl 		(*fp->f_ops->fo_ioctl)(fp, FIONBIO, (caddr_t)&one, curp);
    462          1.43  sommerfe 	}
    463          1.88     enami 
    464          1.28  christos 	/*
    465          1.28  christos 	 * need something to (un)trace (XXX - why is this here?)
    466          1.28  christos 	 */
    467          1.28  christos 	if (!facs) {
    468          1.28  christos 		error = EINVAL;
    469          1.28  christos 		goto done;
    470          1.28  christos 	}
    471          1.88     enami 	/*
    472          1.28  christos 	 * do it
    473          1.28  christos 	 */
    474          1.42  sommerfe 	if (pid < 0) {
    475          1.28  christos 		/*
    476          1.28  christos 		 * by process group
    477          1.28  christos 		 */
    478          1.82       dsl 		pg = pg_find(-pid, PFIND_UNLOCK_FAIL);
    479          1.28  christos 		if (pg == NULL) {
    480          1.28  christos 			error = ESRCH;
    481          1.28  christos 			goto done;
    482          1.28  christos 		}
    483          1.81  jdolecek 		LIST_FOREACH(p, &pg->pg_members, p_pglist) {
    484          1.28  christos 			if (descend)
    485          1.74      fvdl 				ret |= ktrsetchildren(curp, p, ops, facs, fp);
    486          1.88     enami 			else
    487          1.74      fvdl 				ret |= ktrops(curp, p, ops, facs, fp);
    488          1.39   thorpej 		}
    489          1.88     enami 
    490          1.28  christos 	} else {
    491          1.28  christos 		/*
    492          1.28  christos 		 * by pid
    493          1.28  christos 		 */
    494          1.82       dsl 		p = p_find(pid, PFIND_UNLOCK_FAIL);
    495          1.28  christos 		if (p == NULL) {
    496          1.28  christos 			error = ESRCH;
    497          1.28  christos 			goto done;
    498          1.28  christos 		}
    499          1.28  christos 		if (descend)
    500          1.74      fvdl 			ret |= ktrsetchildren(curp, p, ops, facs, fp);
    501          1.28  christos 		else
    502          1.74      fvdl 			ret |= ktrops(curp, p, ops, facs, fp);
    503          1.28  christos 	}
    504          1.82       dsl 	proclist_unlock_read();	/* taken by p{g}_find */
    505          1.28  christos 	if (!ret)
    506          1.28  christos 		error = EPERM;
    507          1.28  christos done:
    508          1.28  christos 	curp->p_traceflag &= ~KTRFAC_ACTIVE;
    509          1.28  christos 	return (error);
    510          1.28  christos }
    511          1.28  christos 
    512          1.28  christos /*
    513          1.28  christos  * ktrace system call
    514          1.28  christos  */
    515          1.28  christos /* ARGSUSED */
    516          1.28  christos int
    517      1.88.2.1        he sys_fktrace(struct lwp *l, void *v, register_t *retval)
    518          1.42  sommerfe {
    519          1.42  sommerfe 	struct sys_fktrace_args /* {
    520          1.42  sommerfe 		syscallarg(int) fd;
    521          1.42  sommerfe 		syscallarg(int) ops;
    522          1.42  sommerfe 		syscallarg(int) facs;
    523          1.42  sommerfe 		syscallarg(int) pid;
    524          1.42  sommerfe 	} */ *uap = v;
    525          1.74      fvdl 	struct proc *curp = l->l_proc;
    526          1.42  sommerfe 	struct file *fp = NULL;
    527          1.74      fvdl 	struct filedesc *fdp = curp->p_fd;
    528          1.70      yamt 	int error;
    529          1.42  sommerfe 
    530          1.54   thorpej 	if ((fp = fd_getfile(fdp, SCARG(uap, fd))) == NULL)
    531          1.54   thorpej 		return (EBADF);
    532          1.54   thorpej 
    533          1.70      yamt 	FILE_USE(fp);
    534          1.70      yamt 
    535          1.54   thorpej 	if ((fp->f_flag & FWRITE) == 0)
    536          1.70      yamt 		error = EBADF;
    537          1.70      yamt 	else
    538          1.74      fvdl 		error = ktrace_common(curp, SCARG(uap, ops),
    539          1.70      yamt 		    SCARG(uap, facs), SCARG(uap, pid), fp);
    540          1.70      yamt 
    541          1.74      fvdl 	FILE_UNUSE(fp, curp);
    542          1.42  sommerfe 
    543          1.70      yamt 	return error;
    544          1.42  sommerfe }
    545          1.42  sommerfe 
    546          1.42  sommerfe /*
    547          1.42  sommerfe  * ktrace system call
    548          1.42  sommerfe  */
    549          1.42  sommerfe /* ARGSUSED */
    550          1.42  sommerfe int
    551      1.88.2.1        he sys_ktrace(struct lwp *l, void *v, register_t *retval)
    552          1.19   thorpej {
    553          1.28  christos 	struct sys_ktrace_args /* {
    554          1.24   mycroft 		syscallarg(const char *) fname;
    555          1.13       cgd 		syscallarg(int) ops;
    556          1.13       cgd 		syscallarg(int) facs;
    557          1.13       cgd 		syscallarg(int) pid;
    558          1.19   thorpej 	} */ *uap = v;
    559          1.67   thorpej 	struct proc *curp = l->l_proc;
    560          1.28  christos 	struct vnode *vp = NULL;
    561          1.42  sommerfe 	struct file *fp = NULL;
    562          1.74      fvdl 	int fd;
    563          1.42  sommerfe 	int ops = SCARG(uap, ops);
    564          1.74      fvdl 	int error = 0;
    565          1.72   darrenr 	struct nameidata nd;
    566           1.1       cgd 
    567          1.42  sommerfe 	ops = KTROP(ops) | (ops & KTRFLAG_DESCEND);
    568          1.42  sommerfe 
    569           1.9       cgd 	curp->p_traceflag |= KTRFAC_ACTIVE;
    570          1.69  christos 	if ((ops & KTROP_CLEAR) == 0) {
    571           1.1       cgd 		/*
    572           1.1       cgd 		 * an operation which requires a file argument.
    573           1.1       cgd 		 */
    574          1.13       cgd 		NDINIT(&nd, LOOKUP, FOLLOW, UIO_USERSPACE, SCARG(uap, fname),
    575          1.74      fvdl 		    curp);
    576          1.22  christos 		if ((error = vn_open(&nd, FREAD|FWRITE, 0)) != 0) {
    577           1.9       cgd 			curp->p_traceflag &= ~KTRFAC_ACTIVE;
    578           1.1       cgd 			return (error);
    579           1.9       cgd 		}
    580           1.1       cgd 		vp = nd.ni_vp;
    581          1.25      fvdl 		VOP_UNLOCK(vp, 0);
    582           1.1       cgd 		if (vp->v_type != VREG) {
    583          1.74      fvdl 			(void) vn_close(vp, FREAD|FWRITE, curp->p_ucred, curp);
    584           1.9       cgd 			curp->p_traceflag &= ~KTRFAC_ACTIVE;
    585           1.1       cgd 			return (EACCES);
    586           1.1       cgd 		}
    587           1.1       cgd 		/*
    588          1.42  sommerfe 		 * XXX This uses up a file descriptor slot in the
    589          1.42  sommerfe 		 * tracing process for the duration of this syscall.
    590          1.42  sommerfe 		 * This is not expected to be a problem.  If
    591          1.42  sommerfe 		 * falloc(NULL, ...) DTRT we could skip that part, but
    592          1.42  sommerfe 		 * that would require changing its interface to allow
    593          1.42  sommerfe 		 * the caller to pass in a ucred..
    594          1.42  sommerfe 		 *
    595          1.88     enami 		 * This will FILE_USE the fp it returns, if any.
    596          1.42  sommerfe 		 * Keep it in use until we return.
    597           1.1       cgd 		 */
    598          1.42  sommerfe 		if ((error = falloc(curp, &fp, &fd)) != 0)
    599           1.1       cgd 			goto done;
    600          1.88     enami 
    601          1.42  sommerfe 		fp->f_flag = FWRITE|FAPPEND;
    602          1.42  sommerfe 		fp->f_type = DTYPE_VNODE;
    603          1.42  sommerfe 		fp->f_ops = &vnops;
    604          1.42  sommerfe 		fp->f_data = (caddr_t)vp;
    605          1.54   thorpej 		FILE_SET_MATURE(fp);
    606          1.42  sommerfe 		vp = NULL;
    607          1.42  sommerfe 	}
    608          1.74      fvdl 	error = ktrace_common(curp, SCARG(uap, ops), SCARG(uap, facs),
    609          1.42  sommerfe 	    SCARG(uap, pid), fp);
    610          1.88     enami done:
    611           1.1       cgd 	if (vp != NULL)
    612          1.74      fvdl 		(void) vn_close(vp, FWRITE, curp->p_ucred, curp);
    613          1.42  sommerfe 	if (fp != NULL) {
    614          1.74      fvdl 		FILE_UNUSE(fp, curp);	/* release file */
    615          1.74      fvdl 		fdrelease(curp, fd); 	/* release fd table slot */
    616          1.42  sommerfe 	}
    617           1.1       cgd 	return (error);
    618           1.1       cgd }
    619           1.1       cgd 
    620           1.4    andrew int
    621      1.88.2.1        he ktrops(struct proc *curp, struct proc *p, int ops, int facs,
    622      1.88.2.1        he     struct file *fp)
    623           1.1       cgd {
    624           1.1       cgd 
    625           1.1       cgd 	if (!ktrcanset(curp, p))
    626           1.1       cgd 		return (0);
    627          1.28  christos 	if (KTROP(ops) == KTROP_SET) {
    628          1.88     enami 		if (p->p_tracep != fp) {
    629           1.1       cgd 			/*
    630           1.1       cgd 			 * if trace file already in use, relinquish
    631           1.1       cgd 			 */
    632          1.28  christos 			ktrderef(p);
    633          1.42  sommerfe 			p->p_tracep = fp;
    634          1.28  christos 			ktradref(p);
    635           1.1       cgd 		}
    636           1.1       cgd 		p->p_traceflag |= facs;
    637           1.1       cgd 		if (curp->p_ucred->cr_uid == 0)
    638           1.1       cgd 			p->p_traceflag |= KTRFAC_ROOT;
    639          1.88     enami 	} else {
    640           1.1       cgd 		/* KTROP_CLEAR */
    641           1.1       cgd 		if (((p->p_traceflag &= ~facs) & KTRFAC_MASK) == 0) {
    642           1.1       cgd 			/* no more tracing */
    643          1.28  christos 			ktrderef(p);
    644           1.1       cgd 		}
    645           1.1       cgd 	}
    646          1.21  christos 
    647          1.21  christos 	/*
    648          1.21  christos 	 * Emit an emulation record, every time there is a ktrace
    649          1.88     enami 	 * change/attach request.
    650          1.21  christos 	 */
    651          1.21  christos 	if (KTRPOINT(p, KTR_EMUL))
    652          1.84       dsl 		p->p_traceflag |= KTRFAC_TRC_EMUL;
    653          1.49    martin #ifdef __HAVE_SYSCALL_INTERN
    654          1.48   mycroft 	(*p->p_emul->e_syscall_intern)(p);
    655          1.49    martin #endif
    656           1.1       cgd 
    657           1.1       cgd 	return (1);
    658           1.1       cgd }
    659           1.1       cgd 
    660          1.22  christos int
    661      1.88.2.1        he ktrsetchildren(struct proc *curp, struct proc *top, int ops, int facs,
    662      1.88.2.1        he     struct file *fp)
    663           1.1       cgd {
    664          1.28  christos 	struct proc *p;
    665          1.28  christos 	int ret = 0;
    666           1.1       cgd 
    667           1.1       cgd 	p = top;
    668           1.1       cgd 	for (;;) {
    669          1.74      fvdl 		ret |= ktrops(curp, p, ops, facs, fp);
    670           1.1       cgd 		/*
    671           1.1       cgd 		 * If this process has children, descend to them next,
    672           1.1       cgd 		 * otherwise do any siblings, and if done with this level,
    673           1.1       cgd 		 * follow back up the tree (but not past top).
    674           1.1       cgd 		 */
    675          1.82       dsl 		if (LIST_FIRST(&p->p_children) != NULL) {
    676          1.39   thorpej 			p = LIST_FIRST(&p->p_children);
    677          1.82       dsl 			continue;
    678          1.82       dsl 		}
    679          1.82       dsl 		for (;;) {
    680           1.1       cgd 			if (p == top)
    681           1.1       cgd 				return (ret);
    682          1.39   thorpej 			if (LIST_NEXT(p, p_sibling) != NULL) {
    683          1.39   thorpej 				p = LIST_NEXT(p, p_sibling);
    684           1.1       cgd 				break;
    685           1.1       cgd 			}
    686          1.12   mycroft 			p = p->p_pptr;
    687           1.1       cgd 		}
    688           1.1       cgd 	}
    689           1.1       cgd 	/*NOTREACHED*/
    690           1.1       cgd }
    691           1.1       cgd 
    692          1.39   thorpej int
    693      1.88.2.1        he ktrwrite(struct proc *p, struct ktr_header *kth)
    694           1.1       cgd {
    695          1.74      fvdl 	struct uio auio;
    696           1.1       cgd 	struct iovec aiov[2];
    697          1.42  sommerfe 	int error, tries;
    698          1.74      fvdl 	struct file *fp = p->p_tracep;
    699           1.1       cgd 
    700          1.42  sommerfe 	if (fp == NULL)
    701          1.42  sommerfe 		return 0;
    702          1.88     enami 
    703          1.84       dsl 	if (p->p_traceflag & KTRFAC_TRC_EMUL) {
    704          1.84       dsl 		/* Add emulation trace before first entry for this process */
    705          1.84       dsl 		p->p_traceflag &= ~KTRFAC_TRC_EMUL;
    706      1.88.2.1        he 		if ((error = ktremul(p)) != 0)
    707      1.88.2.1        he 			return error;
    708          1.84       dsl 	}
    709          1.84       dsl 
    710           1.1       cgd 	auio.uio_iov = &aiov[0];
    711           1.1       cgd 	auio.uio_offset = 0;
    712           1.1       cgd 	auio.uio_segflg = UIO_SYSSPACE;
    713           1.1       cgd 	auio.uio_rw = UIO_WRITE;
    714           1.1       cgd 	aiov[0].iov_base = (caddr_t)kth;
    715           1.1       cgd 	aiov[0].iov_len = sizeof(struct ktr_header);
    716           1.1       cgd 	auio.uio_resid = sizeof(struct ktr_header);
    717           1.1       cgd 	auio.uio_iovcnt = 1;
    718          1.74      fvdl 	auio.uio_procp = (struct proc *)0;
    719           1.1       cgd 	if (kth->ktr_len > 0) {
    720           1.1       cgd 		auio.uio_iovcnt++;
    721          1.75       dsl 		aiov[1].iov_base = (void *)kth->ktr_buf;
    722           1.1       cgd 		aiov[1].iov_len = kth->ktr_len;
    723           1.1       cgd 		auio.uio_resid += kth->ktr_len;
    724           1.1       cgd 	}
    725          1.28  christos 
    726          1.68        pk 	simple_lock(&fp->f_slock);
    727          1.42  sommerfe 	FILE_USE(fp);
    728          1.42  sommerfe 
    729          1.42  sommerfe 	tries = 0;
    730          1.42  sommerfe 	do {
    731          1.30   thorpej 		error = (*fp->f_ops->fo_write)(fp, &fp->f_offset, &auio,
    732          1.30   thorpej 		    fp->f_cred, FOF_UPDATE_OFFSET);
    733          1.74      fvdl 		tries++;
    734          1.88     enami 		if (error == EWOULDBLOCK)
    735          1.88     enami 			preempt(1);
    736          1.42  sommerfe 	} while ((error == EWOULDBLOCK) && (tries < 3));
    737          1.42  sommerfe 	FILE_UNUSE(fp, NULL);
    738          1.28  christos 
    739          1.40   thorpej 	if (__predict_true(error == 0))
    740          1.39   thorpej 		return (0);
    741           1.1       cgd 	/*
    742          1.38   darrenr 	 * If error encountered, give up tracing on this vnode.  Don't report
    743          1.38   darrenr 	 * EPIPE as this can easily happen with fktrace()/ktruss.
    744           1.1       cgd 	 */
    745          1.38   darrenr 	if (error != EPIPE)
    746          1.38   darrenr 		log(LOG_NOTICE,
    747          1.38   darrenr 		    "ktrace write failed, errno %d, tracing stopped\n",
    748          1.38   darrenr 		    error);
    749          1.37   thorpej 	proclist_lock_read();
    750          1.81  jdolecek 	LIST_FOREACH(p, &allproc, p_list) {
    751          1.44  sommerfe 		if (ktrsamefile(p->p_tracep, fp))
    752          1.28  christos 			ktrderef(p);
    753           1.1       cgd 	}
    754          1.36   thorpej 	proclist_unlock_read();
    755          1.39   thorpej 
    756          1.39   thorpej 	return (error);
    757           1.1       cgd }
    758           1.1       cgd 
    759           1.1       cgd /*
    760           1.1       cgd  * Return true if caller has permission to set the ktracing state
    761           1.1       cgd  * of target.  Essentially, the target can't possess any
    762           1.1       cgd  * more permissions than the caller.  KTRFAC_ROOT signifies that
    763          1.88     enami  * root previously set the tracing status on the target process, and
    764           1.1       cgd  * so, only root may further change it.
    765           1.1       cgd  *
    766           1.1       cgd  * TODO: check groups.  use caller effective gid.
    767           1.1       cgd  */
    768          1.22  christos int
    769      1.88.2.1        he ktrcanset(struct proc *callp, struct proc *targetp)
    770           1.1       cgd {
    771          1.28  christos 	struct pcred *caller = callp->p_cred;
    772          1.28  christos 	struct pcred *target = targetp->p_cred;
    773           1.1       cgd 
    774           1.1       cgd 	if ((caller->pc_ucred->cr_uid == target->p_ruid &&
    775          1.88     enami 	    target->p_ruid == target->p_svuid &&
    776          1.88     enami 	    caller->p_rgid == target->p_rgid &&	/* XXX */
    777          1.88     enami 	    target->p_rgid == target->p_svgid &&
    778          1.88     enami 	    (targetp->p_traceflag & KTRFAC_ROOT) == 0 &&
    779          1.88     enami 	    (targetp->p_flag & P_SUGID) == 0) ||
    780          1.88     enami 	    caller->pc_ucred->cr_uid == 0)
    781           1.1       cgd 		return (1);
    782           1.1       cgd 
    783           1.1       cgd 	return (0);
    784           1.1       cgd }
    785          1.47   thorpej #endif /* KTRACE */
    786          1.51  jdolecek 
    787          1.51  jdolecek /*
    788          1.51  jdolecek  * Put user defined entry to ktrace records.
    789          1.51  jdolecek  */
    790          1.51  jdolecek int
    791      1.88.2.1        he sys_utrace(struct lwp *l, void *v, register_t *retval)
    792          1.51  jdolecek {
    793          1.51  jdolecek #ifdef KTRACE
    794          1.51  jdolecek 	struct sys_utrace_args /* {
    795          1.52  jdolecek 		syscallarg(const char *) label;
    796          1.51  jdolecek 		syscallarg(void *) addr;
    797          1.51  jdolecek 		syscallarg(size_t) len;
    798          1.51  jdolecek 	} */ *uap = v;
    799          1.67   thorpej 	struct proc *p = l->l_proc;
    800          1.88     enami 
    801          1.51  jdolecek 	if (!KTRPOINT(p, KTR_USER))
    802          1.51  jdolecek 		return (0);
    803          1.53  jdolecek 
    804  1.88.2.1.4.1    bouyer 	return ktruser(p, SCARG(uap, label), SCARG(uap, addr),
    805  1.88.2.1.4.1    bouyer 		SCARG(uap, len), 1);
    806          1.51  jdolecek 
    807          1.51  jdolecek #else /* !KTRACE */
    808          1.51  jdolecek 	return ENOSYS;
    809          1.51  jdolecek #endif /* KTRACE */
    810          1.51  jdolecek }
    811