Home | History | Annotate | Line # | Download | only in kern
kern_ktrace.c revision 1.86
      1  1.86       mrg /*	$NetBSD: kern_ktrace.c,v 1.86 2004/01/16 05:03:02 mrg Exp $	*/
      2  1.11       cgd 
      3   1.1       cgd /*
      4   1.9       cgd  * Copyright (c) 1989, 1993
      5   1.9       cgd  *	The Regents of the University of California.  All rights reserved.
      6   1.1       cgd  *
      7   1.1       cgd  * Redistribution and use in source and binary forms, with or without
      8   1.1       cgd  * modification, are permitted provided that the following conditions
      9   1.1       cgd  * are met:
     10   1.1       cgd  * 1. Redistributions of source code must retain the above copyright
     11   1.1       cgd  *    notice, this list of conditions and the following disclaimer.
     12   1.1       cgd  * 2. Redistributions in binary form must reproduce the above copyright
     13   1.1       cgd  *    notice, this list of conditions and the following disclaimer in the
     14   1.1       cgd  *    documentation and/or other materials provided with the distribution.
     15  1.77       agc  * 3. Neither the name of the University nor the names of its contributors
     16   1.1       cgd  *    may be used to endorse or promote products derived from this software
     17   1.1       cgd  *    without specific prior written permission.
     18   1.1       cgd  *
     19   1.1       cgd  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
     20   1.1       cgd  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     21   1.1       cgd  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     22   1.1       cgd  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
     23   1.1       cgd  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     24   1.1       cgd  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     25   1.1       cgd  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     26   1.1       cgd  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     27   1.1       cgd  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     28   1.1       cgd  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     29   1.1       cgd  * SUCH DAMAGE.
     30   1.1       cgd  *
     31  1.25      fvdl  *	@(#)kern_ktrace.c	8.5 (Berkeley) 5/14/95
     32   1.1       cgd  */
     33  1.55     lukem 
     34  1.55     lukem #include <sys/cdefs.h>
     35  1.86       mrg __KERNEL_RCSID(0, "$NetBSD: kern_ktrace.c,v 1.86 2004/01/16 05:03:02 mrg Exp $");
     36  1.29   thorpej 
     37  1.29   thorpej #include "opt_ktrace.h"
     38  1.62      manu #include "opt_compat_mach.h"
     39   1.1       cgd 
     40   1.7   mycroft #include <sys/param.h>
     41  1.13       cgd #include <sys/systm.h>
     42   1.7   mycroft #include <sys/proc.h>
     43   1.7   mycroft #include <sys/file.h>
     44   1.7   mycroft #include <sys/namei.h>
     45   1.7   mycroft #include <sys/vnode.h>
     46   1.7   mycroft #include <sys/ktrace.h>
     47   1.7   mycroft #include <sys/malloc.h>
     48   1.7   mycroft #include <sys/syslog.h>
     49  1.28  christos #include <sys/filedesc.h>
     50  1.42  sommerfe #include <sys/ioctl.h>
     51   1.1       cgd 
     52  1.13       cgd #include <sys/mount.h>
     53  1.67   thorpej #include <sys/sa.h>
     54  1.13       cgd #include <sys/syscallargs.h>
     55  1.22  christos 
     56  1.51  jdolecek #ifdef KTRACE
     57  1.51  jdolecek 
     58  1.74      fvdl int	ktrace_common(struct proc *, int, int, int, struct file *);
     59  1.74      fvdl int	ktrops(struct proc *, struct proc *, int, int, struct file *);
     60  1.74      fvdl int	ktrsetchildren(struct proc *, struct proc *, int, int,
     61  1.47   thorpej 	    struct file *);
     62  1.47   thorpej int	ktrcanset(struct proc *, struct proc *);
     63  1.47   thorpej int	ktrsamefile(struct file *, struct file *);
     64  1.44  sommerfe 
     65  1.44  sommerfe /*
     66  1.44  sommerfe  * "deep" compare of two files for the purposes of clearing a trace.
     67  1.44  sommerfe  * Returns true if they're the same open file, or if they point at the
     68  1.44  sommerfe  * same underlying vnode/socket.
     69  1.44  sommerfe  */
     70  1.44  sommerfe 
     71  1.44  sommerfe int
     72  1.62      manu ktrsamefile(f1, f2)
     73  1.62      manu 	struct file *f1;
     74  1.62      manu 	struct file *f2;
     75  1.44  sommerfe {
     76  1.44  sommerfe 	return ((f1 == f2) ||
     77  1.45  sommerfe 	    ((f1 != NULL) && (f2 != NULL) &&
     78  1.45  sommerfe 		(f1->f_type == f2->f_type) &&
     79  1.44  sommerfe 		(f1->f_data == f2->f_data)));
     80  1.44  sommerfe }
     81  1.22  christos 
     82  1.28  christos void
     83  1.62      manu ktrderef(p)
     84  1.62      manu 	struct proc *p;
     85  1.28  christos {
     86  1.42  sommerfe 	struct file *fp = p->p_tracep;
     87  1.42  sommerfe 	p->p_traceflag = 0;
     88  1.42  sommerfe 	if (fp == NULL)
     89  1.28  christos 		return;
     90  1.84       dsl 	p->p_tracep = NULL;
     91  1.84       dsl 
     92  1.68        pk 	simple_lock(&fp->f_slock);
     93  1.42  sommerfe 	FILE_USE(fp);
     94  1.59  jdolecek 
     95  1.59  jdolecek 	/*
     96  1.59  jdolecek 	 * ktrace file descriptor can't be watched (are not visible to
     97  1.59  jdolecek 	 * userspace), so no kqueue stuff here
     98  1.59  jdolecek 	 */
     99  1.42  sommerfe 	closef(fp, NULL);
    100  1.28  christos }
    101  1.28  christos 
    102  1.28  christos void
    103  1.62      manu ktradref(p)
    104  1.62      manu 	struct proc *p;
    105  1.28  christos {
    106  1.42  sommerfe 	struct file *fp = p->p_tracep;
    107  1.28  christos 
    108  1.42  sommerfe 	fp->f_count++;
    109  1.28  christos }
    110  1.28  christos 
    111  1.39   thorpej void
    112  1.74      fvdl ktrinitheader(kth, p, type)
    113  1.62      manu 	struct ktr_header *kth;
    114  1.74      fvdl 	struct proc *p;
    115  1.62      manu 	int type;
    116   1.1       cgd {
    117   1.1       cgd 
    118  1.39   thorpej 	memset(kth, 0, sizeof(*kth));
    119   1.1       cgd 	kth->ktr_type = type;
    120   1.1       cgd 	microtime(&kth->ktr_time);
    121   1.1       cgd 	kth->ktr_pid = p->p_pid;
    122  1.32     perry 	memcpy(kth->ktr_comm, p->p_comm, MAXCOMLEN);
    123   1.1       cgd }
    124   1.1       cgd 
    125  1.17       cgd void
    126  1.74      fvdl ktrsyscall(p, code, realcode, callp, args)
    127  1.74      fvdl 	struct proc *p;
    128  1.62      manu 	register_t code;
    129  1.62      manu 	register_t realcode;
    130  1.66      manu 	const struct sysent *callp;
    131  1.62      manu 	register_t args[];
    132   1.1       cgd {
    133  1.74      fvdl 	struct ktr_header kth;
    134  1.72   darrenr 	struct ktr_syscall *ktp;
    135  1.17       cgd 	register_t *argp;
    136  1.57      fvdl 	int argsize;
    137  1.57      fvdl 	size_t len;
    138  1.60   thorpej 	u_int i;
    139  1.57      fvdl 
    140  1.66      manu 	if (callp == NULL)
    141  1.66      manu 		callp = p->p_emul->e_sysent;
    142  1.66      manu 
    143  1.76  drochner 	argsize = callp[code].sy_argsize;
    144  1.86       mrg #ifdef _LP64
    145  1.86       mrg 	if (p->p_flag & P_32)
    146  1.86       mrg 		argsize = argsize << 1;
    147  1.86       mrg #endif
    148  1.57      fvdl 	len = sizeof(struct ktr_syscall) + argsize;
    149   1.1       cgd 
    150   1.9       cgd 	p->p_traceflag |= KTRFAC_ACTIVE;
    151  1.74      fvdl 	ktrinitheader(&kth, p, KTR_SYSCALL);
    152  1.39   thorpej 	ktp = malloc(len, M_TEMP, M_WAITOK);
    153  1.61      manu 	ktp->ktr_code = realcode;
    154  1.17       cgd 	ktp->ktr_argsize = argsize;
    155  1.17       cgd 	argp = (register_t *)((char *)ktp + sizeof(struct ktr_syscall));
    156  1.31     perry 	for (i = 0; i < (argsize / sizeof(*argp)); i++)
    157   1.1       cgd 		*argp++ = args[i];
    158  1.39   thorpej 	kth.ktr_buf = (caddr_t)ktp;
    159  1.39   thorpej 	kth.ktr_len = len;
    160  1.74      fvdl 	(void) ktrwrite(p, &kth);
    161  1.39   thorpej 	free(ktp, M_TEMP);
    162   1.9       cgd 	p->p_traceflag &= ~KTRFAC_ACTIVE;
    163   1.1       cgd }
    164   1.1       cgd 
    165  1.17       cgd void
    166  1.74      fvdl ktrsysret(p, code, error, retval)
    167  1.74      fvdl 	struct proc *p;
    168  1.62      manu 	register_t code;
    169  1.62      manu 	int error;
    170  1.71       dsl 	register_t *retval;
    171   1.1       cgd {
    172  1.39   thorpej 	struct ktr_header kth;
    173   1.1       cgd 	struct ktr_sysret ktp;
    174   1.1       cgd 
    175   1.9       cgd 	p->p_traceflag |= KTRFAC_ACTIVE;
    176  1.74      fvdl 	ktrinitheader(&kth, p, KTR_SYSRET);
    177   1.1       cgd 	ktp.ktr_code = code;
    178  1.34    kleink 	ktp.ktr_eosys = 0;			/* XXX unused */
    179   1.1       cgd 	ktp.ktr_error = error;
    180  1.71       dsl 	ktp.ktr_retval = retval ? retval[0] : 0;
    181  1.71       dsl 	ktp.ktr_retval_1 = retval ? retval[1] : 0;
    182   1.1       cgd 
    183  1.39   thorpej 	kth.ktr_buf = (caddr_t)&ktp;
    184  1.39   thorpej 	kth.ktr_len = sizeof(struct ktr_sysret);
    185   1.1       cgd 
    186  1.74      fvdl 	(void) ktrwrite(p, &kth);
    187   1.9       cgd 	p->p_traceflag &= ~KTRFAC_ACTIVE;
    188   1.1       cgd }
    189   1.1       cgd 
    190  1.17       cgd void
    191  1.74      fvdl ktrnamei(p, path)
    192  1.74      fvdl 	struct proc *p;
    193  1.62      manu 	char *path;
    194   1.1       cgd {
    195  1.39   thorpej 	struct ktr_header kth;
    196   1.1       cgd 
    197   1.9       cgd 	p->p_traceflag |= KTRFAC_ACTIVE;
    198  1.74      fvdl 	ktrinitheader(&kth, p, KTR_NAMEI);
    199  1.39   thorpej 	kth.ktr_len = strlen(path);
    200  1.39   thorpej 	kth.ktr_buf = path;
    201  1.18  christos 
    202  1.74      fvdl 	(void) ktrwrite(p, &kth);
    203  1.18  christos 	p->p_traceflag &= ~KTRFAC_ACTIVE;
    204  1.18  christos }
    205  1.18  christos 
    206  1.18  christos void
    207  1.74      fvdl ktremul(p)
    208  1.74      fvdl 	struct proc *p;
    209  1.18  christos {
    210  1.39   thorpej 	struct ktr_header kth;
    211  1.74      fvdl 	const char *emul = p->p_emul->e_name;
    212  1.18  christos 
    213  1.18  christos 	p->p_traceflag |= KTRFAC_ACTIVE;
    214  1.74      fvdl 	ktrinitheader(&kth, p, KTR_EMUL);
    215  1.39   thorpej 	kth.ktr_len = strlen(emul);
    216  1.50       scw 	kth.ktr_buf = (caddr_t)emul;
    217   1.1       cgd 
    218  1.74      fvdl 	(void) ktrwrite(p, &kth);
    219   1.9       cgd 	p->p_traceflag &= ~KTRFAC_ACTIVE;
    220   1.1       cgd }
    221   1.1       cgd 
    222  1.17       cgd void
    223  1.75       dsl ktrkmem(struct proc *p, int ktr, const void *buf, size_t len)
    224  1.75       dsl {
    225  1.75       dsl 	struct ktr_header kth;
    226  1.75       dsl 
    227  1.75       dsl 	p->p_traceflag |= KTRFAC_ACTIVE;
    228  1.75       dsl 	ktrinitheader(&kth, p, ktr);
    229  1.75       dsl 	kth.ktr_len = len;
    230  1.75       dsl 	kth.ktr_buf = buf;
    231  1.75       dsl 
    232  1.75       dsl 	(void)ktrwrite(p, &kth);
    233  1.75       dsl 	p->p_traceflag &= ~KTRFAC_ACTIVE;
    234  1.75       dsl }
    235  1.75       dsl 
    236  1.75       dsl void
    237  1.74      fvdl ktrgenio(p, fd, rw, iov, len, error)
    238  1.74      fvdl 	struct proc *p;
    239  1.62      manu 	int fd;
    240  1.62      manu 	enum uio_rw rw;
    241  1.62      manu 	struct iovec *iov;
    242  1.62      manu 	int len;
    243  1.62      manu 	int error;
    244   1.1       cgd {
    245  1.39   thorpej 	struct ktr_header kth;
    246  1.28  christos 	struct ktr_genio *ktp;
    247  1.74      fvdl 	caddr_t cp;
    248  1.72   darrenr 	int resid = len, cnt;
    249  1.39   thorpej 	int buflen;
    250  1.39   thorpej 
    251   1.1       cgd 	if (error)
    252   1.1       cgd 		return;
    253  1.39   thorpej 
    254   1.9       cgd 	p->p_traceflag |= KTRFAC_ACTIVE;
    255  1.39   thorpej 
    256  1.39   thorpej 	buflen = min(PAGE_SIZE, len + sizeof(struct ktr_genio));
    257  1.39   thorpej 
    258  1.74      fvdl 	ktrinitheader(&kth, p, KTR_GENIO);
    259  1.39   thorpej 	ktp = malloc(buflen, M_TEMP, M_WAITOK);
    260   1.1       cgd 	ktp->ktr_fd = fd;
    261   1.1       cgd 	ktp->ktr_rw = rw;
    262  1.39   thorpej 
    263  1.39   thorpej 	kth.ktr_buf = (caddr_t)ktp;
    264  1.39   thorpej 
    265  1.31     perry 	cp = (caddr_t)((char *)ktp + sizeof(struct ktr_genio));
    266  1.39   thorpej 	buflen -= sizeof(struct ktr_genio);
    267  1.39   thorpej 
    268   1.1       cgd 	while (resid > 0) {
    269  1.67   thorpej #if 0 /* XXX NJWLWP */
    270  1.46   thorpej 		KDASSERT(p->p_cpu != NULL);
    271  1.46   thorpej 		KDASSERT(p->p_cpu == curcpu());
    272  1.67   thorpej #endif
    273  1.67   thorpej 		/* XXX NJWLWP */
    274  1.67   thorpej 		if (curcpu()->ci_schedstate.spc_flags & SPCF_SHOULDYIELD)
    275  1.67   thorpej 			preempt(1);
    276  1.39   thorpej 
    277  1.39   thorpej 		cnt = min(iov->iov_len, buflen);
    278  1.39   thorpej 		if (cnt > resid)
    279   1.1       cgd 			cnt = resid;
    280  1.39   thorpej 		if (copyin(iov->iov_base, cp, cnt))
    281  1.39   thorpej 			break;
    282  1.39   thorpej 
    283  1.39   thorpej 		kth.ktr_len = cnt + sizeof(struct ktr_genio);
    284  1.39   thorpej 
    285  1.74      fvdl 		if (__predict_false(ktrwrite(p, &kth) != 0))
    286  1.39   thorpej 			break;
    287  1.39   thorpej 
    288  1.39   thorpej 		iov->iov_base = (caddr_t)iov->iov_base + cnt;
    289  1.39   thorpej 		iov->iov_len -= cnt;
    290  1.39   thorpej 
    291  1.39   thorpej 		if (iov->iov_len == 0)
    292  1.39   thorpej 			iov++;
    293  1.39   thorpej 
    294   1.1       cgd 		resid -= cnt;
    295   1.1       cgd 	}
    296   1.1       cgd 
    297  1.39   thorpej 	free(ktp, M_TEMP);
    298   1.9       cgd 	p->p_traceflag &= ~KTRFAC_ACTIVE;
    299   1.1       cgd }
    300   1.1       cgd 
    301  1.17       cgd void
    302  1.78  christos ktrpsig(p, sig, action, mask, ksi)
    303  1.74      fvdl 	struct proc *p;
    304  1.62      manu 	int sig;
    305  1.62      manu 	sig_t action;
    306  1.79  christos 	const sigset_t *mask;
    307  1.79  christos 	const ksiginfo_t *ksi;
    308   1.1       cgd {
    309  1.39   thorpej 	struct ktr_header kth;
    310  1.78  christos 	struct {
    311  1.78  christos 		struct ktr_psig	kp;
    312  1.78  christos 		siginfo_t	si;
    313  1.78  christos 	} kbuf;
    314   1.1       cgd 
    315   1.9       cgd 	p->p_traceflag |= KTRFAC_ACTIVE;
    316  1.74      fvdl 	ktrinitheader(&kth, p, KTR_PSIG);
    317  1.78  christos 	kbuf.kp.signo = (char)sig;
    318  1.78  christos 	kbuf.kp.action = action;
    319  1.78  christos 	kbuf.kp.mask = *mask;
    320  1.78  christos 	kth.ktr_buf = (caddr_t)&kbuf;
    321  1.78  christos 	if (ksi) {
    322  1.80   thorpej 		kbuf.kp.code = KSI_TRAPCODE(ksi);
    323  1.78  christos 		(void)memset(&kbuf.si, 0, sizeof(kbuf.si));
    324  1.80   thorpej 		kbuf.si._info = ksi->ksi_info;
    325  1.78  christos 		kth.ktr_len = sizeof(kbuf);
    326  1.78  christos 	} else {
    327  1.78  christos 		kbuf.kp.code = 0;
    328  1.78  christos 		kth.ktr_len = sizeof(struct ktr_psig);
    329  1.78  christos 	}
    330  1.74      fvdl 	(void) ktrwrite(p, &kth);
    331   1.9       cgd 	p->p_traceflag &= ~KTRFAC_ACTIVE;
    332   1.9       cgd }
    333   1.9       cgd 
    334  1.17       cgd void
    335  1.74      fvdl ktrcsw(p, out, user)
    336  1.74      fvdl 	struct proc *p;
    337  1.62      manu 	int out;
    338  1.62      manu 	int user;
    339   1.9       cgd {
    340  1.39   thorpej 	struct ktr_header kth;
    341  1.39   thorpej 	struct ktr_csw kc;
    342   1.9       cgd 
    343   1.9       cgd 	p->p_traceflag |= KTRFAC_ACTIVE;
    344  1.74      fvdl 	ktrinitheader(&kth, p, KTR_CSW);
    345   1.9       cgd 	kc.out = out;
    346   1.9       cgd 	kc.user = user;
    347  1.39   thorpej 	kth.ktr_buf = (caddr_t)&kc;
    348  1.39   thorpej 	kth.ktr_len = sizeof(struct ktr_csw);
    349   1.9       cgd 
    350  1.74      fvdl 	(void) ktrwrite(p, &kth);
    351   1.9       cgd 	p->p_traceflag &= ~KTRFAC_ACTIVE;
    352   1.1       cgd }
    353   1.1       cgd 
    354  1.51  jdolecek void
    355  1.74      fvdl ktruser(p, id, addr, len, ustr)
    356  1.74      fvdl 	struct proc *p;
    357  1.51  jdolecek 	const char *id;
    358  1.51  jdolecek 	void *addr;
    359  1.51  jdolecek 	size_t len;
    360  1.51  jdolecek 	int ustr;
    361  1.51  jdolecek {
    362  1.51  jdolecek 	struct ktr_header kth;
    363  1.51  jdolecek 	struct ktr_user *ktp;
    364  1.51  jdolecek 	caddr_t user_dta;
    365  1.51  jdolecek 
    366  1.51  jdolecek 	p->p_traceflag |= KTRFAC_ACTIVE;
    367  1.74      fvdl 	ktrinitheader(&kth, p, KTR_USER);
    368  1.51  jdolecek 	ktp = malloc(sizeof(struct ktr_user) + len, M_TEMP, M_WAITOK);
    369  1.51  jdolecek 	if (ustr) {
    370  1.51  jdolecek 		if (copyinstr(id, ktp->ktr_id, KTR_USER_MAXIDLEN, NULL) != 0)
    371  1.51  jdolecek 			ktp->ktr_id[0] = '\0';
    372  1.51  jdolecek 	} else
    373  1.51  jdolecek 		strncpy(ktp->ktr_id, id, KTR_USER_MAXIDLEN);
    374  1.51  jdolecek 	ktp->ktr_id[KTR_USER_MAXIDLEN-1] = '\0';
    375  1.51  jdolecek 
    376  1.51  jdolecek 	user_dta = (caddr_t) ((char *)ktp + sizeof(struct ktr_user));
    377  1.51  jdolecek 	if (copyin(addr, (void *) user_dta, len) != 0)
    378  1.51  jdolecek 		len = 0;
    379  1.51  jdolecek 
    380  1.51  jdolecek 	kth.ktr_buf = (void *)ktp;
    381  1.51  jdolecek 	kth.ktr_len = sizeof(struct ktr_user) + len;
    382  1.74      fvdl 	(void) ktrwrite(p, &kth);
    383  1.51  jdolecek 
    384  1.51  jdolecek 	free(ktp, M_TEMP);
    385  1.51  jdolecek 	p->p_traceflag &= ~KTRFAC_ACTIVE;
    386  1.51  jdolecek 
    387  1.51  jdolecek }
    388  1.51  jdolecek 
    389  1.62      manu void
    390  1.74      fvdl ktrmmsg(p, msgh, size)
    391  1.74      fvdl 	struct proc *p;
    392  1.63  christos 	const void *msgh;
    393  1.62      manu 	size_t size;
    394  1.62      manu {
    395  1.62      manu 	struct ktr_header kth;
    396  1.62      manu 	struct ktr_mmsg	*kp;
    397  1.62      manu 
    398  1.62      manu 	p->p_traceflag |= KTRFAC_ACTIVE;
    399  1.74      fvdl 	ktrinitheader(&kth, p, KTR_MMSG);
    400  1.64      manu 
    401  1.64      manu 	kp = (struct ktr_mmsg *)msgh;
    402  1.62      manu 	kth.ktr_buf = (caddr_t)kp;
    403  1.62      manu 	kth.ktr_len = size;
    404  1.74      fvdl 	(void) ktrwrite(p, &kth);
    405  1.62      manu 	p->p_traceflag &= ~KTRFAC_ACTIVE;
    406  1.62      manu }
    407  1.83      manu 
    408  1.83      manu void
    409  1.83      manu ktrmool(p, kaddr, size, uaddr)
    410  1.83      manu 	struct proc *p;
    411  1.83      manu 	const void *kaddr;
    412  1.83      manu 	size_t size;
    413  1.83      manu 	const void *uaddr;
    414  1.83      manu {
    415  1.83      manu 	struct ktr_header kth;
    416  1.83      manu 	struct ktr_mool *kp;
    417  1.83      manu 	struct ktr_mool *buf;
    418  1.83      manu 
    419  1.83      manu 	p->p_traceflag |= KTRFAC_ACTIVE;
    420  1.83      manu 	ktrinitheader(&kth, p, KTR_MOOL);
    421  1.83      manu 
    422  1.83      manu 	kp = malloc(size + sizeof(*kp), M_TEMP, M_WAITOK);
    423  1.83      manu 	kp->uaddr = uaddr;
    424  1.83      manu 	kp->size = size;
    425  1.83      manu 	buf = kp + 1; /* Skip uaddr and size */
    426  1.83      manu 	memcpy(buf, kaddr, size);
    427  1.83      manu 
    428  1.83      manu 	kth.ktr_buf = (caddr_t)kp;
    429  1.83      manu 	kth.ktr_len = size + sizeof(*kp);
    430  1.83      manu 	(void) ktrwrite(p, &kth);
    431  1.83      manu 	free(kp, M_TEMP);
    432  1.83      manu 
    433  1.83      manu 	p->p_traceflag &= ~KTRFAC_ACTIVE;
    434  1.83      manu }
    435  1.83      manu 
    436  1.62      manu 
    437   1.1       cgd /* Interface and common routines */
    438   1.1       cgd 
    439  1.17       cgd int
    440  1.74      fvdl ktrace_common(curp, ops, facs, pid, fp)
    441  1.74      fvdl 	struct proc *curp;
    442  1.62      manu 	int ops;
    443  1.62      manu 	int facs;
    444  1.62      manu 	int pid;
    445  1.62      manu 	struct file *fp;
    446  1.28  christos {
    447  1.74      fvdl 	int ret = 0;
    448  1.72   darrenr 	int error = 0;
    449  1.42  sommerfe 	int one = 1;
    450  1.42  sommerfe 	int descend;
    451  1.74      fvdl 	struct proc *p;
    452  1.74      fvdl 	struct pgrp *pg;
    453  1.28  christos 
    454  1.28  christos 	curp->p_traceflag |= KTRFAC_ACTIVE;
    455  1.42  sommerfe 	descend = ops & KTRFLAG_DESCEND;
    456  1.42  sommerfe 	facs = facs & ~((unsigned) KTRFAC_ROOT);
    457  1.28  christos 
    458  1.28  christos 	/*
    459  1.28  christos 	 * Clear all uses of the tracefile
    460  1.28  christos 	 */
    461  1.28  christos 	if (KTROP(ops) == KTROP_CLEARFILE) {
    462  1.37   thorpej 		proclist_lock_read();
    463  1.81  jdolecek 		LIST_FOREACH(p, &allproc, p_list) {
    464  1.44  sommerfe 			if (ktrsamefile(p->p_tracep, fp)) {
    465  1.28  christos 				if (ktrcanset(curp, p))
    466  1.28  christos 					ktrderef(p);
    467  1.28  christos 				else
    468  1.28  christos 					error = EPERM;
    469  1.28  christos 			}
    470  1.28  christos 		}
    471  1.36   thorpej 		proclist_unlock_read();
    472  1.28  christos 		goto done;
    473  1.28  christos 	}
    474  1.42  sommerfe 
    475  1.42  sommerfe 	/*
    476  1.42  sommerfe 	 * Mark fp non-blocking, to avoid problems from possible deadlocks.
    477  1.42  sommerfe 	 */
    478  1.42  sommerfe 
    479  1.43  sommerfe 	if (fp != NULL) {
    480  1.43  sommerfe 		fp->f_flag |= FNONBLOCK;
    481  1.74      fvdl 		(*fp->f_ops->fo_ioctl)(fp, FIONBIO, (caddr_t)&one, curp);
    482  1.43  sommerfe 	}
    483  1.42  sommerfe 
    484  1.28  christos 	/*
    485  1.28  christos 	 * need something to (un)trace (XXX - why is this here?)
    486  1.28  christos 	 */
    487  1.28  christos 	if (!facs) {
    488  1.28  christos 		error = EINVAL;
    489  1.28  christos 		goto done;
    490  1.28  christos 	}
    491  1.28  christos 	/*
    492  1.28  christos 	 * do it
    493  1.28  christos 	 */
    494  1.42  sommerfe 	if (pid < 0) {
    495  1.28  christos 		/*
    496  1.28  christos 		 * by process group
    497  1.28  christos 		 */
    498  1.82       dsl 		pg = pg_find(-pid, PFIND_UNLOCK_FAIL);
    499  1.28  christos 		if (pg == NULL) {
    500  1.28  christos 			error = ESRCH;
    501  1.28  christos 			goto done;
    502  1.28  christos 		}
    503  1.81  jdolecek 		LIST_FOREACH(p, &pg->pg_members, p_pglist) {
    504  1.28  christos 			if (descend)
    505  1.74      fvdl 				ret |= ktrsetchildren(curp, p, ops, facs, fp);
    506  1.28  christos 			else
    507  1.74      fvdl 				ret |= ktrops(curp, p, ops, facs, fp);
    508  1.39   thorpej 		}
    509  1.28  christos 
    510  1.28  christos 	} else {
    511  1.28  christos 		/*
    512  1.28  christos 		 * by pid
    513  1.28  christos 		 */
    514  1.82       dsl 		p = p_find(pid, PFIND_UNLOCK_FAIL);
    515  1.28  christos 		if (p == NULL) {
    516  1.28  christos 			error = ESRCH;
    517  1.28  christos 			goto done;
    518  1.28  christos 		}
    519  1.28  christos 		if (descend)
    520  1.74      fvdl 			ret |= ktrsetchildren(curp, p, ops, facs, fp);
    521  1.28  christos 		else
    522  1.74      fvdl 			ret |= ktrops(curp, p, ops, facs, fp);
    523  1.28  christos 	}
    524  1.82       dsl 	proclist_unlock_read();	/* taken by p{g}_find */
    525  1.28  christos 	if (!ret)
    526  1.28  christos 		error = EPERM;
    527  1.28  christos done:
    528  1.28  christos 	curp->p_traceflag &= ~KTRFAC_ACTIVE;
    529  1.28  christos 	return (error);
    530  1.28  christos }
    531  1.28  christos 
    532  1.28  christos /*
    533  1.28  christos  * ktrace system call
    534  1.28  christos  */
    535  1.28  christos /* ARGSUSED */
    536  1.28  christos int
    537  1.67   thorpej sys_fktrace(l, v, retval)
    538  1.67   thorpej 	struct lwp *l;
    539  1.62      manu 	void *v;
    540  1.62      manu 	register_t *retval;
    541  1.42  sommerfe {
    542  1.42  sommerfe 	struct sys_fktrace_args /* {
    543  1.42  sommerfe 		syscallarg(int) fd;
    544  1.42  sommerfe 		syscallarg(int) ops;
    545  1.42  sommerfe 		syscallarg(int) facs;
    546  1.42  sommerfe 		syscallarg(int) pid;
    547  1.42  sommerfe 	} */ *uap = v;
    548  1.74      fvdl 	struct proc *curp = l->l_proc;
    549  1.42  sommerfe 	struct file *fp = NULL;
    550  1.74      fvdl 	struct filedesc *fdp = curp->p_fd;
    551  1.70      yamt 	int error;
    552  1.42  sommerfe 
    553  1.54   thorpej 	if ((fp = fd_getfile(fdp, SCARG(uap, fd))) == NULL)
    554  1.54   thorpej 		return (EBADF);
    555  1.54   thorpej 
    556  1.70      yamt 	FILE_USE(fp);
    557  1.70      yamt 
    558  1.54   thorpej 	if ((fp->f_flag & FWRITE) == 0)
    559  1.70      yamt 		error = EBADF;
    560  1.70      yamt 	else
    561  1.74      fvdl 		error = ktrace_common(curp, SCARG(uap, ops),
    562  1.70      yamt 		    SCARG(uap, facs), SCARG(uap, pid), fp);
    563  1.70      yamt 
    564  1.74      fvdl 	FILE_UNUSE(fp, curp);
    565  1.42  sommerfe 
    566  1.70      yamt 	return error;
    567  1.42  sommerfe }
    568  1.42  sommerfe 
    569  1.42  sommerfe /*
    570  1.42  sommerfe  * ktrace system call
    571  1.42  sommerfe  */
    572  1.42  sommerfe /* ARGSUSED */
    573  1.42  sommerfe int
    574  1.67   thorpej sys_ktrace(l, v, retval)
    575  1.67   thorpej 	struct lwp *l;
    576  1.62      manu 	void *v;
    577  1.62      manu 	register_t *retval;
    578  1.19   thorpej {
    579  1.28  christos 	struct sys_ktrace_args /* {
    580  1.24   mycroft 		syscallarg(const char *) fname;
    581  1.13       cgd 		syscallarg(int) ops;
    582  1.13       cgd 		syscallarg(int) facs;
    583  1.13       cgd 		syscallarg(int) pid;
    584  1.19   thorpej 	} */ *uap = v;
    585  1.67   thorpej 	struct proc *curp = l->l_proc;
    586  1.28  christos 	struct vnode *vp = NULL;
    587  1.42  sommerfe 	struct file *fp = NULL;
    588  1.74      fvdl 	int fd;
    589  1.42  sommerfe 	int ops = SCARG(uap, ops);
    590  1.74      fvdl 	int error = 0;
    591  1.72   darrenr 	struct nameidata nd;
    592   1.1       cgd 
    593  1.42  sommerfe 	ops = KTROP(ops) | (ops & KTRFLAG_DESCEND);
    594  1.42  sommerfe 
    595   1.9       cgd 	curp->p_traceflag |= KTRFAC_ACTIVE;
    596  1.69  christos 	if ((ops & KTROP_CLEAR) == 0) {
    597   1.1       cgd 		/*
    598   1.1       cgd 		 * an operation which requires a file argument.
    599   1.1       cgd 		 */
    600  1.13       cgd 		NDINIT(&nd, LOOKUP, FOLLOW, UIO_USERSPACE, SCARG(uap, fname),
    601  1.74      fvdl 		    curp);
    602  1.22  christos 		if ((error = vn_open(&nd, FREAD|FWRITE, 0)) != 0) {
    603   1.9       cgd 			curp->p_traceflag &= ~KTRFAC_ACTIVE;
    604   1.1       cgd 			return (error);
    605   1.9       cgd 		}
    606   1.1       cgd 		vp = nd.ni_vp;
    607  1.25      fvdl 		VOP_UNLOCK(vp, 0);
    608   1.1       cgd 		if (vp->v_type != VREG) {
    609  1.74      fvdl 			(void) vn_close(vp, FREAD|FWRITE, curp->p_ucred, curp);
    610   1.9       cgd 			curp->p_traceflag &= ~KTRFAC_ACTIVE;
    611   1.1       cgd 			return (EACCES);
    612   1.1       cgd 		}
    613   1.1       cgd 		/*
    614  1.42  sommerfe 		 * XXX This uses up a file descriptor slot in the
    615  1.42  sommerfe 		 * tracing process for the duration of this syscall.
    616  1.42  sommerfe 		 * This is not expected to be a problem.  If
    617  1.42  sommerfe 		 * falloc(NULL, ...) DTRT we could skip that part, but
    618  1.42  sommerfe 		 * that would require changing its interface to allow
    619  1.42  sommerfe 		 * the caller to pass in a ucred..
    620  1.42  sommerfe 		 *
    621  1.42  sommerfe 		 * This will FILE_USE the fp it returns, if any.
    622  1.42  sommerfe 		 * Keep it in use until we return.
    623   1.1       cgd 		 */
    624  1.42  sommerfe 		if ((error = falloc(curp, &fp, &fd)) != 0)
    625   1.1       cgd 			goto done;
    626  1.42  sommerfe 
    627  1.42  sommerfe 		fp->f_flag = FWRITE|FAPPEND;
    628  1.42  sommerfe 		fp->f_type = DTYPE_VNODE;
    629  1.42  sommerfe 		fp->f_ops = &vnops;
    630  1.42  sommerfe 		fp->f_data = (caddr_t)vp;
    631  1.54   thorpej 		FILE_SET_MATURE(fp);
    632  1.42  sommerfe 		vp = NULL;
    633  1.42  sommerfe 	}
    634  1.74      fvdl 	error = ktrace_common(curp, SCARG(uap, ops), SCARG(uap, facs),
    635  1.42  sommerfe 	    SCARG(uap, pid), fp);
    636  1.42  sommerfe done:
    637   1.1       cgd 	if (vp != NULL)
    638  1.74      fvdl 		(void) vn_close(vp, FWRITE, curp->p_ucred, curp);
    639  1.42  sommerfe 	if (fp != NULL) {
    640  1.74      fvdl 		FILE_UNUSE(fp, curp);	/* release file */
    641  1.74      fvdl 		fdrelease(curp, fd); 	/* release fd table slot */
    642  1.42  sommerfe 	}
    643   1.1       cgd 	return (error);
    644   1.1       cgd }
    645   1.1       cgd 
    646   1.4    andrew int
    647  1.74      fvdl ktrops(curp, p, ops, facs, fp)
    648  1.74      fvdl 	struct proc *curp;
    649  1.62      manu 	struct proc *p;
    650  1.62      manu 	int ops;
    651  1.62      manu 	int facs;
    652  1.62      manu 	struct file *fp;
    653   1.1       cgd {
    654   1.1       cgd 
    655   1.1       cgd 	if (!ktrcanset(curp, p))
    656   1.1       cgd 		return (0);
    657  1.28  christos 	if (KTROP(ops) == KTROP_SET) {
    658  1.42  sommerfe 		if (p->p_tracep != fp) {
    659   1.1       cgd 			/*
    660   1.1       cgd 			 * if trace file already in use, relinquish
    661   1.1       cgd 			 */
    662  1.28  christos 			ktrderef(p);
    663  1.42  sommerfe 			p->p_tracep = fp;
    664  1.28  christos 			ktradref(p);
    665   1.1       cgd 		}
    666   1.1       cgd 		p->p_traceflag |= facs;
    667   1.1       cgd 		if (curp->p_ucred->cr_uid == 0)
    668   1.1       cgd 			p->p_traceflag |= KTRFAC_ROOT;
    669   1.1       cgd 	} else {
    670   1.1       cgd 		/* KTROP_CLEAR */
    671   1.1       cgd 		if (((p->p_traceflag &= ~facs) & KTRFAC_MASK) == 0) {
    672   1.1       cgd 			/* no more tracing */
    673  1.28  christos 			ktrderef(p);
    674   1.1       cgd 		}
    675   1.1       cgd 	}
    676  1.21  christos 
    677  1.21  christos 	/*
    678  1.21  christos 	 * Emit an emulation record, every time there is a ktrace
    679  1.21  christos 	 * change/attach request.
    680  1.21  christos 	 */
    681  1.21  christos 	if (KTRPOINT(p, KTR_EMUL))
    682  1.84       dsl 		p->p_traceflag |= KTRFAC_TRC_EMUL;
    683  1.49    martin #ifdef __HAVE_SYSCALL_INTERN
    684  1.48   mycroft 	(*p->p_emul->e_syscall_intern)(p);
    685  1.49    martin #endif
    686   1.1       cgd 
    687   1.1       cgd 	return (1);
    688   1.1       cgd }
    689   1.1       cgd 
    690  1.22  christos int
    691  1.74      fvdl ktrsetchildren(curp, top, ops, facs, fp)
    692  1.74      fvdl 	struct proc *curp;
    693  1.62      manu 	struct proc *top;
    694  1.62      manu 	int ops;
    695  1.62      manu 	int facs;
    696  1.62      manu 	struct file *fp;
    697   1.1       cgd {
    698  1.28  christos 	struct proc *p;
    699  1.28  christos 	int ret = 0;
    700   1.1       cgd 
    701   1.1       cgd 	p = top;
    702   1.1       cgd 	for (;;) {
    703  1.74      fvdl 		ret |= ktrops(curp, p, ops, facs, fp);
    704   1.1       cgd 		/*
    705   1.1       cgd 		 * If this process has children, descend to them next,
    706   1.1       cgd 		 * otherwise do any siblings, and if done with this level,
    707   1.1       cgd 		 * follow back up the tree (but not past top).
    708   1.1       cgd 		 */
    709  1.82       dsl 		if (LIST_FIRST(&p->p_children) != NULL) {
    710  1.39   thorpej 			p = LIST_FIRST(&p->p_children);
    711  1.82       dsl 			continue;
    712  1.82       dsl 		}
    713  1.82       dsl 		for (;;) {
    714   1.1       cgd 			if (p == top)
    715   1.1       cgd 				return (ret);
    716  1.39   thorpej 			if (LIST_NEXT(p, p_sibling) != NULL) {
    717  1.39   thorpej 				p = LIST_NEXT(p, p_sibling);
    718   1.1       cgd 				break;
    719   1.1       cgd 			}
    720  1.12   mycroft 			p = p->p_pptr;
    721   1.1       cgd 		}
    722   1.1       cgd 	}
    723   1.1       cgd 	/*NOTREACHED*/
    724   1.1       cgd }
    725   1.1       cgd 
    726  1.39   thorpej int
    727  1.74      fvdl ktrwrite(p, kth)
    728  1.74      fvdl 	struct proc *p;
    729  1.62      manu 	struct ktr_header *kth;
    730   1.1       cgd {
    731  1.74      fvdl 	struct uio auio;
    732   1.1       cgd 	struct iovec aiov[2];
    733  1.42  sommerfe 	int error, tries;
    734  1.74      fvdl 	struct file *fp = p->p_tracep;
    735   1.1       cgd 
    736  1.42  sommerfe 	if (fp == NULL)
    737  1.42  sommerfe 		return 0;
    738  1.42  sommerfe 
    739  1.84       dsl 	if (p->p_traceflag & KTRFAC_TRC_EMUL) {
    740  1.84       dsl 		/* Add emulation trace before first entry for this process */
    741  1.84       dsl 		p->p_traceflag &= ~KTRFAC_TRC_EMUL;
    742  1.84       dsl 		ktremul(p);
    743  1.84       dsl 	}
    744  1.84       dsl 
    745   1.1       cgd 	auio.uio_iov = &aiov[0];
    746   1.1       cgd 	auio.uio_offset = 0;
    747   1.1       cgd 	auio.uio_segflg = UIO_SYSSPACE;
    748   1.1       cgd 	auio.uio_rw = UIO_WRITE;
    749   1.1       cgd 	aiov[0].iov_base = (caddr_t)kth;
    750   1.1       cgd 	aiov[0].iov_len = sizeof(struct ktr_header);
    751   1.1       cgd 	auio.uio_resid = sizeof(struct ktr_header);
    752   1.1       cgd 	auio.uio_iovcnt = 1;
    753  1.74      fvdl 	auio.uio_procp = (struct proc *)0;
    754   1.1       cgd 	if (kth->ktr_len > 0) {
    755   1.1       cgd 		auio.uio_iovcnt++;
    756  1.75       dsl 		aiov[1].iov_base = (void *)kth->ktr_buf;
    757   1.1       cgd 		aiov[1].iov_len = kth->ktr_len;
    758   1.1       cgd 		auio.uio_resid += kth->ktr_len;
    759   1.1       cgd 	}
    760  1.28  christos 
    761  1.68        pk 	simple_lock(&fp->f_slock);
    762  1.42  sommerfe 	FILE_USE(fp);
    763  1.42  sommerfe 
    764  1.42  sommerfe 	tries = 0;
    765  1.42  sommerfe 	do {
    766  1.30   thorpej 		error = (*fp->f_ops->fo_write)(fp, &fp->f_offset, &auio,
    767  1.30   thorpej 		    fp->f_cred, FOF_UPDATE_OFFSET);
    768  1.74      fvdl 		tries++;
    769  1.42  sommerfe 		if (error == EWOULDBLOCK)
    770  1.67   thorpej 		  	preempt(1);
    771  1.42  sommerfe 	} while ((error == EWOULDBLOCK) && (tries < 3));
    772  1.42  sommerfe 	FILE_UNUSE(fp, NULL);
    773  1.28  christos 
    774  1.40   thorpej 	if (__predict_true(error == 0))
    775  1.39   thorpej 		return (0);
    776   1.1       cgd 	/*
    777  1.38   darrenr 	 * If error encountered, give up tracing on this vnode.  Don't report
    778  1.38   darrenr 	 * EPIPE as this can easily happen with fktrace()/ktruss.
    779   1.1       cgd 	 */
    780  1.38   darrenr 	if (error != EPIPE)
    781  1.38   darrenr 		log(LOG_NOTICE,
    782  1.38   darrenr 		    "ktrace write failed, errno %d, tracing stopped\n",
    783  1.38   darrenr 		    error);
    784  1.37   thorpej 	proclist_lock_read();
    785  1.81  jdolecek 	LIST_FOREACH(p, &allproc, p_list) {
    786  1.44  sommerfe 		if (ktrsamefile(p->p_tracep, fp))
    787  1.28  christos 			ktrderef(p);
    788   1.1       cgd 	}
    789  1.36   thorpej 	proclist_unlock_read();
    790  1.39   thorpej 
    791  1.39   thorpej 	return (error);
    792   1.1       cgd }
    793   1.1       cgd 
    794   1.1       cgd /*
    795   1.1       cgd  * Return true if caller has permission to set the ktracing state
    796   1.1       cgd  * of target.  Essentially, the target can't possess any
    797   1.1       cgd  * more permissions than the caller.  KTRFAC_ROOT signifies that
    798   1.1       cgd  * root previously set the tracing status on the target process, and
    799   1.1       cgd  * so, only root may further change it.
    800   1.1       cgd  *
    801   1.1       cgd  * TODO: check groups.  use caller effective gid.
    802   1.1       cgd  */
    803  1.22  christos int
    804  1.62      manu ktrcanset(callp, targetp)
    805  1.62      manu 	struct proc *callp;
    806  1.62      manu 	struct proc *targetp;
    807   1.1       cgd {
    808  1.28  christos 	struct pcred *caller = callp->p_cred;
    809  1.28  christos 	struct pcred *target = targetp->p_cred;
    810   1.1       cgd 
    811   1.1       cgd 	if ((caller->pc_ucred->cr_uid == target->p_ruid &&
    812   1.1       cgd 	     target->p_ruid == target->p_svuid &&
    813   1.1       cgd 	     caller->p_rgid == target->p_rgid &&	/* XXX */
    814   1.1       cgd 	     target->p_rgid == target->p_svgid &&
    815  1.58    itojun 	     (targetp->p_traceflag & KTRFAC_ROOT) == 0 &&
    816  1.58    itojun 	     (targetp->p_flag & P_SUGID) == 0) ||
    817   1.1       cgd 	     caller->pc_ucred->cr_uid == 0)
    818   1.1       cgd 		return (1);
    819   1.1       cgd 
    820   1.1       cgd 	return (0);
    821   1.1       cgd }
    822  1.47   thorpej #endif /* KTRACE */
    823  1.51  jdolecek 
    824  1.51  jdolecek /*
    825  1.51  jdolecek  * Put user defined entry to ktrace records.
    826  1.51  jdolecek  */
    827  1.51  jdolecek int
    828  1.67   thorpej sys_utrace(l, v, retval)
    829  1.67   thorpej 	struct lwp *l;
    830  1.51  jdolecek 	void *v;
    831  1.51  jdolecek 	register_t *retval;
    832  1.51  jdolecek {
    833  1.51  jdolecek #ifdef KTRACE
    834  1.51  jdolecek 	struct sys_utrace_args /* {
    835  1.52  jdolecek 		syscallarg(const char *) label;
    836  1.51  jdolecek 		syscallarg(void *) addr;
    837  1.51  jdolecek 		syscallarg(size_t) len;
    838  1.51  jdolecek 	} */ *uap = v;
    839  1.67   thorpej 	struct proc *p = l->l_proc;
    840  1.51  jdolecek 	if (!KTRPOINT(p, KTR_USER))
    841  1.51  jdolecek 		return (0);
    842  1.53  jdolecek 
    843  1.53  jdolecek 	if (SCARG(uap, len) > KTR_USER_MAXLEN)
    844  1.53  jdolecek 		return (EINVAL);
    845  1.51  jdolecek 
    846  1.74      fvdl 	ktruser(p, SCARG(uap, label), SCARG(uap, addr), SCARG(uap, len), 1);
    847  1.51  jdolecek 
    848  1.51  jdolecek 	return (0);
    849  1.51  jdolecek #else /* !KTRACE */
    850  1.51  jdolecek 	return ENOSYS;
    851  1.51  jdolecek #endif /* KTRACE */
    852  1.51  jdolecek }
    853