Home | History | Annotate | Line # | Download | only in kern
kern_ktrace.c revision 1.53.2.8
      1  1.53.2.7   nathanw /*	$NetBSD: kern_ktrace.c,v 1.53.2.8 2002/11/11 22:13:43 nathanw Exp $	*/
      2      1.11       cgd 
      3       1.1       cgd /*
      4       1.9       cgd  * Copyright (c) 1989, 1993
      5       1.9       cgd  *	The Regents of the University of California.  All rights reserved.
      6       1.1       cgd  *
      7       1.1       cgd  * Redistribution and use in source and binary forms, with or without
      8       1.1       cgd  * modification, are permitted provided that the following conditions
      9       1.1       cgd  * are met:
     10       1.1       cgd  * 1. Redistributions of source code must retain the above copyright
     11       1.1       cgd  *    notice, this list of conditions and the following disclaimer.
     12       1.1       cgd  * 2. Redistributions in binary form must reproduce the above copyright
     13       1.1       cgd  *    notice, this list of conditions and the following disclaimer in the
     14       1.1       cgd  *    documentation and/or other materials provided with the distribution.
     15       1.1       cgd  * 3. All advertising materials mentioning features or use of this software
     16       1.1       cgd  *    must display the following acknowledgement:
     17       1.1       cgd  *	This product includes software developed by the University of
     18       1.1       cgd  *	California, Berkeley and its contributors.
     19       1.1       cgd  * 4. Neither the name of the University nor the names of its contributors
     20       1.1       cgd  *    may be used to endorse or promote products derived from this software
     21       1.1       cgd  *    without specific prior written permission.
     22       1.1       cgd  *
     23       1.1       cgd  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
     24       1.1       cgd  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     25       1.1       cgd  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     26       1.1       cgd  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
     27       1.1       cgd  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     28       1.1       cgd  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     29       1.1       cgd  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     30       1.1       cgd  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     31       1.1       cgd  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     32       1.1       cgd  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     33       1.1       cgd  * SUCH DAMAGE.
     34       1.1       cgd  *
     35      1.25      fvdl  *	@(#)kern_ktrace.c	8.5 (Berkeley) 5/14/95
     36       1.1       cgd  */
     37  1.53.2.3   nathanw 
     38  1.53.2.3   nathanw #include <sys/cdefs.h>
     39  1.53.2.7   nathanw __KERNEL_RCSID(0, "$NetBSD: kern_ktrace.c,v 1.53.2.8 2002/11/11 22:13:43 nathanw Exp $");
     40      1.29   thorpej 
     41      1.29   thorpej #include "opt_ktrace.h"
     42       1.1       cgd 
     43       1.7   mycroft #include <sys/param.h>
     44      1.13       cgd #include <sys/systm.h>
     45       1.7   mycroft #include <sys/proc.h>
     46       1.7   mycroft #include <sys/file.h>
     47       1.7   mycroft #include <sys/namei.h>
     48       1.7   mycroft #include <sys/vnode.h>
     49       1.7   mycroft #include <sys/ktrace.h>
     50       1.7   mycroft #include <sys/malloc.h>
     51       1.7   mycroft #include <sys/syslog.h>
     52      1.28  christos #include <sys/filedesc.h>
     53      1.42  sommerfe #include <sys/ioctl.h>
     54       1.1       cgd 
     55      1.13       cgd #include <sys/mount.h>
     56  1.53.2.4   nathanw #include <sys/sa.h>
     57      1.13       cgd #include <sys/syscallargs.h>
     58      1.22  christos 
     59      1.51  jdolecek #ifdef KTRACE
     60      1.51  jdolecek 
     61      1.47   thorpej int	ktrace_common(struct proc *, int, int, int, struct file *);
     62      1.47   thorpej void	ktrinitheader(struct ktr_header *, struct proc *, int);
     63      1.47   thorpej int	ktrops(struct proc *, struct proc *, int, int, struct file *);
     64      1.47   thorpej int	ktrsetchildren(struct proc *, struct proc *, int, int,
     65      1.47   thorpej 	    struct file *);
     66      1.47   thorpej int	ktrwrite(struct proc *, struct ktr_header *);
     67      1.47   thorpej int	ktrcanset(struct proc *, struct proc *);
     68      1.47   thorpej int	ktrsamefile(struct file *, struct file *);
     69      1.44  sommerfe 
     70      1.44  sommerfe /*
     71      1.44  sommerfe  * "deep" compare of two files for the purposes of clearing a trace.
     72      1.44  sommerfe  * Returns true if they're the same open file, or if they point at the
     73      1.44  sommerfe  * same underlying vnode/socket.
     74      1.44  sommerfe  */
     75      1.44  sommerfe 
     76      1.44  sommerfe int
     77      1.47   thorpej ktrsamefile(struct file *f1, struct file *f2)
     78      1.44  sommerfe {
     79      1.44  sommerfe 	return ((f1 == f2) ||
     80      1.45  sommerfe 	    ((f1 != NULL) && (f2 != NULL) &&
     81      1.45  sommerfe 		(f1->f_type == f2->f_type) &&
     82      1.44  sommerfe 		(f1->f_data == f2->f_data)));
     83      1.44  sommerfe }
     84      1.22  christos 
     85      1.28  christos void
     86      1.47   thorpej ktrderef(struct proc *p)
     87      1.28  christos {
     88      1.42  sommerfe 	struct file *fp = p->p_tracep;
     89      1.42  sommerfe 	p->p_traceflag = 0;
     90      1.42  sommerfe 	if (fp == NULL)
     91      1.28  christos 		return;
     92      1.42  sommerfe 	FILE_USE(fp);
     93  1.53.2.8   nathanw 
     94  1.53.2.8   nathanw 	/*
     95  1.53.2.8   nathanw 	 * ktrace file descriptor can't be watched (are not visible to
     96  1.53.2.8   nathanw 	 * userspace), so no kqueue stuff here
     97  1.53.2.8   nathanw 	 */
     98      1.42  sommerfe 	closef(fp, NULL);
     99      1.28  christos 
    100      1.28  christos 	p->p_tracep = NULL;
    101      1.28  christos }
    102      1.28  christos 
    103      1.28  christos void
    104      1.47   thorpej ktradref(struct proc *p)
    105      1.28  christos {
    106      1.42  sommerfe 	struct file *fp = p->p_tracep;
    107      1.28  christos 
    108      1.42  sommerfe 	fp->f_count++;
    109      1.28  christos }
    110      1.28  christos 
    111      1.39   thorpej void
    112      1.47   thorpej ktrinitheader(struct ktr_header *kth, struct proc *p, int type)
    113       1.1       cgd {
    114       1.1       cgd 
    115      1.39   thorpej 	memset(kth, 0, sizeof(*kth));
    116       1.1       cgd 	kth->ktr_type = type;
    117       1.1       cgd 	microtime(&kth->ktr_time);
    118       1.1       cgd 	kth->ktr_pid = p->p_pid;
    119      1.32     perry 	memcpy(kth->ktr_comm, p->p_comm, MAXCOMLEN);
    120       1.1       cgd }
    121       1.1       cgd 
    122      1.17       cgd void
    123  1.53.2.5   nathanw ktrsyscall(struct proc *p, register_t code, register_t args[])
    124       1.1       cgd {
    125      1.39   thorpej 	struct ktr_header kth;
    126      1.39   thorpej 	struct ktr_syscall *ktp;
    127      1.17       cgd 	register_t *argp;
    128  1.53.2.5   nathanw 	int argsize;
    129  1.53.2.5   nathanw 	size_t len;
    130  1.53.2.8   nathanw 	u_int i;
    131  1.53.2.5   nathanw 
    132  1.53.2.5   nathanw 	argsize = p->p_emul->e_sysent[code].sy_narg * sizeof (register_t);
    133  1.53.2.5   nathanw 	len = sizeof(struct ktr_syscall) + argsize;
    134       1.1       cgd 
    135       1.9       cgd 	p->p_traceflag |= KTRFAC_ACTIVE;
    136      1.39   thorpej 	ktrinitheader(&kth, p, KTR_SYSCALL);
    137      1.39   thorpej 	ktp = malloc(len, M_TEMP, M_WAITOK);
    138       1.1       cgd 	ktp->ktr_code = code;
    139      1.17       cgd 	ktp->ktr_argsize = argsize;
    140      1.17       cgd 	argp = (register_t *)((char *)ktp + sizeof(struct ktr_syscall));
    141      1.31     perry 	for (i = 0; i < (argsize / sizeof(*argp)); i++)
    142       1.1       cgd 		*argp++ = args[i];
    143      1.39   thorpej 	kth.ktr_buf = (caddr_t)ktp;
    144      1.39   thorpej 	kth.ktr_len = len;
    145      1.42  sommerfe 	(void) ktrwrite(p, &kth);
    146      1.39   thorpej 	free(ktp, M_TEMP);
    147       1.9       cgd 	p->p_traceflag &= ~KTRFAC_ACTIVE;
    148       1.1       cgd }
    149       1.1       cgd 
    150      1.17       cgd void
    151      1.47   thorpej ktrsysret(struct proc *p, register_t code, int error, register_t retval)
    152       1.1       cgd {
    153      1.39   thorpej 	struct ktr_header kth;
    154       1.1       cgd 	struct ktr_sysret ktp;
    155       1.1       cgd 
    156       1.9       cgd 	p->p_traceflag |= KTRFAC_ACTIVE;
    157      1.39   thorpej 	ktrinitheader(&kth, p, KTR_SYSRET);
    158       1.1       cgd 	ktp.ktr_code = code;
    159      1.34    kleink 	ktp.ktr_eosys = 0;			/* XXX unused */
    160       1.1       cgd 	ktp.ktr_error = error;
    161       1.1       cgd 	ktp.ktr_retval = retval;		/* what about val2 ? */
    162       1.1       cgd 
    163      1.39   thorpej 	kth.ktr_buf = (caddr_t)&ktp;
    164      1.39   thorpej 	kth.ktr_len = sizeof(struct ktr_sysret);
    165       1.1       cgd 
    166      1.42  sommerfe 	(void) ktrwrite(p, &kth);
    167       1.9       cgd 	p->p_traceflag &= ~KTRFAC_ACTIVE;
    168       1.1       cgd }
    169       1.1       cgd 
    170      1.17       cgd void
    171      1.47   thorpej ktrnamei(struct proc *p, char *path)
    172       1.1       cgd {
    173      1.39   thorpej 	struct ktr_header kth;
    174       1.1       cgd 
    175       1.9       cgd 	p->p_traceflag |= KTRFAC_ACTIVE;
    176      1.39   thorpej 	ktrinitheader(&kth, p, KTR_NAMEI);
    177      1.39   thorpej 	kth.ktr_len = strlen(path);
    178      1.39   thorpej 	kth.ktr_buf = path;
    179      1.18  christos 
    180      1.42  sommerfe 	(void) ktrwrite(p, &kth);
    181      1.18  christos 	p->p_traceflag &= ~KTRFAC_ACTIVE;
    182      1.18  christos }
    183      1.18  christos 
    184      1.18  christos void
    185      1.47   thorpej ktremul(struct proc *p)
    186      1.18  christos {
    187      1.39   thorpej 	struct ktr_header kth;
    188      1.50       scw 	const char *emul = p->p_emul->e_name;
    189      1.18  christos 
    190      1.18  christos 	p->p_traceflag |= KTRFAC_ACTIVE;
    191      1.39   thorpej 	ktrinitheader(&kth, p, KTR_EMUL);
    192      1.39   thorpej 	kth.ktr_len = strlen(emul);
    193      1.50       scw 	kth.ktr_buf = (caddr_t)emul;
    194       1.1       cgd 
    195      1.42  sommerfe 	(void) ktrwrite(p, &kth);
    196       1.9       cgd 	p->p_traceflag &= ~KTRFAC_ACTIVE;
    197       1.1       cgd }
    198       1.1       cgd 
    199      1.17       cgd void
    200      1.47   thorpej ktrgenio(struct proc *p, int fd, enum uio_rw rw, struct iovec *iov,
    201      1.47   thorpej     int len, int error)
    202       1.1       cgd {
    203      1.39   thorpej 	struct ktr_header kth;
    204      1.28  christos 	struct ktr_genio *ktp;
    205      1.28  christos 	caddr_t cp;
    206      1.28  christos 	int resid = len, cnt;
    207      1.39   thorpej 	int buflen;
    208      1.39   thorpej 
    209       1.1       cgd 	if (error)
    210       1.1       cgd 		return;
    211      1.39   thorpej 
    212       1.9       cgd 	p->p_traceflag |= KTRFAC_ACTIVE;
    213      1.39   thorpej 
    214      1.39   thorpej 	buflen = min(PAGE_SIZE, len + sizeof(struct ktr_genio));
    215      1.39   thorpej 
    216      1.39   thorpej 	ktrinitheader(&kth, p, KTR_GENIO);
    217      1.39   thorpej 	ktp = malloc(buflen, M_TEMP, M_WAITOK);
    218       1.1       cgd 	ktp->ktr_fd = fd;
    219       1.1       cgd 	ktp->ktr_rw = rw;
    220      1.39   thorpej 
    221      1.39   thorpej 	kth.ktr_buf = (caddr_t)ktp;
    222      1.39   thorpej 
    223      1.31     perry 	cp = (caddr_t)((char *)ktp + sizeof(struct ktr_genio));
    224      1.39   thorpej 	buflen -= sizeof(struct ktr_genio);
    225      1.39   thorpej 
    226       1.1       cgd 	while (resid > 0) {
    227  1.53.2.1   nathanw #if 0 /* XXX NJWLWP */
    228      1.46   thorpej 		KDASSERT(p->p_cpu != NULL);
    229      1.46   thorpej 		KDASSERT(p->p_cpu == curcpu());
    230  1.53.2.1   nathanw #endif
    231  1.53.2.1   nathanw 		/* XXX NJWLWP */
    232  1.53.2.1   nathanw 		if (curcpu()->ci_schedstate.spc_flags & SPCF_SHOULDYIELD)
    233      1.39   thorpej 			preempt(NULL);
    234      1.39   thorpej 
    235      1.39   thorpej 		cnt = min(iov->iov_len, buflen);
    236      1.39   thorpej 		if (cnt > resid)
    237       1.1       cgd 			cnt = resid;
    238      1.39   thorpej 		if (copyin(iov->iov_base, cp, cnt))
    239      1.39   thorpej 			break;
    240      1.39   thorpej 
    241      1.39   thorpej 		kth.ktr_len = cnt + sizeof(struct ktr_genio);
    242      1.39   thorpej 
    243      1.42  sommerfe 		if (__predict_false(ktrwrite(p, &kth) != 0))
    244      1.39   thorpej 			break;
    245      1.39   thorpej 
    246      1.39   thorpej 		iov->iov_base = (caddr_t)iov->iov_base + cnt;
    247      1.39   thorpej 		iov->iov_len -= cnt;
    248      1.39   thorpej 
    249      1.39   thorpej 		if (iov->iov_len == 0)
    250      1.39   thorpej 			iov++;
    251      1.39   thorpej 
    252       1.1       cgd 		resid -= cnt;
    253       1.1       cgd 	}
    254       1.1       cgd 
    255      1.39   thorpej 	free(ktp, M_TEMP);
    256       1.9       cgd 	p->p_traceflag &= ~KTRFAC_ACTIVE;
    257       1.1       cgd }
    258       1.1       cgd 
    259      1.17       cgd void
    260      1.47   thorpej ktrpsig(struct proc *p, int sig, sig_t action, sigset_t *mask, int code)
    261       1.1       cgd {
    262      1.39   thorpej 	struct ktr_header kth;
    263       1.1       cgd 	struct ktr_psig	kp;
    264       1.1       cgd 
    265       1.9       cgd 	p->p_traceflag |= KTRFAC_ACTIVE;
    266      1.39   thorpej 	ktrinitheader(&kth, p, KTR_PSIG);
    267       1.1       cgd 	kp.signo = (char)sig;
    268       1.1       cgd 	kp.action = action;
    269      1.33   mycroft 	kp.mask = *mask;
    270       1.1       cgd 	kp.code = code;
    271      1.39   thorpej 	kth.ktr_buf = (caddr_t)&kp;
    272      1.39   thorpej 	kth.ktr_len = sizeof(struct ktr_psig);
    273       1.1       cgd 
    274      1.42  sommerfe 	(void) ktrwrite(p, &kth);
    275       1.9       cgd 	p->p_traceflag &= ~KTRFAC_ACTIVE;
    276       1.9       cgd }
    277       1.9       cgd 
    278      1.17       cgd void
    279      1.47   thorpej ktrcsw(struct proc *p, int out, int user)
    280       1.9       cgd {
    281      1.39   thorpej 	struct ktr_header kth;
    282      1.39   thorpej 	struct ktr_csw kc;
    283       1.9       cgd 
    284       1.9       cgd 	p->p_traceflag |= KTRFAC_ACTIVE;
    285      1.39   thorpej 	ktrinitheader(&kth, p, KTR_CSW);
    286       1.9       cgd 	kc.out = out;
    287       1.9       cgd 	kc.user = user;
    288      1.39   thorpej 	kth.ktr_buf = (caddr_t)&kc;
    289      1.39   thorpej 	kth.ktr_len = sizeof(struct ktr_csw);
    290       1.9       cgd 
    291      1.42  sommerfe 	(void) ktrwrite(p, &kth);
    292       1.9       cgd 	p->p_traceflag &= ~KTRFAC_ACTIVE;
    293       1.1       cgd }
    294       1.1       cgd 
    295      1.51  jdolecek void
    296      1.51  jdolecek ktruser(p, id, addr, len, ustr)
    297      1.51  jdolecek 	struct proc *p;
    298      1.51  jdolecek 	const char *id;
    299      1.51  jdolecek 	void *addr;
    300      1.51  jdolecek 	size_t len;
    301      1.51  jdolecek 	int ustr;
    302      1.51  jdolecek {
    303      1.51  jdolecek 	struct ktr_header kth;
    304      1.51  jdolecek 	struct ktr_user *ktp;
    305      1.51  jdolecek 	caddr_t user_dta;
    306      1.51  jdolecek 
    307      1.51  jdolecek 	p->p_traceflag |= KTRFAC_ACTIVE;
    308      1.51  jdolecek 	ktrinitheader(&kth, p, KTR_USER);
    309      1.51  jdolecek 	ktp = malloc(sizeof(struct ktr_user) + len, M_TEMP, M_WAITOK);
    310      1.51  jdolecek 	if (ustr) {
    311      1.51  jdolecek 		if (copyinstr(id, ktp->ktr_id, KTR_USER_MAXIDLEN, NULL) != 0)
    312      1.51  jdolecek 			ktp->ktr_id[0] = '\0';
    313      1.51  jdolecek 	} else
    314      1.51  jdolecek 		strncpy(ktp->ktr_id, id, KTR_USER_MAXIDLEN);
    315      1.51  jdolecek 	ktp->ktr_id[KTR_USER_MAXIDLEN-1] = '\0';
    316      1.51  jdolecek 
    317      1.51  jdolecek 	user_dta = (caddr_t) ((char *)ktp + sizeof(struct ktr_user));
    318      1.51  jdolecek 	if (copyin(addr, (void *) user_dta, len) != 0)
    319      1.51  jdolecek 		len = 0;
    320      1.51  jdolecek 
    321      1.51  jdolecek 	kth.ktr_buf = (void *)ktp;
    322      1.51  jdolecek 	kth.ktr_len = sizeof(struct ktr_user) + len;
    323      1.51  jdolecek 	(void) ktrwrite(p, &kth);
    324      1.51  jdolecek 
    325      1.51  jdolecek 	free(ktp, M_TEMP);
    326      1.51  jdolecek 	p->p_traceflag &= ~KTRFAC_ACTIVE;
    327      1.51  jdolecek 
    328      1.51  jdolecek }
    329      1.51  jdolecek 
    330       1.1       cgd /* Interface and common routines */
    331       1.1       cgd 
    332      1.17       cgd int
    333      1.47   thorpej ktrace_common(struct proc *curp, int ops, int facs, int pid, struct file *fp)
    334      1.28  christos {
    335      1.42  sommerfe 	int ret = 0;
    336      1.42  sommerfe 	int error = 0;
    337      1.42  sommerfe 	int one = 1;
    338      1.42  sommerfe 	int descend;
    339      1.28  christos 	struct proc *p;
    340      1.28  christos 	struct pgrp *pg;
    341      1.28  christos 
    342      1.28  christos 	curp->p_traceflag |= KTRFAC_ACTIVE;
    343      1.42  sommerfe 	descend = ops & KTRFLAG_DESCEND;
    344      1.42  sommerfe 	facs = facs & ~((unsigned) KTRFAC_ROOT);
    345      1.28  christos 
    346      1.28  christos 	/*
    347      1.28  christos 	 * Clear all uses of the tracefile
    348      1.28  christos 	 */
    349      1.28  christos 	if (KTROP(ops) == KTROP_CLEARFILE) {
    350      1.37   thorpej 		proclist_lock_read();
    351      1.39   thorpej 		for (p = LIST_FIRST(&allproc); p != NULL;
    352      1.39   thorpej 		     p = LIST_NEXT(p, p_list)) {
    353      1.44  sommerfe 			if (ktrsamefile(p->p_tracep, fp)) {
    354      1.28  christos 				if (ktrcanset(curp, p))
    355      1.28  christos 					ktrderef(p);
    356      1.28  christos 				else
    357      1.28  christos 					error = EPERM;
    358      1.28  christos 			}
    359      1.28  christos 		}
    360      1.36   thorpej 		proclist_unlock_read();
    361      1.28  christos 		goto done;
    362      1.28  christos 	}
    363      1.42  sommerfe 
    364      1.42  sommerfe 	/*
    365      1.42  sommerfe 	 * Mark fp non-blocking, to avoid problems from possible deadlocks.
    366      1.42  sommerfe 	 */
    367      1.42  sommerfe 
    368      1.43  sommerfe 	if (fp != NULL) {
    369      1.43  sommerfe 		fp->f_flag |= FNONBLOCK;
    370      1.43  sommerfe 		(*fp->f_ops->fo_ioctl)(fp, FIONBIO, (caddr_t)&one, curp);
    371      1.43  sommerfe 	}
    372      1.42  sommerfe 
    373      1.28  christos 	/*
    374      1.28  christos 	 * need something to (un)trace (XXX - why is this here?)
    375      1.28  christos 	 */
    376      1.28  christos 	if (!facs) {
    377      1.28  christos 		error = EINVAL;
    378      1.28  christos 		goto done;
    379      1.28  christos 	}
    380      1.28  christos 	/*
    381      1.28  christos 	 * do it
    382      1.28  christos 	 */
    383      1.42  sommerfe 	if (pid < 0) {
    384      1.28  christos 		/*
    385      1.28  christos 		 * by process group
    386      1.28  christos 		 */
    387      1.42  sommerfe 		pg = pgfind(-pid);
    388      1.28  christos 		if (pg == NULL) {
    389      1.28  christos 			error = ESRCH;
    390      1.28  christos 			goto done;
    391      1.28  christos 		}
    392      1.39   thorpej 		for (p = LIST_FIRST(&pg->pg_members); p != NULL;
    393      1.39   thorpej 		     p = LIST_NEXT(p, p_pglist)) {
    394      1.28  christos 			if (descend)
    395      1.28  christos 				ret |= ktrsetchildren(curp, p, ops, facs, fp);
    396      1.28  christos 			else
    397      1.28  christos 				ret |= ktrops(curp, p, ops, facs, fp);
    398      1.39   thorpej 		}
    399      1.28  christos 
    400      1.28  christos 	} else {
    401      1.28  christos 		/*
    402      1.28  christos 		 * by pid
    403      1.28  christos 		 */
    404      1.42  sommerfe 		p = pfind(pid);
    405      1.28  christos 		if (p == NULL) {
    406      1.28  christos 			error = ESRCH;
    407      1.28  christos 			goto done;
    408      1.28  christos 		}
    409      1.28  christos 		if (descend)
    410      1.28  christos 			ret |= ktrsetchildren(curp, p, ops, facs, fp);
    411      1.28  christos 		else
    412      1.28  christos 			ret |= ktrops(curp, p, ops, facs, fp);
    413      1.28  christos 	}
    414      1.28  christos 	if (!ret)
    415      1.28  christos 		error = EPERM;
    416      1.28  christos done:
    417      1.28  christos 	curp->p_traceflag &= ~KTRFAC_ACTIVE;
    418      1.28  christos 	return (error);
    419      1.28  christos }
    420      1.28  christos 
    421      1.28  christos /*
    422      1.28  christos  * ktrace system call
    423      1.28  christos  */
    424      1.28  christos /* ARGSUSED */
    425      1.28  christos int
    426  1.53.2.1   nathanw sys_fktrace(struct lwp *l, void *v, register_t *retval)
    427      1.42  sommerfe {
    428      1.42  sommerfe 	struct sys_fktrace_args /* {
    429      1.42  sommerfe 		syscallarg(int) fd;
    430      1.42  sommerfe 		syscallarg(int) ops;
    431      1.42  sommerfe 		syscallarg(int) facs;
    432      1.42  sommerfe 		syscallarg(int) pid;
    433      1.42  sommerfe 	} */ *uap = v;
    434  1.53.2.1   nathanw 	struct proc *curp = l->l_proc;
    435      1.42  sommerfe 	struct file *fp = NULL;
    436      1.42  sommerfe 	struct filedesc *fdp = curp->p_fd;
    437      1.42  sommerfe 
    438  1.53.2.2   nathanw 	if ((fp = fd_getfile(fdp, SCARG(uap, fd))) == NULL)
    439  1.53.2.2   nathanw 		return (EBADF);
    440  1.53.2.2   nathanw 
    441  1.53.2.2   nathanw 	if ((fp->f_flag & FWRITE) == 0)
    442      1.42  sommerfe 		return (EBADF);
    443      1.42  sommerfe 
    444      1.42  sommerfe 	return ktrace_common(curp, SCARG(uap, ops),
    445      1.42  sommerfe 	    SCARG(uap, facs), SCARG(uap, pid), fp);
    446      1.42  sommerfe }
    447      1.42  sommerfe 
    448      1.42  sommerfe /*
    449      1.42  sommerfe  * ktrace system call
    450      1.42  sommerfe  */
    451      1.42  sommerfe /* ARGSUSED */
    452      1.42  sommerfe int
    453  1.53.2.1   nathanw sys_ktrace(struct lwp *l, void *v, register_t *retval)
    454      1.19   thorpej {
    455      1.28  christos 	struct sys_ktrace_args /* {
    456      1.24   mycroft 		syscallarg(const char *) fname;
    457      1.13       cgd 		syscallarg(int) ops;
    458      1.13       cgd 		syscallarg(int) facs;
    459      1.13       cgd 		syscallarg(int) pid;
    460      1.19   thorpej 	} */ *uap = v;
    461  1.53.2.1   nathanw 	struct proc *curp = l->l_proc;
    462      1.28  christos 	struct vnode *vp = NULL;
    463      1.42  sommerfe 	struct file *fp = NULL;
    464      1.42  sommerfe 	int fd;
    465      1.42  sommerfe 	int ops = SCARG(uap, ops);
    466       1.1       cgd 	int error = 0;
    467       1.1       cgd 	struct nameidata nd;
    468       1.1       cgd 
    469      1.42  sommerfe 	ops = KTROP(ops) | (ops & KTRFLAG_DESCEND);
    470      1.42  sommerfe 
    471       1.9       cgd 	curp->p_traceflag |= KTRFAC_ACTIVE;
    472       1.1       cgd 	if (ops != KTROP_CLEAR) {
    473       1.1       cgd 		/*
    474       1.1       cgd 		 * an operation which requires a file argument.
    475       1.1       cgd 		 */
    476      1.13       cgd 		NDINIT(&nd, LOOKUP, FOLLOW, UIO_USERSPACE, SCARG(uap, fname),
    477      1.13       cgd 		    curp);
    478      1.22  christos 		if ((error = vn_open(&nd, FREAD|FWRITE, 0)) != 0) {
    479       1.9       cgd 			curp->p_traceflag &= ~KTRFAC_ACTIVE;
    480       1.1       cgd 			return (error);
    481       1.9       cgd 		}
    482       1.1       cgd 		vp = nd.ni_vp;
    483      1.25      fvdl 		VOP_UNLOCK(vp, 0);
    484       1.1       cgd 		if (vp->v_type != VREG) {
    485       1.1       cgd 			(void) vn_close(vp, FREAD|FWRITE, curp->p_ucred, curp);
    486       1.9       cgd 			curp->p_traceflag &= ~KTRFAC_ACTIVE;
    487       1.1       cgd 			return (EACCES);
    488       1.1       cgd 		}
    489       1.1       cgd 		/*
    490      1.42  sommerfe 		 * XXX This uses up a file descriptor slot in the
    491      1.42  sommerfe 		 * tracing process for the duration of this syscall.
    492      1.42  sommerfe 		 * This is not expected to be a problem.  If
    493      1.42  sommerfe 		 * falloc(NULL, ...) DTRT we could skip that part, but
    494      1.42  sommerfe 		 * that would require changing its interface to allow
    495      1.42  sommerfe 		 * the caller to pass in a ucred..
    496      1.42  sommerfe 		 *
    497      1.42  sommerfe 		 * This will FILE_USE the fp it returns, if any.
    498      1.42  sommerfe 		 * Keep it in use until we return.
    499       1.1       cgd 		 */
    500      1.42  sommerfe 		if ((error = falloc(curp, &fp, &fd)) != 0)
    501       1.1       cgd 			goto done;
    502      1.42  sommerfe 
    503      1.42  sommerfe 		fp->f_flag = FWRITE|FAPPEND;
    504      1.42  sommerfe 		fp->f_type = DTYPE_VNODE;
    505      1.42  sommerfe 		fp->f_ops = &vnops;
    506      1.42  sommerfe 		fp->f_data = (caddr_t)vp;
    507  1.53.2.2   nathanw 		FILE_SET_MATURE(fp);
    508      1.42  sommerfe 		vp = NULL;
    509      1.42  sommerfe 	}
    510      1.42  sommerfe 	error = ktrace_common(curp, SCARG(uap, ops), SCARG(uap, facs),
    511      1.42  sommerfe 	    SCARG(uap, pid), fp);
    512      1.42  sommerfe done:
    513       1.1       cgd 	if (vp != NULL)
    514       1.1       cgd 		(void) vn_close(vp, FWRITE, curp->p_ucred, curp);
    515      1.42  sommerfe 	if (fp != NULL) {
    516      1.44  sommerfe 		FILE_UNUSE(fp, curp);	/* release file */
    517      1.42  sommerfe 		fdrelease(curp, fd); 	/* release fd table slot */
    518      1.42  sommerfe 	}
    519       1.1       cgd 	return (error);
    520       1.1       cgd }
    521       1.1       cgd 
    522       1.4    andrew int
    523      1.47   thorpej ktrops(struct proc *curp, struct proc *p, int ops, int facs, struct file *fp)
    524       1.1       cgd {
    525       1.1       cgd 
    526       1.1       cgd 	if (!ktrcanset(curp, p))
    527       1.1       cgd 		return (0);
    528      1.28  christos 	if (KTROP(ops) == KTROP_SET) {
    529      1.42  sommerfe 		if (p->p_tracep != fp) {
    530       1.1       cgd 			/*
    531       1.1       cgd 			 * if trace file already in use, relinquish
    532       1.1       cgd 			 */
    533      1.28  christos 			ktrderef(p);
    534      1.42  sommerfe 			p->p_tracep = fp;
    535      1.28  christos 			ktradref(p);
    536       1.1       cgd 		}
    537       1.1       cgd 		p->p_traceflag |= facs;
    538       1.1       cgd 		if (curp->p_ucred->cr_uid == 0)
    539       1.1       cgd 			p->p_traceflag |= KTRFAC_ROOT;
    540       1.1       cgd 	} else {
    541       1.1       cgd 		/* KTROP_CLEAR */
    542       1.1       cgd 		if (((p->p_traceflag &= ~facs) & KTRFAC_MASK) == 0) {
    543       1.1       cgd 			/* no more tracing */
    544      1.28  christos 			ktrderef(p);
    545       1.1       cgd 		}
    546       1.1       cgd 	}
    547      1.21  christos 
    548      1.21  christos 	/*
    549      1.21  christos 	 * Emit an emulation record, every time there is a ktrace
    550      1.21  christos 	 * change/attach request.
    551      1.21  christos 	 */
    552      1.21  christos 	if (KTRPOINT(p, KTR_EMUL))
    553      1.42  sommerfe 		ktremul(p);
    554      1.49    martin #ifdef __HAVE_SYSCALL_INTERN
    555      1.48   mycroft 	(*p->p_emul->e_syscall_intern)(p);
    556      1.49    martin #endif
    557       1.1       cgd 
    558       1.1       cgd 	return (1);
    559       1.1       cgd }
    560       1.1       cgd 
    561      1.22  christos int
    562      1.47   thorpej ktrsetchildren(struct proc *curp, struct proc *top, int ops, int facs,
    563      1.47   thorpej     struct file *fp)
    564       1.1       cgd {
    565      1.28  christos 	struct proc *p;
    566      1.28  christos 	int ret = 0;
    567       1.1       cgd 
    568       1.1       cgd 	p = top;
    569       1.1       cgd 	for (;;) {
    570      1.42  sommerfe 		ret |= ktrops(curp, p, ops, facs, fp);
    571       1.1       cgd 		/*
    572       1.1       cgd 		 * If this process has children, descend to them next,
    573       1.1       cgd 		 * otherwise do any siblings, and if done with this level,
    574       1.1       cgd 		 * follow back up the tree (but not past top).
    575       1.1       cgd 		 */
    576      1.39   thorpej 		if (LIST_FIRST(&p->p_children) != NULL)
    577      1.39   thorpej 			p = LIST_FIRST(&p->p_children);
    578       1.1       cgd 		else for (;;) {
    579       1.1       cgd 			if (p == top)
    580       1.1       cgd 				return (ret);
    581      1.39   thorpej 			if (LIST_NEXT(p, p_sibling) != NULL) {
    582      1.39   thorpej 				p = LIST_NEXT(p, p_sibling);
    583       1.1       cgd 				break;
    584       1.1       cgd 			}
    585      1.12   mycroft 			p = p->p_pptr;
    586       1.1       cgd 		}
    587       1.1       cgd 	}
    588       1.1       cgd 	/*NOTREACHED*/
    589       1.1       cgd }
    590       1.1       cgd 
    591      1.39   thorpej int
    592      1.47   thorpej ktrwrite(struct proc *p, struct ktr_header *kth)
    593       1.1       cgd {
    594       1.1       cgd 	struct uio auio;
    595       1.1       cgd 	struct iovec aiov[2];
    596      1.42  sommerfe 	int error, tries;
    597      1.42  sommerfe 	struct file *fp = p->p_tracep;
    598       1.1       cgd 
    599      1.42  sommerfe 	if (fp == NULL)
    600      1.42  sommerfe 		return 0;
    601      1.42  sommerfe 
    602       1.1       cgd 	auio.uio_iov = &aiov[0];
    603       1.1       cgd 	auio.uio_offset = 0;
    604       1.1       cgd 	auio.uio_segflg = UIO_SYSSPACE;
    605       1.1       cgd 	auio.uio_rw = UIO_WRITE;
    606       1.1       cgd 	aiov[0].iov_base = (caddr_t)kth;
    607       1.1       cgd 	aiov[0].iov_len = sizeof(struct ktr_header);
    608       1.1       cgd 	auio.uio_resid = sizeof(struct ktr_header);
    609       1.1       cgd 	auio.uio_iovcnt = 1;
    610       1.1       cgd 	auio.uio_procp = (struct proc *)0;
    611       1.1       cgd 	if (kth->ktr_len > 0) {
    612       1.1       cgd 		auio.uio_iovcnt++;
    613       1.1       cgd 		aiov[1].iov_base = kth->ktr_buf;
    614       1.1       cgd 		aiov[1].iov_len = kth->ktr_len;
    615       1.1       cgd 		auio.uio_resid += kth->ktr_len;
    616       1.1       cgd 	}
    617      1.28  christos 
    618      1.42  sommerfe 	FILE_USE(fp);
    619      1.42  sommerfe 
    620      1.42  sommerfe 	tries = 0;
    621      1.42  sommerfe 	do {
    622      1.30   thorpej 		error = (*fp->f_ops->fo_write)(fp, &fp->f_offset, &auio,
    623      1.30   thorpej 		    fp->f_cred, FOF_UPDATE_OFFSET);
    624      1.42  sommerfe 		tries++;
    625      1.42  sommerfe 		if (error == EWOULDBLOCK)
    626      1.42  sommerfe 		  	yield();
    627      1.42  sommerfe 	} while ((error == EWOULDBLOCK) && (tries < 3));
    628      1.42  sommerfe 	FILE_UNUSE(fp, NULL);
    629      1.28  christos 
    630      1.40   thorpej 	if (__predict_true(error == 0))
    631      1.39   thorpej 		return (0);
    632       1.1       cgd 	/*
    633      1.38   darrenr 	 * If error encountered, give up tracing on this vnode.  Don't report
    634      1.38   darrenr 	 * EPIPE as this can easily happen with fktrace()/ktruss.
    635       1.1       cgd 	 */
    636      1.38   darrenr 	if (error != EPIPE)
    637      1.38   darrenr 		log(LOG_NOTICE,
    638      1.38   darrenr 		    "ktrace write failed, errno %d, tracing stopped\n",
    639      1.38   darrenr 		    error);
    640      1.37   thorpej 	proclist_lock_read();
    641      1.39   thorpej 	for (p = LIST_FIRST(&allproc); p != NULL; p = LIST_NEXT(p, p_list)) {
    642      1.44  sommerfe 		if (ktrsamefile(p->p_tracep, fp))
    643      1.28  christos 			ktrderef(p);
    644       1.1       cgd 	}
    645      1.36   thorpej 	proclist_unlock_read();
    646      1.39   thorpej 
    647      1.39   thorpej 	return (error);
    648       1.1       cgd }
    649       1.1       cgd 
    650       1.1       cgd /*
    651       1.1       cgd  * Return true if caller has permission to set the ktracing state
    652       1.1       cgd  * of target.  Essentially, the target can't possess any
    653       1.1       cgd  * more permissions than the caller.  KTRFAC_ROOT signifies that
    654       1.1       cgd  * root previously set the tracing status on the target process, and
    655       1.1       cgd  * so, only root may further change it.
    656       1.1       cgd  *
    657       1.1       cgd  * TODO: check groups.  use caller effective gid.
    658       1.1       cgd  */
    659      1.22  christos int
    660      1.47   thorpej ktrcanset(struct proc *callp, struct proc *targetp)
    661       1.1       cgd {
    662      1.28  christos 	struct pcred *caller = callp->p_cred;
    663      1.28  christos 	struct pcred *target = targetp->p_cred;
    664       1.1       cgd 
    665       1.1       cgd 	if ((caller->pc_ucred->cr_uid == target->p_ruid &&
    666       1.1       cgd 	     target->p_ruid == target->p_svuid &&
    667       1.1       cgd 	     caller->p_rgid == target->p_rgid &&	/* XXX */
    668       1.1       cgd 	     target->p_rgid == target->p_svgid &&
    669  1.53.2.7   nathanw 	     (targetp->p_traceflag & KTRFAC_ROOT) == 0 &&
    670  1.53.2.7   nathanw 	     (targetp->p_flag & P_SUGID) == 0) ||
    671       1.1       cgd 	     caller->pc_ucred->cr_uid == 0)
    672       1.1       cgd 		return (1);
    673       1.1       cgd 
    674       1.1       cgd 	return (0);
    675       1.1       cgd }
    676      1.47   thorpej #endif /* KTRACE */
    677      1.51  jdolecek 
    678      1.51  jdolecek /*
    679      1.51  jdolecek  * Put user defined entry to ktrace records.
    680      1.51  jdolecek  */
    681      1.51  jdolecek int
    682  1.53.2.1   nathanw sys_utrace(l, v, retval)
    683  1.53.2.1   nathanw 	struct lwp *l;
    684      1.51  jdolecek 	void *v;
    685      1.51  jdolecek 	register_t *retval;
    686      1.51  jdolecek {
    687      1.51  jdolecek #ifdef KTRACE
    688      1.51  jdolecek 	struct sys_utrace_args /* {
    689      1.52  jdolecek 		syscallarg(const char *) label;
    690      1.51  jdolecek 		syscallarg(void *) addr;
    691      1.51  jdolecek 		syscallarg(size_t) len;
    692      1.51  jdolecek 	} */ *uap = v;
    693  1.53.2.1   nathanw 	struct proc *p = l->l_proc;
    694      1.51  jdolecek 	if (!KTRPOINT(p, KTR_USER))
    695      1.51  jdolecek 		return (0);
    696      1.53  jdolecek 
    697      1.53  jdolecek 	if (SCARG(uap, len) > KTR_USER_MAXLEN)
    698      1.53  jdolecek 		return (EINVAL);
    699      1.51  jdolecek 
    700      1.52  jdolecek 	ktruser(p, SCARG(uap, label), SCARG(uap, addr), SCARG(uap, len), 1);
    701      1.51  jdolecek 
    702      1.51  jdolecek 	return (0);
    703      1.51  jdolecek #else /* !KTRACE */
    704      1.51  jdolecek 	return ENOSYS;
    705      1.51  jdolecek #endif /* KTRACE */
    706      1.51  jdolecek }
    707