Home | History | Annotate | Line # | Download | only in kern
kern_ktrace.c revision 1.93
      1  1.93     enami /*	$NetBSD: kern_ktrace.c,v 1.93 2004/09/22 22:15:03 enami Exp $	*/
      2  1.11       cgd 
      3   1.1       cgd /*
      4   1.9       cgd  * Copyright (c) 1989, 1993
      5   1.9       cgd  *	The Regents of the University of California.  All rights reserved.
      6   1.1       cgd  *
      7   1.1       cgd  * Redistribution and use in source and binary forms, with or without
      8   1.1       cgd  * modification, are permitted provided that the following conditions
      9   1.1       cgd  * are met:
     10   1.1       cgd  * 1. Redistributions of source code must retain the above copyright
     11   1.1       cgd  *    notice, this list of conditions and the following disclaimer.
     12   1.1       cgd  * 2. Redistributions in binary form must reproduce the above copyright
     13   1.1       cgd  *    notice, this list of conditions and the following disclaimer in the
     14   1.1       cgd  *    documentation and/or other materials provided with the distribution.
     15  1.77       agc  * 3. Neither the name of the University nor the names of its contributors
     16   1.1       cgd  *    may be used to endorse or promote products derived from this software
     17   1.1       cgd  *    without specific prior written permission.
     18   1.1       cgd  *
     19   1.1       cgd  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
     20   1.1       cgd  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     21   1.1       cgd  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     22   1.1       cgd  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
     23   1.1       cgd  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     24   1.1       cgd  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     25   1.1       cgd  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     26   1.1       cgd  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     27   1.1       cgd  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     28   1.1       cgd  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     29   1.1       cgd  * SUCH DAMAGE.
     30   1.1       cgd  *
     31  1.25      fvdl  *	@(#)kern_ktrace.c	8.5 (Berkeley) 5/14/95
     32   1.1       cgd  */
     33  1.55     lukem 
     34  1.55     lukem #include <sys/cdefs.h>
     35  1.93     enami __KERNEL_RCSID(0, "$NetBSD: kern_ktrace.c,v 1.93 2004/09/22 22:15:03 enami Exp $");
     36  1.29   thorpej 
     37  1.29   thorpej #include "opt_ktrace.h"
     38  1.62      manu #include "opt_compat_mach.h"
     39   1.1       cgd 
     40   1.7   mycroft #include <sys/param.h>
     41  1.13       cgd #include <sys/systm.h>
     42   1.7   mycroft #include <sys/proc.h>
     43   1.7   mycroft #include <sys/file.h>
     44   1.7   mycroft #include <sys/namei.h>
     45   1.7   mycroft #include <sys/vnode.h>
     46  1.93     enami #include <sys/kernel.h>
     47  1.93     enami #include <sys/kthread.h>
     48   1.7   mycroft #include <sys/ktrace.h>
     49   1.7   mycroft #include <sys/malloc.h>
     50   1.7   mycroft #include <sys/syslog.h>
     51  1.28  christos #include <sys/filedesc.h>
     52  1.42  sommerfe #include <sys/ioctl.h>
     53  1.93     enami #include <sys/callout.h>
     54   1.1       cgd 
     55  1.13       cgd #include <sys/mount.h>
     56  1.67   thorpej #include <sys/sa.h>
     57  1.13       cgd #include <sys/syscallargs.h>
     58  1.22  christos 
     59  1.51  jdolecek #ifdef KTRACE
     60  1.51  jdolecek 
     61  1.93     enami /*
     62  1.93     enami  * XXX:
     63  1.93     enami  *	- need better error reporting?
     64  1.93     enami  *	- p->p_tracep access lock.  lock p_lock, lock ktd if !NULL, inc ref.
     65  1.93     enami  *	- userland utility to sort ktrace.out by timestamp.
     66  1.93     enami  *	- keep minimum information in ktrace_entry when rest of alloc failed.
     67  1.93     enami  *	- enlarge ktrace_entry so that small entry won't require additional
     68  1.93     enami  *	  alloc?
     69  1.93     enami  *	- per trace control of configurable parameters.
     70  1.93     enami  */
     71  1.93     enami 
     72  1.93     enami struct ktrace_entry {
     73  1.93     enami 	TAILQ_ENTRY(ktrace_entry) kte_list;
     74  1.93     enami 	struct ktr_header kte_kth;
     75  1.93     enami 	void *kte_buf;			/* ktr_buf */
     76  1.93     enami };
     77  1.93     enami 
     78  1.93     enami struct ktr_desc {
     79  1.93     enami 	TAILQ_ENTRY(ktr_desc) ktd_list;
     80  1.93     enami 	int ktd_flags;
     81  1.93     enami #define	KTDF_WAIT		0x0001
     82  1.93     enami #define	KTDF_DONE		0x0002
     83  1.93     enami #define	KTDF_BLOCKING		0x0004
     84  1.93     enami #define	KTDF_INTERACTIVE	0x0008
     85  1.93     enami 	int ktd_error;
     86  1.93     enami #define	KTDE_ENOMEM		0x0001
     87  1.93     enami #define	KTDE_ENOSPC		0x0002
     88  1.93     enami 	int ktd_errcnt;
     89  1.93     enami 	int ktd_ref;			/* # of reference */
     90  1.93     enami 	int ktd_qcount;			/* # of entry in the queue */
     91  1.93     enami 
     92  1.93     enami 	/*
     93  1.93     enami 	 * Params to control behaviour.
     94  1.93     enami 	 */
     95  1.93     enami 	int ktd_delayqcnt;		/* # of entry allowed to delay */
     96  1.93     enami 	int ktd_wakedelay;		/* delay of wakeup in *tick* */
     97  1.93     enami 	int ktd_intrwakdl;		/* ditto, but when interactive */
     98  1.93     enami 
     99  1.93     enami 	struct file *ktd_fp;		/* trace output file */
    100  1.93     enami 	struct proc *ktd_proc;		/* our kernel thread */
    101  1.93     enami 	TAILQ_HEAD(, ktrace_entry) ktd_queue;
    102  1.93     enami 	struct callout ktd_wakch;	/* delayed wakeup */
    103  1.93     enami 	struct simplelock ktd_slock;
    104  1.93     enami };
    105  1.93     enami 
    106  1.93     enami static void	ktrinitheader(struct ktr_header *, struct proc *, int);
    107  1.93     enami static void	ktrwrite(struct ktr_desc *, struct ktrace_entry *);
    108  1.93     enami static int	ktrace_common(struct proc *, int, int, int, struct file *);
    109  1.93     enami static int	ktrops(struct proc *, struct proc *, int, int,
    110  1.93     enami 		    struct ktr_desc *);
    111  1.93     enami static int	ktrsetchildren(struct proc *, struct proc *, int, int,
    112  1.93     enami 		    struct ktr_desc *);
    113  1.93     enami static int	ktrcanset(struct proc *, struct proc *);
    114  1.93     enami static int	ktrsamefile(struct file *, struct file *);
    115  1.93     enami 
    116  1.93     enami static struct ktr_desc *
    117  1.93     enami 		ktd_lookup(struct file *);
    118  1.93     enami static void	ktdrel(struct ktr_desc *);
    119  1.93     enami static void	ktdref(struct ktr_desc *);
    120  1.93     enami static void	ktraddentry(struct proc *, struct ktrace_entry *, int);
    121  1.93     enami /* Flags for ktraddentry (3rd arg) */
    122  1.93     enami #define	KTA_NOWAIT		0x0000
    123  1.93     enami #define	KTA_WAITOK		0x0001
    124  1.93     enami #define	KTA_LARGE		0x0002
    125  1.93     enami static void	ktefree(struct ktrace_entry *);
    126  1.93     enami static void	ktd_logerrl(struct ktr_desc *, int);
    127  1.93     enami static void	ktd_logerr(struct proc *, int);
    128  1.93     enami static void	ktrace_thread(void *);
    129  1.93     enami 
    130  1.93     enami /*
    131  1.93     enami  * Default vaules.
    132  1.93     enami  */
    133  1.93     enami #define	KTD_MAXENTRY		1000	/* XXX: tune */
    134  1.93     enami #define	KTD_TIMEOUT		5	/* XXX: tune */
    135  1.93     enami #define	KTD_DELAYQCNT		100	/* XXX: tune */
    136  1.93     enami #define	KTD_WAKEDELAY		5000	/* XXX: tune */
    137  1.93     enami #define	KTD_INTRWAKDL		100	/* XXX: tune */
    138  1.93     enami 
    139  1.93     enami /*
    140  1.93     enami  * Patchable variables.
    141  1.93     enami  */
    142  1.93     enami int ktd_maxentry = KTD_MAXENTRY;	/* max # of entry in the queue */
    143  1.93     enami int ktd_timeout = KTD_TIMEOUT;		/* timeout in seconds */
    144  1.93     enami int ktd_delayqcnt = KTD_DELAYQCNT;	/* # of entry allowed to delay */
    145  1.93     enami int ktd_wakedelay = KTD_WAKEDELAY;	/* delay of wakeup in *ms* */
    146  1.93     enami int ktd_intrwakdl = KTD_INTRWAKDL;	/* ditto, but when interactive */
    147  1.93     enami 
    148  1.93     enami static struct simplelock ktdq_slock = SIMPLELOCK_INITIALIZER;
    149  1.93     enami static TAILQ_HEAD(, ktr_desc) ktdq = TAILQ_HEAD_INITIALIZER(ktdq);
    150  1.93     enami 
    151  1.93     enami MALLOC_DEFINE(M_KTRACE, "ktrace", "ktrace data buffer");
    152  1.93     enami POOL_INIT(kte_pool, sizeof(struct ktrace_entry), 0, 0, 0,
    153  1.93     enami     "ktepl", &pool_allocator_nointr);
    154  1.93     enami 
    155  1.93     enami static __inline void
    156  1.93     enami ktd_wakeup(struct ktr_desc *ktd)
    157  1.93     enami {
    158  1.93     enami 
    159  1.93     enami 	callout_stop(&ktd->ktd_wakch);
    160  1.93     enami 	wakeup(ktd);
    161  1.93     enami }
    162  1.93     enami 
    163  1.93     enami static void
    164  1.93     enami ktd_logerrl(struct ktr_desc *ktd, int error)
    165  1.93     enami {
    166  1.93     enami 
    167  1.93     enami 	ktd->ktd_error |= error;
    168  1.93     enami 	ktd->ktd_errcnt++;
    169  1.93     enami }
    170  1.93     enami 
    171  1.93     enami static void
    172  1.93     enami ktd_logerr(struct proc *p, int error)
    173  1.93     enami {
    174  1.93     enami 	struct ktr_desc *ktd = p->p_tracep;
    175  1.93     enami 
    176  1.93     enami 	if (ktd == NULL)
    177  1.93     enami 		return;
    178  1.93     enami 
    179  1.93     enami 	simple_lock(&ktd->ktd_slock);
    180  1.93     enami 	ktd_logerrl(ktd, error);
    181  1.93     enami 	simple_unlock(&ktd->ktd_slock);
    182  1.93     enami }
    183  1.93     enami 
    184  1.93     enami /*
    185  1.93     enami  * Release a reference.  Called with ktd_slock held.
    186  1.93     enami  */
    187  1.93     enami void
    188  1.93     enami ktdrel(struct ktr_desc *ktd)
    189  1.93     enami {
    190  1.93     enami 
    191  1.93     enami 	KDASSERT(ktd->ktd_ref != 0);
    192  1.93     enami 	KASSERT(ktd->ktd_ref > 0);
    193  1.93     enami 	if (--ktd->ktd_ref <= 0) {
    194  1.93     enami 		ktd->ktd_flags |= KTDF_DONE;
    195  1.93     enami 		wakeup(ktd);
    196  1.93     enami 	}
    197  1.93     enami 	simple_unlock(&ktd->ktd_slock);
    198  1.93     enami }
    199  1.93     enami 
    200  1.93     enami void
    201  1.93     enami ktdref(struct ktr_desc *ktd)
    202  1.93     enami {
    203  1.93     enami 
    204  1.93     enami 	simple_lock(&ktd->ktd_slock);
    205  1.93     enami 	ktd->ktd_ref++;
    206  1.93     enami 	simple_unlock(&ktd->ktd_slock);
    207  1.93     enami }
    208  1.93     enami 
    209  1.93     enami struct ktr_desc *
    210  1.93     enami ktd_lookup(struct file *fp)
    211  1.93     enami {
    212  1.93     enami 	struct ktr_desc *ktd;
    213  1.93     enami 
    214  1.93     enami 	simple_lock(&ktdq_slock);
    215  1.93     enami 	for (ktd = TAILQ_FIRST(&ktdq); ktd != NULL;
    216  1.93     enami 	    ktd = TAILQ_NEXT(ktd, ktd_list)) {
    217  1.93     enami 		simple_lock(&ktd->ktd_slock);
    218  1.93     enami 		if (ktrsamefile(ktd->ktd_fp, fp)) {
    219  1.93     enami 			ktd->ktd_ref++;
    220  1.93     enami 			simple_unlock(&ktd->ktd_slock);
    221  1.93     enami 			break;
    222  1.93     enami 		}
    223  1.93     enami 		simple_unlock(&ktd->ktd_slock);
    224  1.93     enami 	}
    225  1.93     enami 	simple_unlock(&ktdq_slock);
    226  1.93     enami 	return (ktd);
    227  1.93     enami }
    228  1.93     enami 
    229  1.93     enami void
    230  1.93     enami ktraddentry(struct proc *p, struct ktrace_entry *kte, int flags)
    231  1.93     enami {
    232  1.93     enami 	struct ktr_desc *ktd;
    233  1.93     enami #ifdef DEBUG
    234  1.93     enami 	struct timeval t;
    235  1.93     enami 	int s;
    236  1.93     enami #endif
    237  1.93     enami 
    238  1.93     enami 	if (p->p_traceflag & KTRFAC_TRC_EMUL) {
    239  1.93     enami 		/* Add emulation trace before first entry for this process */
    240  1.93     enami 		p->p_traceflag &= ~KTRFAC_TRC_EMUL;
    241  1.93     enami 		ktremul(p);
    242  1.93     enami 	}
    243  1.93     enami 
    244  1.93     enami 	/*
    245  1.93     enami 	 * Tracing may be canceled while we were sleeping waiting for
    246  1.93     enami 	 * memory.
    247  1.93     enami 	 */
    248  1.93     enami 	ktd = p->p_tracep;
    249  1.93     enami 	if (ktd == NULL)
    250  1.93     enami 		goto freekte;
    251  1.93     enami 
    252  1.93     enami 	/*
    253  1.93     enami 	 * Bump reference count so that the object will remain while
    254  1.93     enami 	 * we are here.  Note that the trace is controlled by other
    255  1.93     enami 	 * process.
    256  1.93     enami 	 */
    257  1.93     enami 	ktdref(ktd);
    258  1.93     enami 
    259  1.93     enami 	simple_lock(&ktd->ktd_slock);
    260  1.93     enami 	if (ktd->ktd_flags & KTDF_DONE)
    261  1.93     enami 		goto relktd;
    262  1.93     enami 
    263  1.93     enami 	if (ktd->ktd_qcount > ktd_maxentry) {
    264  1.93     enami 		ktd_logerrl(ktd, KTDE_ENOSPC);
    265  1.93     enami 		goto relktd;
    266  1.93     enami 	}
    267  1.93     enami 	TAILQ_INSERT_TAIL(&ktd->ktd_queue, kte, kte_list);
    268  1.93     enami 	ktd->ktd_qcount++;
    269  1.93     enami 	if (ktd->ktd_flags & KTDF_BLOCKING)
    270  1.93     enami 		goto skip_sync;
    271  1.93     enami 
    272  1.93     enami 	if (flags & KTA_WAITOK &&
    273  1.93     enami 	    (/* flags & KTA_LARGE */0 || ktd->ktd_flags & KTDF_WAIT ||
    274  1.93     enami 	    ktd->ktd_qcount > ktd_maxentry >> 1))
    275  1.93     enami 		/*
    276  1.93     enami 		 * Sync with writer thread since we're requesting rather
    277  1.93     enami 		 * big one or many requests are pending.
    278  1.93     enami 		 */
    279  1.93     enami 		do {
    280  1.93     enami 			ktd->ktd_flags |= KTDF_WAIT;
    281  1.93     enami 			ktd_wakeup(ktd);
    282  1.93     enami #ifdef DEBUG
    283  1.93     enami 			s = splclock();
    284  1.93     enami 			t = mono_time;
    285  1.93     enami 			splx(s);
    286  1.93     enami #endif
    287  1.93     enami 			if (ltsleep(&ktd->ktd_flags, PWAIT, "ktrsync",
    288  1.93     enami 			    ktd_timeout * hz, &ktd->ktd_slock) != 0) {
    289  1.93     enami 				ktd->ktd_flags |= KTDF_BLOCKING;
    290  1.93     enami 				/*
    291  1.93     enami 				 * Maybe the writer thread is blocking
    292  1.93     enami 				 * completely for some reason, but
    293  1.93     enami 				 * don't stop target process forever.
    294  1.93     enami 				 */
    295  1.93     enami 				log(LOG_NOTICE, "ktrace timeout\n");
    296  1.93     enami 				break;
    297  1.93     enami 			}
    298  1.93     enami #ifdef DEBUG
    299  1.93     enami 			s = splclock();
    300  1.93     enami 			timersub(&mono_time, &t, &t);
    301  1.93     enami 			splx(s);
    302  1.93     enami 			if (t.tv_sec > 0)
    303  1.93     enami 				log(LOG_NOTICE,
    304  1.93     enami 				    "ktrace long wait: %ld.%06ld\n",
    305  1.93     enami 				    t.tv_sec, t.tv_usec);
    306  1.93     enami #endif
    307  1.93     enami 		} while (p->p_tracep == ktd &&
    308  1.93     enami 		    (ktd->ktd_flags & (KTDF_WAIT | KTDF_DONE)) == KTDF_WAIT);
    309  1.93     enami 	else {
    310  1.93     enami 		/* Schedule delayed wakeup */
    311  1.93     enami 		if (ktd->ktd_qcount > ktd->ktd_delayqcnt)
    312  1.93     enami 			ktd_wakeup(ktd);	/* Wakeup now */
    313  1.93     enami 		else if (!callout_pending(&ktd->ktd_wakch))
    314  1.93     enami 			callout_reset(&ktd->ktd_wakch,
    315  1.93     enami 			    ktd->ktd_flags & KTDF_INTERACTIVE ?
    316  1.93     enami 			    ktd->ktd_intrwakdl : ktd->ktd_wakedelay,
    317  1.93     enami 			    (void (*)(void *))wakeup, ktd);
    318  1.93     enami 	}
    319  1.93     enami 
    320  1.93     enami skip_sync:
    321  1.93     enami 	ktdrel(ktd);
    322  1.93     enami 	return;
    323  1.93     enami 
    324  1.93     enami relktd:
    325  1.93     enami 	ktdrel(ktd);
    326  1.93     enami 
    327  1.93     enami freekte:
    328  1.93     enami 	ktefree(kte);
    329  1.93     enami }
    330  1.93     enami 
    331  1.93     enami void
    332  1.93     enami ktefree(struct ktrace_entry *kte)
    333  1.93     enami {
    334  1.93     enami 	struct ktr_header *kth = &kte->kte_kth;
    335  1.93     enami 
    336  1.93     enami 	if (kth->ktr_len > 0)
    337  1.93     enami 		free(kte->kte_buf, M_KTRACE);
    338  1.93     enami 	pool_put(&kte_pool, kte);
    339  1.93     enami }
    340  1.44  sommerfe 
    341  1.44  sommerfe /*
    342  1.44  sommerfe  * "deep" compare of two files for the purposes of clearing a trace.
    343  1.44  sommerfe  * Returns true if they're the same open file, or if they point at the
    344  1.44  sommerfe  * same underlying vnode/socket.
    345  1.44  sommerfe  */
    346  1.44  sommerfe 
    347  1.44  sommerfe int
    348  1.89     enami ktrsamefile(struct file *f1, struct file *f2)
    349  1.44  sommerfe {
    350  1.88     enami 
    351  1.44  sommerfe 	return ((f1 == f2) ||
    352  1.45  sommerfe 	    ((f1 != NULL) && (f2 != NULL) &&
    353  1.45  sommerfe 		(f1->f_type == f2->f_type) &&
    354  1.44  sommerfe 		(f1->f_data == f2->f_data)));
    355  1.44  sommerfe }
    356  1.22  christos 
    357  1.28  christos void
    358  1.89     enami ktrderef(struct proc *p)
    359  1.28  christos {
    360  1.93     enami 	struct ktr_desc *ktd = p->p_tracep;
    361  1.93     enami 
    362  1.42  sommerfe 	p->p_traceflag = 0;
    363  1.93     enami 	if (ktd == NULL)
    364  1.28  christos 		return;
    365  1.84       dsl 	p->p_tracep = NULL;
    366  1.84       dsl 
    367  1.93     enami 	simple_lock(&ktd->ktd_slock);
    368  1.93     enami 	wakeup(&ktd->ktd_flags);
    369  1.93     enami 	ktdrel(ktd);
    370  1.28  christos }
    371  1.28  christos 
    372  1.28  christos void
    373  1.89     enami ktradref(struct proc *p)
    374  1.28  christos {
    375  1.93     enami 	struct ktr_desc *ktd = p->p_tracep;
    376  1.28  christos 
    377  1.93     enami 	ktdref(ktd);
    378  1.28  christos }
    379  1.28  christos 
    380  1.39   thorpej void
    381  1.89     enami ktrinitheader(struct ktr_header *kth, struct proc *p, int type)
    382   1.1       cgd {
    383   1.1       cgd 
    384  1.90  christos 	(void)memset(kth, 0, sizeof(*kth));
    385   1.1       cgd 	kth->ktr_type = type;
    386   1.1       cgd 	microtime(&kth->ktr_time);
    387   1.1       cgd 	kth->ktr_pid = p->p_pid;
    388  1.32     perry 	memcpy(kth->ktr_comm, p->p_comm, MAXCOMLEN);
    389   1.1       cgd }
    390   1.1       cgd 
    391  1.93     enami void
    392  1.89     enami ktrsyscall(struct proc *p, register_t code, register_t realcode,
    393  1.89     enami     const struct sysent *callp, register_t args[])
    394   1.1       cgd {
    395  1.93     enami 	struct ktrace_entry *kte;
    396  1.93     enami 	struct ktr_header *kth;
    397  1.72   darrenr 	struct ktr_syscall *ktp;
    398  1.17       cgd 	register_t *argp;
    399  1.93     enami 	int argsize;
    400  1.57      fvdl 	size_t len;
    401  1.60   thorpej 	u_int i;
    402  1.57      fvdl 
    403  1.66      manu 	if (callp == NULL)
    404  1.66      manu 		callp = p->p_emul->e_sysent;
    405  1.88     enami 
    406  1.76  drochner 	argsize = callp[code].sy_argsize;
    407  1.86       mrg #ifdef _LP64
    408  1.86       mrg 	if (p->p_flag & P_32)
    409  1.86       mrg 		argsize = argsize << 1;
    410  1.86       mrg #endif
    411  1.57      fvdl 	len = sizeof(struct ktr_syscall) + argsize;
    412   1.1       cgd 
    413   1.9       cgd 	p->p_traceflag |= KTRFAC_ACTIVE;
    414  1.93     enami 	kte = pool_get(&kte_pool, PR_WAITOK);
    415  1.93     enami 	kth = &kte->kte_kth;
    416  1.93     enami 	ktrinitheader(kth, p, KTR_SYSCALL);
    417  1.93     enami 
    418  1.93     enami 	ktp = malloc(len, M_KTRACE, M_WAITOK);
    419  1.61      manu 	ktp->ktr_code = realcode;
    420  1.17       cgd 	ktp->ktr_argsize = argsize;
    421  1.93     enami 	argp = (register_t *)(ktp + 1);
    422  1.31     perry 	for (i = 0; i < (argsize / sizeof(*argp)); i++)
    423   1.1       cgd 		*argp++ = args[i];
    424  1.93     enami 	kth->ktr_len = len;
    425  1.93     enami 	kte->kte_buf = ktp;
    426  1.93     enami 
    427  1.93     enami 	ktraddentry(p, kte, KTA_WAITOK);
    428   1.9       cgd 	p->p_traceflag &= ~KTRFAC_ACTIVE;
    429   1.1       cgd }
    430   1.1       cgd 
    431  1.93     enami void
    432  1.89     enami ktrsysret(struct proc *p, register_t code, int error, register_t *retval)
    433   1.1       cgd {
    434  1.93     enami 	struct ktrace_entry *kte;
    435  1.93     enami 	struct ktr_header *kth;
    436  1.93     enami 	struct ktr_sysret *ktp;
    437   1.1       cgd 
    438   1.9       cgd 	p->p_traceflag |= KTRFAC_ACTIVE;
    439  1.93     enami 	kte = pool_get(&kte_pool, PR_WAITOK);
    440  1.93     enami 	kth = &kte->kte_kth;
    441  1.93     enami 	ktrinitheader(kth, p, KTR_SYSRET);
    442  1.93     enami 
    443  1.93     enami 	ktp = malloc(sizeof(struct ktr_sysret), M_KTRACE, M_WAITOK);
    444  1.93     enami 	ktp->ktr_code = code;
    445  1.93     enami 	ktp->ktr_eosys = 0;			/* XXX unused */
    446  1.93     enami 	ktp->ktr_error = error;
    447  1.93     enami 	ktp->ktr_retval = retval ? retval[0] : 0;
    448  1.93     enami 	ktp->ktr_retval_1 = retval ? retval[1] : 0;
    449   1.1       cgd 
    450  1.93     enami 	kth->ktr_len = sizeof(struct ktr_sysret);
    451  1.93     enami 	kte->kte_buf = ktp;
    452   1.1       cgd 
    453  1.93     enami 	ktraddentry(p, kte, KTA_WAITOK);
    454   1.9       cgd 	p->p_traceflag &= ~KTRFAC_ACTIVE;
    455   1.1       cgd }
    456   1.1       cgd 
    457  1.93     enami /*
    458  1.93     enami  * XXX: ndp->ni_pathlen should be passed.
    459  1.93     enami  */
    460  1.93     enami void
    461  1.89     enami ktrnamei(struct proc *p, char *path)
    462   1.1       cgd {
    463   1.1       cgd 
    464  1.93     enami 	ktrkmem(p, KTR_NAMEI, path, strlen(path));
    465  1.18  christos }
    466  1.18  christos 
    467  1.93     enami void
    468  1.89     enami ktremul(struct proc *p)
    469  1.18  christos {
    470  1.74      fvdl 	const char *emul = p->p_emul->e_name;
    471   1.1       cgd 
    472  1.93     enami 	ktrkmem(p, KTR_EMUL, emul, strlen(emul));
    473   1.1       cgd }
    474   1.1       cgd 
    475  1.93     enami void
    476  1.93     enami ktrkmem(struct proc *p, int type, const void *buf, size_t len)
    477  1.75       dsl {
    478  1.93     enami 	struct ktrace_entry *kte;
    479  1.93     enami 	struct ktr_header *kth;
    480  1.75       dsl 
    481  1.75       dsl 	p->p_traceflag |= KTRFAC_ACTIVE;
    482  1.93     enami 	kte = pool_get(&kte_pool, PR_WAITOK);
    483  1.93     enami 	kth = &kte->kte_kth;
    484  1.93     enami 	ktrinitheader(kth, p, type);
    485  1.93     enami 
    486  1.93     enami 	kth->ktr_len = len;
    487  1.93     enami 	kte->kte_buf = malloc(len, M_KTRACE, M_WAITOK);
    488  1.93     enami 	memcpy(kte->kte_buf, buf, len);
    489  1.75       dsl 
    490  1.93     enami 	ktraddentry(p, kte, KTA_WAITOK);
    491  1.75       dsl 	p->p_traceflag &= ~KTRFAC_ACTIVE;
    492  1.75       dsl }
    493  1.75       dsl 
    494  1.93     enami void
    495  1.89     enami ktrgenio(struct proc *p, int fd, enum uio_rw rw, struct iovec *iov,
    496  1.89     enami     int len, int error)
    497   1.1       cgd {
    498  1.93     enami 	struct ktrace_entry *kte;
    499  1.93     enami 	struct ktr_header *kth;
    500  1.28  christos 	struct ktr_genio *ktp;
    501  1.74      fvdl 	caddr_t cp;
    502  1.72   darrenr 	int resid = len, cnt;
    503  1.39   thorpej 	int buflen;
    504  1.39   thorpej 
    505   1.1       cgd 	if (error)
    506  1.93     enami 		return;
    507  1.39   thorpej 
    508   1.9       cgd 	p->p_traceflag |= KTRFAC_ACTIVE;
    509  1.39   thorpej 
    510  1.93     enami next:
    511  1.93     enami 	buflen = min(PAGE_SIZE, resid + sizeof(struct ktr_genio));
    512  1.39   thorpej 
    513  1.93     enami 	kte = pool_get(&kte_pool, PR_WAITOK);
    514  1.93     enami 	kth = &kte->kte_kth;
    515  1.93     enami 	ktrinitheader(kth, p, KTR_GENIO);
    516  1.93     enami 
    517  1.93     enami 	ktp = malloc(buflen, M_KTRACE, M_WAITOK);
    518   1.1       cgd 	ktp->ktr_fd = fd;
    519   1.1       cgd 	ktp->ktr_rw = rw;
    520  1.39   thorpej 
    521  1.93     enami 	kte->kte_buf = ktp;
    522  1.39   thorpej 
    523  1.93     enami 	cp = (caddr_t)(ktp + 1);
    524  1.39   thorpej 	buflen -= sizeof(struct ktr_genio);
    525  1.93     enami 	kth->ktr_len = sizeof(struct ktr_genio);
    526  1.93     enami 
    527  1.93     enami 	while (buflen > 0) {
    528  1.93     enami 		cnt = min(iov->iov_len, buflen);
    529  1.93     enami 		if (copyin(iov->iov_base, cp, cnt) != 0)
    530  1.93     enami 			goto out;
    531  1.93     enami 		kth->ktr_len += cnt;
    532  1.93     enami 		buflen -= cnt;
    533  1.93     enami 		resid -= cnt;
    534  1.93     enami 		iov->iov_len -= cnt;
    535  1.93     enami 		if (iov->iov_len == 0)
    536  1.93     enami 			iov++;
    537  1.93     enami 		else
    538  1.93     enami 			iov->iov_base = (caddr_t)iov->iov_base + cnt;
    539  1.93     enami 	}
    540  1.39   thorpej 
    541  1.93     enami 	/*
    542  1.93     enami 	 * Don't push so many entry at once.  It will cause kmem map
    543  1.93     enami 	 * shortage.
    544  1.93     enami 	 */
    545  1.93     enami 	ktraddentry(p, kte, KTA_WAITOK | KTA_LARGE);
    546  1.93     enami 	if (resid > 0) {
    547  1.67   thorpej #if 0 /* XXX NJWLWP */
    548  1.46   thorpej 		KDASSERT(p->p_cpu != NULL);
    549  1.46   thorpej 		KDASSERT(p->p_cpu == curcpu());
    550  1.67   thorpej #endif
    551  1.67   thorpej 		/* XXX NJWLWP */
    552  1.67   thorpej 		if (curcpu()->ci_schedstate.spc_flags & SPCF_SHOULDYIELD)
    553  1.67   thorpej 			preempt(1);
    554  1.39   thorpej 
    555  1.93     enami 		goto next;
    556  1.93     enami 	}
    557  1.39   thorpej 
    558  1.93     enami 	p->p_traceflag &= ~KTRFAC_ACTIVE;
    559  1.93     enami 	return;
    560  1.39   thorpej 
    561  1.93     enami out:
    562  1.93     enami 	ktefree(kte);
    563   1.9       cgd 	p->p_traceflag &= ~KTRFAC_ACTIVE;
    564   1.1       cgd }
    565   1.1       cgd 
    566  1.93     enami void
    567  1.89     enami ktrpsig(struct proc *p, int sig, sig_t action, const sigset_t *mask,
    568  1.89     enami     const ksiginfo_t *ksi)
    569   1.1       cgd {
    570  1.93     enami 	struct ktrace_entry *kte;
    571  1.93     enami 	struct ktr_header *kth;
    572  1.78  christos 	struct {
    573  1.78  christos 		struct ktr_psig	kp;
    574  1.78  christos 		siginfo_t	si;
    575  1.93     enami 	} *kbuf;
    576   1.1       cgd 
    577   1.9       cgd 	p->p_traceflag |= KTRFAC_ACTIVE;
    578  1.93     enami 	kte = pool_get(&kte_pool, PR_WAITOK);
    579  1.93     enami 	kth = &kte->kte_kth;
    580  1.93     enami 	ktrinitheader(kth, p, KTR_PSIG);
    581  1.93     enami 
    582  1.93     enami 	kbuf = malloc(sizeof(*kbuf), M_KTRACE, M_WAITOK);
    583  1.93     enami 	kbuf->kp.signo = (char)sig;
    584  1.93     enami 	kbuf->kp.action = action;
    585  1.93     enami 	kbuf->kp.mask = *mask;
    586  1.93     enami 	kte->kte_buf = kbuf;
    587  1.78  christos 	if (ksi) {
    588  1.93     enami 		kbuf->kp.code = KSI_TRAPCODE(ksi);
    589  1.93     enami 		(void)memset(&kbuf->si, 0, sizeof(kbuf->si));
    590  1.93     enami 		kbuf->si._info = ksi->ksi_info;
    591  1.93     enami 		kth->ktr_len = sizeof(kbuf);
    592  1.78  christos 	} else {
    593  1.93     enami 		kbuf->kp.code = 0;
    594  1.93     enami 		kth->ktr_len = sizeof(struct ktr_psig);
    595  1.78  christos 	}
    596  1.93     enami 
    597  1.93     enami 	ktraddentry(p, kte, KTA_WAITOK);
    598   1.9       cgd 	p->p_traceflag &= ~KTRFAC_ACTIVE;
    599   1.9       cgd }
    600   1.9       cgd 
    601  1.93     enami void
    602  1.89     enami ktrcsw(struct proc *p, int out, int user)
    603   1.9       cgd {
    604  1.93     enami 	struct ktrace_entry *kte;
    605  1.93     enami 	struct ktr_header *kth;
    606  1.93     enami 	struct ktr_csw *kc;
    607   1.9       cgd 
    608   1.9       cgd 	p->p_traceflag |= KTRFAC_ACTIVE;
    609   1.9       cgd 
    610  1.93     enami 	/*
    611  1.93     enami 	 * We can't sleep if we're already going to sleep (if original
    612  1.93     enami 	 * condition is met during sleep, we hang up).
    613  1.93     enami 	 */
    614  1.93     enami 	kte = pool_get(&kte_pool, out ? PR_NOWAIT : PR_WAITOK);
    615  1.93     enami 	if (kte == NULL) {
    616  1.93     enami 		ktd_logerr(p, KTDE_ENOMEM);
    617  1.93     enami 		goto out;
    618  1.93     enami 	}
    619  1.93     enami 	kth = &kte->kte_kth;
    620  1.93     enami 	ktrinitheader(kth, p, KTR_CSW);
    621  1.93     enami 
    622  1.93     enami 	kc = malloc(sizeof(struct ktr_csw), M_KTRACE,
    623  1.93     enami 	    out ? M_NOWAIT : M_WAITOK);
    624  1.93     enami 	if (kc == NULL) {
    625  1.93     enami 		ktd_logerr(p, KTDE_ENOMEM);
    626  1.93     enami 		goto free_kte;
    627  1.93     enami 	}
    628  1.93     enami 	kc->out = out;
    629  1.93     enami 	kc->user = user;
    630  1.93     enami 	kth->ktr_len = sizeof(struct ktr_csw);
    631  1.93     enami 	kte->kte_buf = kc;
    632  1.93     enami 
    633  1.93     enami 	ktraddentry(p, kte, out ? KTA_NOWAIT : KTA_WAITOK);
    634  1.93     enami 	p->p_traceflag &= ~KTRFAC_ACTIVE;
    635  1.93     enami 	return;
    636  1.93     enami 
    637  1.93     enami free_kte:
    638  1.93     enami 	pool_put(&kte_pool, kte);
    639  1.93     enami out:
    640   1.9       cgd 	p->p_traceflag &= ~KTRFAC_ACTIVE;
    641   1.1       cgd }
    642   1.1       cgd 
    643  1.93     enami void
    644  1.89     enami ktruser(struct proc *p, const char *id, void *addr, size_t len, int ustr)
    645  1.51  jdolecek {
    646  1.93     enami 	struct ktrace_entry *kte;
    647  1.93     enami 	struct ktr_header *kth;
    648  1.51  jdolecek 	struct ktr_user *ktp;
    649  1.51  jdolecek 	caddr_t user_dta;
    650  1.51  jdolecek 
    651  1.51  jdolecek 	p->p_traceflag |= KTRFAC_ACTIVE;
    652  1.93     enami 	kte = pool_get(&kte_pool, PR_WAITOK);
    653  1.93     enami 	kth = &kte->kte_kth;
    654  1.93     enami 	ktrinitheader(kth, p, KTR_USER);
    655  1.93     enami 
    656  1.93     enami 	ktp = malloc(sizeof(struct ktr_user) + len, M_KTRACE, M_WAITOK);
    657  1.51  jdolecek 	if (ustr) {
    658  1.51  jdolecek 		if (copyinstr(id, ktp->ktr_id, KTR_USER_MAXIDLEN, NULL) != 0)
    659  1.51  jdolecek 			ktp->ktr_id[0] = '\0';
    660  1.51  jdolecek 	} else
    661  1.51  jdolecek 		strncpy(ktp->ktr_id, id, KTR_USER_MAXIDLEN);
    662  1.51  jdolecek 	ktp->ktr_id[KTR_USER_MAXIDLEN-1] = '\0';
    663  1.51  jdolecek 
    664  1.93     enami 	user_dta = (caddr_t)(ktp + 1);
    665  1.93     enami 	if (copyin(addr, (void *)user_dta, len) != 0)
    666  1.51  jdolecek 		len = 0;
    667  1.51  jdolecek 
    668  1.93     enami 	kth->ktr_len = sizeof(struct ktr_user) + len;
    669  1.93     enami 	kte->kte_buf = ktp;
    670  1.51  jdolecek 
    671  1.93     enami 	ktraddentry(p, kte, KTA_WAITOK);
    672  1.51  jdolecek 	p->p_traceflag &= ~KTRFAC_ACTIVE;
    673  1.51  jdolecek }
    674  1.51  jdolecek 
    675  1.93     enami void
    676  1.89     enami ktrmmsg(struct proc *p, const void *msgh, size_t size)
    677  1.62      manu {
    678  1.88     enami 
    679  1.93     enami 	ktrkmem(p, KTR_MMSG, msgh, size);
    680  1.62      manu }
    681  1.83      manu 
    682  1.93     enami void
    683  1.89     enami ktrmool(struct proc *p, const void *kaddr, size_t size, const void *uaddr)
    684  1.83      manu {
    685  1.93     enami 	struct ktrace_entry *kte;
    686  1.93     enami 	struct ktr_header *kth;
    687  1.83      manu 	struct ktr_mool *kp;
    688  1.83      manu 	struct ktr_mool *buf;
    689  1.83      manu 
    690  1.83      manu 	p->p_traceflag |= KTRFAC_ACTIVE;
    691  1.93     enami 	kte = pool_get(&kte_pool, PR_WAITOK);
    692  1.93     enami 	kth = &kte->kte_kth;
    693  1.93     enami 	ktrinitheader(kth, p, KTR_MOOL);
    694  1.83      manu 
    695  1.93     enami 	kp = malloc(size + sizeof(*kp), M_KTRACE, M_WAITOK);
    696  1.83      manu 	kp->uaddr = uaddr;
    697  1.83      manu 	kp->size = size;
    698  1.83      manu 	buf = kp + 1; /* Skip uaddr and size */
    699  1.90  christos 	(void)memcpy(buf, kaddr, size);
    700  1.88     enami 
    701  1.93     enami 	kth->ktr_len = size + sizeof(*kp);
    702  1.93     enami 	kte->kte_buf = kp;
    703  1.83      manu 
    704  1.93     enami 	ktraddentry(p, kte, KTA_WAITOK);
    705  1.83      manu 	p->p_traceflag &= ~KTRFAC_ACTIVE;
    706  1.83      manu }
    707  1.83      manu 
    708  1.62      manu 
    709   1.1       cgd /* Interface and common routines */
    710   1.1       cgd 
    711  1.17       cgd int
    712  1.89     enami ktrace_common(struct proc *curp, int ops, int facs, int pid, struct file *fp)
    713  1.28  christos {
    714  1.93     enami 	struct proc *p;
    715  1.93     enami 	struct pgrp *pg;
    716  1.93     enami 	struct ktr_desc *ktd = NULL;
    717  1.74      fvdl 	int ret = 0;
    718  1.72   darrenr 	int error = 0;
    719  1.42  sommerfe 	int descend;
    720  1.28  christos 
    721  1.28  christos 	curp->p_traceflag |= KTRFAC_ACTIVE;
    722  1.42  sommerfe 	descend = ops & KTRFLAG_DESCEND;
    723  1.42  sommerfe 	facs = facs & ~((unsigned) KTRFAC_ROOT);
    724  1.28  christos 
    725  1.93     enami 	switch (KTROP(ops)) {
    726  1.93     enami 
    727  1.93     enami 	case KTROP_CLEARFILE:
    728  1.93     enami 		/*
    729  1.93     enami 		 * Clear all uses of the tracefile
    730  1.93     enami 		 */
    731  1.93     enami 
    732  1.93     enami 		ktd = ktd_lookup(fp);
    733  1.93     enami 		if (ktd == NULL)
    734  1.93     enami 			goto done;
    735  1.93     enami 
    736  1.37   thorpej 		proclist_lock_read();
    737  1.81  jdolecek 		LIST_FOREACH(p, &allproc, p_list) {
    738  1.93     enami 			if (p->p_tracep == ktd) {
    739  1.28  christos 				if (ktrcanset(curp, p))
    740  1.28  christos 					ktrderef(p);
    741  1.28  christos 				else
    742  1.28  christos 					error = EPERM;
    743  1.28  christos 			}
    744  1.28  christos 		}
    745  1.36   thorpej 		proclist_unlock_read();
    746  1.28  christos 		goto done;
    747  1.42  sommerfe 
    748  1.93     enami 	case KTROP_SET:
    749  1.93     enami 		ktd = ktd_lookup(fp);
    750  1.93     enami 		if (ktd == NULL) {
    751  1.93     enami 			ktd = malloc(sizeof(struct ktr_desc),
    752  1.93     enami 			    M_KTRACE, M_WAITOK);
    753  1.93     enami 			TAILQ_INIT(&ktd->ktd_queue);
    754  1.93     enami 			simple_lock_init(&ktd->ktd_slock);
    755  1.93     enami 			callout_init(&ktd->ktd_wakch);
    756  1.93     enami 			ktd->ktd_flags = ktd->ktd_qcount =
    757  1.93     enami 			    ktd->ktd_error = ktd->ktd_errcnt = 0;
    758  1.93     enami 			ktd->ktd_ref = 1;
    759  1.93     enami 			ktd->ktd_delayqcnt = ktd_delayqcnt;
    760  1.93     enami 			ktd->ktd_wakedelay = mstohz(ktd_wakedelay);
    761  1.93     enami 			ktd->ktd_intrwakdl = mstohz(ktd_intrwakdl);
    762  1.93     enami 			/*
    763  1.93     enami 			 * XXX: not correct.  needs an way to detect
    764  1.93     enami 			 * whether ktruss or ktrace.
    765  1.93     enami 			 */
    766  1.93     enami 			if (fp->f_type == DTYPE_PIPE)
    767  1.93     enami 				ktd->ktd_flags |= KTDF_INTERACTIVE;
    768  1.93     enami 
    769  1.93     enami 			error = kthread_create1(ktrace_thread, ktd,
    770  1.93     enami 			    &ktd->ktd_proc, "ktr %p", ktd);
    771  1.93     enami 			if (error != 0) {
    772  1.93     enami 				free(ktd, M_KTRACE);
    773  1.93     enami 				goto done;
    774  1.93     enami 			}
    775  1.93     enami 
    776  1.93     enami 			simple_lock(&fp->f_slock);
    777  1.93     enami 			fp->f_count++;
    778  1.93     enami 			simple_unlock(&fp->f_slock);
    779  1.93     enami 			ktd->ktd_fp = fp;
    780  1.93     enami 
    781  1.93     enami 			simple_lock(&ktdq_slock);
    782  1.93     enami 			TAILQ_INSERT_TAIL(&ktdq, ktd, ktd_list);
    783  1.93     enami 			simple_unlock(&ktdq_slock);
    784  1.93     enami 		}
    785  1.93     enami 		break;
    786  1.42  sommerfe 
    787  1.93     enami 	case KTROP_CLEAR:
    788  1.93     enami 		break;
    789  1.43  sommerfe 	}
    790  1.88     enami 
    791  1.28  christos 	/*
    792  1.28  christos 	 * need something to (un)trace (XXX - why is this here?)
    793  1.28  christos 	 */
    794  1.28  christos 	if (!facs) {
    795  1.28  christos 		error = EINVAL;
    796  1.28  christos 		goto done;
    797  1.28  christos 	}
    798  1.93     enami 
    799  1.88     enami 	/*
    800  1.28  christos 	 * do it
    801  1.28  christos 	 */
    802  1.42  sommerfe 	if (pid < 0) {
    803  1.28  christos 		/*
    804  1.28  christos 		 * by process group
    805  1.28  christos 		 */
    806  1.82       dsl 		pg = pg_find(-pid, PFIND_UNLOCK_FAIL);
    807  1.28  christos 		if (pg == NULL) {
    808  1.28  christos 			error = ESRCH;
    809  1.28  christos 			goto done;
    810  1.28  christos 		}
    811  1.81  jdolecek 		LIST_FOREACH(p, &pg->pg_members, p_pglist) {
    812  1.28  christos 			if (descend)
    813  1.93     enami 				ret |= ktrsetchildren(curp, p, ops, facs, ktd);
    814  1.88     enami 			else
    815  1.93     enami 				ret |= ktrops(curp, p, ops, facs, ktd);
    816  1.39   thorpej 		}
    817  1.88     enami 
    818  1.28  christos 	} else {
    819  1.28  christos 		/*
    820  1.28  christos 		 * by pid
    821  1.28  christos 		 */
    822  1.82       dsl 		p = p_find(pid, PFIND_UNLOCK_FAIL);
    823  1.28  christos 		if (p == NULL) {
    824  1.28  christos 			error = ESRCH;
    825  1.28  christos 			goto done;
    826  1.28  christos 		}
    827  1.28  christos 		if (descend)
    828  1.93     enami 			ret |= ktrsetchildren(curp, p, ops, facs, ktd);
    829  1.28  christos 		else
    830  1.93     enami 			ret |= ktrops(curp, p, ops, facs, ktd);
    831  1.28  christos 	}
    832  1.82       dsl 	proclist_unlock_read();	/* taken by p{g}_find */
    833  1.28  christos 	if (!ret)
    834  1.28  christos 		error = EPERM;
    835  1.28  christos done:
    836  1.93     enami 	if (error != 0 && ktd != NULL)
    837  1.93     enami 		/*
    838  1.93     enami 		 * Wakup the thread so that it can be die if we
    839  1.93     enami 		 * can't trace any process.
    840  1.93     enami 		 */
    841  1.93     enami 		ktd_wakeup(ktd);
    842  1.93     enami 	if (KTROP(ops) == KTROP_SET ||
    843  1.93     enami 	    KTROP(ops) == KTROP_CLEARFILE) {
    844  1.93     enami 		simple_lock(&ktd->ktd_slock);
    845  1.93     enami 		ktdrel(ktd);
    846  1.93     enami 	}
    847  1.28  christos 	curp->p_traceflag &= ~KTRFAC_ACTIVE;
    848  1.28  christos 	return (error);
    849  1.28  christos }
    850  1.28  christos 
    851  1.28  christos /*
    852  1.93     enami  * fktrace system call
    853  1.28  christos  */
    854  1.28  christos /* ARGSUSED */
    855  1.28  christos int
    856  1.89     enami sys_fktrace(struct lwp *l, void *v, register_t *retval)
    857  1.42  sommerfe {
    858  1.42  sommerfe 	struct sys_fktrace_args /* {
    859  1.42  sommerfe 		syscallarg(int) fd;
    860  1.42  sommerfe 		syscallarg(int) ops;
    861  1.42  sommerfe 		syscallarg(int) facs;
    862  1.42  sommerfe 		syscallarg(int) pid;
    863  1.42  sommerfe 	} */ *uap = v;
    864  1.74      fvdl 	struct proc *curp = l->l_proc;
    865  1.42  sommerfe 	struct file *fp = NULL;
    866  1.74      fvdl 	struct filedesc *fdp = curp->p_fd;
    867  1.70      yamt 	int error;
    868  1.42  sommerfe 
    869  1.54   thorpej 	if ((fp = fd_getfile(fdp, SCARG(uap, fd))) == NULL)
    870  1.54   thorpej 		return (EBADF);
    871  1.54   thorpej 
    872  1.70      yamt 	FILE_USE(fp);
    873  1.70      yamt 
    874  1.54   thorpej 	if ((fp->f_flag & FWRITE) == 0)
    875  1.70      yamt 		error = EBADF;
    876  1.70      yamt 	else
    877  1.74      fvdl 		error = ktrace_common(curp, SCARG(uap, ops),
    878  1.70      yamt 		    SCARG(uap, facs), SCARG(uap, pid), fp);
    879  1.70      yamt 
    880  1.74      fvdl 	FILE_UNUSE(fp, curp);
    881  1.42  sommerfe 
    882  1.70      yamt 	return error;
    883  1.42  sommerfe }
    884  1.42  sommerfe 
    885  1.42  sommerfe /*
    886  1.42  sommerfe  * ktrace system call
    887  1.42  sommerfe  */
    888  1.42  sommerfe /* ARGSUSED */
    889  1.42  sommerfe int
    890  1.89     enami sys_ktrace(struct lwp *l, void *v, register_t *retval)
    891  1.19   thorpej {
    892  1.28  christos 	struct sys_ktrace_args /* {
    893  1.24   mycroft 		syscallarg(const char *) fname;
    894  1.13       cgd 		syscallarg(int) ops;
    895  1.13       cgd 		syscallarg(int) facs;
    896  1.13       cgd 		syscallarg(int) pid;
    897  1.19   thorpej 	} */ *uap = v;
    898  1.67   thorpej 	struct proc *curp = l->l_proc;
    899  1.28  christos 	struct vnode *vp = NULL;
    900  1.42  sommerfe 	struct file *fp = NULL;
    901  1.74      fvdl 	int fd;
    902  1.42  sommerfe 	int ops = SCARG(uap, ops);
    903  1.74      fvdl 	int error = 0;
    904  1.72   darrenr 	struct nameidata nd;
    905   1.1       cgd 
    906  1.42  sommerfe 	ops = KTROP(ops) | (ops & KTRFLAG_DESCEND);
    907  1.42  sommerfe 
    908   1.9       cgd 	curp->p_traceflag |= KTRFAC_ACTIVE;
    909  1.69  christos 	if ((ops & KTROP_CLEAR) == 0) {
    910   1.1       cgd 		/*
    911   1.1       cgd 		 * an operation which requires a file argument.
    912   1.1       cgd 		 */
    913  1.13       cgd 		NDINIT(&nd, LOOKUP, FOLLOW, UIO_USERSPACE, SCARG(uap, fname),
    914  1.74      fvdl 		    curp);
    915  1.22  christos 		if ((error = vn_open(&nd, FREAD|FWRITE, 0)) != 0) {
    916   1.9       cgd 			curp->p_traceflag &= ~KTRFAC_ACTIVE;
    917   1.1       cgd 			return (error);
    918   1.9       cgd 		}
    919   1.1       cgd 		vp = nd.ni_vp;
    920  1.25      fvdl 		VOP_UNLOCK(vp, 0);
    921   1.1       cgd 		if (vp->v_type != VREG) {
    922  1.74      fvdl 			(void) vn_close(vp, FREAD|FWRITE, curp->p_ucred, curp);
    923   1.9       cgd 			curp->p_traceflag &= ~KTRFAC_ACTIVE;
    924   1.1       cgd 			return (EACCES);
    925   1.1       cgd 		}
    926   1.1       cgd 		/*
    927  1.42  sommerfe 		 * XXX This uses up a file descriptor slot in the
    928  1.42  sommerfe 		 * tracing process for the duration of this syscall.
    929  1.42  sommerfe 		 * This is not expected to be a problem.  If
    930  1.42  sommerfe 		 * falloc(NULL, ...) DTRT we could skip that part, but
    931  1.42  sommerfe 		 * that would require changing its interface to allow
    932  1.42  sommerfe 		 * the caller to pass in a ucred..
    933  1.42  sommerfe 		 *
    934  1.88     enami 		 * This will FILE_USE the fp it returns, if any.
    935  1.42  sommerfe 		 * Keep it in use until we return.
    936   1.1       cgd 		 */
    937  1.42  sommerfe 		if ((error = falloc(curp, &fp, &fd)) != 0)
    938   1.1       cgd 			goto done;
    939  1.88     enami 
    940  1.93     enami 		fp->f_flag = FWRITE;
    941  1.42  sommerfe 		fp->f_type = DTYPE_VNODE;
    942  1.42  sommerfe 		fp->f_ops = &vnops;
    943  1.42  sommerfe 		fp->f_data = (caddr_t)vp;
    944  1.54   thorpej 		FILE_SET_MATURE(fp);
    945  1.42  sommerfe 		vp = NULL;
    946  1.42  sommerfe 	}
    947  1.74      fvdl 	error = ktrace_common(curp, SCARG(uap, ops), SCARG(uap, facs),
    948  1.42  sommerfe 	    SCARG(uap, pid), fp);
    949  1.88     enami done:
    950   1.1       cgd 	if (vp != NULL)
    951  1.74      fvdl 		(void) vn_close(vp, FWRITE, curp->p_ucred, curp);
    952  1.42  sommerfe 	if (fp != NULL) {
    953  1.74      fvdl 		FILE_UNUSE(fp, curp);	/* release file */
    954  1.74      fvdl 		fdrelease(curp, fd); 	/* release fd table slot */
    955  1.42  sommerfe 	}
    956   1.1       cgd 	return (error);
    957   1.1       cgd }
    958   1.1       cgd 
    959   1.4    andrew int
    960  1.89     enami ktrops(struct proc *curp, struct proc *p, int ops, int facs,
    961  1.93     enami     struct ktr_desc *ktd)
    962   1.1       cgd {
    963   1.1       cgd 
    964   1.1       cgd 	if (!ktrcanset(curp, p))
    965   1.1       cgd 		return (0);
    966  1.28  christos 	if (KTROP(ops) == KTROP_SET) {
    967  1.93     enami 		if (p->p_tracep != ktd) {
    968   1.1       cgd 			/*
    969   1.1       cgd 			 * if trace file already in use, relinquish
    970   1.1       cgd 			 */
    971  1.28  christos 			ktrderef(p);
    972  1.93     enami 			p->p_tracep = ktd;
    973  1.28  christos 			ktradref(p);
    974   1.1       cgd 		}
    975   1.1       cgd 		p->p_traceflag |= facs;
    976   1.1       cgd 		if (curp->p_ucred->cr_uid == 0)
    977   1.1       cgd 			p->p_traceflag |= KTRFAC_ROOT;
    978  1.88     enami 	} else {
    979   1.1       cgd 		/* KTROP_CLEAR */
    980   1.1       cgd 		if (((p->p_traceflag &= ~facs) & KTRFAC_MASK) == 0) {
    981   1.1       cgd 			/* no more tracing */
    982  1.28  christos 			ktrderef(p);
    983   1.1       cgd 		}
    984   1.1       cgd 	}
    985  1.21  christos 
    986  1.21  christos 	/*
    987  1.21  christos 	 * Emit an emulation record, every time there is a ktrace
    988  1.88     enami 	 * change/attach request.
    989  1.21  christos 	 */
    990  1.21  christos 	if (KTRPOINT(p, KTR_EMUL))
    991  1.84       dsl 		p->p_traceflag |= KTRFAC_TRC_EMUL;
    992  1.49    martin #ifdef __HAVE_SYSCALL_INTERN
    993  1.48   mycroft 	(*p->p_emul->e_syscall_intern)(p);
    994  1.49    martin #endif
    995   1.1       cgd 
    996   1.1       cgd 	return (1);
    997   1.1       cgd }
    998   1.1       cgd 
    999  1.22  christos int
   1000  1.89     enami ktrsetchildren(struct proc *curp, struct proc *top, int ops, int facs,
   1001  1.93     enami     struct ktr_desc *ktd)
   1002   1.1       cgd {
   1003  1.28  christos 	struct proc *p;
   1004  1.28  christos 	int ret = 0;
   1005   1.1       cgd 
   1006   1.1       cgd 	p = top;
   1007   1.1       cgd 	for (;;) {
   1008  1.93     enami 		ret |= ktrops(curp, p, ops, facs, ktd);
   1009   1.1       cgd 		/*
   1010   1.1       cgd 		 * If this process has children, descend to them next,
   1011   1.1       cgd 		 * otherwise do any siblings, and if done with this level,
   1012   1.1       cgd 		 * follow back up the tree (but not past top).
   1013   1.1       cgd 		 */
   1014  1.82       dsl 		if (LIST_FIRST(&p->p_children) != NULL) {
   1015  1.39   thorpej 			p = LIST_FIRST(&p->p_children);
   1016  1.82       dsl 			continue;
   1017  1.82       dsl 		}
   1018  1.82       dsl 		for (;;) {
   1019   1.1       cgd 			if (p == top)
   1020   1.1       cgd 				return (ret);
   1021  1.39   thorpej 			if (LIST_NEXT(p, p_sibling) != NULL) {
   1022  1.39   thorpej 				p = LIST_NEXT(p, p_sibling);
   1023   1.1       cgd 				break;
   1024   1.1       cgd 			}
   1025  1.12   mycroft 			p = p->p_pptr;
   1026   1.1       cgd 		}
   1027   1.1       cgd 	}
   1028   1.1       cgd 	/*NOTREACHED*/
   1029   1.1       cgd }
   1030   1.1       cgd 
   1031  1.93     enami void
   1032  1.93     enami ktrwrite(struct ktr_desc *ktd, struct ktrace_entry *kte)
   1033   1.1       cgd {
   1034  1.74      fvdl 	struct uio auio;
   1035  1.93     enami 	struct iovec aiov[64], *iov;
   1036  1.93     enami 	struct ktrace_entry *top = kte;
   1037  1.93     enami 	struct ktr_header *kth;
   1038  1.93     enami 	struct file *fp = ktd->ktd_fp;
   1039  1.93     enami 	struct proc *p;
   1040  1.93     enami 	int error;
   1041  1.88     enami 
   1042  1.93     enami next:
   1043  1.93     enami 	auio.uio_iov = iov = &aiov[0];
   1044   1.1       cgd 	auio.uio_offset = 0;
   1045   1.1       cgd 	auio.uio_segflg = UIO_SYSSPACE;
   1046   1.1       cgd 	auio.uio_rw = UIO_WRITE;
   1047  1.93     enami 	auio.uio_resid = 0;
   1048  1.93     enami 	auio.uio_iovcnt = 0;
   1049  1.92     skrll 	auio.uio_procp = NULL;
   1050  1.93     enami 	do {
   1051  1.93     enami 		kth = &kte->kte_kth;
   1052  1.93     enami 		iov->iov_base = (caddr_t)kth;
   1053  1.93     enami 		iov++->iov_len = sizeof(struct ktr_header);
   1054  1.93     enami 		auio.uio_resid += sizeof(struct ktr_header);
   1055   1.1       cgd 		auio.uio_iovcnt++;
   1056  1.93     enami 		if (kth->ktr_len > 0) {
   1057  1.93     enami 			iov->iov_base = kte->kte_buf;
   1058  1.93     enami 			iov++->iov_len = kth->ktr_len;
   1059  1.93     enami 			auio.uio_resid += kth->ktr_len;
   1060  1.93     enami 			auio.uio_iovcnt++;
   1061  1.93     enami 		}
   1062  1.93     enami 	} while ((kte = TAILQ_NEXT(kte, kte_list)) != NULL &&
   1063  1.93     enami 	    auio.uio_iovcnt < sizeof(aiov) / sizeof(aiov[0]) - 1);
   1064  1.93     enami 
   1065  1.93     enami again:
   1066  1.93     enami 	simple_lock(&fp->f_slock);
   1067  1.93     enami 	FILE_USE(fp);
   1068  1.93     enami 	error = (*fp->f_ops->fo_write)(fp, &fp->f_offset, &auio,
   1069  1.93     enami 	    fp->f_cred, FOF_UPDATE_OFFSET);
   1070  1.93     enami 	FILE_UNUSE(fp, NULL);
   1071  1.93     enami 	switch (error) {
   1072  1.93     enami 
   1073  1.93     enami 	case 0:
   1074  1.93     enami 		if (auio.uio_resid > 0)
   1075  1.93     enami 			goto again;
   1076  1.93     enami 		if (kte != NULL)
   1077  1.93     enami 			goto next;
   1078  1.93     enami 		break;
   1079  1.93     enami 
   1080  1.93     enami 	case EWOULDBLOCK:
   1081  1.93     enami 		preempt(1);
   1082  1.93     enami 		goto again;
   1083  1.93     enami 
   1084  1.93     enami 	default:
   1085  1.93     enami 		/*
   1086  1.93     enami 		 * If error encountered, give up tracing on this
   1087  1.93     enami 		 * vnode.  Don't report EPIPE as this can easily
   1088  1.93     enami 		 * happen with fktrace()/ktruss.
   1089  1.93     enami 		 */
   1090  1.93     enami #ifndef DEBUG
   1091  1.93     enami 		if (error != EPIPE)
   1092  1.93     enami #endif
   1093  1.93     enami 			log(LOG_NOTICE,
   1094  1.93     enami 			    "ktrace write failed, errno %d, tracing stopped\n",
   1095  1.93     enami 			    error);
   1096  1.93     enami 		proclist_lock_read();
   1097  1.93     enami 		LIST_FOREACH(p, &allproc, p_list) {
   1098  1.93     enami 			if (p->p_tracep == ktd)
   1099  1.93     enami 				ktrderef(p);
   1100  1.93     enami 		}
   1101  1.93     enami 		proclist_unlock_read();
   1102  1.93     enami 	}
   1103  1.93     enami 
   1104  1.93     enami 	while ((kte = top) != NULL) {
   1105  1.93     enami 		top = TAILQ_NEXT(top, kte_list);
   1106  1.93     enami 		ktefree(kte);
   1107  1.93     enami 	}
   1108  1.93     enami }
   1109  1.93     enami 
   1110  1.93     enami void
   1111  1.93     enami ktrace_thread(void *arg)
   1112  1.93     enami {
   1113  1.93     enami 	struct ktr_desc *ktd = arg;
   1114  1.93     enami 	struct file *fp = ktd->ktd_fp;
   1115  1.93     enami 	struct ktrace_entry *kte;
   1116  1.93     enami 	int ktrerr, errcnt;
   1117  1.93     enami 
   1118  1.93     enami 	for (;;) {
   1119  1.93     enami 		simple_lock(&ktd->ktd_slock);
   1120  1.93     enami 		kte = TAILQ_FIRST(&ktd->ktd_queue);
   1121  1.93     enami 		if (kte == NULL) {
   1122  1.93     enami 			if (ktd->ktd_flags & KTDF_WAIT) {
   1123  1.93     enami 				ktd->ktd_flags &= ~(KTDF_WAIT | KTDF_BLOCKING);
   1124  1.93     enami 				wakeup(&ktd->ktd_flags);
   1125  1.93     enami 			}
   1126  1.93     enami 			if (ktd->ktd_ref == 0)
   1127  1.93     enami 				break;
   1128  1.93     enami 			ltsleep(ktd, PWAIT | PNORELOCK, "ktrwait", 0,
   1129  1.93     enami 			    &ktd->ktd_slock);
   1130  1.93     enami 			continue;
   1131  1.93     enami 		}
   1132  1.93     enami 		TAILQ_INIT(&ktd->ktd_queue);
   1133  1.93     enami 		ktd->ktd_qcount = 0;
   1134  1.93     enami 		ktrerr = ktd->ktd_error;
   1135  1.93     enami 		errcnt = ktd->ktd_errcnt;
   1136  1.93     enami 		ktd->ktd_error = ktd->ktd_errcnt = 0;
   1137  1.93     enami 		simple_unlock(&ktd->ktd_slock);
   1138  1.93     enami 
   1139  1.93     enami 		if (ktrerr) {
   1140  1.93     enami 			log(LOG_NOTICE,
   1141  1.93     enami 			    "ktrace failed, fp %p, error 0x%x, total %d\n",
   1142  1.93     enami 			    fp, ktrerr, errcnt);
   1143  1.93     enami 		}
   1144  1.93     enami 		ktrwrite(ktd, kte);
   1145   1.1       cgd 	}
   1146  1.93     enami 	simple_unlock(&ktd->ktd_slock);
   1147  1.93     enami 
   1148  1.93     enami 	simple_lock(&ktdq_slock);
   1149  1.93     enami 	TAILQ_REMOVE(&ktdq, ktd, ktd_list);
   1150  1.93     enami 	simple_unlock(&ktdq_slock);
   1151  1.28  christos 
   1152  1.68        pk 	simple_lock(&fp->f_slock);
   1153  1.42  sommerfe 	FILE_USE(fp);
   1154  1.42  sommerfe 
   1155   1.1       cgd 	/*
   1156  1.93     enami 	 * ktrace file descriptor can't be watched (are not visible to
   1157  1.93     enami 	 * userspace), so no kqueue stuff here
   1158  1.93     enami 	 * XXX: The above comment is wrong, because the fktrace file
   1159  1.93     enami 	 * descriptor is available in userland.
   1160   1.1       cgd 	 */
   1161  1.93     enami 	closef(fp, NULL);
   1162  1.93     enami 
   1163  1.93     enami 	callout_stop(&ktd->ktd_wakch);
   1164  1.93     enami 	free(ktd, M_KTRACE);
   1165  1.39   thorpej 
   1166  1.93     enami 	kthread_exit(0);
   1167   1.1       cgd }
   1168   1.1       cgd 
   1169   1.1       cgd /*
   1170   1.1       cgd  * Return true if caller has permission to set the ktracing state
   1171   1.1       cgd  * of target.  Essentially, the target can't possess any
   1172   1.1       cgd  * more permissions than the caller.  KTRFAC_ROOT signifies that
   1173  1.88     enami  * root previously set the tracing status on the target process, and
   1174   1.1       cgd  * so, only root may further change it.
   1175   1.1       cgd  *
   1176   1.1       cgd  * TODO: check groups.  use caller effective gid.
   1177   1.1       cgd  */
   1178  1.22  christos int
   1179  1.89     enami ktrcanset(struct proc *callp, struct proc *targetp)
   1180   1.1       cgd {
   1181  1.28  christos 	struct pcred *caller = callp->p_cred;
   1182  1.28  christos 	struct pcred *target = targetp->p_cred;
   1183   1.1       cgd 
   1184   1.1       cgd 	if ((caller->pc_ucred->cr_uid == target->p_ruid &&
   1185  1.88     enami 	    target->p_ruid == target->p_svuid &&
   1186  1.88     enami 	    caller->p_rgid == target->p_rgid &&	/* XXX */
   1187  1.88     enami 	    target->p_rgid == target->p_svgid &&
   1188  1.88     enami 	    (targetp->p_traceflag & KTRFAC_ROOT) == 0 &&
   1189  1.88     enami 	    (targetp->p_flag & P_SUGID) == 0) ||
   1190  1.88     enami 	    caller->pc_ucred->cr_uid == 0)
   1191   1.1       cgd 		return (1);
   1192   1.1       cgd 
   1193   1.1       cgd 	return (0);
   1194   1.1       cgd }
   1195  1.47   thorpej #endif /* KTRACE */
   1196  1.51  jdolecek 
   1197  1.51  jdolecek /*
   1198  1.51  jdolecek  * Put user defined entry to ktrace records.
   1199  1.51  jdolecek  */
   1200  1.51  jdolecek int
   1201  1.89     enami sys_utrace(struct lwp *l, void *v, register_t *retval)
   1202  1.51  jdolecek {
   1203  1.51  jdolecek #ifdef KTRACE
   1204  1.51  jdolecek 	struct sys_utrace_args /* {
   1205  1.52  jdolecek 		syscallarg(const char *) label;
   1206  1.51  jdolecek 		syscallarg(void *) addr;
   1207  1.51  jdolecek 		syscallarg(size_t) len;
   1208  1.51  jdolecek 	} */ *uap = v;
   1209  1.67   thorpej 	struct proc *p = l->l_proc;
   1210  1.88     enami 
   1211  1.51  jdolecek 	if (!KTRPOINT(p, KTR_USER))
   1212  1.51  jdolecek 		return (0);
   1213  1.53  jdolecek 
   1214  1.53  jdolecek 	if (SCARG(uap, len) > KTR_USER_MAXLEN)
   1215  1.53  jdolecek 		return (EINVAL);
   1216  1.51  jdolecek 
   1217  1.74      fvdl 	ktruser(p, SCARG(uap, label), SCARG(uap, addr), SCARG(uap, len), 1);
   1218  1.51  jdolecek 
   1219  1.51  jdolecek 	return (0);
   1220  1.51  jdolecek #else /* !KTRACE */
   1221  1.51  jdolecek 	return ENOSYS;
   1222  1.51  jdolecek #endif /* KTRACE */
   1223  1.51  jdolecek }
   1224