kern_ktrace.c revision 1.106 1 1.106 manu /* $NetBSD: kern_ktrace.c,v 1.106 2006/09/23 22:01:04 manu Exp $ */
2 1.11 cgd
3 1.1 cgd /*
4 1.9 cgd * Copyright (c) 1989, 1993
5 1.9 cgd * The Regents of the University of California. All rights reserved.
6 1.1 cgd *
7 1.1 cgd * Redistribution and use in source and binary forms, with or without
8 1.1 cgd * modification, are permitted provided that the following conditions
9 1.1 cgd * are met:
10 1.1 cgd * 1. Redistributions of source code must retain the above copyright
11 1.1 cgd * notice, this list of conditions and the following disclaimer.
12 1.1 cgd * 2. Redistributions in binary form must reproduce the above copyright
13 1.1 cgd * notice, this list of conditions and the following disclaimer in the
14 1.1 cgd * documentation and/or other materials provided with the distribution.
15 1.77 agc * 3. Neither the name of the University nor the names of its contributors
16 1.1 cgd * may be used to endorse or promote products derived from this software
17 1.1 cgd * without specific prior written permission.
18 1.1 cgd *
19 1.1 cgd * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
20 1.1 cgd * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
21 1.1 cgd * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
22 1.1 cgd * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
23 1.1 cgd * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
24 1.1 cgd * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
25 1.1 cgd * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
26 1.1 cgd * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
27 1.1 cgd * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
28 1.1 cgd * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
29 1.1 cgd * SUCH DAMAGE.
30 1.1 cgd *
31 1.25 fvdl * @(#)kern_ktrace.c 8.5 (Berkeley) 5/14/95
32 1.1 cgd */
33 1.55 lukem
34 1.55 lukem #include <sys/cdefs.h>
35 1.106 manu __KERNEL_RCSID(0, "$NetBSD: kern_ktrace.c,v 1.106 2006/09/23 22:01:04 manu Exp $");
36 1.29 thorpej
37 1.29 thorpej #include "opt_ktrace.h"
38 1.62 manu #include "opt_compat_mach.h"
39 1.1 cgd
40 1.7 mycroft #include <sys/param.h>
41 1.13 cgd #include <sys/systm.h>
42 1.7 mycroft #include <sys/proc.h>
43 1.7 mycroft #include <sys/file.h>
44 1.7 mycroft #include <sys/namei.h>
45 1.7 mycroft #include <sys/vnode.h>
46 1.93 enami #include <sys/kernel.h>
47 1.93 enami #include <sys/kthread.h>
48 1.7 mycroft #include <sys/ktrace.h>
49 1.7 mycroft #include <sys/malloc.h>
50 1.7 mycroft #include <sys/syslog.h>
51 1.28 christos #include <sys/filedesc.h>
52 1.42 sommerfe #include <sys/ioctl.h>
53 1.93 enami #include <sys/callout.h>
54 1.103 elad #include <sys/kauth.h>
55 1.1 cgd
56 1.13 cgd #include <sys/mount.h>
57 1.67 thorpej #include <sys/sa.h>
58 1.13 cgd #include <sys/syscallargs.h>
59 1.22 christos
60 1.51 jdolecek #ifdef KTRACE
61 1.51 jdolecek
62 1.93 enami /*
63 1.93 enami * XXX:
64 1.93 enami * - need better error reporting?
65 1.93 enami * - p->p_tracep access lock. lock p_lock, lock ktd if !NULL, inc ref.
66 1.93 enami * - userland utility to sort ktrace.out by timestamp.
67 1.93 enami * - keep minimum information in ktrace_entry when rest of alloc failed.
68 1.93 enami * - enlarge ktrace_entry so that small entry won't require additional
69 1.93 enami * alloc?
70 1.93 enami * - per trace control of configurable parameters.
71 1.93 enami */
72 1.93 enami
73 1.93 enami struct ktrace_entry {
74 1.93 enami TAILQ_ENTRY(ktrace_entry) kte_list;
75 1.93 enami struct ktr_header kte_kth;
76 1.98 christos void *kte_buf;
77 1.93 enami };
78 1.93 enami
79 1.93 enami struct ktr_desc {
80 1.93 enami TAILQ_ENTRY(ktr_desc) ktd_list;
81 1.93 enami int ktd_flags;
82 1.93 enami #define KTDF_WAIT 0x0001
83 1.93 enami #define KTDF_DONE 0x0002
84 1.93 enami #define KTDF_BLOCKING 0x0004
85 1.93 enami #define KTDF_INTERACTIVE 0x0008
86 1.93 enami int ktd_error;
87 1.93 enami #define KTDE_ENOMEM 0x0001
88 1.93 enami #define KTDE_ENOSPC 0x0002
89 1.93 enami int ktd_errcnt;
90 1.93 enami int ktd_ref; /* # of reference */
91 1.93 enami int ktd_qcount; /* # of entry in the queue */
92 1.93 enami
93 1.93 enami /*
94 1.93 enami * Params to control behaviour.
95 1.93 enami */
96 1.93 enami int ktd_delayqcnt; /* # of entry allowed to delay */
97 1.93 enami int ktd_wakedelay; /* delay of wakeup in *tick* */
98 1.93 enami int ktd_intrwakdl; /* ditto, but when interactive */
99 1.93 enami
100 1.93 enami struct file *ktd_fp; /* trace output file */
101 1.93 enami struct proc *ktd_proc; /* our kernel thread */
102 1.93 enami TAILQ_HEAD(, ktrace_entry) ktd_queue;
103 1.93 enami struct callout ktd_wakch; /* delayed wakeup */
104 1.93 enami struct simplelock ktd_slock;
105 1.93 enami };
106 1.93 enami
107 1.98 christos static void ktrinitheader(struct ktr_header *, struct lwp *, int);
108 1.93 enami static void ktrwrite(struct ktr_desc *, struct ktrace_entry *);
109 1.105 ad static int ktrace_common(struct lwp *, int, int, int, struct file *);
110 1.105 ad static int ktrops(struct lwp *, struct proc *, int, int,
111 1.93 enami struct ktr_desc *);
112 1.105 ad static int ktrsetchildren(struct lwp *, struct proc *, int, int,
113 1.93 enami struct ktr_desc *);
114 1.105 ad static int ktrcanset(struct lwp *, struct proc *);
115 1.93 enami static int ktrsamefile(struct file *, struct file *);
116 1.93 enami
117 1.93 enami static struct ktr_desc *
118 1.93 enami ktd_lookup(struct file *);
119 1.93 enami static void ktdrel(struct ktr_desc *);
120 1.93 enami static void ktdref(struct ktr_desc *);
121 1.98 christos static void ktraddentry(struct lwp *, struct ktrace_entry *, int);
122 1.93 enami /* Flags for ktraddentry (3rd arg) */
123 1.93 enami #define KTA_NOWAIT 0x0000
124 1.93 enami #define KTA_WAITOK 0x0001
125 1.93 enami #define KTA_LARGE 0x0002
126 1.93 enami static void ktefree(struct ktrace_entry *);
127 1.93 enami static void ktd_logerrl(struct ktr_desc *, int);
128 1.93 enami static void ktd_logerr(struct proc *, int);
129 1.93 enami static void ktrace_thread(void *);
130 1.93 enami
131 1.93 enami /*
132 1.93 enami * Default vaules.
133 1.93 enami */
134 1.93 enami #define KTD_MAXENTRY 1000 /* XXX: tune */
135 1.93 enami #define KTD_TIMEOUT 5 /* XXX: tune */
136 1.93 enami #define KTD_DELAYQCNT 100 /* XXX: tune */
137 1.93 enami #define KTD_WAKEDELAY 5000 /* XXX: tune */
138 1.93 enami #define KTD_INTRWAKDL 100 /* XXX: tune */
139 1.93 enami
140 1.93 enami /*
141 1.93 enami * Patchable variables.
142 1.93 enami */
143 1.93 enami int ktd_maxentry = KTD_MAXENTRY; /* max # of entry in the queue */
144 1.93 enami int ktd_timeout = KTD_TIMEOUT; /* timeout in seconds */
145 1.93 enami int ktd_delayqcnt = KTD_DELAYQCNT; /* # of entry allowed to delay */
146 1.93 enami int ktd_wakedelay = KTD_WAKEDELAY; /* delay of wakeup in *ms* */
147 1.93 enami int ktd_intrwakdl = KTD_INTRWAKDL; /* ditto, but when interactive */
148 1.93 enami
149 1.93 enami static struct simplelock ktdq_slock = SIMPLELOCK_INITIALIZER;
150 1.93 enami static TAILQ_HEAD(, ktr_desc) ktdq = TAILQ_HEAD_INITIALIZER(ktdq);
151 1.93 enami
152 1.93 enami MALLOC_DEFINE(M_KTRACE, "ktrace", "ktrace data buffer");
153 1.93 enami POOL_INIT(kte_pool, sizeof(struct ktrace_entry), 0, 0, 0,
154 1.93 enami "ktepl", &pool_allocator_nointr);
155 1.93 enami
156 1.100 perry static inline void
157 1.93 enami ktd_wakeup(struct ktr_desc *ktd)
158 1.93 enami {
159 1.93 enami
160 1.93 enami callout_stop(&ktd->ktd_wakch);
161 1.93 enami wakeup(ktd);
162 1.93 enami }
163 1.93 enami
164 1.93 enami static void
165 1.93 enami ktd_logerrl(struct ktr_desc *ktd, int error)
166 1.93 enami {
167 1.93 enami
168 1.93 enami ktd->ktd_error |= error;
169 1.93 enami ktd->ktd_errcnt++;
170 1.93 enami }
171 1.93 enami
172 1.93 enami static void
173 1.93 enami ktd_logerr(struct proc *p, int error)
174 1.93 enami {
175 1.93 enami struct ktr_desc *ktd = p->p_tracep;
176 1.93 enami
177 1.93 enami if (ktd == NULL)
178 1.93 enami return;
179 1.93 enami
180 1.93 enami simple_lock(&ktd->ktd_slock);
181 1.93 enami ktd_logerrl(ktd, error);
182 1.93 enami simple_unlock(&ktd->ktd_slock);
183 1.93 enami }
184 1.93 enami
185 1.93 enami /*
186 1.93 enami * Release a reference. Called with ktd_slock held.
187 1.93 enami */
188 1.93 enami void
189 1.93 enami ktdrel(struct ktr_desc *ktd)
190 1.93 enami {
191 1.93 enami
192 1.93 enami KDASSERT(ktd->ktd_ref != 0);
193 1.93 enami KASSERT(ktd->ktd_ref > 0);
194 1.93 enami if (--ktd->ktd_ref <= 0) {
195 1.93 enami ktd->ktd_flags |= KTDF_DONE;
196 1.93 enami wakeup(ktd);
197 1.93 enami }
198 1.93 enami simple_unlock(&ktd->ktd_slock);
199 1.93 enami }
200 1.93 enami
201 1.93 enami void
202 1.93 enami ktdref(struct ktr_desc *ktd)
203 1.93 enami {
204 1.93 enami
205 1.93 enami simple_lock(&ktd->ktd_slock);
206 1.93 enami ktd->ktd_ref++;
207 1.93 enami simple_unlock(&ktd->ktd_slock);
208 1.93 enami }
209 1.93 enami
210 1.93 enami struct ktr_desc *
211 1.93 enami ktd_lookup(struct file *fp)
212 1.93 enami {
213 1.93 enami struct ktr_desc *ktd;
214 1.93 enami
215 1.93 enami simple_lock(&ktdq_slock);
216 1.93 enami for (ktd = TAILQ_FIRST(&ktdq); ktd != NULL;
217 1.93 enami ktd = TAILQ_NEXT(ktd, ktd_list)) {
218 1.93 enami simple_lock(&ktd->ktd_slock);
219 1.93 enami if (ktrsamefile(ktd->ktd_fp, fp)) {
220 1.93 enami ktd->ktd_ref++;
221 1.93 enami simple_unlock(&ktd->ktd_slock);
222 1.93 enami break;
223 1.93 enami }
224 1.93 enami simple_unlock(&ktd->ktd_slock);
225 1.93 enami }
226 1.93 enami simple_unlock(&ktdq_slock);
227 1.93 enami return (ktd);
228 1.93 enami }
229 1.93 enami
230 1.93 enami void
231 1.98 christos ktraddentry(struct lwp *l, struct ktrace_entry *kte, int flags)
232 1.93 enami {
233 1.98 christos struct proc *p = l->l_proc;
234 1.93 enami struct ktr_desc *ktd;
235 1.93 enami #ifdef DEBUG
236 1.104 kardel struct timeval t1, t2;
237 1.93 enami #endif
238 1.93 enami
239 1.93 enami if (p->p_traceflag & KTRFAC_TRC_EMUL) {
240 1.93 enami /* Add emulation trace before first entry for this process */
241 1.93 enami p->p_traceflag &= ~KTRFAC_TRC_EMUL;
242 1.98 christos ktremul(l);
243 1.93 enami }
244 1.93 enami
245 1.93 enami /*
246 1.93 enami * Tracing may be canceled while we were sleeping waiting for
247 1.93 enami * memory.
248 1.93 enami */
249 1.93 enami ktd = p->p_tracep;
250 1.93 enami if (ktd == NULL)
251 1.93 enami goto freekte;
252 1.93 enami
253 1.93 enami /*
254 1.93 enami * Bump reference count so that the object will remain while
255 1.93 enami * we are here. Note that the trace is controlled by other
256 1.93 enami * process.
257 1.93 enami */
258 1.93 enami ktdref(ktd);
259 1.93 enami
260 1.93 enami simple_lock(&ktd->ktd_slock);
261 1.93 enami if (ktd->ktd_flags & KTDF_DONE)
262 1.93 enami goto relktd;
263 1.93 enami
264 1.93 enami if (ktd->ktd_qcount > ktd_maxentry) {
265 1.93 enami ktd_logerrl(ktd, KTDE_ENOSPC);
266 1.93 enami goto relktd;
267 1.93 enami }
268 1.93 enami TAILQ_INSERT_TAIL(&ktd->ktd_queue, kte, kte_list);
269 1.93 enami ktd->ktd_qcount++;
270 1.93 enami if (ktd->ktd_flags & KTDF_BLOCKING)
271 1.93 enami goto skip_sync;
272 1.93 enami
273 1.93 enami if (flags & KTA_WAITOK &&
274 1.93 enami (/* flags & KTA_LARGE */0 || ktd->ktd_flags & KTDF_WAIT ||
275 1.93 enami ktd->ktd_qcount > ktd_maxentry >> 1))
276 1.93 enami /*
277 1.93 enami * Sync with writer thread since we're requesting rather
278 1.93 enami * big one or many requests are pending.
279 1.93 enami */
280 1.93 enami do {
281 1.93 enami ktd->ktd_flags |= KTDF_WAIT;
282 1.93 enami ktd_wakeup(ktd);
283 1.93 enami #ifdef DEBUG
284 1.104 kardel getmicrouptime(&t1);
285 1.93 enami #endif
286 1.93 enami if (ltsleep(&ktd->ktd_flags, PWAIT, "ktrsync",
287 1.93 enami ktd_timeout * hz, &ktd->ktd_slock) != 0) {
288 1.93 enami ktd->ktd_flags |= KTDF_BLOCKING;
289 1.93 enami /*
290 1.93 enami * Maybe the writer thread is blocking
291 1.93 enami * completely for some reason, but
292 1.93 enami * don't stop target process forever.
293 1.93 enami */
294 1.93 enami log(LOG_NOTICE, "ktrace timeout\n");
295 1.93 enami break;
296 1.93 enami }
297 1.93 enami #ifdef DEBUG
298 1.104 kardel getmicrouptime(&t2);
299 1.104 kardel timersub(&t2, &t1, &t2);
300 1.104 kardel if (t2.tv_sec > 0)
301 1.93 enami log(LOG_NOTICE,
302 1.93 enami "ktrace long wait: %ld.%06ld\n",
303 1.104 kardel t2.tv_sec, t2.tv_usec);
304 1.93 enami #endif
305 1.93 enami } while (p->p_tracep == ktd &&
306 1.93 enami (ktd->ktd_flags & (KTDF_WAIT | KTDF_DONE)) == KTDF_WAIT);
307 1.93 enami else {
308 1.93 enami /* Schedule delayed wakeup */
309 1.93 enami if (ktd->ktd_qcount > ktd->ktd_delayqcnt)
310 1.93 enami ktd_wakeup(ktd); /* Wakeup now */
311 1.93 enami else if (!callout_pending(&ktd->ktd_wakch))
312 1.93 enami callout_reset(&ktd->ktd_wakch,
313 1.93 enami ktd->ktd_flags & KTDF_INTERACTIVE ?
314 1.93 enami ktd->ktd_intrwakdl : ktd->ktd_wakedelay,
315 1.93 enami (void (*)(void *))wakeup, ktd);
316 1.93 enami }
317 1.93 enami
318 1.93 enami skip_sync:
319 1.93 enami ktdrel(ktd);
320 1.93 enami return;
321 1.93 enami
322 1.93 enami relktd:
323 1.93 enami ktdrel(ktd);
324 1.93 enami
325 1.93 enami freekte:
326 1.93 enami ktefree(kte);
327 1.93 enami }
328 1.93 enami
329 1.93 enami void
330 1.93 enami ktefree(struct ktrace_entry *kte)
331 1.93 enami {
332 1.93 enami
333 1.98 christos if (kte->kte_buf != NULL)
334 1.93 enami free(kte->kte_buf, M_KTRACE);
335 1.93 enami pool_put(&kte_pool, kte);
336 1.93 enami }
337 1.44 sommerfe
338 1.44 sommerfe /*
339 1.44 sommerfe * "deep" compare of two files for the purposes of clearing a trace.
340 1.44 sommerfe * Returns true if they're the same open file, or if they point at the
341 1.44 sommerfe * same underlying vnode/socket.
342 1.44 sommerfe */
343 1.44 sommerfe
344 1.44 sommerfe int
345 1.89 enami ktrsamefile(struct file *f1, struct file *f2)
346 1.44 sommerfe {
347 1.88 enami
348 1.44 sommerfe return ((f1 == f2) ||
349 1.45 sommerfe ((f1 != NULL) && (f2 != NULL) &&
350 1.45 sommerfe (f1->f_type == f2->f_type) &&
351 1.44 sommerfe (f1->f_data == f2->f_data)));
352 1.44 sommerfe }
353 1.22 christos
354 1.28 christos void
355 1.89 enami ktrderef(struct proc *p)
356 1.28 christos {
357 1.93 enami struct ktr_desc *ktd = p->p_tracep;
358 1.93 enami
359 1.42 sommerfe p->p_traceflag = 0;
360 1.93 enami if (ktd == NULL)
361 1.28 christos return;
362 1.84 dsl p->p_tracep = NULL;
363 1.84 dsl
364 1.93 enami simple_lock(&ktd->ktd_slock);
365 1.93 enami wakeup(&ktd->ktd_flags);
366 1.93 enami ktdrel(ktd);
367 1.28 christos }
368 1.28 christos
369 1.28 christos void
370 1.89 enami ktradref(struct proc *p)
371 1.28 christos {
372 1.93 enami struct ktr_desc *ktd = p->p_tracep;
373 1.28 christos
374 1.93 enami ktdref(ktd);
375 1.28 christos }
376 1.28 christos
377 1.39 thorpej void
378 1.98 christos ktrinitheader(struct ktr_header *kth, struct lwp *l, int type)
379 1.1 cgd {
380 1.98 christos struct proc *p = l->l_proc;
381 1.1 cgd
382 1.90 christos (void)memset(kth, 0, sizeof(*kth));
383 1.1 cgd kth->ktr_type = type;
384 1.1 cgd kth->ktr_pid = p->p_pid;
385 1.32 perry memcpy(kth->ktr_comm, p->p_comm, MAXCOMLEN);
386 1.98 christos
387 1.98 christos kth->ktr_version = KTRFAC_VERSION(p->p_traceflag);
388 1.98 christos
389 1.98 christos switch (KTRFAC_VERSION(p->p_traceflag)) {
390 1.98 christos case 0:
391 1.98 christos /* This is the original format */
392 1.98 christos microtime(&kth->ktr_tv);
393 1.98 christos break;
394 1.98 christos case 1:
395 1.98 christos kth->ktr_lid = l->l_lid;
396 1.98 christos nanotime(&kth->ktr_time);
397 1.98 christos break;
398 1.98 christos default:
399 1.98 christos break;
400 1.98 christos }
401 1.1 cgd }
402 1.1 cgd
403 1.93 enami void
404 1.98 christos ktrsyscall(struct lwp *l, register_t code, register_t realcode,
405 1.89 enami const struct sysent *callp, register_t args[])
406 1.1 cgd {
407 1.98 christos struct proc *p = l->l_proc;
408 1.93 enami struct ktrace_entry *kte;
409 1.93 enami struct ktr_header *kth;
410 1.72 darrenr struct ktr_syscall *ktp;
411 1.17 cgd register_t *argp;
412 1.93 enami int argsize;
413 1.57 fvdl size_t len;
414 1.60 thorpej u_int i;
415 1.57 fvdl
416 1.66 manu if (callp == NULL)
417 1.66 manu callp = p->p_emul->e_sysent;
418 1.88 enami
419 1.76 drochner argsize = callp[code].sy_argsize;
420 1.86 mrg #ifdef _LP64
421 1.86 mrg if (p->p_flag & P_32)
422 1.86 mrg argsize = argsize << 1;
423 1.86 mrg #endif
424 1.57 fvdl len = sizeof(struct ktr_syscall) + argsize;
425 1.1 cgd
426 1.9 cgd p->p_traceflag |= KTRFAC_ACTIVE;
427 1.93 enami kte = pool_get(&kte_pool, PR_WAITOK);
428 1.93 enami kth = &kte->kte_kth;
429 1.98 christos ktrinitheader(kth, l, KTR_SYSCALL);
430 1.93 enami
431 1.93 enami ktp = malloc(len, M_KTRACE, M_WAITOK);
432 1.61 manu ktp->ktr_code = realcode;
433 1.17 cgd ktp->ktr_argsize = argsize;
434 1.93 enami argp = (register_t *)(ktp + 1);
435 1.31 perry for (i = 0; i < (argsize / sizeof(*argp)); i++)
436 1.1 cgd *argp++ = args[i];
437 1.93 enami kth->ktr_len = len;
438 1.93 enami kte->kte_buf = ktp;
439 1.93 enami
440 1.98 christos ktraddentry(l, kte, KTA_WAITOK);
441 1.9 cgd p->p_traceflag &= ~KTRFAC_ACTIVE;
442 1.1 cgd }
443 1.1 cgd
444 1.93 enami void
445 1.98 christos ktrsysret(struct lwp *l, register_t code, int error, register_t *retval)
446 1.1 cgd {
447 1.98 christos struct proc *p = l->l_proc;
448 1.93 enami struct ktrace_entry *kte;
449 1.93 enami struct ktr_header *kth;
450 1.93 enami struct ktr_sysret *ktp;
451 1.1 cgd
452 1.9 cgd p->p_traceflag |= KTRFAC_ACTIVE;
453 1.93 enami kte = pool_get(&kte_pool, PR_WAITOK);
454 1.93 enami kth = &kte->kte_kth;
455 1.98 christos ktrinitheader(kth, l, KTR_SYSRET);
456 1.93 enami
457 1.93 enami ktp = malloc(sizeof(struct ktr_sysret), M_KTRACE, M_WAITOK);
458 1.93 enami ktp->ktr_code = code;
459 1.93 enami ktp->ktr_eosys = 0; /* XXX unused */
460 1.93 enami ktp->ktr_error = error;
461 1.93 enami ktp->ktr_retval = retval ? retval[0] : 0;
462 1.93 enami ktp->ktr_retval_1 = retval ? retval[1] : 0;
463 1.1 cgd
464 1.93 enami kth->ktr_len = sizeof(struct ktr_sysret);
465 1.93 enami kte->kte_buf = ktp;
466 1.1 cgd
467 1.98 christos ktraddentry(l, kte, KTA_WAITOK);
468 1.9 cgd p->p_traceflag &= ~KTRFAC_ACTIVE;
469 1.1 cgd }
470 1.1 cgd
471 1.93 enami /*
472 1.93 enami * XXX: ndp->ni_pathlen should be passed.
473 1.93 enami */
474 1.93 enami void
475 1.98 christos ktrnamei(struct lwp *l, char *path)
476 1.1 cgd {
477 1.1 cgd
478 1.98 christos ktrkmem(l, KTR_NAMEI, path, strlen(path));
479 1.18 christos }
480 1.18 christos
481 1.93 enami void
482 1.98 christos ktremul(struct lwp *l)
483 1.18 christos {
484 1.98 christos const char *emul = l->l_proc->p_emul->e_name;
485 1.1 cgd
486 1.98 christos ktrkmem(l, KTR_EMUL, emul, strlen(emul));
487 1.1 cgd }
488 1.1 cgd
489 1.93 enami void
490 1.98 christos ktrkmem(struct lwp *l, int type, const void *bf, size_t len)
491 1.75 dsl {
492 1.98 christos struct proc *p = l->l_proc;
493 1.93 enami struct ktrace_entry *kte;
494 1.93 enami struct ktr_header *kth;
495 1.75 dsl
496 1.75 dsl p->p_traceflag |= KTRFAC_ACTIVE;
497 1.93 enami kte = pool_get(&kte_pool, PR_WAITOK);
498 1.93 enami kth = &kte->kte_kth;
499 1.98 christos ktrinitheader(kth, l, type);
500 1.93 enami
501 1.93 enami kth->ktr_len = len;
502 1.93 enami kte->kte_buf = malloc(len, M_KTRACE, M_WAITOK);
503 1.97 christos memcpy(kte->kte_buf, bf, len);
504 1.75 dsl
505 1.98 christos ktraddentry(l, kte, KTA_WAITOK);
506 1.75 dsl p->p_traceflag &= ~KTRFAC_ACTIVE;
507 1.75 dsl }
508 1.75 dsl
509 1.93 enami void
510 1.98 christos ktrgenio(struct lwp *l, int fd, enum uio_rw rw, struct iovec *iov,
511 1.89 enami int len, int error)
512 1.1 cgd {
513 1.98 christos struct proc *p = l->l_proc;
514 1.93 enami struct ktrace_entry *kte;
515 1.93 enami struct ktr_header *kth;
516 1.28 christos struct ktr_genio *ktp;
517 1.98 christos int resid = len, cnt;
518 1.74 fvdl caddr_t cp;
519 1.39 thorpej int buflen;
520 1.39 thorpej
521 1.1 cgd if (error)
522 1.93 enami return;
523 1.39 thorpej
524 1.9 cgd p->p_traceflag |= KTRFAC_ACTIVE;
525 1.39 thorpej
526 1.93 enami next:
527 1.93 enami buflen = min(PAGE_SIZE, resid + sizeof(struct ktr_genio));
528 1.39 thorpej
529 1.93 enami kte = pool_get(&kte_pool, PR_WAITOK);
530 1.93 enami kth = &kte->kte_kth;
531 1.98 christos ktrinitheader(kth, l, KTR_GENIO);
532 1.93 enami
533 1.93 enami ktp = malloc(buflen, M_KTRACE, M_WAITOK);
534 1.1 cgd ktp->ktr_fd = fd;
535 1.1 cgd ktp->ktr_rw = rw;
536 1.39 thorpej
537 1.93 enami kte->kte_buf = ktp;
538 1.39 thorpej
539 1.93 enami cp = (caddr_t)(ktp + 1);
540 1.39 thorpej buflen -= sizeof(struct ktr_genio);
541 1.93 enami kth->ktr_len = sizeof(struct ktr_genio);
542 1.93 enami
543 1.93 enami while (buflen > 0) {
544 1.93 enami cnt = min(iov->iov_len, buflen);
545 1.93 enami if (copyin(iov->iov_base, cp, cnt) != 0)
546 1.93 enami goto out;
547 1.93 enami kth->ktr_len += cnt;
548 1.93 enami buflen -= cnt;
549 1.93 enami resid -= cnt;
550 1.93 enami iov->iov_len -= cnt;
551 1.93 enami if (iov->iov_len == 0)
552 1.93 enami iov++;
553 1.93 enami else
554 1.93 enami iov->iov_base = (caddr_t)iov->iov_base + cnt;
555 1.93 enami }
556 1.39 thorpej
557 1.93 enami /*
558 1.93 enami * Don't push so many entry at once. It will cause kmem map
559 1.93 enami * shortage.
560 1.93 enami */
561 1.98 christos ktraddentry(l, kte, KTA_WAITOK | KTA_LARGE);
562 1.93 enami if (resid > 0) {
563 1.67 thorpej #if 0 /* XXX NJWLWP */
564 1.46 thorpej KDASSERT(p->p_cpu != NULL);
565 1.46 thorpej KDASSERT(p->p_cpu == curcpu());
566 1.67 thorpej #endif
567 1.67 thorpej /* XXX NJWLWP */
568 1.67 thorpej if (curcpu()->ci_schedstate.spc_flags & SPCF_SHOULDYIELD)
569 1.67 thorpej preempt(1);
570 1.39 thorpej
571 1.93 enami goto next;
572 1.93 enami }
573 1.39 thorpej
574 1.93 enami p->p_traceflag &= ~KTRFAC_ACTIVE;
575 1.93 enami return;
576 1.39 thorpej
577 1.93 enami out:
578 1.93 enami ktefree(kte);
579 1.9 cgd p->p_traceflag &= ~KTRFAC_ACTIVE;
580 1.1 cgd }
581 1.1 cgd
582 1.93 enami void
583 1.98 christos ktrpsig(struct lwp *l, int sig, sig_t action, const sigset_t *mask,
584 1.89 enami const ksiginfo_t *ksi)
585 1.1 cgd {
586 1.98 christos struct proc *p = l->l_proc;
587 1.93 enami struct ktrace_entry *kte;
588 1.93 enami struct ktr_header *kth;
589 1.78 christos struct {
590 1.78 christos struct ktr_psig kp;
591 1.78 christos siginfo_t si;
592 1.93 enami } *kbuf;
593 1.1 cgd
594 1.9 cgd p->p_traceflag |= KTRFAC_ACTIVE;
595 1.93 enami kte = pool_get(&kte_pool, PR_WAITOK);
596 1.93 enami kth = &kte->kte_kth;
597 1.98 christos ktrinitheader(kth, l, KTR_PSIG);
598 1.93 enami
599 1.93 enami kbuf = malloc(sizeof(*kbuf), M_KTRACE, M_WAITOK);
600 1.93 enami kbuf->kp.signo = (char)sig;
601 1.93 enami kbuf->kp.action = action;
602 1.93 enami kbuf->kp.mask = *mask;
603 1.93 enami kte->kte_buf = kbuf;
604 1.78 christos if (ksi) {
605 1.93 enami kbuf->kp.code = KSI_TRAPCODE(ksi);
606 1.93 enami (void)memset(&kbuf->si, 0, sizeof(kbuf->si));
607 1.93 enami kbuf->si._info = ksi->ksi_info;
608 1.95 skrll kth->ktr_len = sizeof(*kbuf);
609 1.78 christos } else {
610 1.93 enami kbuf->kp.code = 0;
611 1.93 enami kth->ktr_len = sizeof(struct ktr_psig);
612 1.78 christos }
613 1.93 enami
614 1.98 christos ktraddentry(l, kte, KTA_WAITOK);
615 1.9 cgd p->p_traceflag &= ~KTRFAC_ACTIVE;
616 1.9 cgd }
617 1.9 cgd
618 1.93 enami void
619 1.98 christos ktrcsw(struct lwp *l, int out, int user)
620 1.9 cgd {
621 1.98 christos struct proc *p = l->l_proc;
622 1.93 enami struct ktrace_entry *kte;
623 1.93 enami struct ktr_header *kth;
624 1.93 enami struct ktr_csw *kc;
625 1.9 cgd
626 1.9 cgd p->p_traceflag |= KTRFAC_ACTIVE;
627 1.9 cgd
628 1.93 enami /*
629 1.93 enami * We can't sleep if we're already going to sleep (if original
630 1.93 enami * condition is met during sleep, we hang up).
631 1.93 enami */
632 1.93 enami kte = pool_get(&kte_pool, out ? PR_NOWAIT : PR_WAITOK);
633 1.93 enami if (kte == NULL) {
634 1.93 enami ktd_logerr(p, KTDE_ENOMEM);
635 1.93 enami goto out;
636 1.93 enami }
637 1.93 enami kth = &kte->kte_kth;
638 1.98 christos ktrinitheader(kth, l, KTR_CSW);
639 1.93 enami
640 1.93 enami kc = malloc(sizeof(struct ktr_csw), M_KTRACE,
641 1.93 enami out ? M_NOWAIT : M_WAITOK);
642 1.93 enami if (kc == NULL) {
643 1.93 enami ktd_logerr(p, KTDE_ENOMEM);
644 1.93 enami goto free_kte;
645 1.93 enami }
646 1.93 enami kc->out = out;
647 1.93 enami kc->user = user;
648 1.93 enami kth->ktr_len = sizeof(struct ktr_csw);
649 1.93 enami kte->kte_buf = kc;
650 1.93 enami
651 1.98 christos ktraddentry(l, kte, out ? KTA_NOWAIT : KTA_WAITOK);
652 1.93 enami p->p_traceflag &= ~KTRFAC_ACTIVE;
653 1.93 enami return;
654 1.93 enami
655 1.93 enami free_kte:
656 1.93 enami pool_put(&kte_pool, kte);
657 1.93 enami out:
658 1.9 cgd p->p_traceflag &= ~KTRFAC_ACTIVE;
659 1.1 cgd }
660 1.1 cgd
661 1.93 enami void
662 1.98 christos ktruser(struct lwp *l, const char *id, void *addr, size_t len, int ustr)
663 1.51 jdolecek {
664 1.98 christos struct proc *p = l->l_proc;
665 1.93 enami struct ktrace_entry *kte;
666 1.93 enami struct ktr_header *kth;
667 1.51 jdolecek struct ktr_user *ktp;
668 1.51 jdolecek caddr_t user_dta;
669 1.51 jdolecek
670 1.51 jdolecek p->p_traceflag |= KTRFAC_ACTIVE;
671 1.93 enami kte = pool_get(&kte_pool, PR_WAITOK);
672 1.93 enami kth = &kte->kte_kth;
673 1.98 christos ktrinitheader(kth, l, KTR_USER);
674 1.93 enami
675 1.93 enami ktp = malloc(sizeof(struct ktr_user) + len, M_KTRACE, M_WAITOK);
676 1.51 jdolecek if (ustr) {
677 1.51 jdolecek if (copyinstr(id, ktp->ktr_id, KTR_USER_MAXIDLEN, NULL) != 0)
678 1.51 jdolecek ktp->ktr_id[0] = '\0';
679 1.51 jdolecek } else
680 1.51 jdolecek strncpy(ktp->ktr_id, id, KTR_USER_MAXIDLEN);
681 1.51 jdolecek ktp->ktr_id[KTR_USER_MAXIDLEN-1] = '\0';
682 1.51 jdolecek
683 1.93 enami user_dta = (caddr_t)(ktp + 1);
684 1.93 enami if (copyin(addr, (void *)user_dta, len) != 0)
685 1.51 jdolecek len = 0;
686 1.51 jdolecek
687 1.93 enami kth->ktr_len = sizeof(struct ktr_user) + len;
688 1.93 enami kte->kte_buf = ktp;
689 1.51 jdolecek
690 1.98 christos ktraddentry(l, kte, KTA_WAITOK);
691 1.51 jdolecek p->p_traceflag &= ~KTRFAC_ACTIVE;
692 1.51 jdolecek }
693 1.51 jdolecek
694 1.93 enami void
695 1.98 christos ktrmmsg(struct lwp *l, const void *msgh, size_t size)
696 1.62 manu {
697 1.98 christos ktrkmem(l, KTR_MMSG, msgh, size);
698 1.62 manu }
699 1.83 manu
700 1.93 enami void
701 1.98 christos ktrmool(struct lwp *l, const void *kaddr, size_t size, const void *uaddr)
702 1.83 manu {
703 1.98 christos struct proc *p = l->l_proc;
704 1.93 enami struct ktrace_entry *kte;
705 1.93 enami struct ktr_header *kth;
706 1.83 manu struct ktr_mool *kp;
707 1.97 christos struct ktr_mool *bf;
708 1.83 manu
709 1.83 manu p->p_traceflag |= KTRFAC_ACTIVE;
710 1.93 enami kte = pool_get(&kte_pool, PR_WAITOK);
711 1.93 enami kth = &kte->kte_kth;
712 1.98 christos ktrinitheader(kth, l, KTR_MOOL);
713 1.83 manu
714 1.93 enami kp = malloc(size + sizeof(*kp), M_KTRACE, M_WAITOK);
715 1.83 manu kp->uaddr = uaddr;
716 1.83 manu kp->size = size;
717 1.97 christos bf = kp + 1; /* Skip uaddr and size */
718 1.97 christos (void)memcpy(bf, kaddr, size);
719 1.88 enami
720 1.93 enami kth->ktr_len = size + sizeof(*kp);
721 1.93 enami kte->kte_buf = kp;
722 1.83 manu
723 1.98 christos ktraddentry(l, kte, KTA_WAITOK);
724 1.83 manu p->p_traceflag &= ~KTRFAC_ACTIVE;
725 1.83 manu }
726 1.83 manu
727 1.98 christos void
728 1.98 christos ktrsaupcall(struct lwp *l, int type, int nevent, int nint, void *sas,
729 1.98 christos void *ap)
730 1.98 christos {
731 1.98 christos struct proc *p = l->l_proc;
732 1.98 christos struct ktrace_entry *kte;
733 1.98 christos struct ktr_header *kth;
734 1.98 christos struct ktr_saupcall *ktp;
735 1.98 christos size_t len;
736 1.98 christos struct sa_t **sapp;
737 1.98 christos int i;
738 1.98 christos
739 1.98 christos p->p_traceflag |= KTRFAC_ACTIVE;
740 1.98 christos kte = pool_get(&kte_pool, PR_WAITOK);
741 1.98 christos kth = &kte->kte_kth;
742 1.98 christos ktrinitheader(kth, l, KTR_SAUPCALL);
743 1.98 christos
744 1.98 christos len = sizeof(struct ktr_saupcall);
745 1.98 christos ktp = malloc(len + sizeof(struct sa_t) * (nevent + nint + 1), M_KTRACE,
746 1.98 christos M_WAITOK);
747 1.98 christos
748 1.98 christos ktp->ktr_type = type;
749 1.98 christos ktp->ktr_nevent = nevent;
750 1.98 christos ktp->ktr_nint = nint;
751 1.98 christos ktp->ktr_sas = sas;
752 1.98 christos ktp->ktr_ap = ap;
753 1.98 christos /*
754 1.98 christos * Copy the sa_t's
755 1.98 christos */
756 1.98 christos sapp = (struct sa_t **) sas;
757 1.98 christos
758 1.98 christos for (i = nevent + nint; i >= 0; i--) {
759 1.98 christos if (copyin(*sapp, (char *)ktp + len, sizeof(struct sa_t)) == 0)
760 1.98 christos len += sizeof(struct sa_t);
761 1.98 christos sapp++;
762 1.98 christos }
763 1.98 christos
764 1.98 christos kth->ktr_len = len;
765 1.98 christos kte->kte_buf = ktp;
766 1.98 christos
767 1.98 christos ktraddentry(l, kte, KTA_WAITOK);
768 1.98 christos p->p_traceflag &= ~KTRFAC_ACTIVE;
769 1.98 christos }
770 1.62 manu
771 1.106 manu void
772 1.106 manu ktrmib(l, name, namelen)
773 1.106 manu struct lwp *l;
774 1.106 manu const int *name;
775 1.106 manu u_int namelen;
776 1.106 manu {
777 1.106 manu struct proc *p = l->l_proc;
778 1.106 manu struct ktrace_entry *kte;
779 1.106 manu struct ktr_header *kth;
780 1.106 manu int *namep;
781 1.106 manu size_t size;
782 1.106 manu
783 1.106 manu p->p_traceflag |= KTRFAC_ACTIVE;
784 1.106 manu kte = pool_get(&kte_pool, PR_WAITOK);
785 1.106 manu kth = &kte->kte_kth;
786 1.106 manu ktrinitheader(kth, l, KTR_MIB);
787 1.106 manu
788 1.106 manu size = namelen * sizeof(*name);
789 1.106 manu namep = malloc(size, M_KTRACE, M_WAITOK);
790 1.106 manu (void)memcpy(namep, name, namelen * sizeof(*name));
791 1.106 manu
792 1.106 manu kth->ktr_len = size;
793 1.106 manu kte->kte_buf = namep;
794 1.106 manu
795 1.106 manu ktraddentry(l, kte, KTA_WAITOK);
796 1.106 manu p->p_traceflag &= ~KTRFAC_ACTIVE;
797 1.106 manu }
798 1.106 manu
799 1.1 cgd /* Interface and common routines */
800 1.1 cgd
801 1.17 cgd int
802 1.105 ad ktrace_common(struct lwp *curl, int ops, int facs, int pid, struct file *fp)
803 1.28 christos {
804 1.105 ad struct proc *curp;
805 1.93 enami struct proc *p;
806 1.93 enami struct pgrp *pg;
807 1.93 enami struct ktr_desc *ktd = NULL;
808 1.74 fvdl int ret = 0;
809 1.72 darrenr int error = 0;
810 1.42 sommerfe int descend;
811 1.28 christos
812 1.105 ad curp = curl->l_proc;
813 1.28 christos curp->p_traceflag |= KTRFAC_ACTIVE;
814 1.42 sommerfe descend = ops & KTRFLAG_DESCEND;
815 1.42 sommerfe facs = facs & ~((unsigned) KTRFAC_ROOT);
816 1.28 christos
817 1.93 enami switch (KTROP(ops)) {
818 1.93 enami
819 1.93 enami case KTROP_CLEARFILE:
820 1.93 enami /*
821 1.93 enami * Clear all uses of the tracefile
822 1.93 enami */
823 1.93 enami
824 1.93 enami ktd = ktd_lookup(fp);
825 1.93 enami if (ktd == NULL)
826 1.93 enami goto done;
827 1.93 enami
828 1.37 thorpej proclist_lock_read();
829 1.94 yamt PROCLIST_FOREACH(p, &allproc) {
830 1.93 enami if (p->p_tracep == ktd) {
831 1.105 ad if (ktrcanset(curl, p))
832 1.28 christos ktrderef(p);
833 1.28 christos else
834 1.28 christos error = EPERM;
835 1.28 christos }
836 1.28 christos }
837 1.36 thorpej proclist_unlock_read();
838 1.28 christos goto done;
839 1.42 sommerfe
840 1.93 enami case KTROP_SET:
841 1.93 enami ktd = ktd_lookup(fp);
842 1.93 enami if (ktd == NULL) {
843 1.93 enami ktd = malloc(sizeof(struct ktr_desc),
844 1.93 enami M_KTRACE, M_WAITOK);
845 1.93 enami TAILQ_INIT(&ktd->ktd_queue);
846 1.93 enami simple_lock_init(&ktd->ktd_slock);
847 1.93 enami callout_init(&ktd->ktd_wakch);
848 1.93 enami ktd->ktd_flags = ktd->ktd_qcount =
849 1.93 enami ktd->ktd_error = ktd->ktd_errcnt = 0;
850 1.93 enami ktd->ktd_ref = 1;
851 1.93 enami ktd->ktd_delayqcnt = ktd_delayqcnt;
852 1.93 enami ktd->ktd_wakedelay = mstohz(ktd_wakedelay);
853 1.93 enami ktd->ktd_intrwakdl = mstohz(ktd_intrwakdl);
854 1.93 enami /*
855 1.93 enami * XXX: not correct. needs an way to detect
856 1.93 enami * whether ktruss or ktrace.
857 1.93 enami */
858 1.93 enami if (fp->f_type == DTYPE_PIPE)
859 1.93 enami ktd->ktd_flags |= KTDF_INTERACTIVE;
860 1.93 enami
861 1.93 enami error = kthread_create1(ktrace_thread, ktd,
862 1.93 enami &ktd->ktd_proc, "ktr %p", ktd);
863 1.93 enami if (error != 0) {
864 1.93 enami free(ktd, M_KTRACE);
865 1.93 enami goto done;
866 1.93 enami }
867 1.93 enami
868 1.93 enami simple_lock(&fp->f_slock);
869 1.93 enami fp->f_count++;
870 1.93 enami simple_unlock(&fp->f_slock);
871 1.93 enami ktd->ktd_fp = fp;
872 1.93 enami
873 1.93 enami simple_lock(&ktdq_slock);
874 1.93 enami TAILQ_INSERT_TAIL(&ktdq, ktd, ktd_list);
875 1.93 enami simple_unlock(&ktdq_slock);
876 1.93 enami }
877 1.93 enami break;
878 1.42 sommerfe
879 1.93 enami case KTROP_CLEAR:
880 1.93 enami break;
881 1.43 sommerfe }
882 1.88 enami
883 1.28 christos /*
884 1.28 christos * need something to (un)trace (XXX - why is this here?)
885 1.28 christos */
886 1.28 christos if (!facs) {
887 1.28 christos error = EINVAL;
888 1.28 christos goto done;
889 1.28 christos }
890 1.93 enami
891 1.88 enami /*
892 1.28 christos * do it
893 1.28 christos */
894 1.42 sommerfe if (pid < 0) {
895 1.28 christos /*
896 1.28 christos * by process group
897 1.28 christos */
898 1.82 dsl pg = pg_find(-pid, PFIND_UNLOCK_FAIL);
899 1.28 christos if (pg == NULL) {
900 1.28 christos error = ESRCH;
901 1.28 christos goto done;
902 1.28 christos }
903 1.81 jdolecek LIST_FOREACH(p, &pg->pg_members, p_pglist) {
904 1.28 christos if (descend)
905 1.105 ad ret |= ktrsetchildren(curl, p, ops, facs, ktd);
906 1.88 enami else
907 1.105 ad ret |= ktrops(curl, p, ops, facs, ktd);
908 1.39 thorpej }
909 1.88 enami
910 1.28 christos } else {
911 1.28 christos /*
912 1.28 christos * by pid
913 1.28 christos */
914 1.82 dsl p = p_find(pid, PFIND_UNLOCK_FAIL);
915 1.28 christos if (p == NULL) {
916 1.28 christos error = ESRCH;
917 1.28 christos goto done;
918 1.28 christos }
919 1.28 christos if (descend)
920 1.105 ad ret |= ktrsetchildren(curl, p, ops, facs, ktd);
921 1.28 christos else
922 1.105 ad ret |= ktrops(curl, p, ops, facs, ktd);
923 1.28 christos }
924 1.82 dsl proclist_unlock_read(); /* taken by p{g}_find */
925 1.28 christos if (!ret)
926 1.28 christos error = EPERM;
927 1.28 christos done:
928 1.96 christos if (ktd != NULL) {
929 1.96 christos if (error != 0) {
930 1.96 christos /*
931 1.96 christos * Wakeup the thread so that it can be die if we
932 1.96 christos * can't trace any process.
933 1.96 christos */
934 1.96 christos ktd_wakeup(ktd);
935 1.96 christos }
936 1.96 christos if (KTROP(ops) == KTROP_SET || KTROP(ops) == KTROP_CLEARFILE) {
937 1.96 christos simple_lock(&ktd->ktd_slock);
938 1.96 christos ktdrel(ktd);
939 1.96 christos }
940 1.93 enami }
941 1.28 christos curp->p_traceflag &= ~KTRFAC_ACTIVE;
942 1.28 christos return (error);
943 1.28 christos }
944 1.28 christos
945 1.28 christos /*
946 1.93 enami * fktrace system call
947 1.28 christos */
948 1.28 christos /* ARGSUSED */
949 1.28 christos int
950 1.89 enami sys_fktrace(struct lwp *l, void *v, register_t *retval)
951 1.42 sommerfe {
952 1.42 sommerfe struct sys_fktrace_args /* {
953 1.42 sommerfe syscallarg(int) fd;
954 1.42 sommerfe syscallarg(int) ops;
955 1.42 sommerfe syscallarg(int) facs;
956 1.42 sommerfe syscallarg(int) pid;
957 1.42 sommerfe } */ *uap = v;
958 1.42 sommerfe struct file *fp = NULL;
959 1.98 christos struct filedesc *fdp = l->l_proc->p_fd;
960 1.70 yamt int error;
961 1.42 sommerfe
962 1.105 ad fdp = l->l_proc->p_fd;
963 1.54 thorpej if ((fp = fd_getfile(fdp, SCARG(uap, fd))) == NULL)
964 1.54 thorpej return (EBADF);
965 1.54 thorpej
966 1.70 yamt FILE_USE(fp);
967 1.70 yamt
968 1.54 thorpej if ((fp->f_flag & FWRITE) == 0)
969 1.70 yamt error = EBADF;
970 1.70 yamt else
971 1.105 ad error = ktrace_common(l, SCARG(uap, ops),
972 1.70 yamt SCARG(uap, facs), SCARG(uap, pid), fp);
973 1.70 yamt
974 1.98 christos FILE_UNUSE(fp, l);
975 1.42 sommerfe
976 1.70 yamt return error;
977 1.42 sommerfe }
978 1.42 sommerfe
979 1.42 sommerfe /*
980 1.42 sommerfe * ktrace system call
981 1.42 sommerfe */
982 1.42 sommerfe /* ARGSUSED */
983 1.42 sommerfe int
984 1.89 enami sys_ktrace(struct lwp *l, void *v, register_t *retval)
985 1.19 thorpej {
986 1.28 christos struct sys_ktrace_args /* {
987 1.24 mycroft syscallarg(const char *) fname;
988 1.13 cgd syscallarg(int) ops;
989 1.13 cgd syscallarg(int) facs;
990 1.13 cgd syscallarg(int) pid;
991 1.19 thorpej } */ *uap = v;
992 1.67 thorpej struct proc *curp = l->l_proc;
993 1.28 christos struct vnode *vp = NULL;
994 1.42 sommerfe struct file *fp = NULL;
995 1.98 christos struct nameidata nd;
996 1.74 fvdl int error = 0;
997 1.98 christos int fd;
998 1.1 cgd
999 1.9 cgd curp->p_traceflag |= KTRFAC_ACTIVE;
1000 1.102 christos if (KTROP(SCARG(uap, ops)) != KTROP_CLEAR) {
1001 1.1 cgd /*
1002 1.1 cgd * an operation which requires a file argument.
1003 1.1 cgd */
1004 1.13 cgd NDINIT(&nd, LOOKUP, FOLLOW, UIO_USERSPACE, SCARG(uap, fname),
1005 1.98 christos l);
1006 1.22 christos if ((error = vn_open(&nd, FREAD|FWRITE, 0)) != 0) {
1007 1.9 cgd curp->p_traceflag &= ~KTRFAC_ACTIVE;
1008 1.1 cgd return (error);
1009 1.9 cgd }
1010 1.1 cgd vp = nd.ni_vp;
1011 1.25 fvdl VOP_UNLOCK(vp, 0);
1012 1.1 cgd if (vp->v_type != VREG) {
1013 1.105 ad (void) vn_close(vp, FREAD|FWRITE, l->l_cred, l);
1014 1.9 cgd curp->p_traceflag &= ~KTRFAC_ACTIVE;
1015 1.1 cgd return (EACCES);
1016 1.1 cgd }
1017 1.1 cgd /*
1018 1.42 sommerfe * XXX This uses up a file descriptor slot in the
1019 1.42 sommerfe * tracing process for the duration of this syscall.
1020 1.42 sommerfe * This is not expected to be a problem. If
1021 1.42 sommerfe * falloc(NULL, ...) DTRT we could skip that part, but
1022 1.42 sommerfe * that would require changing its interface to allow
1023 1.42 sommerfe * the caller to pass in a ucred..
1024 1.42 sommerfe *
1025 1.88 enami * This will FILE_USE the fp it returns, if any.
1026 1.42 sommerfe * Keep it in use until we return.
1027 1.1 cgd */
1028 1.105 ad if ((error = falloc(l, &fp, &fd)) != 0)
1029 1.1 cgd goto done;
1030 1.88 enami
1031 1.93 enami fp->f_flag = FWRITE;
1032 1.42 sommerfe fp->f_type = DTYPE_VNODE;
1033 1.42 sommerfe fp->f_ops = &vnops;
1034 1.42 sommerfe fp->f_data = (caddr_t)vp;
1035 1.54 thorpej FILE_SET_MATURE(fp);
1036 1.42 sommerfe vp = NULL;
1037 1.42 sommerfe }
1038 1.105 ad error = ktrace_common(l, SCARG(uap, ops), SCARG(uap, facs),
1039 1.42 sommerfe SCARG(uap, pid), fp);
1040 1.88 enami done:
1041 1.1 cgd if (vp != NULL)
1042 1.105 ad (void) vn_close(vp, FWRITE, l->l_cred, l);
1043 1.42 sommerfe if (fp != NULL) {
1044 1.98 christos FILE_UNUSE(fp, l); /* release file */
1045 1.98 christos fdrelease(l, fd); /* release fd table slot */
1046 1.42 sommerfe }
1047 1.1 cgd return (error);
1048 1.1 cgd }
1049 1.1 cgd
1050 1.4 andrew int
1051 1.105 ad ktrops(struct lwp *curl, struct proc *p, int ops, int facs,
1052 1.93 enami struct ktr_desc *ktd)
1053 1.1 cgd {
1054 1.98 christos int vers = ops & KTRFAC_VER_MASK;
1055 1.98 christos
1056 1.105 ad if (!ktrcanset(curl, p))
1057 1.1 cgd return (0);
1058 1.98 christos
1059 1.98 christos switch (vers) {
1060 1.98 christos case KTRFACv0:
1061 1.98 christos case KTRFACv1:
1062 1.98 christos break;
1063 1.98 christos default:
1064 1.98 christos return EINVAL;
1065 1.98 christos }
1066 1.98 christos
1067 1.28 christos if (KTROP(ops) == KTROP_SET) {
1068 1.93 enami if (p->p_tracep != ktd) {
1069 1.1 cgd /*
1070 1.1 cgd * if trace file already in use, relinquish
1071 1.1 cgd */
1072 1.28 christos ktrderef(p);
1073 1.93 enami p->p_tracep = ktd;
1074 1.28 christos ktradref(p);
1075 1.1 cgd }
1076 1.1 cgd p->p_traceflag |= facs;
1077 1.105 ad if (kauth_cred_geteuid(curl->l_cred) == 0)
1078 1.1 cgd p->p_traceflag |= KTRFAC_ROOT;
1079 1.88 enami } else {
1080 1.1 cgd /* KTROP_CLEAR */
1081 1.1 cgd if (((p->p_traceflag &= ~facs) & KTRFAC_MASK) == 0) {
1082 1.1 cgd /* no more tracing */
1083 1.28 christos ktrderef(p);
1084 1.1 cgd }
1085 1.1 cgd }
1086 1.21 christos
1087 1.98 christos if (p->p_traceflag)
1088 1.98 christos p->p_traceflag |= vers;
1089 1.21 christos /*
1090 1.21 christos * Emit an emulation record, every time there is a ktrace
1091 1.88 enami * change/attach request.
1092 1.21 christos */
1093 1.21 christos if (KTRPOINT(p, KTR_EMUL))
1094 1.84 dsl p->p_traceflag |= KTRFAC_TRC_EMUL;
1095 1.49 martin #ifdef __HAVE_SYSCALL_INTERN
1096 1.48 mycroft (*p->p_emul->e_syscall_intern)(p);
1097 1.49 martin #endif
1098 1.1 cgd
1099 1.1 cgd return (1);
1100 1.1 cgd }
1101 1.1 cgd
1102 1.22 christos int
1103 1.105 ad ktrsetchildren(struct lwp *curl, struct proc *top, int ops, int facs,
1104 1.93 enami struct ktr_desc *ktd)
1105 1.1 cgd {
1106 1.28 christos struct proc *p;
1107 1.28 christos int ret = 0;
1108 1.1 cgd
1109 1.1 cgd p = top;
1110 1.1 cgd for (;;) {
1111 1.105 ad ret |= ktrops(curl, p, ops, facs, ktd);
1112 1.1 cgd /*
1113 1.1 cgd * If this process has children, descend to them next,
1114 1.1 cgd * otherwise do any siblings, and if done with this level,
1115 1.1 cgd * follow back up the tree (but not past top).
1116 1.1 cgd */
1117 1.82 dsl if (LIST_FIRST(&p->p_children) != NULL) {
1118 1.39 thorpej p = LIST_FIRST(&p->p_children);
1119 1.82 dsl continue;
1120 1.82 dsl }
1121 1.82 dsl for (;;) {
1122 1.1 cgd if (p == top)
1123 1.1 cgd return (ret);
1124 1.39 thorpej if (LIST_NEXT(p, p_sibling) != NULL) {
1125 1.39 thorpej p = LIST_NEXT(p, p_sibling);
1126 1.1 cgd break;
1127 1.1 cgd }
1128 1.12 mycroft p = p->p_pptr;
1129 1.1 cgd }
1130 1.1 cgd }
1131 1.1 cgd /*NOTREACHED*/
1132 1.1 cgd }
1133 1.1 cgd
1134 1.93 enami void
1135 1.93 enami ktrwrite(struct ktr_desc *ktd, struct ktrace_entry *kte)
1136 1.1 cgd {
1137 1.74 fvdl struct uio auio;
1138 1.93 enami struct iovec aiov[64], *iov;
1139 1.93 enami struct ktrace_entry *top = kte;
1140 1.93 enami struct ktr_header *kth;
1141 1.93 enami struct file *fp = ktd->ktd_fp;
1142 1.93 enami struct proc *p;
1143 1.93 enami int error;
1144 1.93 enami next:
1145 1.93 enami auio.uio_iov = iov = &aiov[0];
1146 1.1 cgd auio.uio_offset = 0;
1147 1.1 cgd auio.uio_rw = UIO_WRITE;
1148 1.93 enami auio.uio_resid = 0;
1149 1.93 enami auio.uio_iovcnt = 0;
1150 1.101 yamt UIO_SETUP_SYSSPACE(&auio);
1151 1.93 enami do {
1152 1.93 enami kth = &kte->kte_kth;
1153 1.98 christos
1154 1.98 christos if (kth->ktr_version == 0) {
1155 1.98 christos /*
1156 1.98 christos * Convert back to the old format fields
1157 1.98 christos */
1158 1.98 christos TIMESPEC_TO_TIMEVAL(&kth->ktr_tv, &kth->ktr_time);
1159 1.98 christos kth->ktr_unused = NULL;
1160 1.98 christos }
1161 1.93 enami iov->iov_base = (caddr_t)kth;
1162 1.93 enami iov++->iov_len = sizeof(struct ktr_header);
1163 1.93 enami auio.uio_resid += sizeof(struct ktr_header);
1164 1.1 cgd auio.uio_iovcnt++;
1165 1.93 enami if (kth->ktr_len > 0) {
1166 1.93 enami iov->iov_base = kte->kte_buf;
1167 1.93 enami iov++->iov_len = kth->ktr_len;
1168 1.93 enami auio.uio_resid += kth->ktr_len;
1169 1.93 enami auio.uio_iovcnt++;
1170 1.93 enami }
1171 1.93 enami } while ((kte = TAILQ_NEXT(kte, kte_list)) != NULL &&
1172 1.93 enami auio.uio_iovcnt < sizeof(aiov) / sizeof(aiov[0]) - 1);
1173 1.93 enami
1174 1.93 enami again:
1175 1.93 enami simple_lock(&fp->f_slock);
1176 1.93 enami FILE_USE(fp);
1177 1.93 enami error = (*fp->f_ops->fo_write)(fp, &fp->f_offset, &auio,
1178 1.93 enami fp->f_cred, FOF_UPDATE_OFFSET);
1179 1.93 enami FILE_UNUSE(fp, NULL);
1180 1.93 enami switch (error) {
1181 1.93 enami
1182 1.93 enami case 0:
1183 1.93 enami if (auio.uio_resid > 0)
1184 1.93 enami goto again;
1185 1.93 enami if (kte != NULL)
1186 1.93 enami goto next;
1187 1.93 enami break;
1188 1.93 enami
1189 1.93 enami case EWOULDBLOCK:
1190 1.93 enami preempt(1);
1191 1.93 enami goto again;
1192 1.93 enami
1193 1.93 enami default:
1194 1.93 enami /*
1195 1.93 enami * If error encountered, give up tracing on this
1196 1.93 enami * vnode. Don't report EPIPE as this can easily
1197 1.93 enami * happen with fktrace()/ktruss.
1198 1.93 enami */
1199 1.93 enami #ifndef DEBUG
1200 1.93 enami if (error != EPIPE)
1201 1.93 enami #endif
1202 1.93 enami log(LOG_NOTICE,
1203 1.93 enami "ktrace write failed, errno %d, tracing stopped\n",
1204 1.93 enami error);
1205 1.93 enami proclist_lock_read();
1206 1.94 yamt PROCLIST_FOREACH(p, &allproc) {
1207 1.93 enami if (p->p_tracep == ktd)
1208 1.93 enami ktrderef(p);
1209 1.93 enami }
1210 1.93 enami proclist_unlock_read();
1211 1.93 enami }
1212 1.93 enami
1213 1.93 enami while ((kte = top) != NULL) {
1214 1.93 enami top = TAILQ_NEXT(top, kte_list);
1215 1.93 enami ktefree(kte);
1216 1.93 enami }
1217 1.93 enami }
1218 1.93 enami
1219 1.93 enami void
1220 1.93 enami ktrace_thread(void *arg)
1221 1.93 enami {
1222 1.93 enami struct ktr_desc *ktd = arg;
1223 1.93 enami struct file *fp = ktd->ktd_fp;
1224 1.93 enami struct ktrace_entry *kte;
1225 1.93 enami int ktrerr, errcnt;
1226 1.93 enami
1227 1.93 enami for (;;) {
1228 1.93 enami simple_lock(&ktd->ktd_slock);
1229 1.93 enami kte = TAILQ_FIRST(&ktd->ktd_queue);
1230 1.93 enami if (kte == NULL) {
1231 1.93 enami if (ktd->ktd_flags & KTDF_WAIT) {
1232 1.93 enami ktd->ktd_flags &= ~(KTDF_WAIT | KTDF_BLOCKING);
1233 1.93 enami wakeup(&ktd->ktd_flags);
1234 1.93 enami }
1235 1.93 enami if (ktd->ktd_ref == 0)
1236 1.93 enami break;
1237 1.93 enami ltsleep(ktd, PWAIT | PNORELOCK, "ktrwait", 0,
1238 1.93 enami &ktd->ktd_slock);
1239 1.93 enami continue;
1240 1.93 enami }
1241 1.93 enami TAILQ_INIT(&ktd->ktd_queue);
1242 1.93 enami ktd->ktd_qcount = 0;
1243 1.93 enami ktrerr = ktd->ktd_error;
1244 1.93 enami errcnt = ktd->ktd_errcnt;
1245 1.93 enami ktd->ktd_error = ktd->ktd_errcnt = 0;
1246 1.93 enami simple_unlock(&ktd->ktd_slock);
1247 1.93 enami
1248 1.93 enami if (ktrerr) {
1249 1.93 enami log(LOG_NOTICE,
1250 1.93 enami "ktrace failed, fp %p, error 0x%x, total %d\n",
1251 1.93 enami fp, ktrerr, errcnt);
1252 1.93 enami }
1253 1.93 enami ktrwrite(ktd, kte);
1254 1.1 cgd }
1255 1.93 enami simple_unlock(&ktd->ktd_slock);
1256 1.93 enami
1257 1.93 enami simple_lock(&ktdq_slock);
1258 1.93 enami TAILQ_REMOVE(&ktdq, ktd, ktd_list);
1259 1.93 enami simple_unlock(&ktdq_slock);
1260 1.28 christos
1261 1.68 pk simple_lock(&fp->f_slock);
1262 1.42 sommerfe FILE_USE(fp);
1263 1.42 sommerfe
1264 1.1 cgd /*
1265 1.93 enami * ktrace file descriptor can't be watched (are not visible to
1266 1.93 enami * userspace), so no kqueue stuff here
1267 1.93 enami * XXX: The above comment is wrong, because the fktrace file
1268 1.93 enami * descriptor is available in userland.
1269 1.1 cgd */
1270 1.93 enami closef(fp, NULL);
1271 1.93 enami
1272 1.93 enami callout_stop(&ktd->ktd_wakch);
1273 1.93 enami free(ktd, M_KTRACE);
1274 1.39 thorpej
1275 1.93 enami kthread_exit(0);
1276 1.1 cgd }
1277 1.1 cgd
1278 1.1 cgd /*
1279 1.1 cgd * Return true if caller has permission to set the ktracing state
1280 1.1 cgd * of target. Essentially, the target can't possess any
1281 1.1 cgd * more permissions than the caller. KTRFAC_ROOT signifies that
1282 1.88 enami * root previously set the tracing status on the target process, and
1283 1.1 cgd * so, only root may further change it.
1284 1.1 cgd *
1285 1.1 cgd * TODO: check groups. use caller effective gid.
1286 1.1 cgd */
1287 1.22 christos int
1288 1.105 ad ktrcanset(struct lwp *calll, struct proc *targetp)
1289 1.1 cgd {
1290 1.105 ad kauth_cred_t caller = calll->l_cred;
1291 1.103 elad kauth_cred_t target = targetp->p_cred;
1292 1.1 cgd
1293 1.103 elad if ((kauth_cred_geteuid(caller) == kauth_cred_getuid(target) &&
1294 1.103 elad kauth_cred_getuid(target) == kauth_cred_getsvuid(target) &&
1295 1.103 elad kauth_cred_getgid(caller) == kauth_cred_getgid(target) && /* XXX */
1296 1.103 elad kauth_cred_getgid(target) == kauth_cred_getsvgid(target) &&
1297 1.88 enami (targetp->p_traceflag & KTRFAC_ROOT) == 0 &&
1298 1.88 enami (targetp->p_flag & P_SUGID) == 0) ||
1299 1.103 elad kauth_cred_geteuid(caller) == 0)
1300 1.1 cgd return (1);
1301 1.1 cgd
1302 1.1 cgd return (0);
1303 1.1 cgd }
1304 1.47 thorpej #endif /* KTRACE */
1305 1.51 jdolecek
1306 1.51 jdolecek /*
1307 1.51 jdolecek * Put user defined entry to ktrace records.
1308 1.51 jdolecek */
1309 1.51 jdolecek int
1310 1.89 enami sys_utrace(struct lwp *l, void *v, register_t *retval)
1311 1.51 jdolecek {
1312 1.51 jdolecek #ifdef KTRACE
1313 1.51 jdolecek struct sys_utrace_args /* {
1314 1.52 jdolecek syscallarg(const char *) label;
1315 1.51 jdolecek syscallarg(void *) addr;
1316 1.51 jdolecek syscallarg(size_t) len;
1317 1.51 jdolecek } */ *uap = v;
1318 1.67 thorpej struct proc *p = l->l_proc;
1319 1.88 enami
1320 1.51 jdolecek if (!KTRPOINT(p, KTR_USER))
1321 1.51 jdolecek return (0);
1322 1.53 jdolecek
1323 1.53 jdolecek if (SCARG(uap, len) > KTR_USER_MAXLEN)
1324 1.53 jdolecek return (EINVAL);
1325 1.51 jdolecek
1326 1.98 christos ktruser(l, SCARG(uap, label), SCARG(uap, addr), SCARG(uap, len), 1);
1327 1.51 jdolecek
1328 1.51 jdolecek return (0);
1329 1.51 jdolecek #else /* !KTRACE */
1330 1.51 jdolecek return ENOSYS;
1331 1.51 jdolecek #endif /* KTRACE */
1332 1.51 jdolecek }
1333