Home | History | Annotate | Line # | Download | only in dtrace
      1 /*	$NetBSD: dtrace_ioctl.c,v 1.7 2018/05/28 21:05:03 chs Exp $	*/
      2 
      3 /*
      4  * CDDL HEADER START
      5  *
      6  * The contents of this file are subject to the terms of the
      7  * Common Development and Distribution License (the "License").
      8  * You may not use this file except in compliance with the License.
      9  *
     10  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
     11  * or http://www.opensolaris.org/os/licensing.
     12  * See the License for the specific language governing permissions
     13  * and limitations under the License.
     14  *
     15  * When distributing Covered Code, include this CDDL HEADER in each
     16  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
     17  * If applicable, add the following below this CDDL HEADER, with the
     18  * fields enclosed by brackets "[]" replaced with your own identifying
     19  * information: Portions Copyright [yyyy] [name of copyright owner]
     20  *
     21  * CDDL HEADER END
     22  *
     23  * $FreeBSD: head/sys/cddl/dev/dtrace/dtrace_ioctl.c 313262 2017-02-05 02:39:12Z markj $
     24  *
     25  */
     26 
     27 static int dtrace_verbose_ioctl;
     28 SYSCTL_INT(_debug_dtrace, OID_AUTO, verbose_ioctl, CTLFLAG_RW,
     29     &dtrace_verbose_ioctl, 0, "log DTrace ioctls");
     30 
     31 #define pfind(pid) proc_find((pid))
     32 
     33 #define DTRACE_IOCTL_PRINTF(fmt, ...)	if (dtrace_verbose_ioctl) printf(fmt, ## __VA_ARGS__ )
     34 
     35 #ifdef __FreeBSD__
     36 static int
     37 dtrace_ioctl_helper(struct cdev *dev, u_long cmd, caddr_t addr, int flags,
     38     struct thread *td)
     39 #endif
     40 #ifdef __NetBSD__
     41 static int
     42 dtrace_ioctl_helper(dev_t dev, u_long cmd, caddr_t addr, int flags)
     43 #endif
     44 {
     45 	struct proc *p;
     46 	dof_helper_t *dhp;
     47 	dof_hdr_t *dof;
     48 	int rval;
     49 
     50 	dhp = NULL;
     51 	dof = NULL;
     52 	rval = 0;
     53 	switch (cmd) {
     54 	case DTRACEHIOC_ADDDOF:
     55 		dhp = (dof_helper_t *)addr;
     56 		addr = (caddr_t)(uintptr_t)dhp->dofhp_dof;
     57 		p = curproc;
     58 		if (p->p_pid == dhp->dofhp_pid) {
     59 			dof = dtrace_dof_copyin((uintptr_t)addr, &rval);
     60 		} else {
     61 #ifdef __FreeBSD__
     62 			p = pfind(dhp->dofhp_pid);
     63 			if (p == NULL)
     64 				return (EINVAL);
     65 			if (!P_SHOULDSTOP(p) ||
     66 			    (p->p_flag & (P_TRACED | P_WEXIT)) != P_TRACED ||
     67 			    p->p_pptr != curproc) {
     68 				PROC_UNLOCK(p);
     69 				return (EINVAL);
     70 			}
     71 			_PHOLD(p);
     72 			PROC_UNLOCK(p);
     73 			dof = dtrace_dof_copyin_proc(p, (uintptr_t)addr, &rval);
     74 #endif
     75 #ifdef __NetBSD__
     76 			dof = dtrace_dof_copyin_pid(dhp->dofhp_pid, addr, &rval);
     77 #endif
     78 		}
     79 
     80 		if (dof == NULL) {
     81 #ifdef __FreeBSD__
     82 			if (p != curproc)
     83 				PRELE(p);
     84 #endif
     85 			break;
     86 		}
     87 
     88 		mutex_enter(&dtrace_lock);
     89 		if ((rval = dtrace_helper_slurp(dof, dhp, p)) != -1) {
     90 			dhp->dofhp_gen = rval;
     91 			rval = 0;
     92 		} else {
     93 			rval = EINVAL;
     94 		}
     95 		mutex_exit(&dtrace_lock);
     96 #ifdef __FreeBSD__
     97 		if (p != curproc)
     98 			PRELE(p);
     99 #endif
    100 		break;
    101 	case DTRACEHIOC_REMOVE:
    102 		mutex_enter(&dtrace_lock);
    103 		rval = dtrace_helper_destroygen(NULL, *(int *)(uintptr_t)addr);
    104 		mutex_exit(&dtrace_lock);
    105 		break;
    106 	default:
    107 		rval = ENOTTY;
    108 		break;
    109 	}
    110 	return (rval);
    111 }
    112 
    113 /* ARGSUSED */
    114 #ifdef __FreeBSD__
    115 static int
    116 dtrace_ioctl(struct cdev *dev, u_long cmd, caddr_t addr,
    117     int flags __unused, struct thread *td)
    118 #endif
    119 #ifdef __NetBSD__
    120 static int
    121 dtrace_ioctl(struct file *fp, u_long cmd, void *addr)
    122 #endif
    123 {
    124 	dtrace_state_t *state = (dtrace_state_t *)fp->f_data;
    125 	int error = 0;
    126 
    127 	if (state == NULL)
    128 		return (EINVAL);
    129 
    130 	if (state->dts_anon) {
    131 		ASSERT(dtrace_anon.dta_state == NULL);
    132 		state = state->dts_anon;
    133 	}
    134 
    135 	switch (cmd) {
    136 	case DTRACEIOC_AGGDESC: {
    137 		dtrace_aggdesc_t **paggdesc = (dtrace_aggdesc_t **) addr;
    138 		dtrace_aggdesc_t aggdesc;
    139 		dtrace_action_t *act;
    140 		dtrace_aggregation_t *agg;
    141 		int nrecs;
    142 		uint32_t offs;
    143 		dtrace_recdesc_t *lrec;
    144 		void *buf;
    145 		size_t size;
    146 		uintptr_t dest;
    147 
    148 		DTRACE_IOCTL_PRINTF("%s(%d): DTRACEIOC_AGGDESC\n",__func__,__LINE__);
    149 
    150 		if (copyin((void *) *paggdesc, &aggdesc, sizeof (aggdesc)) != 0)
    151 			return (EFAULT);
    152 
    153 		mutex_enter(&dtrace_lock);
    154 
    155 		if ((agg = dtrace_aggid2agg(state, aggdesc.dtagd_id)) == NULL) {
    156 			mutex_exit(&dtrace_lock);
    157 			return (EINVAL);
    158 		}
    159 
    160 		aggdesc.dtagd_epid = agg->dtag_ecb->dte_epid;
    161 
    162 		nrecs = aggdesc.dtagd_nrecs;
    163 		aggdesc.dtagd_nrecs = 0;
    164 
    165 		offs = agg->dtag_base;
    166 		lrec = &agg->dtag_action.dta_rec;
    167 		aggdesc.dtagd_size = lrec->dtrd_offset + lrec->dtrd_size - offs;
    168 
    169 		for (act = agg->dtag_first; ; act = act->dta_next) {
    170 			ASSERT(act->dta_intuple ||
    171 			    DTRACEACT_ISAGG(act->dta_kind));
    172 
    173 			/*
    174 			 * If this action has a record size of zero, it
    175 			 * denotes an argument to the aggregating action.
    176 			 * Because the presence of this record doesn't (or
    177 			 * shouldn't) affect the way the data is interpreted,
    178 			 * we don't copy it out to save user-level the
    179 			 * confusion of dealing with a zero-length record.
    180 			 */
    181 			if (act->dta_rec.dtrd_size == 0) {
    182 				ASSERT(agg->dtag_hasarg);
    183 				continue;
    184 			}
    185 
    186 			aggdesc.dtagd_nrecs++;
    187 
    188 			if (act == &agg->dtag_action)
    189 				break;
    190 		}
    191 
    192 		/*
    193 		 * Now that we have the size, we need to allocate a temporary
    194 		 * buffer in which to store the complete description.  We need
    195 		 * the temporary buffer to be able to drop dtrace_lock()
    196 		 * across the copyout(), below.
    197 		 */
    198 		size = sizeof (dtrace_aggdesc_t) +
    199 		    (aggdesc.dtagd_nrecs * sizeof (dtrace_recdesc_t));
    200 
    201 		buf = kmem_alloc(size, KM_SLEEP);
    202 		dest = (uintptr_t)buf;
    203 
    204 		bcopy(&aggdesc, (void *)dest, sizeof (aggdesc));
    205 		dest += offsetof(dtrace_aggdesc_t, dtagd_rec[0]);
    206 
    207 		for (act = agg->dtag_first; ; act = act->dta_next) {
    208 			dtrace_recdesc_t rec = act->dta_rec;
    209 
    210 			/*
    211 			 * See the comment in the above loop for why we pass
    212 			 * over zero-length records.
    213 			 */
    214 			if (rec.dtrd_size == 0) {
    215 				ASSERT(agg->dtag_hasarg);
    216 				continue;
    217 			}
    218 
    219 			if (nrecs-- == 0)
    220 				break;
    221 
    222 			rec.dtrd_offset -= offs;
    223 			bcopy(&rec, (void *)dest, sizeof (rec));
    224 			dest += sizeof (dtrace_recdesc_t);
    225 
    226 			if (act == &agg->dtag_action)
    227 				break;
    228 		}
    229 
    230 		mutex_exit(&dtrace_lock);
    231 
    232 		if (copyout(buf, (void *) *paggdesc, dest - (uintptr_t)buf) != 0) {
    233 			kmem_free(buf, size);
    234 			return (EFAULT);
    235 		}
    236 
    237 		kmem_free(buf, size);
    238 		return (0);
    239 	}
    240 	case DTRACEIOC_AGGSNAP:
    241 	case DTRACEIOC_BUFSNAP: {
    242 		dtrace_bufdesc_t **pdesc = (dtrace_bufdesc_t **) addr;
    243 		dtrace_bufdesc_t desc;
    244 		caddr_t cached;
    245 		dtrace_buffer_t *buf;
    246 
    247 		dtrace_debug_output();
    248 
    249 		if (copyin((void *) *pdesc, &desc, sizeof (desc)) != 0)
    250 			return (EFAULT);
    251 
    252 		DTRACE_IOCTL_PRINTF("%s(%d): %s curcpu %d cpu %d\n",
    253 		    __func__,__LINE__,
    254 		    cmd == DTRACEIOC_AGGSNAP ?
    255 		    "DTRACEIOC_AGGSNAP":"DTRACEIOC_BUFSNAP",
    256 		    cpu_number(), desc.dtbd_cpu);
    257 
    258 		if (desc.dtbd_cpu >= ncpu)
    259 			return (ENOENT);
    260 
    261 		mutex_enter(&dtrace_lock);
    262 
    263 		if (cmd == DTRACEIOC_BUFSNAP) {
    264 			buf = &state->dts_buffer[desc.dtbd_cpu];
    265 		} else {
    266 			buf = &state->dts_aggbuffer[desc.dtbd_cpu];
    267 		}
    268 
    269 		if (buf->dtb_flags & (DTRACEBUF_RING | DTRACEBUF_FILL)) {
    270 			size_t sz = buf->dtb_offset;
    271 
    272 			if (state->dts_activity != DTRACE_ACTIVITY_STOPPED) {
    273 				mutex_exit(&dtrace_lock);
    274 				return (EBUSY);
    275 			}
    276 
    277 			/*
    278 			 * If this buffer has already been consumed, we're
    279 			 * going to indicate that there's nothing left here
    280 			 * to consume.
    281 			 */
    282 			if (buf->dtb_flags & DTRACEBUF_CONSUMED) {
    283 				mutex_exit(&dtrace_lock);
    284 
    285 				desc.dtbd_size = 0;
    286 				desc.dtbd_drops = 0;
    287 				desc.dtbd_errors = 0;
    288 				desc.dtbd_oldest = 0;
    289 				sz = sizeof (desc);
    290 
    291 				if (copyout(&desc, (void *) *pdesc, sz) != 0)
    292 					return (EFAULT);
    293 
    294 				return (0);
    295 			}
    296 
    297 			/*
    298 			 * If this is a ring buffer that has wrapped, we want
    299 			 * to copy the whole thing out.
    300 			 */
    301 			if (buf->dtb_flags & DTRACEBUF_WRAPPED) {
    302 				dtrace_buffer_polish(buf);
    303 				sz = buf->dtb_size;
    304 			}
    305 
    306 			if (copyout(buf->dtb_tomax, desc.dtbd_data, sz) != 0) {
    307 				mutex_exit(&dtrace_lock);
    308 				return (EFAULT);
    309 			}
    310 
    311 			desc.dtbd_size = sz;
    312 			desc.dtbd_drops = buf->dtb_drops;
    313 			desc.dtbd_errors = buf->dtb_errors;
    314 			desc.dtbd_oldest = buf->dtb_xamot_offset;
    315 			desc.dtbd_timestamp = dtrace_gethrtime();
    316 
    317 			mutex_exit(&dtrace_lock);
    318 
    319 			if (copyout(&desc, (void *) *pdesc, sizeof (desc)) != 0)
    320 				return (EFAULT);
    321 
    322 			buf->dtb_flags |= DTRACEBUF_CONSUMED;
    323 
    324 			return (0);
    325 		}
    326 
    327 		if (buf->dtb_tomax == NULL) {
    328 			ASSERT(buf->dtb_xamot == NULL);
    329 			mutex_exit(&dtrace_lock);
    330 			return (ENOENT);
    331 		}
    332 
    333 		cached = buf->dtb_tomax;
    334 		ASSERT(!(buf->dtb_flags & DTRACEBUF_NOSWITCH));
    335 
    336 		dtrace_xcall(desc.dtbd_cpu,
    337 		    (dtrace_xcall_t)dtrace_buffer_switch, buf);
    338 
    339 		state->dts_errors += buf->dtb_xamot_errors;
    340 
    341 		/*
    342 		 * If the buffers did not actually switch, then the cross call
    343 		 * did not take place -- presumably because the given CPU is
    344 		 * not in the ready set.  If this is the case, we'll return
    345 		 * ENOENT.
    346 		 */
    347 		if (buf->dtb_tomax == cached) {
    348 			ASSERT(buf->dtb_xamot != cached);
    349 			mutex_exit(&dtrace_lock);
    350 			return (ENOENT);
    351 		}
    352 
    353 		ASSERT(cached == buf->dtb_xamot);
    354 
    355 		DTRACE_IOCTL_PRINTF("%s(%d): copyout the buffer snapshot\n",__func__,__LINE__);
    356 
    357 		/*
    358 		 * We have our snapshot; now copy it out.
    359 		 */
    360 		if (copyout(buf->dtb_xamot, desc.dtbd_data,
    361 		    buf->dtb_xamot_offset) != 0) {
    362 			mutex_exit(&dtrace_lock);
    363 			return (EFAULT);
    364 		}
    365 
    366 		desc.dtbd_size = buf->dtb_xamot_offset;
    367 		desc.dtbd_drops = buf->dtb_xamot_drops;
    368 		desc.dtbd_errors = buf->dtb_xamot_errors;
    369 		desc.dtbd_oldest = 0;
    370 		desc.dtbd_timestamp = buf->dtb_switched;
    371 
    372 		mutex_exit(&dtrace_lock);
    373 
    374 		DTRACE_IOCTL_PRINTF("%s(%d): copyout buffer desc: size %zd drops %lu errors %lu\n",__func__,__LINE__,(size_t) desc.dtbd_size,(u_long) desc.dtbd_drops,(u_long) desc.dtbd_errors);
    375 
    376 		/*
    377 		 * Finally, copy out the buffer description.
    378 		 */
    379 		if (copyout(&desc, (void *) *pdesc, sizeof (desc)) != 0)
    380 			return (EFAULT);
    381 
    382 		return (0);
    383 	}
    384 	case DTRACEIOC_CONF: {
    385 		dtrace_conf_t conf;
    386 
    387 		DTRACE_IOCTL_PRINTF("%s(%d): DTRACEIOC_CONF\n",__func__,__LINE__);
    388 
    389 		bzero(&conf, sizeof (conf));
    390 		conf.dtc_difversion = DIF_VERSION;
    391 		conf.dtc_difintregs = DIF_DIR_NREGS;
    392 		conf.dtc_diftupregs = DIF_DTR_NREGS;
    393 		conf.dtc_ctfmodel = CTF_MODEL_NATIVE;
    394 
    395 		*((dtrace_conf_t *) addr) = conf;
    396 
    397 		return (0);
    398 	}
    399 	case DTRACEIOC_DOFGET: {
    400 		dof_hdr_t **pdof = (dof_hdr_t **) addr;
    401 		dof_hdr_t hdr, *dof = *pdof;
    402 		int rval;
    403 		uint64_t len;
    404 
    405 		DTRACE_IOCTL_PRINTF("%s(%d): DTRACEIOC_DOFGET\n",__func__,__LINE__);
    406 
    407 		if (copyin((void *)dof, &hdr, sizeof (hdr)) != 0)
    408 			return (EFAULT);
    409 
    410 		mutex_enter(&dtrace_lock);
    411 		dof = dtrace_dof_create(state);
    412 		mutex_exit(&dtrace_lock);
    413 
    414 		len = MIN(hdr.dofh_loadsz, dof->dofh_loadsz);
    415 		rval = copyout(dof, (void *) *pdof, len);
    416 		dtrace_dof_destroy(dof);
    417 
    418 		return (rval == 0 ? 0 : EFAULT);
    419 	}
    420 	case DTRACEIOC_ENABLE: {
    421 		dof_hdr_t *dof = NULL;
    422 		dtrace_enabling_t *enab = NULL;
    423 		dtrace_vstate_t *vstate;
    424 		int err = 0;
    425 		int rval;
    426 		dtrace_enable_io_t *p = (dtrace_enable_io_t *) addr;
    427 
    428 		DTRACE_IOCTL_PRINTF("%s(%d): DTRACEIOC_ENABLE\n",__func__,__LINE__);
    429 
    430 		/*
    431 		 * If a NULL argument has been passed, we take this as our
    432 		 * cue to reevaluate our enablings.
    433 		 */
    434 		if (p->dof == NULL) {
    435 			dtrace_enabling_matchall();
    436 
    437 			return (0);
    438 		}
    439 
    440 		if ((dof = dtrace_dof_copyin((uintptr_t) p->dof, &rval)) == NULL)
    441 			return (EINVAL);
    442 
    443 		mutex_enter(&cpu_lock);
    444 		mutex_enter(&dtrace_lock);
    445 		vstate = &state->dts_vstate;
    446 
    447 		if (state->dts_activity != DTRACE_ACTIVITY_INACTIVE) {
    448 			mutex_exit(&dtrace_lock);
    449 			mutex_exit(&cpu_lock);
    450 			dtrace_dof_destroy(dof);
    451 			return (EBUSY);
    452 		}
    453 
    454 		if (dtrace_dof_slurp(dof, vstate, CRED(), &enab, 0, 0,
    455 		    B_TRUE) != 0) {
    456 			mutex_exit(&dtrace_lock);
    457 			mutex_exit(&cpu_lock);
    458 			dtrace_dof_destroy(dof);
    459 			return (EINVAL);
    460 		}
    461 
    462 		if ((rval = dtrace_dof_options(dof, state)) != 0) {
    463 			dtrace_enabling_destroy(enab);
    464 			mutex_exit(&dtrace_lock);
    465 			mutex_exit(&cpu_lock);
    466 			dtrace_dof_destroy(dof);
    467 			return (rval);
    468 		}
    469 
    470 		if ((err = dtrace_enabling_match(enab, &p->n_matched)) == 0) {
    471 			err = dtrace_enabling_retain(enab);
    472 		} else {
    473 			dtrace_enabling_destroy(enab);
    474 		}
    475 
    476 		mutex_exit(&cpu_lock);
    477 		mutex_exit(&dtrace_lock);
    478 		dtrace_dof_destroy(dof);
    479 
    480 		return (err);
    481 	}
    482 	case DTRACEIOC_EPROBE: {
    483 		dtrace_eprobedesc_t **pepdesc = (dtrace_eprobedesc_t **) addr;
    484 		dtrace_eprobedesc_t epdesc;
    485 		dtrace_ecb_t *ecb;
    486 		dtrace_action_t *act;
    487 		void *buf;
    488 		size_t size;
    489 		uintptr_t dest;
    490 		int nrecs;
    491 
    492 		DTRACE_IOCTL_PRINTF("%s(%d): DTRACEIOC_EPROBE\n",__func__,__LINE__);
    493 
    494 		if (copyin((void *)*pepdesc, &epdesc, sizeof (epdesc)) != 0)
    495 			return (EFAULT);
    496 
    497 		mutex_enter(&dtrace_lock);
    498 
    499 		if ((ecb = dtrace_epid2ecb(state, epdesc.dtepd_epid)) == NULL) {
    500 			mutex_exit(&dtrace_lock);
    501 			return (EINVAL);
    502 		}
    503 
    504 		if (ecb->dte_probe == NULL) {
    505 			mutex_exit(&dtrace_lock);
    506 			return (EINVAL);
    507 		}
    508 
    509 		epdesc.dtepd_probeid = ecb->dte_probe->dtpr_id;
    510 		epdesc.dtepd_uarg = ecb->dte_uarg;
    511 		epdesc.dtepd_size = ecb->dte_size;
    512 
    513 		nrecs = epdesc.dtepd_nrecs;
    514 		epdesc.dtepd_nrecs = 0;
    515 		for (act = ecb->dte_action; act != NULL; act = act->dta_next) {
    516 			if (DTRACEACT_ISAGG(act->dta_kind) || act->dta_intuple)
    517 				continue;
    518 
    519 			epdesc.dtepd_nrecs++;
    520 		}
    521 
    522 		/*
    523 		 * Now that we have the size, we need to allocate a temporary
    524 		 * buffer in which to store the complete description.  We need
    525 		 * the temporary buffer to be able to drop dtrace_lock()
    526 		 * across the copyout(), below.
    527 		 */
    528 		size = sizeof (dtrace_eprobedesc_t) +
    529 		    (epdesc.dtepd_nrecs * sizeof (dtrace_recdesc_t));
    530 
    531 		buf = kmem_alloc(size, KM_SLEEP);
    532 		dest = (uintptr_t)buf;
    533 
    534 		bcopy(&epdesc, (void *)dest, sizeof (epdesc));
    535 		dest += offsetof(dtrace_eprobedesc_t, dtepd_rec[0]);
    536 
    537 		for (act = ecb->dte_action; act != NULL; act = act->dta_next) {
    538 			if (DTRACEACT_ISAGG(act->dta_kind) || act->dta_intuple)
    539 				continue;
    540 
    541 			if (nrecs-- == 0)
    542 				break;
    543 
    544 			bcopy(&act->dta_rec, (void *)dest,
    545 			    sizeof (dtrace_recdesc_t));
    546 			dest += sizeof (dtrace_recdesc_t);
    547 		}
    548 
    549 		mutex_exit(&dtrace_lock);
    550 
    551 		if (copyout(buf, (void *) *pepdesc, dest - (uintptr_t)buf) != 0) {
    552 			kmem_free(buf, size);
    553 			return (EFAULT);
    554 		}
    555 
    556 		kmem_free(buf, size);
    557 		return (0);
    558 	}
    559 	case DTRACEIOC_FORMAT: {
    560 		dtrace_fmtdesc_t *fmt = (dtrace_fmtdesc_t *) addr;
    561 		char *str;
    562 		int len;
    563 
    564 		DTRACE_IOCTL_PRINTF("%s(%d): DTRACEIOC_FORMAT\n",__func__,__LINE__);
    565 
    566 		mutex_enter(&dtrace_lock);
    567 
    568 		if (fmt->dtfd_format == 0 ||
    569 		    fmt->dtfd_format > state->dts_nformats) {
    570 			mutex_exit(&dtrace_lock);
    571 			return (EINVAL);
    572 		}
    573 
    574 		/*
    575 		 * Format strings are allocated contiguously and they are
    576 		 * never freed; if a format index is less than the number
    577 		 * of formats, we can assert that the format map is non-NULL
    578 		 * and that the format for the specified index is non-NULL.
    579 		 */
    580 		ASSERT(state->dts_formats != NULL);
    581 		str = state->dts_formats[fmt->dtfd_format - 1];
    582 		ASSERT(str != NULL);
    583 
    584 		len = strlen(str) + 1;
    585 
    586 		if (len > fmt->dtfd_length) {
    587 			fmt->dtfd_length = len;
    588 		} else {
    589 			if (copyout(str, fmt->dtfd_string, len) != 0) {
    590 				mutex_exit(&dtrace_lock);
    591 				return (EINVAL);
    592 			}
    593 		}
    594 
    595 		mutex_exit(&dtrace_lock);
    596 		return (0);
    597 	}
    598 	case DTRACEIOC_GO: {
    599 		int rval;
    600 		processorid_t *cpuid = (processorid_t *) addr;
    601 
    602 		DTRACE_IOCTL_PRINTF("%s(%d): DTRACEIOC_GO\n",__func__,__LINE__);
    603 
    604 		rval = dtrace_state_go(state, cpuid);
    605 
    606 		return (rval);
    607 	}
    608 	case DTRACEIOC_PROBEARG: {
    609 		dtrace_argdesc_t *desc = (dtrace_argdesc_t *) addr;
    610 		dtrace_probe_t *probe;
    611 		dtrace_provider_t *prov;
    612 
    613 		DTRACE_IOCTL_PRINTF("%s(%d): DTRACEIOC_PROBEARG\n",__func__,__LINE__);
    614 
    615 		if (desc->dtargd_id == DTRACE_IDNONE)
    616 			return (EINVAL);
    617 
    618 		if (desc->dtargd_ndx == DTRACE_ARGNONE)
    619 			return (EINVAL);
    620 
    621 		mutex_enter(&dtrace_provider_lock);
    622 #ifdef illumos
    623 		mutex_enter(&mod_lock);
    624 #endif
    625 		mutex_enter(&dtrace_lock);
    626 
    627 		if (desc->dtargd_id > dtrace_nprobes) {
    628 			mutex_exit(&dtrace_lock);
    629 #ifdef illumos
    630 			mutex_exit(&mod_lock);
    631 #endif
    632 			mutex_exit(&dtrace_provider_lock);
    633 			return (EINVAL);
    634 		}
    635 
    636 		if ((probe = dtrace_probes[desc->dtargd_id - 1]) == NULL) {
    637 			mutex_exit(&dtrace_lock);
    638 #ifdef illumos
    639 			mutex_exit(&mod_lock);
    640 #endif
    641 			mutex_exit(&dtrace_provider_lock);
    642 			return (EINVAL);
    643 		}
    644 
    645 		mutex_exit(&dtrace_lock);
    646 
    647 		prov = probe->dtpr_provider;
    648 
    649 		if (prov->dtpv_pops.dtps_getargdesc == NULL) {
    650 			/*
    651 			 * There isn't any typed information for this probe.
    652 			 * Set the argument number to DTRACE_ARGNONE.
    653 			 */
    654 			desc->dtargd_ndx = DTRACE_ARGNONE;
    655 		} else {
    656 			desc->dtargd_native[0] = '\0';
    657 			desc->dtargd_xlate[0] = '\0';
    658 			desc->dtargd_mapping = desc->dtargd_ndx;
    659 
    660 			prov->dtpv_pops.dtps_getargdesc(prov->dtpv_arg,
    661 			    probe->dtpr_id, probe->dtpr_arg, desc);
    662 		}
    663 
    664 #ifdef illumos
    665 		mutex_exit(&mod_lock);
    666 #endif
    667 		mutex_exit(&dtrace_provider_lock);
    668 
    669 		return (0);
    670 	}
    671 	case DTRACEIOC_PROBEMATCH:
    672 	case DTRACEIOC_PROBES: {
    673 		dtrace_probedesc_t *p_desc = (dtrace_probedesc_t *) addr;
    674 		dtrace_probe_t *probe = NULL;
    675 		dtrace_probekey_t pkey;
    676 		dtrace_id_t i;
    677 		int m = 0;
    678 		uint32_t priv = 0;
    679 		uid_t uid = 0;
    680 		zoneid_t zoneid = 0;
    681 
    682 		DTRACE_IOCTL_PRINTF("%s(%d): %s\n",__func__,__LINE__,
    683 		    cmd == DTRACEIOC_PROBEMATCH ?
    684 		    "DTRACEIOC_PROBEMATCH":"DTRACEIOC_PROBES");
    685 
    686 		p_desc->dtpd_provider[DTRACE_PROVNAMELEN - 1] = '\0';
    687 		p_desc->dtpd_mod[DTRACE_MODNAMELEN - 1] = '\0';
    688 		p_desc->dtpd_func[DTRACE_FUNCNAMELEN - 1] = '\0';
    689 		p_desc->dtpd_name[DTRACE_NAMELEN - 1] = '\0';
    690 
    691 		/*
    692 		 * Before we attempt to match this probe, we want to give
    693 		 * all providers the opportunity to provide it.
    694 		 */
    695 		if (p_desc->dtpd_id == DTRACE_IDNONE) {
    696 			mutex_enter(&dtrace_provider_lock);
    697 			dtrace_probe_provide(p_desc, NULL);
    698 			mutex_exit(&dtrace_provider_lock);
    699 			p_desc->dtpd_id++;
    700 		}
    701 
    702 		if (cmd == DTRACEIOC_PROBEMATCH)  {
    703 			dtrace_probekey(p_desc, &pkey);
    704 			pkey.dtpk_id = DTRACE_IDNONE;
    705 		}
    706 
    707 		dtrace_cred2priv(curlwp->l_cred, &priv, &uid, &zoneid);
    708 
    709 		mutex_enter(&dtrace_lock);
    710 
    711 		if (cmd == DTRACEIOC_PROBEMATCH) {
    712 			for (i = p_desc->dtpd_id; i <= dtrace_nprobes; i++) {
    713 				if ((probe = dtrace_probes[i - 1]) != NULL &&
    714 				    (m = dtrace_match_probe(probe, &pkey,
    715 				    priv, uid, zoneid)) != 0)
    716 					break;
    717 			}
    718 
    719 			if (m < 0) {
    720 				mutex_exit(&dtrace_lock);
    721 				return (EINVAL);
    722 			}
    723 
    724 		} else {
    725 			for (i = p_desc->dtpd_id; i <= dtrace_nprobes; i++) {
    726 				if ((probe = dtrace_probes[i - 1]) != NULL &&
    727 				    dtrace_match_priv(probe, priv, uid, zoneid))
    728 					break;
    729 			}
    730 		}
    731 
    732 		if (probe == NULL) {
    733 			mutex_exit(&dtrace_lock);
    734 			return (ESRCH);
    735 		}
    736 
    737 		dtrace_probe_description(probe, p_desc);
    738 		mutex_exit(&dtrace_lock);
    739 
    740 		return (0);
    741 	}
    742 	case DTRACEIOC_PROVIDER: {
    743 		dtrace_providerdesc_t *pvd = (dtrace_providerdesc_t *) addr;
    744 		dtrace_provider_t *pvp;
    745 
    746 		DTRACE_IOCTL_PRINTF("%s(%d): DTRACEIOC_PROVIDER\n",__func__,__LINE__);
    747 
    748 		pvd->dtvd_name[DTRACE_PROVNAMELEN - 1] = '\0';
    749 		error = 0;
    750 again:
    751 		mutex_enter(&dtrace_provider_lock);
    752 
    753 		for (pvp = dtrace_provider; pvp != NULL; pvp = pvp->dtpv_next) {
    754 			if (strcmp(pvp->dtpv_name, pvd->dtvd_name) == 0)
    755 				break;
    756 		}
    757 
    758 		mutex_exit(&dtrace_provider_lock);
    759 
    760 		if (pvp == NULL && error == 0) {
    761 			char name[NAME_MAX];
    762 			const char *provider;
    763 			if (strcmp(pvd->dtvd_name, "proc") == 0)
    764 				provider = "sdt";
    765 			else
    766 				provider = pvd->dtvd_name;
    767 
    768 			if (snprintf(name, sizeof name, "dtrace_%s",
    769 			    provider) < sizeof name) {
    770 				error = module_autoload(name,
    771 				    MODULE_CLASS_MISC);
    772 				if (error == 0)
    773 					goto again;
    774 			}
    775 		}
    776 
    777 		if (pvp == NULL)
    778 			return (ESRCH);
    779 
    780 		bcopy(&pvp->dtpv_priv, &pvd->dtvd_priv, sizeof (dtrace_ppriv_t));
    781 		bcopy(&pvp->dtpv_attr, &pvd->dtvd_attr, sizeof (dtrace_pattr_t));
    782 
    783 		return (0);
    784 	}
    785 	case DTRACEIOC_REPLICATE: {
    786 		dtrace_repldesc_t *desc = (dtrace_repldesc_t *) addr;
    787 		dtrace_probedesc_t *match = &desc->dtrpd_match;
    788 		dtrace_probedesc_t *create = &desc->dtrpd_create;
    789 		int err;
    790 
    791 		DTRACE_IOCTL_PRINTF("%s(%d): DTRACEIOC_REPLICATE\n",__func__,__LINE__);
    792 
    793 		match->dtpd_provider[DTRACE_PROVNAMELEN - 1] = '\0';
    794 		match->dtpd_mod[DTRACE_MODNAMELEN - 1] = '\0';
    795 		match->dtpd_func[DTRACE_FUNCNAMELEN - 1] = '\0';
    796 		match->dtpd_name[DTRACE_NAMELEN - 1] = '\0';
    797 
    798 		create->dtpd_provider[DTRACE_PROVNAMELEN - 1] = '\0';
    799 		create->dtpd_mod[DTRACE_MODNAMELEN - 1] = '\0';
    800 		create->dtpd_func[DTRACE_FUNCNAMELEN - 1] = '\0';
    801 		create->dtpd_name[DTRACE_NAMELEN - 1] = '\0';
    802 
    803 		mutex_enter(&dtrace_lock);
    804 		err = dtrace_enabling_replicate(state, match, create);
    805 		mutex_exit(&dtrace_lock);
    806 
    807 		return (err);
    808 	}
    809 	case DTRACEIOC_STATUS: {
    810 		dtrace_status_t *stat = (dtrace_status_t *) addr;
    811 		dtrace_dstate_t *dstate;
    812 		int i, j;
    813 		uint64_t nerrs;
    814 		CPU_INFO_ITERATOR cpuind;
    815 		struct cpu_info *cinfo;
    816 
    817 		DTRACE_IOCTL_PRINTF("%s(%d): DTRACEIOC_STATUS\n",__func__,__LINE__);
    818 
    819 		/*
    820 		 * See the comment in dtrace_state_deadman() for the reason
    821 		 * for setting dts_laststatus to INT64_MAX before setting
    822 		 * it to the correct value.
    823 		 */
    824 		state->dts_laststatus = INT64_MAX;
    825 		dtrace_membar_producer();
    826 		state->dts_laststatus = dtrace_gethrtime();
    827 
    828 		bzero(stat, sizeof (*stat));
    829 
    830 		mutex_enter(&dtrace_lock);
    831 
    832 		if (state->dts_activity == DTRACE_ACTIVITY_INACTIVE) {
    833 			mutex_exit(&dtrace_lock);
    834 			return (ENOENT);
    835 		}
    836 
    837 		if (state->dts_activity == DTRACE_ACTIVITY_DRAINING)
    838 			stat->dtst_exiting = 1;
    839 
    840 		nerrs = state->dts_errors;
    841 		dstate = &state->dts_vstate.dtvs_dynvars;
    842 
    843 		for (CPU_INFO_FOREACH(cpuind, cinfo)) {
    844 		    	i = cpu_index(cinfo);
    845 
    846 			dtrace_dstate_percpu_t *dcpu = &dstate->dtds_percpu[i];
    847 
    848 			stat->dtst_dyndrops += dcpu->dtdsc_drops;
    849 			stat->dtst_dyndrops_dirty += dcpu->dtdsc_dirty_drops;
    850 			stat->dtst_dyndrops_rinsing += dcpu->dtdsc_rinsing_drops;
    851 
    852 			if (state->dts_buffer[i].dtb_flags & DTRACEBUF_FULL)
    853 				stat->dtst_filled++;
    854 
    855 			nerrs += state->dts_buffer[i].dtb_errors;
    856 
    857 			for (j = 0; j < state->dts_nspeculations; j++) {
    858 				dtrace_speculation_t *spec;
    859 				dtrace_buffer_t *buf;
    860 
    861 				spec = &state->dts_speculations[j];
    862 				buf = &spec->dtsp_buffer[i];
    863 				stat->dtst_specdrops += buf->dtb_xamot_drops;
    864 			}
    865 		}
    866 
    867 		stat->dtst_specdrops_busy = state->dts_speculations_busy;
    868 		stat->dtst_specdrops_unavail = state->dts_speculations_unavail;
    869 		stat->dtst_stkstroverflows = state->dts_stkstroverflows;
    870 		stat->dtst_dblerrors = state->dts_dblerrors;
    871 		stat->dtst_killed =
    872 		    (state->dts_activity == DTRACE_ACTIVITY_KILLED);
    873 		stat->dtst_errors = nerrs;
    874 
    875 		mutex_exit(&dtrace_lock);
    876 
    877 		return (0);
    878 	}
    879 	case DTRACEIOC_STOP: {
    880 		int rval;
    881 		processorid_t *cpuid = (processorid_t *) addr;
    882 
    883 		DTRACE_IOCTL_PRINTF("%s(%d): DTRACEIOC_STOP\n",__func__,__LINE__);
    884 
    885 		mutex_enter(&dtrace_lock);
    886 		rval = dtrace_state_stop(state, cpuid);
    887 		mutex_exit(&dtrace_lock);
    888 
    889 		return (rval);
    890 	}
    891 	default:
    892 		error = ENOTTY;
    893 	}
    894 	return (error);
    895 }
    896