xref: /netbsd-src/external/cddl/osnet/dev/dtrace/dtrace_ioctl.c (revision ba2539a9805a0544ff82c0003cc02fe1eee5603d)
1 /*	$NetBSD: dtrace_ioctl.c,v 1.7 2018/05/28 21:05:03 chs Exp $	*/
2 
3 /*
4  * CDDL HEADER START
5  *
6  * The contents of this file are subject to the terms of the
7  * Common Development and Distribution License (the "License").
8  * You may not use this file except in compliance with the License.
9  *
10  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
11  * or http://www.opensolaris.org/os/licensing.
12  * See the License for the specific language governing permissions
13  * and limitations under the License.
14  *
15  * When distributing Covered Code, include this CDDL HEADER in each
16  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
17  * If applicable, add the following below this CDDL HEADER, with the
18  * fields enclosed by brackets "[]" replaced with your own identifying
19  * information: Portions Copyright [yyyy] [name of copyright owner]
20  *
21  * CDDL HEADER END
22  *
23  * $FreeBSD: head/sys/cddl/dev/dtrace/dtrace_ioctl.c 313262 2017-02-05 02:39:12Z markj $
24  *
25  */
26 
27 static int dtrace_verbose_ioctl;
28 SYSCTL_INT(_debug_dtrace, OID_AUTO, verbose_ioctl, CTLFLAG_RW,
29     &dtrace_verbose_ioctl, 0, "log DTrace ioctls");
30 
31 #define pfind(pid) proc_find((pid))
32 
33 #define DTRACE_IOCTL_PRINTF(fmt, ...)	if (dtrace_verbose_ioctl) printf(fmt, ## __VA_ARGS__ )
34 
35 #ifdef __FreeBSD__
36 static int
dtrace_ioctl_helper(struct cdev * dev,u_long cmd,caddr_t addr,int flags,struct thread * td)37 dtrace_ioctl_helper(struct cdev *dev, u_long cmd, caddr_t addr, int flags,
38     struct thread *td)
39 #endif
40 #ifdef __NetBSD__
41 static int
42 dtrace_ioctl_helper(dev_t dev, u_long cmd, caddr_t addr, int flags)
43 #endif
44 {
45 	struct proc *p;
46 	dof_helper_t *dhp;
47 	dof_hdr_t *dof;
48 	int rval;
49 
50 	dhp = NULL;
51 	dof = NULL;
52 	rval = 0;
53 	switch (cmd) {
54 	case DTRACEHIOC_ADDDOF:
55 		dhp = (dof_helper_t *)addr;
56 		addr = (caddr_t)(uintptr_t)dhp->dofhp_dof;
57 		p = curproc;
58 		if (p->p_pid == dhp->dofhp_pid) {
59 			dof = dtrace_dof_copyin((uintptr_t)addr, &rval);
60 		} else {
61 #ifdef __FreeBSD__
62 			p = pfind(dhp->dofhp_pid);
63 			if (p == NULL)
64 				return (EINVAL);
65 			if (!P_SHOULDSTOP(p) ||
66 			    (p->p_flag & (P_TRACED | P_WEXIT)) != P_TRACED ||
67 			    p->p_pptr != curproc) {
68 				PROC_UNLOCK(p);
69 				return (EINVAL);
70 			}
71 			_PHOLD(p);
72 			PROC_UNLOCK(p);
73 			dof = dtrace_dof_copyin_proc(p, (uintptr_t)addr, &rval);
74 #endif
75 #ifdef __NetBSD__
76 			dof = dtrace_dof_copyin_pid(dhp->dofhp_pid, addr, &rval);
77 #endif
78 		}
79 
80 		if (dof == NULL) {
81 #ifdef __FreeBSD__
82 			if (p != curproc)
83 				PRELE(p);
84 #endif
85 			break;
86 		}
87 
88 		mutex_enter(&dtrace_lock);
89 		if ((rval = dtrace_helper_slurp(dof, dhp, p)) != -1) {
90 			dhp->dofhp_gen = rval;
91 			rval = 0;
92 		} else {
93 			rval = EINVAL;
94 		}
95 		mutex_exit(&dtrace_lock);
96 #ifdef __FreeBSD__
97 		if (p != curproc)
98 			PRELE(p);
99 #endif
100 		break;
101 	case DTRACEHIOC_REMOVE:
102 		mutex_enter(&dtrace_lock);
103 		rval = dtrace_helper_destroygen(NULL, *(int *)(uintptr_t)addr);
104 		mutex_exit(&dtrace_lock);
105 		break;
106 	default:
107 		rval = ENOTTY;
108 		break;
109 	}
110 	return (rval);
111 }
112 
113 /* ARGSUSED */
114 #ifdef __FreeBSD__
115 static int
dtrace_ioctl(struct cdev * dev,u_long cmd,caddr_t addr,int flags __unused,struct thread * td)116 dtrace_ioctl(struct cdev *dev, u_long cmd, caddr_t addr,
117     int flags __unused, struct thread *td)
118 #endif
119 #ifdef __NetBSD__
120 static int
121 dtrace_ioctl(struct file *fp, u_long cmd, void *addr)
122 #endif
123 {
124 	dtrace_state_t *state = (dtrace_state_t *)fp->f_data;
125 	int error = 0;
126 
127 	if (state == NULL)
128 		return (EINVAL);
129 
130 	if (state->dts_anon) {
131 		ASSERT(dtrace_anon.dta_state == NULL);
132 		state = state->dts_anon;
133 	}
134 
135 	switch (cmd) {
136 	case DTRACEIOC_AGGDESC: {
137 		dtrace_aggdesc_t **paggdesc = (dtrace_aggdesc_t **) addr;
138 		dtrace_aggdesc_t aggdesc;
139 		dtrace_action_t *act;
140 		dtrace_aggregation_t *agg;
141 		int nrecs;
142 		uint32_t offs;
143 		dtrace_recdesc_t *lrec;
144 		void *buf;
145 		size_t size;
146 		uintptr_t dest;
147 
148 		DTRACE_IOCTL_PRINTF("%s(%d): DTRACEIOC_AGGDESC\n",__func__,__LINE__);
149 
150 		if (copyin((void *) *paggdesc, &aggdesc, sizeof (aggdesc)) != 0)
151 			return (EFAULT);
152 
153 		mutex_enter(&dtrace_lock);
154 
155 		if ((agg = dtrace_aggid2agg(state, aggdesc.dtagd_id)) == NULL) {
156 			mutex_exit(&dtrace_lock);
157 			return (EINVAL);
158 		}
159 
160 		aggdesc.dtagd_epid = agg->dtag_ecb->dte_epid;
161 
162 		nrecs = aggdesc.dtagd_nrecs;
163 		aggdesc.dtagd_nrecs = 0;
164 
165 		offs = agg->dtag_base;
166 		lrec = &agg->dtag_action.dta_rec;
167 		aggdesc.dtagd_size = lrec->dtrd_offset + lrec->dtrd_size - offs;
168 
169 		for (act = agg->dtag_first; ; act = act->dta_next) {
170 			ASSERT(act->dta_intuple ||
171 			    DTRACEACT_ISAGG(act->dta_kind));
172 
173 			/*
174 			 * If this action has a record size of zero, it
175 			 * denotes an argument to the aggregating action.
176 			 * Because the presence of this record doesn't (or
177 			 * shouldn't) affect the way the data is interpreted,
178 			 * we don't copy it out to save user-level the
179 			 * confusion of dealing with a zero-length record.
180 			 */
181 			if (act->dta_rec.dtrd_size == 0) {
182 				ASSERT(agg->dtag_hasarg);
183 				continue;
184 			}
185 
186 			aggdesc.dtagd_nrecs++;
187 
188 			if (act == &agg->dtag_action)
189 				break;
190 		}
191 
192 		/*
193 		 * Now that we have the size, we need to allocate a temporary
194 		 * buffer in which to store the complete description.  We need
195 		 * the temporary buffer to be able to drop dtrace_lock()
196 		 * across the copyout(), below.
197 		 */
198 		size = sizeof (dtrace_aggdesc_t) +
199 		    (aggdesc.dtagd_nrecs * sizeof (dtrace_recdesc_t));
200 
201 		buf = kmem_alloc(size, KM_SLEEP);
202 		dest = (uintptr_t)buf;
203 
204 		bcopy(&aggdesc, (void *)dest, sizeof (aggdesc));
205 		dest += offsetof(dtrace_aggdesc_t, dtagd_rec[0]);
206 
207 		for (act = agg->dtag_first; ; act = act->dta_next) {
208 			dtrace_recdesc_t rec = act->dta_rec;
209 
210 			/*
211 			 * See the comment in the above loop for why we pass
212 			 * over zero-length records.
213 			 */
214 			if (rec.dtrd_size == 0) {
215 				ASSERT(agg->dtag_hasarg);
216 				continue;
217 			}
218 
219 			if (nrecs-- == 0)
220 				break;
221 
222 			rec.dtrd_offset -= offs;
223 			bcopy(&rec, (void *)dest, sizeof (rec));
224 			dest += sizeof (dtrace_recdesc_t);
225 
226 			if (act == &agg->dtag_action)
227 				break;
228 		}
229 
230 		mutex_exit(&dtrace_lock);
231 
232 		if (copyout(buf, (void *) *paggdesc, dest - (uintptr_t)buf) != 0) {
233 			kmem_free(buf, size);
234 			return (EFAULT);
235 		}
236 
237 		kmem_free(buf, size);
238 		return (0);
239 	}
240 	case DTRACEIOC_AGGSNAP:
241 	case DTRACEIOC_BUFSNAP: {
242 		dtrace_bufdesc_t **pdesc = (dtrace_bufdesc_t **) addr;
243 		dtrace_bufdesc_t desc;
244 		caddr_t cached;
245 		dtrace_buffer_t *buf;
246 
247 		dtrace_debug_output();
248 
249 		if (copyin((void *) *pdesc, &desc, sizeof (desc)) != 0)
250 			return (EFAULT);
251 
252 		DTRACE_IOCTL_PRINTF("%s(%d): %s curcpu %d cpu %d\n",
253 		    __func__,__LINE__,
254 		    cmd == DTRACEIOC_AGGSNAP ?
255 		    "DTRACEIOC_AGGSNAP":"DTRACEIOC_BUFSNAP",
256 		    cpu_number(), desc.dtbd_cpu);
257 
258 		if (desc.dtbd_cpu >= ncpu)
259 			return (ENOENT);
260 
261 		mutex_enter(&dtrace_lock);
262 
263 		if (cmd == DTRACEIOC_BUFSNAP) {
264 			buf = &state->dts_buffer[desc.dtbd_cpu];
265 		} else {
266 			buf = &state->dts_aggbuffer[desc.dtbd_cpu];
267 		}
268 
269 		if (buf->dtb_flags & (DTRACEBUF_RING | DTRACEBUF_FILL)) {
270 			size_t sz = buf->dtb_offset;
271 
272 			if (state->dts_activity != DTRACE_ACTIVITY_STOPPED) {
273 				mutex_exit(&dtrace_lock);
274 				return (EBUSY);
275 			}
276 
277 			/*
278 			 * If this buffer has already been consumed, we're
279 			 * going to indicate that there's nothing left here
280 			 * to consume.
281 			 */
282 			if (buf->dtb_flags & DTRACEBUF_CONSUMED) {
283 				mutex_exit(&dtrace_lock);
284 
285 				desc.dtbd_size = 0;
286 				desc.dtbd_drops = 0;
287 				desc.dtbd_errors = 0;
288 				desc.dtbd_oldest = 0;
289 				sz = sizeof (desc);
290 
291 				if (copyout(&desc, (void *) *pdesc, sz) != 0)
292 					return (EFAULT);
293 
294 				return (0);
295 			}
296 
297 			/*
298 			 * If this is a ring buffer that has wrapped, we want
299 			 * to copy the whole thing out.
300 			 */
301 			if (buf->dtb_flags & DTRACEBUF_WRAPPED) {
302 				dtrace_buffer_polish(buf);
303 				sz = buf->dtb_size;
304 			}
305 
306 			if (copyout(buf->dtb_tomax, desc.dtbd_data, sz) != 0) {
307 				mutex_exit(&dtrace_lock);
308 				return (EFAULT);
309 			}
310 
311 			desc.dtbd_size = sz;
312 			desc.dtbd_drops = buf->dtb_drops;
313 			desc.dtbd_errors = buf->dtb_errors;
314 			desc.dtbd_oldest = buf->dtb_xamot_offset;
315 			desc.dtbd_timestamp = dtrace_gethrtime();
316 
317 			mutex_exit(&dtrace_lock);
318 
319 			if (copyout(&desc, (void *) *pdesc, sizeof (desc)) != 0)
320 				return (EFAULT);
321 
322 			buf->dtb_flags |= DTRACEBUF_CONSUMED;
323 
324 			return (0);
325 		}
326 
327 		if (buf->dtb_tomax == NULL) {
328 			ASSERT(buf->dtb_xamot == NULL);
329 			mutex_exit(&dtrace_lock);
330 			return (ENOENT);
331 		}
332 
333 		cached = buf->dtb_tomax;
334 		ASSERT(!(buf->dtb_flags & DTRACEBUF_NOSWITCH));
335 
336 		dtrace_xcall(desc.dtbd_cpu,
337 		    (dtrace_xcall_t)dtrace_buffer_switch, buf);
338 
339 		state->dts_errors += buf->dtb_xamot_errors;
340 
341 		/*
342 		 * If the buffers did not actually switch, then the cross call
343 		 * did not take place -- presumably because the given CPU is
344 		 * not in the ready set.  If this is the case, we'll return
345 		 * ENOENT.
346 		 */
347 		if (buf->dtb_tomax == cached) {
348 			ASSERT(buf->dtb_xamot != cached);
349 			mutex_exit(&dtrace_lock);
350 			return (ENOENT);
351 		}
352 
353 		ASSERT(cached == buf->dtb_xamot);
354 
355 		DTRACE_IOCTL_PRINTF("%s(%d): copyout the buffer snapshot\n",__func__,__LINE__);
356 
357 		/*
358 		 * We have our snapshot; now copy it out.
359 		 */
360 		if (copyout(buf->dtb_xamot, desc.dtbd_data,
361 		    buf->dtb_xamot_offset) != 0) {
362 			mutex_exit(&dtrace_lock);
363 			return (EFAULT);
364 		}
365 
366 		desc.dtbd_size = buf->dtb_xamot_offset;
367 		desc.dtbd_drops = buf->dtb_xamot_drops;
368 		desc.dtbd_errors = buf->dtb_xamot_errors;
369 		desc.dtbd_oldest = 0;
370 		desc.dtbd_timestamp = buf->dtb_switched;
371 
372 		mutex_exit(&dtrace_lock);
373 
374 		DTRACE_IOCTL_PRINTF("%s(%d): copyout buffer desc: size %zd drops %lu errors %lu\n",__func__,__LINE__,(size_t) desc.dtbd_size,(u_long) desc.dtbd_drops,(u_long) desc.dtbd_errors);
375 
376 		/*
377 		 * Finally, copy out the buffer description.
378 		 */
379 		if (copyout(&desc, (void *) *pdesc, sizeof (desc)) != 0)
380 			return (EFAULT);
381 
382 		return (0);
383 	}
384 	case DTRACEIOC_CONF: {
385 		dtrace_conf_t conf;
386 
387 		DTRACE_IOCTL_PRINTF("%s(%d): DTRACEIOC_CONF\n",__func__,__LINE__);
388 
389 		bzero(&conf, sizeof (conf));
390 		conf.dtc_difversion = DIF_VERSION;
391 		conf.dtc_difintregs = DIF_DIR_NREGS;
392 		conf.dtc_diftupregs = DIF_DTR_NREGS;
393 		conf.dtc_ctfmodel = CTF_MODEL_NATIVE;
394 
395 		*((dtrace_conf_t *) addr) = conf;
396 
397 		return (0);
398 	}
399 	case DTRACEIOC_DOFGET: {
400 		dof_hdr_t **pdof = (dof_hdr_t **) addr;
401 		dof_hdr_t hdr, *dof = *pdof;
402 		int rval;
403 		uint64_t len;
404 
405 		DTRACE_IOCTL_PRINTF("%s(%d): DTRACEIOC_DOFGET\n",__func__,__LINE__);
406 
407 		if (copyin((void *)dof, &hdr, sizeof (hdr)) != 0)
408 			return (EFAULT);
409 
410 		mutex_enter(&dtrace_lock);
411 		dof = dtrace_dof_create(state);
412 		mutex_exit(&dtrace_lock);
413 
414 		len = MIN(hdr.dofh_loadsz, dof->dofh_loadsz);
415 		rval = copyout(dof, (void *) *pdof, len);
416 		dtrace_dof_destroy(dof);
417 
418 		return (rval == 0 ? 0 : EFAULT);
419 	}
420 	case DTRACEIOC_ENABLE: {
421 		dof_hdr_t *dof = NULL;
422 		dtrace_enabling_t *enab = NULL;
423 		dtrace_vstate_t *vstate;
424 		int err = 0;
425 		int rval;
426 		dtrace_enable_io_t *p = (dtrace_enable_io_t *) addr;
427 
428 		DTRACE_IOCTL_PRINTF("%s(%d): DTRACEIOC_ENABLE\n",__func__,__LINE__);
429 
430 		/*
431 		 * If a NULL argument has been passed, we take this as our
432 		 * cue to reevaluate our enablings.
433 		 */
434 		if (p->dof == NULL) {
435 			dtrace_enabling_matchall();
436 
437 			return (0);
438 		}
439 
440 		if ((dof = dtrace_dof_copyin((uintptr_t) p->dof, &rval)) == NULL)
441 			return (EINVAL);
442 
443 		mutex_enter(&cpu_lock);
444 		mutex_enter(&dtrace_lock);
445 		vstate = &state->dts_vstate;
446 
447 		if (state->dts_activity != DTRACE_ACTIVITY_INACTIVE) {
448 			mutex_exit(&dtrace_lock);
449 			mutex_exit(&cpu_lock);
450 			dtrace_dof_destroy(dof);
451 			return (EBUSY);
452 		}
453 
454 		if (dtrace_dof_slurp(dof, vstate, CRED(), &enab, 0, 0,
455 		    B_TRUE) != 0) {
456 			mutex_exit(&dtrace_lock);
457 			mutex_exit(&cpu_lock);
458 			dtrace_dof_destroy(dof);
459 			return (EINVAL);
460 		}
461 
462 		if ((rval = dtrace_dof_options(dof, state)) != 0) {
463 			dtrace_enabling_destroy(enab);
464 			mutex_exit(&dtrace_lock);
465 			mutex_exit(&cpu_lock);
466 			dtrace_dof_destroy(dof);
467 			return (rval);
468 		}
469 
470 		if ((err = dtrace_enabling_match(enab, &p->n_matched)) == 0) {
471 			err = dtrace_enabling_retain(enab);
472 		} else {
473 			dtrace_enabling_destroy(enab);
474 		}
475 
476 		mutex_exit(&cpu_lock);
477 		mutex_exit(&dtrace_lock);
478 		dtrace_dof_destroy(dof);
479 
480 		return (err);
481 	}
482 	case DTRACEIOC_EPROBE: {
483 		dtrace_eprobedesc_t **pepdesc = (dtrace_eprobedesc_t **) addr;
484 		dtrace_eprobedesc_t epdesc;
485 		dtrace_ecb_t *ecb;
486 		dtrace_action_t *act;
487 		void *buf;
488 		size_t size;
489 		uintptr_t dest;
490 		int nrecs;
491 
492 		DTRACE_IOCTL_PRINTF("%s(%d): DTRACEIOC_EPROBE\n",__func__,__LINE__);
493 
494 		if (copyin((void *)*pepdesc, &epdesc, sizeof (epdesc)) != 0)
495 			return (EFAULT);
496 
497 		mutex_enter(&dtrace_lock);
498 
499 		if ((ecb = dtrace_epid2ecb(state, epdesc.dtepd_epid)) == NULL) {
500 			mutex_exit(&dtrace_lock);
501 			return (EINVAL);
502 		}
503 
504 		if (ecb->dte_probe == NULL) {
505 			mutex_exit(&dtrace_lock);
506 			return (EINVAL);
507 		}
508 
509 		epdesc.dtepd_probeid = ecb->dte_probe->dtpr_id;
510 		epdesc.dtepd_uarg = ecb->dte_uarg;
511 		epdesc.dtepd_size = ecb->dte_size;
512 
513 		nrecs = epdesc.dtepd_nrecs;
514 		epdesc.dtepd_nrecs = 0;
515 		for (act = ecb->dte_action; act != NULL; act = act->dta_next) {
516 			if (DTRACEACT_ISAGG(act->dta_kind) || act->dta_intuple)
517 				continue;
518 
519 			epdesc.dtepd_nrecs++;
520 		}
521 
522 		/*
523 		 * Now that we have the size, we need to allocate a temporary
524 		 * buffer in which to store the complete description.  We need
525 		 * the temporary buffer to be able to drop dtrace_lock()
526 		 * across the copyout(), below.
527 		 */
528 		size = sizeof (dtrace_eprobedesc_t) +
529 		    (epdesc.dtepd_nrecs * sizeof (dtrace_recdesc_t));
530 
531 		buf = kmem_alloc(size, KM_SLEEP);
532 		dest = (uintptr_t)buf;
533 
534 		bcopy(&epdesc, (void *)dest, sizeof (epdesc));
535 		dest += offsetof(dtrace_eprobedesc_t, dtepd_rec[0]);
536 
537 		for (act = ecb->dte_action; act != NULL; act = act->dta_next) {
538 			if (DTRACEACT_ISAGG(act->dta_kind) || act->dta_intuple)
539 				continue;
540 
541 			if (nrecs-- == 0)
542 				break;
543 
544 			bcopy(&act->dta_rec, (void *)dest,
545 			    sizeof (dtrace_recdesc_t));
546 			dest += sizeof (dtrace_recdesc_t);
547 		}
548 
549 		mutex_exit(&dtrace_lock);
550 
551 		if (copyout(buf, (void *) *pepdesc, dest - (uintptr_t)buf) != 0) {
552 			kmem_free(buf, size);
553 			return (EFAULT);
554 		}
555 
556 		kmem_free(buf, size);
557 		return (0);
558 	}
559 	case DTRACEIOC_FORMAT: {
560 		dtrace_fmtdesc_t *fmt = (dtrace_fmtdesc_t *) addr;
561 		char *str;
562 		int len;
563 
564 		DTRACE_IOCTL_PRINTF("%s(%d): DTRACEIOC_FORMAT\n",__func__,__LINE__);
565 
566 		mutex_enter(&dtrace_lock);
567 
568 		if (fmt->dtfd_format == 0 ||
569 		    fmt->dtfd_format > state->dts_nformats) {
570 			mutex_exit(&dtrace_lock);
571 			return (EINVAL);
572 		}
573 
574 		/*
575 		 * Format strings are allocated contiguously and they are
576 		 * never freed; if a format index is less than the number
577 		 * of formats, we can assert that the format map is non-NULL
578 		 * and that the format for the specified index is non-NULL.
579 		 */
580 		ASSERT(state->dts_formats != NULL);
581 		str = state->dts_formats[fmt->dtfd_format - 1];
582 		ASSERT(str != NULL);
583 
584 		len = strlen(str) + 1;
585 
586 		if (len > fmt->dtfd_length) {
587 			fmt->dtfd_length = len;
588 		} else {
589 			if (copyout(str, fmt->dtfd_string, len) != 0) {
590 				mutex_exit(&dtrace_lock);
591 				return (EINVAL);
592 			}
593 		}
594 
595 		mutex_exit(&dtrace_lock);
596 		return (0);
597 	}
598 	case DTRACEIOC_GO: {
599 		int rval;
600 		processorid_t *cpuid = (processorid_t *) addr;
601 
602 		DTRACE_IOCTL_PRINTF("%s(%d): DTRACEIOC_GO\n",__func__,__LINE__);
603 
604 		rval = dtrace_state_go(state, cpuid);
605 
606 		return (rval);
607 	}
608 	case DTRACEIOC_PROBEARG: {
609 		dtrace_argdesc_t *desc = (dtrace_argdesc_t *) addr;
610 		dtrace_probe_t *probe;
611 		dtrace_provider_t *prov;
612 
613 		DTRACE_IOCTL_PRINTF("%s(%d): DTRACEIOC_PROBEARG\n",__func__,__LINE__);
614 
615 		if (desc->dtargd_id == DTRACE_IDNONE)
616 			return (EINVAL);
617 
618 		if (desc->dtargd_ndx == DTRACE_ARGNONE)
619 			return (EINVAL);
620 
621 		mutex_enter(&dtrace_provider_lock);
622 #ifdef illumos
623 		mutex_enter(&mod_lock);
624 #endif
625 		mutex_enter(&dtrace_lock);
626 
627 		if (desc->dtargd_id > dtrace_nprobes) {
628 			mutex_exit(&dtrace_lock);
629 #ifdef illumos
630 			mutex_exit(&mod_lock);
631 #endif
632 			mutex_exit(&dtrace_provider_lock);
633 			return (EINVAL);
634 		}
635 
636 		if ((probe = dtrace_probes[desc->dtargd_id - 1]) == NULL) {
637 			mutex_exit(&dtrace_lock);
638 #ifdef illumos
639 			mutex_exit(&mod_lock);
640 #endif
641 			mutex_exit(&dtrace_provider_lock);
642 			return (EINVAL);
643 		}
644 
645 		mutex_exit(&dtrace_lock);
646 
647 		prov = probe->dtpr_provider;
648 
649 		if (prov->dtpv_pops.dtps_getargdesc == NULL) {
650 			/*
651 			 * There isn't any typed information for this probe.
652 			 * Set the argument number to DTRACE_ARGNONE.
653 			 */
654 			desc->dtargd_ndx = DTRACE_ARGNONE;
655 		} else {
656 			desc->dtargd_native[0] = '\0';
657 			desc->dtargd_xlate[0] = '\0';
658 			desc->dtargd_mapping = desc->dtargd_ndx;
659 
660 			prov->dtpv_pops.dtps_getargdesc(prov->dtpv_arg,
661 			    probe->dtpr_id, probe->dtpr_arg, desc);
662 		}
663 
664 #ifdef illumos
665 		mutex_exit(&mod_lock);
666 #endif
667 		mutex_exit(&dtrace_provider_lock);
668 
669 		return (0);
670 	}
671 	case DTRACEIOC_PROBEMATCH:
672 	case DTRACEIOC_PROBES: {
673 		dtrace_probedesc_t *p_desc = (dtrace_probedesc_t *) addr;
674 		dtrace_probe_t *probe = NULL;
675 		dtrace_probekey_t pkey;
676 		dtrace_id_t i;
677 		int m = 0;
678 		uint32_t priv = 0;
679 		uid_t uid = 0;
680 		zoneid_t zoneid = 0;
681 
682 		DTRACE_IOCTL_PRINTF("%s(%d): %s\n",__func__,__LINE__,
683 		    cmd == DTRACEIOC_PROBEMATCH ?
684 		    "DTRACEIOC_PROBEMATCH":"DTRACEIOC_PROBES");
685 
686 		p_desc->dtpd_provider[DTRACE_PROVNAMELEN - 1] = '\0';
687 		p_desc->dtpd_mod[DTRACE_MODNAMELEN - 1] = '\0';
688 		p_desc->dtpd_func[DTRACE_FUNCNAMELEN - 1] = '\0';
689 		p_desc->dtpd_name[DTRACE_NAMELEN - 1] = '\0';
690 
691 		/*
692 		 * Before we attempt to match this probe, we want to give
693 		 * all providers the opportunity to provide it.
694 		 */
695 		if (p_desc->dtpd_id == DTRACE_IDNONE) {
696 			mutex_enter(&dtrace_provider_lock);
697 			dtrace_probe_provide(p_desc, NULL);
698 			mutex_exit(&dtrace_provider_lock);
699 			p_desc->dtpd_id++;
700 		}
701 
702 		if (cmd == DTRACEIOC_PROBEMATCH)  {
703 			dtrace_probekey(p_desc, &pkey);
704 			pkey.dtpk_id = DTRACE_IDNONE;
705 		}
706 
707 		dtrace_cred2priv(curlwp->l_cred, &priv, &uid, &zoneid);
708 
709 		mutex_enter(&dtrace_lock);
710 
711 		if (cmd == DTRACEIOC_PROBEMATCH) {
712 			for (i = p_desc->dtpd_id; i <= dtrace_nprobes; i++) {
713 				if ((probe = dtrace_probes[i - 1]) != NULL &&
714 				    (m = dtrace_match_probe(probe, &pkey,
715 				    priv, uid, zoneid)) != 0)
716 					break;
717 			}
718 
719 			if (m < 0) {
720 				mutex_exit(&dtrace_lock);
721 				return (EINVAL);
722 			}
723 
724 		} else {
725 			for (i = p_desc->dtpd_id; i <= dtrace_nprobes; i++) {
726 				if ((probe = dtrace_probes[i - 1]) != NULL &&
727 				    dtrace_match_priv(probe, priv, uid, zoneid))
728 					break;
729 			}
730 		}
731 
732 		if (probe == NULL) {
733 			mutex_exit(&dtrace_lock);
734 			return (ESRCH);
735 		}
736 
737 		dtrace_probe_description(probe, p_desc);
738 		mutex_exit(&dtrace_lock);
739 
740 		return (0);
741 	}
742 	case DTRACEIOC_PROVIDER: {
743 		dtrace_providerdesc_t *pvd = (dtrace_providerdesc_t *) addr;
744 		dtrace_provider_t *pvp;
745 
746 		DTRACE_IOCTL_PRINTF("%s(%d): DTRACEIOC_PROVIDER\n",__func__,__LINE__);
747 
748 		pvd->dtvd_name[DTRACE_PROVNAMELEN - 1] = '\0';
749 		error = 0;
750 again:
751 		mutex_enter(&dtrace_provider_lock);
752 
753 		for (pvp = dtrace_provider; pvp != NULL; pvp = pvp->dtpv_next) {
754 			if (strcmp(pvp->dtpv_name, pvd->dtvd_name) == 0)
755 				break;
756 		}
757 
758 		mutex_exit(&dtrace_provider_lock);
759 
760 		if (pvp == NULL && error == 0) {
761 			char name[NAME_MAX];
762 			const char *provider;
763 			if (strcmp(pvd->dtvd_name, "proc") == 0)
764 				provider = "sdt";
765 			else
766 				provider = pvd->dtvd_name;
767 
768 			if (snprintf(name, sizeof name, "dtrace_%s",
769 			    provider) < sizeof name) {
770 				error = module_autoload(name,
771 				    MODULE_CLASS_MISC);
772 				if (error == 0)
773 					goto again;
774 			}
775 		}
776 
777 		if (pvp == NULL)
778 			return (ESRCH);
779 
780 		bcopy(&pvp->dtpv_priv, &pvd->dtvd_priv, sizeof (dtrace_ppriv_t));
781 		bcopy(&pvp->dtpv_attr, &pvd->dtvd_attr, sizeof (dtrace_pattr_t));
782 
783 		return (0);
784 	}
785 	case DTRACEIOC_REPLICATE: {
786 		dtrace_repldesc_t *desc = (dtrace_repldesc_t *) addr;
787 		dtrace_probedesc_t *match = &desc->dtrpd_match;
788 		dtrace_probedesc_t *create = &desc->dtrpd_create;
789 		int err;
790 
791 		DTRACE_IOCTL_PRINTF("%s(%d): DTRACEIOC_REPLICATE\n",__func__,__LINE__);
792 
793 		match->dtpd_provider[DTRACE_PROVNAMELEN - 1] = '\0';
794 		match->dtpd_mod[DTRACE_MODNAMELEN - 1] = '\0';
795 		match->dtpd_func[DTRACE_FUNCNAMELEN - 1] = '\0';
796 		match->dtpd_name[DTRACE_NAMELEN - 1] = '\0';
797 
798 		create->dtpd_provider[DTRACE_PROVNAMELEN - 1] = '\0';
799 		create->dtpd_mod[DTRACE_MODNAMELEN - 1] = '\0';
800 		create->dtpd_func[DTRACE_FUNCNAMELEN - 1] = '\0';
801 		create->dtpd_name[DTRACE_NAMELEN - 1] = '\0';
802 
803 		mutex_enter(&dtrace_lock);
804 		err = dtrace_enabling_replicate(state, match, create);
805 		mutex_exit(&dtrace_lock);
806 
807 		return (err);
808 	}
809 	case DTRACEIOC_STATUS: {
810 		dtrace_status_t *stat = (dtrace_status_t *) addr;
811 		dtrace_dstate_t *dstate;
812 		int i, j;
813 		uint64_t nerrs;
814 		CPU_INFO_ITERATOR cpuind;
815 		struct cpu_info *cinfo;
816 
817 		DTRACE_IOCTL_PRINTF("%s(%d): DTRACEIOC_STATUS\n",__func__,__LINE__);
818 
819 		/*
820 		 * See the comment in dtrace_state_deadman() for the reason
821 		 * for setting dts_laststatus to INT64_MAX before setting
822 		 * it to the correct value.
823 		 */
824 		state->dts_laststatus = INT64_MAX;
825 		dtrace_membar_producer();
826 		state->dts_laststatus = dtrace_gethrtime();
827 
828 		bzero(stat, sizeof (*stat));
829 
830 		mutex_enter(&dtrace_lock);
831 
832 		if (state->dts_activity == DTRACE_ACTIVITY_INACTIVE) {
833 			mutex_exit(&dtrace_lock);
834 			return (ENOENT);
835 		}
836 
837 		if (state->dts_activity == DTRACE_ACTIVITY_DRAINING)
838 			stat->dtst_exiting = 1;
839 
840 		nerrs = state->dts_errors;
841 		dstate = &state->dts_vstate.dtvs_dynvars;
842 
843 		for (CPU_INFO_FOREACH(cpuind, cinfo)) {
844 		    	i = cpu_index(cinfo);
845 
846 			dtrace_dstate_percpu_t *dcpu = &dstate->dtds_percpu[i];
847 
848 			stat->dtst_dyndrops += dcpu->dtdsc_drops;
849 			stat->dtst_dyndrops_dirty += dcpu->dtdsc_dirty_drops;
850 			stat->dtst_dyndrops_rinsing += dcpu->dtdsc_rinsing_drops;
851 
852 			if (state->dts_buffer[i].dtb_flags & DTRACEBUF_FULL)
853 				stat->dtst_filled++;
854 
855 			nerrs += state->dts_buffer[i].dtb_errors;
856 
857 			for (j = 0; j < state->dts_nspeculations; j++) {
858 				dtrace_speculation_t *spec;
859 				dtrace_buffer_t *buf;
860 
861 				spec = &state->dts_speculations[j];
862 				buf = &spec->dtsp_buffer[i];
863 				stat->dtst_specdrops += buf->dtb_xamot_drops;
864 			}
865 		}
866 
867 		stat->dtst_specdrops_busy = state->dts_speculations_busy;
868 		stat->dtst_specdrops_unavail = state->dts_speculations_unavail;
869 		stat->dtst_stkstroverflows = state->dts_stkstroverflows;
870 		stat->dtst_dblerrors = state->dts_dblerrors;
871 		stat->dtst_killed =
872 		    (state->dts_activity == DTRACE_ACTIVITY_KILLED);
873 		stat->dtst_errors = nerrs;
874 
875 		mutex_exit(&dtrace_lock);
876 
877 		return (0);
878 	}
879 	case DTRACEIOC_STOP: {
880 		int rval;
881 		processorid_t *cpuid = (processorid_t *) addr;
882 
883 		DTRACE_IOCTL_PRINTF("%s(%d): DTRACEIOC_STOP\n",__func__,__LINE__);
884 
885 		mutex_enter(&dtrace_lock);
886 		rval = dtrace_state_stop(state, cpuid);
887 		mutex_exit(&dtrace_lock);
888 
889 		return (rval);
890 	}
891 	default:
892 		error = ENOTTY;
893 	}
894 	return (error);
895 }
896