1179237Sjb/*
2179237Sjb * CDDL HEADER START
3179237Sjb *
4179237Sjb * The contents of this file are subject to the terms of the
5179237Sjb * Common Development and Distribution License (the "License").
6179237Sjb * You may not use this file except in compliance with the License.
7179237Sjb *
8179237Sjb * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
9179237Sjb * or http://www.opensolaris.org/os/licensing.
10179237Sjb * See the License for the specific language governing permissions
11179237Sjb * and limitations under the License.
12179237Sjb *
13179237Sjb * When distributing Covered Code, include this CDDL HEADER in each
14179237Sjb * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
15179237Sjb * If applicable, add the following below this CDDL HEADER, with the
16179237Sjb * fields enclosed by brackets "[]" replaced with your own identifying
17179237Sjb * information: Portions Copyright [yyyy] [name of copyright owner]
18179237Sjb *
19179237Sjb * CDDL HEADER END
20179237Sjb *
21179237Sjb * $FreeBSD$
22179237Sjb *
23179237Sjb */
24179237Sjb
25179237Sjbstatic int dtrace_verbose_ioctl;
26266101SmarkjSYSCTL_INT(_debug_dtrace, OID_AUTO, verbose_ioctl, CTLFLAG_RW,
27266101Smarkj    &dtrace_verbose_ioctl, 0, "log DTrace ioctls");
28179237Sjb
29179237Sjb#define DTRACE_IOCTL_PRINTF(fmt, ...)	if (dtrace_verbose_ioctl) printf(fmt, ## __VA_ARGS__ )
30179237Sjb
31211608Srpaulostatic int
32211608Srpaulodtrace_ioctl_helper(struct cdev *dev, u_long cmd, caddr_t addr, int flags,
33211608Srpaulo    struct thread *td)
34211608Srpaulo{
35211608Srpaulo	int rval;
36211608Srpaulo	dof_helper_t *dhp = NULL;
37211608Srpaulo	dof_hdr_t *dof = NULL;
38211608Srpaulo
39211608Srpaulo	switch (cmd) {
40211608Srpaulo	case DTRACEHIOC_ADDDOF:
41211608Srpaulo		dhp = (dof_helper_t *)addr;
42211608Srpaulo		/* XXX all because dofhp_dof is 64 bit */
43211608Srpaulo#ifdef __i386
44211608Srpaulo		addr = (caddr_t)(uint32_t)dhp->dofhp_dof;
45211608Srpaulo#else
46211608Srpaulo		addr = (caddr_t)dhp->dofhp_dof;
47211608Srpaulo#endif
48211608Srpaulo		/* FALLTHROUGH */
49211608Srpaulo	case DTRACEHIOC_ADD:
50211608Srpaulo		dof = dtrace_dof_copyin((intptr_t)addr, &rval);
51211608Srpaulo
52211608Srpaulo		if (dof == NULL)
53211608Srpaulo			return (rval);
54211608Srpaulo
55211608Srpaulo		mutex_enter(&dtrace_lock);
56211608Srpaulo		if ((rval = dtrace_helper_slurp((dof_hdr_t *)dof, dhp)) != -1) {
57211608Srpaulo			if (dhp) {
58211608Srpaulo				dhp->gen = rval;
59211608Srpaulo				copyout(dhp, addr, sizeof(*dhp));
60211608Srpaulo			}
61211608Srpaulo			rval = 0;
62211608Srpaulo		} else {
63211608Srpaulo			rval = EINVAL;
64211608Srpaulo		}
65211608Srpaulo		mutex_exit(&dtrace_lock);
66211608Srpaulo		return (rval);
67211608Srpaulo	case DTRACEHIOC_REMOVE:
68211608Srpaulo		mutex_enter(&dtrace_lock);
69211608Srpaulo		rval = dtrace_helper_destroygen((int)*addr);
70211608Srpaulo		mutex_exit(&dtrace_lock);
71211608Srpaulo
72211608Srpaulo		return (rval);
73211608Srpaulo	default:
74211608Srpaulo		break;
75211608Srpaulo	}
76211608Srpaulo
77211608Srpaulo	return (ENOTTY);
78211608Srpaulo}
79211608Srpaulo
80179237Sjb/* ARGSUSED */
81179237Sjbstatic int
82179237Sjbdtrace_ioctl(struct cdev *dev, u_long cmd, caddr_t addr,
83179237Sjb    int flags __unused, struct thread *td)
84179237Sjb{
85184698Srodrigc#if __FreeBSD_version < 800039
86179237Sjb	dtrace_state_t *state = dev->si_drv1;
87184698Srodrigc#else
88184698Srodrigc	dtrace_state_t *state;
89184698Srodrigc	devfs_get_cdevpriv((void **) &state);
90184698Srodrigc#endif
91179237Sjb	int error = 0;
92179237Sjb	if (state == NULL)
93179237Sjb		return (EINVAL);
94179237Sjb
95179237Sjb	if (state->dts_anon) {
96179237Sjb		ASSERT(dtrace_anon.dta_state == NULL);
97179237Sjb		state = state->dts_anon;
98179237Sjb	}
99179237Sjb
100179237Sjb	switch (cmd) {
101179237Sjb	case DTRACEIOC_AGGDESC: {
102179237Sjb		dtrace_aggdesc_t **paggdesc = (dtrace_aggdesc_t **) addr;
103179237Sjb		dtrace_aggdesc_t aggdesc;
104179237Sjb		dtrace_action_t *act;
105179237Sjb		dtrace_aggregation_t *agg;
106179237Sjb		int nrecs;
107179237Sjb		uint32_t offs;
108179237Sjb		dtrace_recdesc_t *lrec;
109179237Sjb		void *buf;
110179237Sjb		size_t size;
111179237Sjb		uintptr_t dest;
112179237Sjb
113179237Sjb		DTRACE_IOCTL_PRINTF("%s(%d): DTRACEIOC_AGGDESC\n",__func__,__LINE__);
114179237Sjb
115179237Sjb		if (copyin((void *) *paggdesc, &aggdesc, sizeof (aggdesc)) != 0)
116179237Sjb			return (EFAULT);
117179237Sjb
118179237Sjb		mutex_enter(&dtrace_lock);
119179237Sjb
120179237Sjb		if ((agg = dtrace_aggid2agg(state, aggdesc.dtagd_id)) == NULL) {
121179237Sjb			mutex_exit(&dtrace_lock);
122179237Sjb			return (EINVAL);
123179237Sjb		}
124179237Sjb
125179237Sjb		aggdesc.dtagd_epid = agg->dtag_ecb->dte_epid;
126179237Sjb
127179237Sjb		nrecs = aggdesc.dtagd_nrecs;
128179237Sjb		aggdesc.dtagd_nrecs = 0;
129179237Sjb
130179237Sjb		offs = agg->dtag_base;
131179237Sjb		lrec = &agg->dtag_action.dta_rec;
132179237Sjb		aggdesc.dtagd_size = lrec->dtrd_offset + lrec->dtrd_size - offs;
133179237Sjb
134179237Sjb		for (act = agg->dtag_first; ; act = act->dta_next) {
135179237Sjb			ASSERT(act->dta_intuple ||
136179237Sjb			    DTRACEACT_ISAGG(act->dta_kind));
137179237Sjb
138179237Sjb			/*
139179237Sjb			 * If this action has a record size of zero, it
140179237Sjb			 * denotes an argument to the aggregating action.
141179237Sjb			 * Because the presence of this record doesn't (or
142179237Sjb			 * shouldn't) affect the way the data is interpreted,
143179237Sjb			 * we don't copy it out to save user-level the
144179237Sjb			 * confusion of dealing with a zero-length record.
145179237Sjb			 */
146179237Sjb			if (act->dta_rec.dtrd_size == 0) {
147179237Sjb				ASSERT(agg->dtag_hasarg);
148179237Sjb				continue;
149179237Sjb			}
150179237Sjb
151179237Sjb			aggdesc.dtagd_nrecs++;
152179237Sjb
153179237Sjb			if (act == &agg->dtag_action)
154179237Sjb				break;
155179237Sjb		}
156179237Sjb
157179237Sjb		/*
158179237Sjb		 * Now that we have the size, we need to allocate a temporary
159179237Sjb		 * buffer in which to store the complete description.  We need
160179237Sjb		 * the temporary buffer to be able to drop dtrace_lock()
161179237Sjb		 * across the copyout(), below.
162179237Sjb		 */
163179237Sjb		size = sizeof (dtrace_aggdesc_t) +
164179237Sjb		    (aggdesc.dtagd_nrecs * sizeof (dtrace_recdesc_t));
165179237Sjb
166179237Sjb		buf = kmem_alloc(size, KM_SLEEP);
167179237Sjb		dest = (uintptr_t)buf;
168179237Sjb
169179237Sjb		bcopy(&aggdesc, (void *)dest, sizeof (aggdesc));
170179237Sjb		dest += offsetof(dtrace_aggdesc_t, dtagd_rec[0]);
171179237Sjb
172179237Sjb		for (act = agg->dtag_first; ; act = act->dta_next) {
173179237Sjb			dtrace_recdesc_t rec = act->dta_rec;
174179237Sjb
175179237Sjb			/*
176179237Sjb			 * See the comment in the above loop for why we pass
177179237Sjb			 * over zero-length records.
178179237Sjb			 */
179179237Sjb			if (rec.dtrd_size == 0) {
180179237Sjb				ASSERT(agg->dtag_hasarg);
181179237Sjb				continue;
182179237Sjb			}
183179237Sjb
184179237Sjb			if (nrecs-- == 0)
185179237Sjb				break;
186179237Sjb
187179237Sjb			rec.dtrd_offset -= offs;
188179237Sjb			bcopy(&rec, (void *)dest, sizeof (rec));
189179237Sjb			dest += sizeof (dtrace_recdesc_t);
190179237Sjb
191179237Sjb			if (act == &agg->dtag_action)
192179237Sjb				break;
193179237Sjb		}
194179237Sjb
195179237Sjb		mutex_exit(&dtrace_lock);
196179237Sjb
197179237Sjb		if (copyout(buf, (void *) *paggdesc, dest - (uintptr_t)buf) != 0) {
198179237Sjb			kmem_free(buf, size);
199179237Sjb			return (EFAULT);
200179237Sjb		}
201179237Sjb
202179237Sjb		kmem_free(buf, size);
203179237Sjb		return (0);
204179237Sjb	}
205179237Sjb	case DTRACEIOC_AGGSNAP:
206179237Sjb	case DTRACEIOC_BUFSNAP: {
207179237Sjb		dtrace_bufdesc_t **pdesc = (dtrace_bufdesc_t **) addr;
208179237Sjb		dtrace_bufdesc_t desc;
209179237Sjb		caddr_t cached;
210179237Sjb		dtrace_buffer_t *buf;
211179237Sjb
212179237Sjb		dtrace_debug_output();
213179237Sjb
214179237Sjb		if (copyin((void *) *pdesc, &desc, sizeof (desc)) != 0)
215179237Sjb			return (EFAULT);
216179237Sjb
217179237Sjb		DTRACE_IOCTL_PRINTF("%s(%d): %s curcpu %d cpu %d\n",
218179237Sjb		    __func__,__LINE__,
219179237Sjb		    cmd == DTRACEIOC_AGGSNAP ?
220179237Sjb		    "DTRACEIOC_AGGSNAP":"DTRACEIOC_BUFSNAP",
221179237Sjb		    curcpu, desc.dtbd_cpu);
222179237Sjb
223179237Sjb		if (desc.dtbd_cpu < 0 || desc.dtbd_cpu >= NCPU)
224179237Sjb			return (ENOENT);
225179237Sjb		if (pcpu_find(desc.dtbd_cpu) == NULL)
226179237Sjb			return (ENOENT);
227179237Sjb
228179237Sjb		mutex_enter(&dtrace_lock);
229179237Sjb
230179237Sjb		if (cmd == DTRACEIOC_BUFSNAP) {
231179237Sjb			buf = &state->dts_buffer[desc.dtbd_cpu];
232179237Sjb		} else {
233179237Sjb			buf = &state->dts_aggbuffer[desc.dtbd_cpu];
234179237Sjb		}
235179237Sjb
236179237Sjb		if (buf->dtb_flags & (DTRACEBUF_RING | DTRACEBUF_FILL)) {
237179237Sjb			size_t sz = buf->dtb_offset;
238179237Sjb
239179237Sjb			if (state->dts_activity != DTRACE_ACTIVITY_STOPPED) {
240179237Sjb				mutex_exit(&dtrace_lock);
241179237Sjb				return (EBUSY);
242179237Sjb			}
243179237Sjb
244179237Sjb			/*
245179237Sjb			 * If this buffer has already been consumed, we're
246179237Sjb			 * going to indicate that there's nothing left here
247179237Sjb			 * to consume.
248179237Sjb			 */
249179237Sjb			if (buf->dtb_flags & DTRACEBUF_CONSUMED) {
250179237Sjb				mutex_exit(&dtrace_lock);
251179237Sjb
252179237Sjb				desc.dtbd_size = 0;
253179237Sjb				desc.dtbd_drops = 0;
254179237Sjb				desc.dtbd_errors = 0;
255179237Sjb				desc.dtbd_oldest = 0;
256179237Sjb				sz = sizeof (desc);
257179237Sjb
258179237Sjb				if (copyout(&desc, (void *) *pdesc, sz) != 0)
259179237Sjb					return (EFAULT);
260179237Sjb
261179237Sjb				return (0);
262179237Sjb			}
263179237Sjb
264179237Sjb			/*
265179237Sjb			 * If this is a ring buffer that has wrapped, we want
266179237Sjb			 * to copy the whole thing out.
267179237Sjb			 */
268179237Sjb			if (buf->dtb_flags & DTRACEBUF_WRAPPED) {
269179237Sjb				dtrace_buffer_polish(buf);
270179237Sjb				sz = buf->dtb_size;
271179237Sjb			}
272179237Sjb
273179237Sjb			if (copyout(buf->dtb_tomax, desc.dtbd_data, sz) != 0) {
274179237Sjb				mutex_exit(&dtrace_lock);
275179237Sjb				return (EFAULT);
276179237Sjb			}
277179237Sjb
278179237Sjb			desc.dtbd_size = sz;
279179237Sjb			desc.dtbd_drops = buf->dtb_drops;
280179237Sjb			desc.dtbd_errors = buf->dtb_errors;
281179237Sjb			desc.dtbd_oldest = buf->dtb_xamot_offset;
282256002Spfg			desc.dtbd_timestamp = dtrace_gethrtime();
283179237Sjb
284179237Sjb			mutex_exit(&dtrace_lock);
285179237Sjb
286179237Sjb			if (copyout(&desc, (void *) *pdesc, sizeof (desc)) != 0)
287179237Sjb				return (EFAULT);
288179237Sjb
289179237Sjb			buf->dtb_flags |= DTRACEBUF_CONSUMED;
290179237Sjb
291179237Sjb			return (0);
292179237Sjb		}
293179237Sjb
294179237Sjb		if (buf->dtb_tomax == NULL) {
295179237Sjb			ASSERT(buf->dtb_xamot == NULL);
296179237Sjb			mutex_exit(&dtrace_lock);
297179237Sjb			return (ENOENT);
298179237Sjb		}
299179237Sjb
300179237Sjb		cached = buf->dtb_tomax;
301179237Sjb		ASSERT(!(buf->dtb_flags & DTRACEBUF_NOSWITCH));
302179237Sjb
303179237Sjb		dtrace_xcall(desc.dtbd_cpu,
304179237Sjb		    (dtrace_xcall_t)dtrace_buffer_switch, buf);
305179237Sjb
306179237Sjb		state->dts_errors += buf->dtb_xamot_errors;
307179237Sjb
308179237Sjb		/*
309179237Sjb		 * If the buffers did not actually switch, then the cross call
310179237Sjb		 * did not take place -- presumably because the given CPU is
311179237Sjb		 * not in the ready set.  If this is the case, we'll return
312179237Sjb		 * ENOENT.
313179237Sjb		 */
314179237Sjb		if (buf->dtb_tomax == cached) {
315179237Sjb			ASSERT(buf->dtb_xamot != cached);
316179237Sjb			mutex_exit(&dtrace_lock);
317179237Sjb			return (ENOENT);
318179237Sjb		}
319179237Sjb
320179237Sjb		ASSERT(cached == buf->dtb_xamot);
321179237Sjb
322179237Sjb		DTRACE_IOCTL_PRINTF("%s(%d): copyout the buffer snapshot\n",__func__,__LINE__);
323179237Sjb
324179237Sjb		/*
325179237Sjb		 * We have our snapshot; now copy it out.
326179237Sjb		 */
327179237Sjb		if (copyout(buf->dtb_xamot, desc.dtbd_data,
328179237Sjb		    buf->dtb_xamot_offset) != 0) {
329179237Sjb			mutex_exit(&dtrace_lock);
330179237Sjb			return (EFAULT);
331179237Sjb		}
332179237Sjb
333179237Sjb		desc.dtbd_size = buf->dtb_xamot_offset;
334179237Sjb		desc.dtbd_drops = buf->dtb_xamot_drops;
335179237Sjb		desc.dtbd_errors = buf->dtb_xamot_errors;
336179237Sjb		desc.dtbd_oldest = 0;
337256002Spfg		desc.dtbd_timestamp = buf->dtb_switched;
338179237Sjb
339179237Sjb		mutex_exit(&dtrace_lock);
340179237Sjb
341179237Sjb		DTRACE_IOCTL_PRINTF("%s(%d): copyout buffer desc: size %zd drops %lu errors %lu\n",__func__,__LINE__,(size_t) desc.dtbd_size,(u_long) desc.dtbd_drops,(u_long) desc.dtbd_errors);
342179237Sjb
343179237Sjb		/*
344179237Sjb		 * Finally, copy out the buffer description.
345179237Sjb		 */
346179237Sjb		if (copyout(&desc, (void *) *pdesc, sizeof (desc)) != 0)
347179237Sjb			return (EFAULT);
348179237Sjb
349179237Sjb		return (0);
350179237Sjb	}
351179237Sjb	case DTRACEIOC_CONF: {
352179237Sjb		dtrace_conf_t conf;
353179237Sjb
354179237Sjb		DTRACE_IOCTL_PRINTF("%s(%d): DTRACEIOC_CONF\n",__func__,__LINE__);
355179237Sjb
356179237Sjb		bzero(&conf, sizeof (conf));
357179237Sjb		conf.dtc_difversion = DIF_VERSION;
358179237Sjb		conf.dtc_difintregs = DIF_DIR_NREGS;
359179237Sjb		conf.dtc_diftupregs = DIF_DTR_NREGS;
360179237Sjb		conf.dtc_ctfmodel = CTF_MODEL_NATIVE;
361179237Sjb
362179237Sjb		*((dtrace_conf_t *) addr) = conf;
363179237Sjb
364179237Sjb		return (0);
365179237Sjb	}
366179237Sjb	case DTRACEIOC_DOFGET: {
367179237Sjb		dof_hdr_t **pdof = (dof_hdr_t **) addr;
368179237Sjb		dof_hdr_t hdr, *dof = *pdof;
369179237Sjb		int rval;
370179237Sjb		uint64_t len;
371179237Sjb
372179237Sjb		DTRACE_IOCTL_PRINTF("%s(%d): DTRACEIOC_DOFGET\n",__func__,__LINE__);
373179237Sjb
374179237Sjb		if (copyin((void *)dof, &hdr, sizeof (hdr)) != 0)
375179237Sjb			return (EFAULT);
376179237Sjb
377179237Sjb		mutex_enter(&dtrace_lock);
378179237Sjb		dof = dtrace_dof_create(state);
379179237Sjb		mutex_exit(&dtrace_lock);
380179237Sjb
381179237Sjb		len = MIN(hdr.dofh_loadsz, dof->dofh_loadsz);
382179237Sjb		rval = copyout(dof, (void *) *pdof, len);
383179237Sjb		dtrace_dof_destroy(dof);
384179237Sjb
385179237Sjb		return (rval == 0 ? 0 : EFAULT);
386179237Sjb	}
387179237Sjb	case DTRACEIOC_ENABLE: {
388179237Sjb		dof_hdr_t *dof = NULL;
389179237Sjb		dtrace_enabling_t *enab = NULL;
390179237Sjb		dtrace_vstate_t *vstate;
391179237Sjb		int err = 0;
392179237Sjb		int rval;
393179237Sjb		dtrace_enable_io_t *p = (dtrace_enable_io_t *) addr;
394179237Sjb
395179237Sjb		DTRACE_IOCTL_PRINTF("%s(%d): DTRACEIOC_ENABLE\n",__func__,__LINE__);
396179237Sjb
397179237Sjb		/*
398179237Sjb		 * If a NULL argument has been passed, we take this as our
399179237Sjb		 * cue to reevaluate our enablings.
400179237Sjb		 */
401179237Sjb		if (p->dof == NULL) {
402179237Sjb			dtrace_enabling_matchall();
403179237Sjb
404179237Sjb			return (0);
405179237Sjb		}
406179237Sjb
407179237Sjb		if ((dof = dtrace_dof_copyin((uintptr_t) p->dof, &rval)) == NULL)
408179237Sjb			return (EINVAL);
409179237Sjb
410179237Sjb		mutex_enter(&cpu_lock);
411179237Sjb		mutex_enter(&dtrace_lock);
412179237Sjb		vstate = &state->dts_vstate;
413179237Sjb
414179237Sjb		if (state->dts_activity != DTRACE_ACTIVITY_INACTIVE) {
415179237Sjb			mutex_exit(&dtrace_lock);
416179237Sjb			mutex_exit(&cpu_lock);
417179237Sjb			dtrace_dof_destroy(dof);
418179237Sjb			return (EBUSY);
419179237Sjb		}
420179237Sjb
421179237Sjb		if (dtrace_dof_slurp(dof, vstate, td->td_ucred, &enab, 0, B_TRUE) != 0) {
422179237Sjb			mutex_exit(&dtrace_lock);
423179237Sjb			mutex_exit(&cpu_lock);
424179237Sjb			dtrace_dof_destroy(dof);
425179237Sjb			return (EINVAL);
426179237Sjb		}
427179237Sjb
428179237Sjb		if ((rval = dtrace_dof_options(dof, state)) != 0) {
429179237Sjb			dtrace_enabling_destroy(enab);
430179237Sjb			mutex_exit(&dtrace_lock);
431179237Sjb			mutex_exit(&cpu_lock);
432179237Sjb			dtrace_dof_destroy(dof);
433179237Sjb			return (rval);
434179237Sjb		}
435179237Sjb
436179237Sjb		if ((err = dtrace_enabling_match(enab, &p->n_matched)) == 0) {
437179237Sjb			err = dtrace_enabling_retain(enab);
438179237Sjb		} else {
439179237Sjb			dtrace_enabling_destroy(enab);
440179237Sjb		}
441179237Sjb
442179237Sjb		mutex_exit(&cpu_lock);
443179237Sjb		mutex_exit(&dtrace_lock);
444179237Sjb		dtrace_dof_destroy(dof);
445179237Sjb
446179237Sjb		return (err);
447179237Sjb	}
448179237Sjb	case DTRACEIOC_EPROBE: {
449179237Sjb		dtrace_eprobedesc_t **pepdesc = (dtrace_eprobedesc_t **) addr;
450179237Sjb		dtrace_eprobedesc_t epdesc;
451179237Sjb		dtrace_ecb_t *ecb;
452179237Sjb		dtrace_action_t *act;
453179237Sjb		void *buf;
454179237Sjb		size_t size;
455179237Sjb		uintptr_t dest;
456179237Sjb		int nrecs;
457179237Sjb
458179237Sjb		DTRACE_IOCTL_PRINTF("%s(%d): DTRACEIOC_EPROBE\n",__func__,__LINE__);
459179237Sjb
460179237Sjb		if (copyin((void *)*pepdesc, &epdesc, sizeof (epdesc)) != 0)
461179237Sjb			return (EFAULT);
462179237Sjb
463179237Sjb		mutex_enter(&dtrace_lock);
464179237Sjb
465179237Sjb		if ((ecb = dtrace_epid2ecb(state, epdesc.dtepd_epid)) == NULL) {
466179237Sjb			mutex_exit(&dtrace_lock);
467179237Sjb			return (EINVAL);
468179237Sjb		}
469179237Sjb
470179237Sjb		if (ecb->dte_probe == NULL) {
471179237Sjb			mutex_exit(&dtrace_lock);
472179237Sjb			return (EINVAL);
473179237Sjb		}
474179237Sjb
475179237Sjb		epdesc.dtepd_probeid = ecb->dte_probe->dtpr_id;
476179237Sjb		epdesc.dtepd_uarg = ecb->dte_uarg;
477179237Sjb		epdesc.dtepd_size = ecb->dte_size;
478179237Sjb
479179237Sjb		nrecs = epdesc.dtepd_nrecs;
480179237Sjb		epdesc.dtepd_nrecs = 0;
481179237Sjb		for (act = ecb->dte_action; act != NULL; act = act->dta_next) {
482179237Sjb			if (DTRACEACT_ISAGG(act->dta_kind) || act->dta_intuple)
483179237Sjb				continue;
484179237Sjb
485179237Sjb			epdesc.dtepd_nrecs++;
486179237Sjb		}
487179237Sjb
488179237Sjb		/*
489179237Sjb		 * Now that we have the size, we need to allocate a temporary
490179237Sjb		 * buffer in which to store the complete description.  We need
491179237Sjb		 * the temporary buffer to be able to drop dtrace_lock()
492179237Sjb		 * across the copyout(), below.
493179237Sjb		 */
494179237Sjb		size = sizeof (dtrace_eprobedesc_t) +
495179237Sjb		    (epdesc.dtepd_nrecs * sizeof (dtrace_recdesc_t));
496179237Sjb
497179237Sjb		buf = kmem_alloc(size, KM_SLEEP);
498179237Sjb		dest = (uintptr_t)buf;
499179237Sjb
500179237Sjb		bcopy(&epdesc, (void *)dest, sizeof (epdesc));
501179237Sjb		dest += offsetof(dtrace_eprobedesc_t, dtepd_rec[0]);
502179237Sjb
503179237Sjb		for (act = ecb->dte_action; act != NULL; act = act->dta_next) {
504179237Sjb			if (DTRACEACT_ISAGG(act->dta_kind) || act->dta_intuple)
505179237Sjb				continue;
506179237Sjb
507179237Sjb			if (nrecs-- == 0)
508179237Sjb				break;
509179237Sjb
510179237Sjb			bcopy(&act->dta_rec, (void *)dest,
511179237Sjb			    sizeof (dtrace_recdesc_t));
512179237Sjb			dest += sizeof (dtrace_recdesc_t);
513179237Sjb		}
514179237Sjb
515179237Sjb		mutex_exit(&dtrace_lock);
516179237Sjb
517179237Sjb		if (copyout(buf, (void *) *pepdesc, dest - (uintptr_t)buf) != 0) {
518179237Sjb			kmem_free(buf, size);
519179237Sjb			return (EFAULT);
520179237Sjb		}
521179237Sjb
522179237Sjb		kmem_free(buf, size);
523179237Sjb		return (0);
524179237Sjb	}
525179237Sjb	case DTRACEIOC_FORMAT: {
526179237Sjb		dtrace_fmtdesc_t *fmt = (dtrace_fmtdesc_t *) addr;
527179237Sjb		char *str;
528179237Sjb		int len;
529179237Sjb
530179237Sjb		DTRACE_IOCTL_PRINTF("%s(%d): DTRACEIOC_FORMAT\n",__func__,__LINE__);
531179237Sjb
532179237Sjb		mutex_enter(&dtrace_lock);
533179237Sjb
534179237Sjb		if (fmt->dtfd_format == 0 ||
535179237Sjb		    fmt->dtfd_format > state->dts_nformats) {
536179237Sjb			mutex_exit(&dtrace_lock);
537179237Sjb			return (EINVAL);
538179237Sjb		}
539179237Sjb
540179237Sjb		/*
541179237Sjb		 * Format strings are allocated contiguously and they are
542179237Sjb		 * never freed; if a format index is less than the number
543179237Sjb		 * of formats, we can assert that the format map is non-NULL
544179237Sjb		 * and that the format for the specified index is non-NULL.
545179237Sjb		 */
546179237Sjb		ASSERT(state->dts_formats != NULL);
547179237Sjb		str = state->dts_formats[fmt->dtfd_format - 1];
548179237Sjb		ASSERT(str != NULL);
549179237Sjb
550179237Sjb		len = strlen(str) + 1;
551179237Sjb
552179237Sjb		if (len > fmt->dtfd_length) {
553179237Sjb			fmt->dtfd_length = len;
554179237Sjb		} else {
555179237Sjb			if (copyout(str, fmt->dtfd_string, len) != 0) {
556179237Sjb				mutex_exit(&dtrace_lock);
557179237Sjb				return (EINVAL);
558179237Sjb			}
559179237Sjb		}
560179237Sjb
561179237Sjb		mutex_exit(&dtrace_lock);
562179237Sjb		return (0);
563179237Sjb	}
564179237Sjb	case DTRACEIOC_GO: {
565179237Sjb		int rval;
566179237Sjb		processorid_t *cpuid = (processorid_t *) addr;
567179237Sjb
568179237Sjb		DTRACE_IOCTL_PRINTF("%s(%d): DTRACEIOC_GO\n",__func__,__LINE__);
569179237Sjb
570179237Sjb		rval = dtrace_state_go(state, cpuid);
571179237Sjb
572179237Sjb		return (rval);
573179237Sjb	}
574179237Sjb	case DTRACEIOC_PROBEARG: {
575179237Sjb		dtrace_argdesc_t *desc = (dtrace_argdesc_t *) addr;
576179237Sjb		dtrace_probe_t *probe;
577179237Sjb		dtrace_provider_t *prov;
578179237Sjb
579179237Sjb		DTRACE_IOCTL_PRINTF("%s(%d): DTRACEIOC_PROBEARG\n",__func__,__LINE__);
580179237Sjb
581179237Sjb		if (desc->dtargd_id == DTRACE_IDNONE)
582179237Sjb			return (EINVAL);
583179237Sjb
584179237Sjb		if (desc->dtargd_ndx == DTRACE_ARGNONE)
585179237Sjb			return (EINVAL);
586179237Sjb
587179237Sjb		mutex_enter(&dtrace_provider_lock);
588262052Savg#if defined(sun)
589179237Sjb		mutex_enter(&mod_lock);
590262052Savg#endif
591179237Sjb		mutex_enter(&dtrace_lock);
592179237Sjb
593179237Sjb		if (desc->dtargd_id > dtrace_nprobes) {
594179237Sjb			mutex_exit(&dtrace_lock);
595262052Savg#if defined(sun)
596179237Sjb			mutex_exit(&mod_lock);
597262052Savg#endif
598179237Sjb			mutex_exit(&dtrace_provider_lock);
599179237Sjb			return (EINVAL);
600179237Sjb		}
601179237Sjb
602179237Sjb		if ((probe = dtrace_probes[desc->dtargd_id - 1]) == NULL) {
603179237Sjb			mutex_exit(&dtrace_lock);
604262052Savg#if defined(sun)
605179237Sjb			mutex_exit(&mod_lock);
606262052Savg#endif
607179237Sjb			mutex_exit(&dtrace_provider_lock);
608179237Sjb			return (EINVAL);
609179237Sjb		}
610179237Sjb
611179237Sjb		mutex_exit(&dtrace_lock);
612179237Sjb
613179237Sjb		prov = probe->dtpr_provider;
614179237Sjb
615179237Sjb		if (prov->dtpv_pops.dtps_getargdesc == NULL) {
616179237Sjb			/*
617179237Sjb			 * There isn't any typed information for this probe.
618179237Sjb			 * Set the argument number to DTRACE_ARGNONE.
619179237Sjb			 */
620179237Sjb			desc->dtargd_ndx = DTRACE_ARGNONE;
621179237Sjb		} else {
622179237Sjb			desc->dtargd_native[0] = '\0';
623179237Sjb			desc->dtargd_xlate[0] = '\0';
624179237Sjb			desc->dtargd_mapping = desc->dtargd_ndx;
625179237Sjb
626179237Sjb			prov->dtpv_pops.dtps_getargdesc(prov->dtpv_arg,
627179237Sjb			    probe->dtpr_id, probe->dtpr_arg, desc);
628179237Sjb		}
629179237Sjb
630262052Savg#if defined(sun)
631179237Sjb		mutex_exit(&mod_lock);
632262052Savg#endif
633179237Sjb		mutex_exit(&dtrace_provider_lock);
634179237Sjb
635179237Sjb		return (0);
636179237Sjb	}
637179237Sjb	case DTRACEIOC_PROBEMATCH:
638179237Sjb	case DTRACEIOC_PROBES: {
639179237Sjb		dtrace_probedesc_t *p_desc = (dtrace_probedesc_t *) addr;
640179237Sjb		dtrace_probe_t *probe = NULL;
641179237Sjb		dtrace_probekey_t pkey;
642179237Sjb		dtrace_id_t i;
643179237Sjb		int m = 0;
644179237Sjb		uint32_t priv = 0;
645179237Sjb		uid_t uid = 0;
646179237Sjb		zoneid_t zoneid = 0;
647179237Sjb
648179237Sjb		DTRACE_IOCTL_PRINTF("%s(%d): %s\n",__func__,__LINE__,
649179237Sjb		    cmd == DTRACEIOC_PROBEMATCH ?
650179237Sjb		    "DTRACEIOC_PROBEMATCH":"DTRACEIOC_PROBES");
651179237Sjb
652179237Sjb		p_desc->dtpd_provider[DTRACE_PROVNAMELEN - 1] = '\0';
653179237Sjb		p_desc->dtpd_mod[DTRACE_MODNAMELEN - 1] = '\0';
654179237Sjb		p_desc->dtpd_func[DTRACE_FUNCNAMELEN - 1] = '\0';
655179237Sjb		p_desc->dtpd_name[DTRACE_NAMELEN - 1] = '\0';
656179237Sjb
657179237Sjb		/*
658179237Sjb		 * Before we attempt to match this probe, we want to give
659179237Sjb		 * all providers the opportunity to provide it.
660179237Sjb		 */
661179237Sjb		if (p_desc->dtpd_id == DTRACE_IDNONE) {
662179237Sjb			mutex_enter(&dtrace_provider_lock);
663179237Sjb			dtrace_probe_provide(p_desc, NULL);
664179237Sjb			mutex_exit(&dtrace_provider_lock);
665179237Sjb			p_desc->dtpd_id++;
666179237Sjb		}
667179237Sjb
668179237Sjb		if (cmd == DTRACEIOC_PROBEMATCH)  {
669179237Sjb			dtrace_probekey(p_desc, &pkey);
670179237Sjb			pkey.dtpk_id = DTRACE_IDNONE;
671179237Sjb		}
672179237Sjb
673179237Sjb		dtrace_cred2priv(td->td_ucred, &priv, &uid, &zoneid);
674179237Sjb
675179237Sjb		mutex_enter(&dtrace_lock);
676179237Sjb
677179237Sjb		if (cmd == DTRACEIOC_PROBEMATCH) {
678179237Sjb			for (i = p_desc->dtpd_id; i <= dtrace_nprobes; i++) {
679179237Sjb				if ((probe = dtrace_probes[i - 1]) != NULL &&
680179237Sjb				    (m = dtrace_match_probe(probe, &pkey,
681179237Sjb				    priv, uid, zoneid)) != 0)
682179237Sjb					break;
683179237Sjb			}
684179237Sjb
685179237Sjb			if (m < 0) {
686179237Sjb				mutex_exit(&dtrace_lock);
687179237Sjb				return (EINVAL);
688179237Sjb			}
689179237Sjb
690179237Sjb		} else {
691179237Sjb			for (i = p_desc->dtpd_id; i <= dtrace_nprobes; i++) {
692179237Sjb				if ((probe = dtrace_probes[i - 1]) != NULL &&
693179237Sjb				    dtrace_match_priv(probe, priv, uid, zoneid))
694179237Sjb					break;
695179237Sjb			}
696179237Sjb		}
697179237Sjb
698179237Sjb		if (probe == NULL) {
699179237Sjb			mutex_exit(&dtrace_lock);
700179237Sjb			return (ESRCH);
701179237Sjb		}
702179237Sjb
703179237Sjb		dtrace_probe_description(probe, p_desc);
704179237Sjb		mutex_exit(&dtrace_lock);
705179237Sjb
706179237Sjb		return (0);
707179237Sjb	}
708179237Sjb	case DTRACEIOC_PROVIDER: {
709179237Sjb		dtrace_providerdesc_t *pvd = (dtrace_providerdesc_t *) addr;
710179237Sjb		dtrace_provider_t *pvp;
711179237Sjb
712179237Sjb		DTRACE_IOCTL_PRINTF("%s(%d): DTRACEIOC_PROVIDER\n",__func__,__LINE__);
713179237Sjb
714179237Sjb		pvd->dtvd_name[DTRACE_PROVNAMELEN - 1] = '\0';
715179237Sjb		mutex_enter(&dtrace_provider_lock);
716179237Sjb
717179237Sjb		for (pvp = dtrace_provider; pvp != NULL; pvp = pvp->dtpv_next) {
718179237Sjb			if (strcmp(pvp->dtpv_name, pvd->dtvd_name) == 0)
719179237Sjb				break;
720179237Sjb		}
721179237Sjb
722179237Sjb		mutex_exit(&dtrace_provider_lock);
723179237Sjb
724179237Sjb		if (pvp == NULL)
725179237Sjb			return (ESRCH);
726179237Sjb
727179237Sjb		bcopy(&pvp->dtpv_priv, &pvd->dtvd_priv, sizeof (dtrace_ppriv_t));
728179237Sjb		bcopy(&pvp->dtpv_attr, &pvd->dtvd_attr, sizeof (dtrace_pattr_t));
729179237Sjb
730179237Sjb		return (0);
731179237Sjb	}
732179237Sjb	case DTRACEIOC_REPLICATE: {
733179237Sjb		dtrace_repldesc_t *desc = (dtrace_repldesc_t *) addr;
734179237Sjb		dtrace_probedesc_t *match = &desc->dtrpd_match;
735179237Sjb		dtrace_probedesc_t *create = &desc->dtrpd_create;
736179237Sjb		int err;
737179237Sjb
738179237Sjb		DTRACE_IOCTL_PRINTF("%s(%d): DTRACEIOC_REPLICATE\n",__func__,__LINE__);
739179237Sjb
740179237Sjb		match->dtpd_provider[DTRACE_PROVNAMELEN - 1] = '\0';
741179237Sjb		match->dtpd_mod[DTRACE_MODNAMELEN - 1] = '\0';
742179237Sjb		match->dtpd_func[DTRACE_FUNCNAMELEN - 1] = '\0';
743179237Sjb		match->dtpd_name[DTRACE_NAMELEN - 1] = '\0';
744179237Sjb
745179237Sjb		create->dtpd_provider[DTRACE_PROVNAMELEN - 1] = '\0';
746179237Sjb		create->dtpd_mod[DTRACE_MODNAMELEN - 1] = '\0';
747179237Sjb		create->dtpd_func[DTRACE_FUNCNAMELEN - 1] = '\0';
748179237Sjb		create->dtpd_name[DTRACE_NAMELEN - 1] = '\0';
749179237Sjb
750179237Sjb		mutex_enter(&dtrace_lock);
751179237Sjb		err = dtrace_enabling_replicate(state, match, create);
752179237Sjb		mutex_exit(&dtrace_lock);
753179237Sjb
754179237Sjb		return (err);
755179237Sjb	}
756179237Sjb	case DTRACEIOC_STATUS: {
757179237Sjb		dtrace_status_t *stat = (dtrace_status_t *) addr;
758179237Sjb		dtrace_dstate_t *dstate;
759179237Sjb		int i, j;
760179237Sjb		uint64_t nerrs;
761179237Sjb
762179237Sjb		DTRACE_IOCTL_PRINTF("%s(%d): DTRACEIOC_STATUS\n",__func__,__LINE__);
763179237Sjb
764179237Sjb		/*
765179237Sjb		 * See the comment in dtrace_state_deadman() for the reason
766179237Sjb		 * for setting dts_laststatus to INT64_MAX before setting
767179237Sjb		 * it to the correct value.
768179237Sjb		 */
769179237Sjb		state->dts_laststatus = INT64_MAX;
770179237Sjb		dtrace_membar_producer();
771179237Sjb		state->dts_laststatus = dtrace_gethrtime();
772179237Sjb
773179237Sjb		bzero(stat, sizeof (*stat));
774179237Sjb
775179237Sjb		mutex_enter(&dtrace_lock);
776179237Sjb
777179237Sjb		if (state->dts_activity == DTRACE_ACTIVITY_INACTIVE) {
778179237Sjb			mutex_exit(&dtrace_lock);
779179237Sjb			return (ENOENT);
780179237Sjb		}
781179237Sjb
782179237Sjb		if (state->dts_activity == DTRACE_ACTIVITY_DRAINING)
783179237Sjb			stat->dtst_exiting = 1;
784179237Sjb
785179237Sjb		nerrs = state->dts_errors;
786179237Sjb		dstate = &state->dts_vstate.dtvs_dynvars;
787179237Sjb
788179237Sjb		for (i = 0; i < NCPU; i++) {
789179237Sjb#if !defined(sun)
790179237Sjb			if (pcpu_find(i) == NULL)
791179237Sjb				continue;
792179237Sjb#endif
793179237Sjb			dtrace_dstate_percpu_t *dcpu = &dstate->dtds_percpu[i];
794179237Sjb
795179237Sjb			stat->dtst_dyndrops += dcpu->dtdsc_drops;
796179237Sjb			stat->dtst_dyndrops_dirty += dcpu->dtdsc_dirty_drops;
797179237Sjb			stat->dtst_dyndrops_rinsing += dcpu->dtdsc_rinsing_drops;
798179237Sjb
799179237Sjb			if (state->dts_buffer[i].dtb_flags & DTRACEBUF_FULL)
800179237Sjb				stat->dtst_filled++;
801179237Sjb
802179237Sjb			nerrs += state->dts_buffer[i].dtb_errors;
803179237Sjb
804179237Sjb			for (j = 0; j < state->dts_nspeculations; j++) {
805179237Sjb				dtrace_speculation_t *spec;
806179237Sjb				dtrace_buffer_t *buf;
807179237Sjb
808179237Sjb				spec = &state->dts_speculations[j];
809179237Sjb				buf = &spec->dtsp_buffer[i];
810179237Sjb				stat->dtst_specdrops += buf->dtb_xamot_drops;
811179237Sjb			}
812179237Sjb		}
813179237Sjb
814179237Sjb		stat->dtst_specdrops_busy = state->dts_speculations_busy;
815179237Sjb		stat->dtst_specdrops_unavail = state->dts_speculations_unavail;
816179237Sjb		stat->dtst_stkstroverflows = state->dts_stkstroverflows;
817179237Sjb		stat->dtst_dblerrors = state->dts_dblerrors;
818179237Sjb		stat->dtst_killed =
819179237Sjb		    (state->dts_activity == DTRACE_ACTIVITY_KILLED);
820179237Sjb		stat->dtst_errors = nerrs;
821179237Sjb
822179237Sjb		mutex_exit(&dtrace_lock);
823179237Sjb
824179237Sjb		return (0);
825179237Sjb	}
826179237Sjb	case DTRACEIOC_STOP: {
827179237Sjb		int rval;
828179237Sjb		processorid_t *cpuid = (processorid_t *) addr;
829179237Sjb
830179237Sjb		DTRACE_IOCTL_PRINTF("%s(%d): DTRACEIOC_STOP\n",__func__,__LINE__);
831179237Sjb
832179237Sjb		mutex_enter(&dtrace_lock);
833179237Sjb		rval = dtrace_state_stop(state, cpuid);
834179237Sjb		mutex_exit(&dtrace_lock);
835179237Sjb
836179237Sjb		return (rval);
837179237Sjb	}
838179237Sjb	default:
839179237Sjb		error = ENOTTY;
840179237Sjb	}
841179237Sjb	return (error);
842179237Sjb}
843