1179237Sjb/* 2179237Sjb * CDDL HEADER START 3179237Sjb * 4179237Sjb * The contents of this file are subject to the terms of the 5179237Sjb * Common Development and Distribution License (the "License"). 6179237Sjb * You may not use this file except in compliance with the License. 7179237Sjb * 8179237Sjb * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE 9179237Sjb * or http://www.opensolaris.org/os/licensing. 10179237Sjb * See the License for the specific language governing permissions 11179237Sjb * and limitations under the License. 12179237Sjb * 13179237Sjb * When distributing Covered Code, include this CDDL HEADER in each 14179237Sjb * file and include the License file at usr/src/OPENSOLARIS.LICENSE. 15179237Sjb * If applicable, add the following below this CDDL HEADER, with the 16179237Sjb * fields enclosed by brackets "[]" replaced with your own identifying 17179237Sjb * information: Portions Copyright [yyyy] [name of copyright owner] 18179237Sjb * 19179237Sjb * CDDL HEADER END 20179237Sjb * 21179237Sjb * $FreeBSD$ 22179237Sjb * 23179237Sjb */ 24179237Sjb 25179237Sjbstatic int dtrace_verbose_ioctl; 26266101SmarkjSYSCTL_INT(_debug_dtrace, OID_AUTO, verbose_ioctl, CTLFLAG_RW, 27266101Smarkj &dtrace_verbose_ioctl, 0, "log DTrace ioctls"); 28179237Sjb 29179237Sjb#define DTRACE_IOCTL_PRINTF(fmt, ...) if (dtrace_verbose_ioctl) printf(fmt, ## __VA_ARGS__ ) 30179237Sjb 31211608Srpaulostatic int 32211608Srpaulodtrace_ioctl_helper(struct cdev *dev, u_long cmd, caddr_t addr, int flags, 33211608Srpaulo struct thread *td) 34211608Srpaulo{ 35211608Srpaulo int rval; 36211608Srpaulo dof_helper_t *dhp = NULL; 37211608Srpaulo dof_hdr_t *dof = NULL; 38211608Srpaulo 39211608Srpaulo switch (cmd) { 40211608Srpaulo case DTRACEHIOC_ADDDOF: 41211608Srpaulo dhp = (dof_helper_t *)addr; 42211608Srpaulo /* XXX all because dofhp_dof is 64 bit */ 43211608Srpaulo#ifdef __i386 44211608Srpaulo addr = (caddr_t)(uint32_t)dhp->dofhp_dof; 45211608Srpaulo#else 46211608Srpaulo addr = (caddr_t)dhp->dofhp_dof; 47211608Srpaulo#endif 48211608Srpaulo /* FALLTHROUGH */ 49211608Srpaulo case DTRACEHIOC_ADD: 50211608Srpaulo dof = dtrace_dof_copyin((intptr_t)addr, &rval); 51211608Srpaulo 52211608Srpaulo if (dof == NULL) 53211608Srpaulo return (rval); 54211608Srpaulo 55211608Srpaulo mutex_enter(&dtrace_lock); 56211608Srpaulo if ((rval = dtrace_helper_slurp((dof_hdr_t *)dof, dhp)) != -1) { 57211608Srpaulo if (dhp) { 58211608Srpaulo dhp->gen = rval; 59211608Srpaulo copyout(dhp, addr, sizeof(*dhp)); 60211608Srpaulo } 61211608Srpaulo rval = 0; 62211608Srpaulo } else { 63211608Srpaulo rval = EINVAL; 64211608Srpaulo } 65211608Srpaulo mutex_exit(&dtrace_lock); 66211608Srpaulo return (rval); 67211608Srpaulo case DTRACEHIOC_REMOVE: 68211608Srpaulo mutex_enter(&dtrace_lock); 69211608Srpaulo rval = dtrace_helper_destroygen((int)*addr); 70211608Srpaulo mutex_exit(&dtrace_lock); 71211608Srpaulo 72211608Srpaulo return (rval); 73211608Srpaulo default: 74211608Srpaulo break; 75211608Srpaulo } 76211608Srpaulo 77211608Srpaulo return (ENOTTY); 78211608Srpaulo} 79211608Srpaulo 80179237Sjb/* ARGSUSED */ 81179237Sjbstatic int 82179237Sjbdtrace_ioctl(struct cdev *dev, u_long cmd, caddr_t addr, 83179237Sjb int flags __unused, struct thread *td) 84179237Sjb{ 85184698Srodrigc#if __FreeBSD_version < 800039 86179237Sjb dtrace_state_t *state = dev->si_drv1; 87184698Srodrigc#else 88184698Srodrigc dtrace_state_t *state; 89184698Srodrigc devfs_get_cdevpriv((void **) &state); 90184698Srodrigc#endif 91179237Sjb int error = 0; 92179237Sjb if (state == NULL) 93179237Sjb return (EINVAL); 94179237Sjb 95179237Sjb if (state->dts_anon) { 96179237Sjb ASSERT(dtrace_anon.dta_state == NULL); 97179237Sjb state = state->dts_anon; 98179237Sjb } 99179237Sjb 100179237Sjb switch (cmd) { 101179237Sjb case DTRACEIOC_AGGDESC: { 102179237Sjb dtrace_aggdesc_t **paggdesc = (dtrace_aggdesc_t **) addr; 103179237Sjb dtrace_aggdesc_t aggdesc; 104179237Sjb dtrace_action_t *act; 105179237Sjb dtrace_aggregation_t *agg; 106179237Sjb int nrecs; 107179237Sjb uint32_t offs; 108179237Sjb dtrace_recdesc_t *lrec; 109179237Sjb void *buf; 110179237Sjb size_t size; 111179237Sjb uintptr_t dest; 112179237Sjb 113179237Sjb DTRACE_IOCTL_PRINTF("%s(%d): DTRACEIOC_AGGDESC\n",__func__,__LINE__); 114179237Sjb 115179237Sjb if (copyin((void *) *paggdesc, &aggdesc, sizeof (aggdesc)) != 0) 116179237Sjb return (EFAULT); 117179237Sjb 118179237Sjb mutex_enter(&dtrace_lock); 119179237Sjb 120179237Sjb if ((agg = dtrace_aggid2agg(state, aggdesc.dtagd_id)) == NULL) { 121179237Sjb mutex_exit(&dtrace_lock); 122179237Sjb return (EINVAL); 123179237Sjb } 124179237Sjb 125179237Sjb aggdesc.dtagd_epid = agg->dtag_ecb->dte_epid; 126179237Sjb 127179237Sjb nrecs = aggdesc.dtagd_nrecs; 128179237Sjb aggdesc.dtagd_nrecs = 0; 129179237Sjb 130179237Sjb offs = agg->dtag_base; 131179237Sjb lrec = &agg->dtag_action.dta_rec; 132179237Sjb aggdesc.dtagd_size = lrec->dtrd_offset + lrec->dtrd_size - offs; 133179237Sjb 134179237Sjb for (act = agg->dtag_first; ; act = act->dta_next) { 135179237Sjb ASSERT(act->dta_intuple || 136179237Sjb DTRACEACT_ISAGG(act->dta_kind)); 137179237Sjb 138179237Sjb /* 139179237Sjb * If this action has a record size of zero, it 140179237Sjb * denotes an argument to the aggregating action. 141179237Sjb * Because the presence of this record doesn't (or 142179237Sjb * shouldn't) affect the way the data is interpreted, 143179237Sjb * we don't copy it out to save user-level the 144179237Sjb * confusion of dealing with a zero-length record. 145179237Sjb */ 146179237Sjb if (act->dta_rec.dtrd_size == 0) { 147179237Sjb ASSERT(agg->dtag_hasarg); 148179237Sjb continue; 149179237Sjb } 150179237Sjb 151179237Sjb aggdesc.dtagd_nrecs++; 152179237Sjb 153179237Sjb if (act == &agg->dtag_action) 154179237Sjb break; 155179237Sjb } 156179237Sjb 157179237Sjb /* 158179237Sjb * Now that we have the size, we need to allocate a temporary 159179237Sjb * buffer in which to store the complete description. We need 160179237Sjb * the temporary buffer to be able to drop dtrace_lock() 161179237Sjb * across the copyout(), below. 162179237Sjb */ 163179237Sjb size = sizeof (dtrace_aggdesc_t) + 164179237Sjb (aggdesc.dtagd_nrecs * sizeof (dtrace_recdesc_t)); 165179237Sjb 166179237Sjb buf = kmem_alloc(size, KM_SLEEP); 167179237Sjb dest = (uintptr_t)buf; 168179237Sjb 169179237Sjb bcopy(&aggdesc, (void *)dest, sizeof (aggdesc)); 170179237Sjb dest += offsetof(dtrace_aggdesc_t, dtagd_rec[0]); 171179237Sjb 172179237Sjb for (act = agg->dtag_first; ; act = act->dta_next) { 173179237Sjb dtrace_recdesc_t rec = act->dta_rec; 174179237Sjb 175179237Sjb /* 176179237Sjb * See the comment in the above loop for why we pass 177179237Sjb * over zero-length records. 178179237Sjb */ 179179237Sjb if (rec.dtrd_size == 0) { 180179237Sjb ASSERT(agg->dtag_hasarg); 181179237Sjb continue; 182179237Sjb } 183179237Sjb 184179237Sjb if (nrecs-- == 0) 185179237Sjb break; 186179237Sjb 187179237Sjb rec.dtrd_offset -= offs; 188179237Sjb bcopy(&rec, (void *)dest, sizeof (rec)); 189179237Sjb dest += sizeof (dtrace_recdesc_t); 190179237Sjb 191179237Sjb if (act == &agg->dtag_action) 192179237Sjb break; 193179237Sjb } 194179237Sjb 195179237Sjb mutex_exit(&dtrace_lock); 196179237Sjb 197179237Sjb if (copyout(buf, (void *) *paggdesc, dest - (uintptr_t)buf) != 0) { 198179237Sjb kmem_free(buf, size); 199179237Sjb return (EFAULT); 200179237Sjb } 201179237Sjb 202179237Sjb kmem_free(buf, size); 203179237Sjb return (0); 204179237Sjb } 205179237Sjb case DTRACEIOC_AGGSNAP: 206179237Sjb case DTRACEIOC_BUFSNAP: { 207179237Sjb dtrace_bufdesc_t **pdesc = (dtrace_bufdesc_t **) addr; 208179237Sjb dtrace_bufdesc_t desc; 209179237Sjb caddr_t cached; 210179237Sjb dtrace_buffer_t *buf; 211179237Sjb 212179237Sjb dtrace_debug_output(); 213179237Sjb 214179237Sjb if (copyin((void *) *pdesc, &desc, sizeof (desc)) != 0) 215179237Sjb return (EFAULT); 216179237Sjb 217179237Sjb DTRACE_IOCTL_PRINTF("%s(%d): %s curcpu %d cpu %d\n", 218179237Sjb __func__,__LINE__, 219179237Sjb cmd == DTRACEIOC_AGGSNAP ? 220179237Sjb "DTRACEIOC_AGGSNAP":"DTRACEIOC_BUFSNAP", 221179237Sjb curcpu, desc.dtbd_cpu); 222179237Sjb 223179237Sjb if (desc.dtbd_cpu < 0 || desc.dtbd_cpu >= NCPU) 224179237Sjb return (ENOENT); 225179237Sjb if (pcpu_find(desc.dtbd_cpu) == NULL) 226179237Sjb return (ENOENT); 227179237Sjb 228179237Sjb mutex_enter(&dtrace_lock); 229179237Sjb 230179237Sjb if (cmd == DTRACEIOC_BUFSNAP) { 231179237Sjb buf = &state->dts_buffer[desc.dtbd_cpu]; 232179237Sjb } else { 233179237Sjb buf = &state->dts_aggbuffer[desc.dtbd_cpu]; 234179237Sjb } 235179237Sjb 236179237Sjb if (buf->dtb_flags & (DTRACEBUF_RING | DTRACEBUF_FILL)) { 237179237Sjb size_t sz = buf->dtb_offset; 238179237Sjb 239179237Sjb if (state->dts_activity != DTRACE_ACTIVITY_STOPPED) { 240179237Sjb mutex_exit(&dtrace_lock); 241179237Sjb return (EBUSY); 242179237Sjb } 243179237Sjb 244179237Sjb /* 245179237Sjb * If this buffer has already been consumed, we're 246179237Sjb * going to indicate that there's nothing left here 247179237Sjb * to consume. 248179237Sjb */ 249179237Sjb if (buf->dtb_flags & DTRACEBUF_CONSUMED) { 250179237Sjb mutex_exit(&dtrace_lock); 251179237Sjb 252179237Sjb desc.dtbd_size = 0; 253179237Sjb desc.dtbd_drops = 0; 254179237Sjb desc.dtbd_errors = 0; 255179237Sjb desc.dtbd_oldest = 0; 256179237Sjb sz = sizeof (desc); 257179237Sjb 258179237Sjb if (copyout(&desc, (void *) *pdesc, sz) != 0) 259179237Sjb return (EFAULT); 260179237Sjb 261179237Sjb return (0); 262179237Sjb } 263179237Sjb 264179237Sjb /* 265179237Sjb * If this is a ring buffer that has wrapped, we want 266179237Sjb * to copy the whole thing out. 267179237Sjb */ 268179237Sjb if (buf->dtb_flags & DTRACEBUF_WRAPPED) { 269179237Sjb dtrace_buffer_polish(buf); 270179237Sjb sz = buf->dtb_size; 271179237Sjb } 272179237Sjb 273179237Sjb if (copyout(buf->dtb_tomax, desc.dtbd_data, sz) != 0) { 274179237Sjb mutex_exit(&dtrace_lock); 275179237Sjb return (EFAULT); 276179237Sjb } 277179237Sjb 278179237Sjb desc.dtbd_size = sz; 279179237Sjb desc.dtbd_drops = buf->dtb_drops; 280179237Sjb desc.dtbd_errors = buf->dtb_errors; 281179237Sjb desc.dtbd_oldest = buf->dtb_xamot_offset; 282256002Spfg desc.dtbd_timestamp = dtrace_gethrtime(); 283179237Sjb 284179237Sjb mutex_exit(&dtrace_lock); 285179237Sjb 286179237Sjb if (copyout(&desc, (void *) *pdesc, sizeof (desc)) != 0) 287179237Sjb return (EFAULT); 288179237Sjb 289179237Sjb buf->dtb_flags |= DTRACEBUF_CONSUMED; 290179237Sjb 291179237Sjb return (0); 292179237Sjb } 293179237Sjb 294179237Sjb if (buf->dtb_tomax == NULL) { 295179237Sjb ASSERT(buf->dtb_xamot == NULL); 296179237Sjb mutex_exit(&dtrace_lock); 297179237Sjb return (ENOENT); 298179237Sjb } 299179237Sjb 300179237Sjb cached = buf->dtb_tomax; 301179237Sjb ASSERT(!(buf->dtb_flags & DTRACEBUF_NOSWITCH)); 302179237Sjb 303179237Sjb dtrace_xcall(desc.dtbd_cpu, 304179237Sjb (dtrace_xcall_t)dtrace_buffer_switch, buf); 305179237Sjb 306179237Sjb state->dts_errors += buf->dtb_xamot_errors; 307179237Sjb 308179237Sjb /* 309179237Sjb * If the buffers did not actually switch, then the cross call 310179237Sjb * did not take place -- presumably because the given CPU is 311179237Sjb * not in the ready set. If this is the case, we'll return 312179237Sjb * ENOENT. 313179237Sjb */ 314179237Sjb if (buf->dtb_tomax == cached) { 315179237Sjb ASSERT(buf->dtb_xamot != cached); 316179237Sjb mutex_exit(&dtrace_lock); 317179237Sjb return (ENOENT); 318179237Sjb } 319179237Sjb 320179237Sjb ASSERT(cached == buf->dtb_xamot); 321179237Sjb 322179237Sjb DTRACE_IOCTL_PRINTF("%s(%d): copyout the buffer snapshot\n",__func__,__LINE__); 323179237Sjb 324179237Sjb /* 325179237Sjb * We have our snapshot; now copy it out. 326179237Sjb */ 327179237Sjb if (copyout(buf->dtb_xamot, desc.dtbd_data, 328179237Sjb buf->dtb_xamot_offset) != 0) { 329179237Sjb mutex_exit(&dtrace_lock); 330179237Sjb return (EFAULT); 331179237Sjb } 332179237Sjb 333179237Sjb desc.dtbd_size = buf->dtb_xamot_offset; 334179237Sjb desc.dtbd_drops = buf->dtb_xamot_drops; 335179237Sjb desc.dtbd_errors = buf->dtb_xamot_errors; 336179237Sjb desc.dtbd_oldest = 0; 337256002Spfg desc.dtbd_timestamp = buf->dtb_switched; 338179237Sjb 339179237Sjb mutex_exit(&dtrace_lock); 340179237Sjb 341179237Sjb DTRACE_IOCTL_PRINTF("%s(%d): copyout buffer desc: size %zd drops %lu errors %lu\n",__func__,__LINE__,(size_t) desc.dtbd_size,(u_long) desc.dtbd_drops,(u_long) desc.dtbd_errors); 342179237Sjb 343179237Sjb /* 344179237Sjb * Finally, copy out the buffer description. 345179237Sjb */ 346179237Sjb if (copyout(&desc, (void *) *pdesc, sizeof (desc)) != 0) 347179237Sjb return (EFAULT); 348179237Sjb 349179237Sjb return (0); 350179237Sjb } 351179237Sjb case DTRACEIOC_CONF: { 352179237Sjb dtrace_conf_t conf; 353179237Sjb 354179237Sjb DTRACE_IOCTL_PRINTF("%s(%d): DTRACEIOC_CONF\n",__func__,__LINE__); 355179237Sjb 356179237Sjb bzero(&conf, sizeof (conf)); 357179237Sjb conf.dtc_difversion = DIF_VERSION; 358179237Sjb conf.dtc_difintregs = DIF_DIR_NREGS; 359179237Sjb conf.dtc_diftupregs = DIF_DTR_NREGS; 360179237Sjb conf.dtc_ctfmodel = CTF_MODEL_NATIVE; 361179237Sjb 362179237Sjb *((dtrace_conf_t *) addr) = conf; 363179237Sjb 364179237Sjb return (0); 365179237Sjb } 366179237Sjb case DTRACEIOC_DOFGET: { 367179237Sjb dof_hdr_t **pdof = (dof_hdr_t **) addr; 368179237Sjb dof_hdr_t hdr, *dof = *pdof; 369179237Sjb int rval; 370179237Sjb uint64_t len; 371179237Sjb 372179237Sjb DTRACE_IOCTL_PRINTF("%s(%d): DTRACEIOC_DOFGET\n",__func__,__LINE__); 373179237Sjb 374179237Sjb if (copyin((void *)dof, &hdr, sizeof (hdr)) != 0) 375179237Sjb return (EFAULT); 376179237Sjb 377179237Sjb mutex_enter(&dtrace_lock); 378179237Sjb dof = dtrace_dof_create(state); 379179237Sjb mutex_exit(&dtrace_lock); 380179237Sjb 381179237Sjb len = MIN(hdr.dofh_loadsz, dof->dofh_loadsz); 382179237Sjb rval = copyout(dof, (void *) *pdof, len); 383179237Sjb dtrace_dof_destroy(dof); 384179237Sjb 385179237Sjb return (rval == 0 ? 0 : EFAULT); 386179237Sjb } 387179237Sjb case DTRACEIOC_ENABLE: { 388179237Sjb dof_hdr_t *dof = NULL; 389179237Sjb dtrace_enabling_t *enab = NULL; 390179237Sjb dtrace_vstate_t *vstate; 391179237Sjb int err = 0; 392179237Sjb int rval; 393179237Sjb dtrace_enable_io_t *p = (dtrace_enable_io_t *) addr; 394179237Sjb 395179237Sjb DTRACE_IOCTL_PRINTF("%s(%d): DTRACEIOC_ENABLE\n",__func__,__LINE__); 396179237Sjb 397179237Sjb /* 398179237Sjb * If a NULL argument has been passed, we take this as our 399179237Sjb * cue to reevaluate our enablings. 400179237Sjb */ 401179237Sjb if (p->dof == NULL) { 402179237Sjb dtrace_enabling_matchall(); 403179237Sjb 404179237Sjb return (0); 405179237Sjb } 406179237Sjb 407179237Sjb if ((dof = dtrace_dof_copyin((uintptr_t) p->dof, &rval)) == NULL) 408179237Sjb return (EINVAL); 409179237Sjb 410179237Sjb mutex_enter(&cpu_lock); 411179237Sjb mutex_enter(&dtrace_lock); 412179237Sjb vstate = &state->dts_vstate; 413179237Sjb 414179237Sjb if (state->dts_activity != DTRACE_ACTIVITY_INACTIVE) { 415179237Sjb mutex_exit(&dtrace_lock); 416179237Sjb mutex_exit(&cpu_lock); 417179237Sjb dtrace_dof_destroy(dof); 418179237Sjb return (EBUSY); 419179237Sjb } 420179237Sjb 421179237Sjb if (dtrace_dof_slurp(dof, vstate, td->td_ucred, &enab, 0, B_TRUE) != 0) { 422179237Sjb mutex_exit(&dtrace_lock); 423179237Sjb mutex_exit(&cpu_lock); 424179237Sjb dtrace_dof_destroy(dof); 425179237Sjb return (EINVAL); 426179237Sjb } 427179237Sjb 428179237Sjb if ((rval = dtrace_dof_options(dof, state)) != 0) { 429179237Sjb dtrace_enabling_destroy(enab); 430179237Sjb mutex_exit(&dtrace_lock); 431179237Sjb mutex_exit(&cpu_lock); 432179237Sjb dtrace_dof_destroy(dof); 433179237Sjb return (rval); 434179237Sjb } 435179237Sjb 436179237Sjb if ((err = dtrace_enabling_match(enab, &p->n_matched)) == 0) { 437179237Sjb err = dtrace_enabling_retain(enab); 438179237Sjb } else { 439179237Sjb dtrace_enabling_destroy(enab); 440179237Sjb } 441179237Sjb 442179237Sjb mutex_exit(&cpu_lock); 443179237Sjb mutex_exit(&dtrace_lock); 444179237Sjb dtrace_dof_destroy(dof); 445179237Sjb 446179237Sjb return (err); 447179237Sjb } 448179237Sjb case DTRACEIOC_EPROBE: { 449179237Sjb dtrace_eprobedesc_t **pepdesc = (dtrace_eprobedesc_t **) addr; 450179237Sjb dtrace_eprobedesc_t epdesc; 451179237Sjb dtrace_ecb_t *ecb; 452179237Sjb dtrace_action_t *act; 453179237Sjb void *buf; 454179237Sjb size_t size; 455179237Sjb uintptr_t dest; 456179237Sjb int nrecs; 457179237Sjb 458179237Sjb DTRACE_IOCTL_PRINTF("%s(%d): DTRACEIOC_EPROBE\n",__func__,__LINE__); 459179237Sjb 460179237Sjb if (copyin((void *)*pepdesc, &epdesc, sizeof (epdesc)) != 0) 461179237Sjb return (EFAULT); 462179237Sjb 463179237Sjb mutex_enter(&dtrace_lock); 464179237Sjb 465179237Sjb if ((ecb = dtrace_epid2ecb(state, epdesc.dtepd_epid)) == NULL) { 466179237Sjb mutex_exit(&dtrace_lock); 467179237Sjb return (EINVAL); 468179237Sjb } 469179237Sjb 470179237Sjb if (ecb->dte_probe == NULL) { 471179237Sjb mutex_exit(&dtrace_lock); 472179237Sjb return (EINVAL); 473179237Sjb } 474179237Sjb 475179237Sjb epdesc.dtepd_probeid = ecb->dte_probe->dtpr_id; 476179237Sjb epdesc.dtepd_uarg = ecb->dte_uarg; 477179237Sjb epdesc.dtepd_size = ecb->dte_size; 478179237Sjb 479179237Sjb nrecs = epdesc.dtepd_nrecs; 480179237Sjb epdesc.dtepd_nrecs = 0; 481179237Sjb for (act = ecb->dte_action; act != NULL; act = act->dta_next) { 482179237Sjb if (DTRACEACT_ISAGG(act->dta_kind) || act->dta_intuple) 483179237Sjb continue; 484179237Sjb 485179237Sjb epdesc.dtepd_nrecs++; 486179237Sjb } 487179237Sjb 488179237Sjb /* 489179237Sjb * Now that we have the size, we need to allocate a temporary 490179237Sjb * buffer in which to store the complete description. We need 491179237Sjb * the temporary buffer to be able to drop dtrace_lock() 492179237Sjb * across the copyout(), below. 493179237Sjb */ 494179237Sjb size = sizeof (dtrace_eprobedesc_t) + 495179237Sjb (epdesc.dtepd_nrecs * sizeof (dtrace_recdesc_t)); 496179237Sjb 497179237Sjb buf = kmem_alloc(size, KM_SLEEP); 498179237Sjb dest = (uintptr_t)buf; 499179237Sjb 500179237Sjb bcopy(&epdesc, (void *)dest, sizeof (epdesc)); 501179237Sjb dest += offsetof(dtrace_eprobedesc_t, dtepd_rec[0]); 502179237Sjb 503179237Sjb for (act = ecb->dte_action; act != NULL; act = act->dta_next) { 504179237Sjb if (DTRACEACT_ISAGG(act->dta_kind) || act->dta_intuple) 505179237Sjb continue; 506179237Sjb 507179237Sjb if (nrecs-- == 0) 508179237Sjb break; 509179237Sjb 510179237Sjb bcopy(&act->dta_rec, (void *)dest, 511179237Sjb sizeof (dtrace_recdesc_t)); 512179237Sjb dest += sizeof (dtrace_recdesc_t); 513179237Sjb } 514179237Sjb 515179237Sjb mutex_exit(&dtrace_lock); 516179237Sjb 517179237Sjb if (copyout(buf, (void *) *pepdesc, dest - (uintptr_t)buf) != 0) { 518179237Sjb kmem_free(buf, size); 519179237Sjb return (EFAULT); 520179237Sjb } 521179237Sjb 522179237Sjb kmem_free(buf, size); 523179237Sjb return (0); 524179237Sjb } 525179237Sjb case DTRACEIOC_FORMAT: { 526179237Sjb dtrace_fmtdesc_t *fmt = (dtrace_fmtdesc_t *) addr; 527179237Sjb char *str; 528179237Sjb int len; 529179237Sjb 530179237Sjb DTRACE_IOCTL_PRINTF("%s(%d): DTRACEIOC_FORMAT\n",__func__,__LINE__); 531179237Sjb 532179237Sjb mutex_enter(&dtrace_lock); 533179237Sjb 534179237Sjb if (fmt->dtfd_format == 0 || 535179237Sjb fmt->dtfd_format > state->dts_nformats) { 536179237Sjb mutex_exit(&dtrace_lock); 537179237Sjb return (EINVAL); 538179237Sjb } 539179237Sjb 540179237Sjb /* 541179237Sjb * Format strings are allocated contiguously and they are 542179237Sjb * never freed; if a format index is less than the number 543179237Sjb * of formats, we can assert that the format map is non-NULL 544179237Sjb * and that the format for the specified index is non-NULL. 545179237Sjb */ 546179237Sjb ASSERT(state->dts_formats != NULL); 547179237Sjb str = state->dts_formats[fmt->dtfd_format - 1]; 548179237Sjb ASSERT(str != NULL); 549179237Sjb 550179237Sjb len = strlen(str) + 1; 551179237Sjb 552179237Sjb if (len > fmt->dtfd_length) { 553179237Sjb fmt->dtfd_length = len; 554179237Sjb } else { 555179237Sjb if (copyout(str, fmt->dtfd_string, len) != 0) { 556179237Sjb mutex_exit(&dtrace_lock); 557179237Sjb return (EINVAL); 558179237Sjb } 559179237Sjb } 560179237Sjb 561179237Sjb mutex_exit(&dtrace_lock); 562179237Sjb return (0); 563179237Sjb } 564179237Sjb case DTRACEIOC_GO: { 565179237Sjb int rval; 566179237Sjb processorid_t *cpuid = (processorid_t *) addr; 567179237Sjb 568179237Sjb DTRACE_IOCTL_PRINTF("%s(%d): DTRACEIOC_GO\n",__func__,__LINE__); 569179237Sjb 570179237Sjb rval = dtrace_state_go(state, cpuid); 571179237Sjb 572179237Sjb return (rval); 573179237Sjb } 574179237Sjb case DTRACEIOC_PROBEARG: { 575179237Sjb dtrace_argdesc_t *desc = (dtrace_argdesc_t *) addr; 576179237Sjb dtrace_probe_t *probe; 577179237Sjb dtrace_provider_t *prov; 578179237Sjb 579179237Sjb DTRACE_IOCTL_PRINTF("%s(%d): DTRACEIOC_PROBEARG\n",__func__,__LINE__); 580179237Sjb 581179237Sjb if (desc->dtargd_id == DTRACE_IDNONE) 582179237Sjb return (EINVAL); 583179237Sjb 584179237Sjb if (desc->dtargd_ndx == DTRACE_ARGNONE) 585179237Sjb return (EINVAL); 586179237Sjb 587179237Sjb mutex_enter(&dtrace_provider_lock); 588262052Savg#if defined(sun) 589179237Sjb mutex_enter(&mod_lock); 590262052Savg#endif 591179237Sjb mutex_enter(&dtrace_lock); 592179237Sjb 593179237Sjb if (desc->dtargd_id > dtrace_nprobes) { 594179237Sjb mutex_exit(&dtrace_lock); 595262052Savg#if defined(sun) 596179237Sjb mutex_exit(&mod_lock); 597262052Savg#endif 598179237Sjb mutex_exit(&dtrace_provider_lock); 599179237Sjb return (EINVAL); 600179237Sjb } 601179237Sjb 602179237Sjb if ((probe = dtrace_probes[desc->dtargd_id - 1]) == NULL) { 603179237Sjb mutex_exit(&dtrace_lock); 604262052Savg#if defined(sun) 605179237Sjb mutex_exit(&mod_lock); 606262052Savg#endif 607179237Sjb mutex_exit(&dtrace_provider_lock); 608179237Sjb return (EINVAL); 609179237Sjb } 610179237Sjb 611179237Sjb mutex_exit(&dtrace_lock); 612179237Sjb 613179237Sjb prov = probe->dtpr_provider; 614179237Sjb 615179237Sjb if (prov->dtpv_pops.dtps_getargdesc == NULL) { 616179237Sjb /* 617179237Sjb * There isn't any typed information for this probe. 618179237Sjb * Set the argument number to DTRACE_ARGNONE. 619179237Sjb */ 620179237Sjb desc->dtargd_ndx = DTRACE_ARGNONE; 621179237Sjb } else { 622179237Sjb desc->dtargd_native[0] = '\0'; 623179237Sjb desc->dtargd_xlate[0] = '\0'; 624179237Sjb desc->dtargd_mapping = desc->dtargd_ndx; 625179237Sjb 626179237Sjb prov->dtpv_pops.dtps_getargdesc(prov->dtpv_arg, 627179237Sjb probe->dtpr_id, probe->dtpr_arg, desc); 628179237Sjb } 629179237Sjb 630262052Savg#if defined(sun) 631179237Sjb mutex_exit(&mod_lock); 632262052Savg#endif 633179237Sjb mutex_exit(&dtrace_provider_lock); 634179237Sjb 635179237Sjb return (0); 636179237Sjb } 637179237Sjb case DTRACEIOC_PROBEMATCH: 638179237Sjb case DTRACEIOC_PROBES: { 639179237Sjb dtrace_probedesc_t *p_desc = (dtrace_probedesc_t *) addr; 640179237Sjb dtrace_probe_t *probe = NULL; 641179237Sjb dtrace_probekey_t pkey; 642179237Sjb dtrace_id_t i; 643179237Sjb int m = 0; 644179237Sjb uint32_t priv = 0; 645179237Sjb uid_t uid = 0; 646179237Sjb zoneid_t zoneid = 0; 647179237Sjb 648179237Sjb DTRACE_IOCTL_PRINTF("%s(%d): %s\n",__func__,__LINE__, 649179237Sjb cmd == DTRACEIOC_PROBEMATCH ? 650179237Sjb "DTRACEIOC_PROBEMATCH":"DTRACEIOC_PROBES"); 651179237Sjb 652179237Sjb p_desc->dtpd_provider[DTRACE_PROVNAMELEN - 1] = '\0'; 653179237Sjb p_desc->dtpd_mod[DTRACE_MODNAMELEN - 1] = '\0'; 654179237Sjb p_desc->dtpd_func[DTRACE_FUNCNAMELEN - 1] = '\0'; 655179237Sjb p_desc->dtpd_name[DTRACE_NAMELEN - 1] = '\0'; 656179237Sjb 657179237Sjb /* 658179237Sjb * Before we attempt to match this probe, we want to give 659179237Sjb * all providers the opportunity to provide it. 660179237Sjb */ 661179237Sjb if (p_desc->dtpd_id == DTRACE_IDNONE) { 662179237Sjb mutex_enter(&dtrace_provider_lock); 663179237Sjb dtrace_probe_provide(p_desc, NULL); 664179237Sjb mutex_exit(&dtrace_provider_lock); 665179237Sjb p_desc->dtpd_id++; 666179237Sjb } 667179237Sjb 668179237Sjb if (cmd == DTRACEIOC_PROBEMATCH) { 669179237Sjb dtrace_probekey(p_desc, &pkey); 670179237Sjb pkey.dtpk_id = DTRACE_IDNONE; 671179237Sjb } 672179237Sjb 673179237Sjb dtrace_cred2priv(td->td_ucred, &priv, &uid, &zoneid); 674179237Sjb 675179237Sjb mutex_enter(&dtrace_lock); 676179237Sjb 677179237Sjb if (cmd == DTRACEIOC_PROBEMATCH) { 678179237Sjb for (i = p_desc->dtpd_id; i <= dtrace_nprobes; i++) { 679179237Sjb if ((probe = dtrace_probes[i - 1]) != NULL && 680179237Sjb (m = dtrace_match_probe(probe, &pkey, 681179237Sjb priv, uid, zoneid)) != 0) 682179237Sjb break; 683179237Sjb } 684179237Sjb 685179237Sjb if (m < 0) { 686179237Sjb mutex_exit(&dtrace_lock); 687179237Sjb return (EINVAL); 688179237Sjb } 689179237Sjb 690179237Sjb } else { 691179237Sjb for (i = p_desc->dtpd_id; i <= dtrace_nprobes; i++) { 692179237Sjb if ((probe = dtrace_probes[i - 1]) != NULL && 693179237Sjb dtrace_match_priv(probe, priv, uid, zoneid)) 694179237Sjb break; 695179237Sjb } 696179237Sjb } 697179237Sjb 698179237Sjb if (probe == NULL) { 699179237Sjb mutex_exit(&dtrace_lock); 700179237Sjb return (ESRCH); 701179237Sjb } 702179237Sjb 703179237Sjb dtrace_probe_description(probe, p_desc); 704179237Sjb mutex_exit(&dtrace_lock); 705179237Sjb 706179237Sjb return (0); 707179237Sjb } 708179237Sjb case DTRACEIOC_PROVIDER: { 709179237Sjb dtrace_providerdesc_t *pvd = (dtrace_providerdesc_t *) addr; 710179237Sjb dtrace_provider_t *pvp; 711179237Sjb 712179237Sjb DTRACE_IOCTL_PRINTF("%s(%d): DTRACEIOC_PROVIDER\n",__func__,__LINE__); 713179237Sjb 714179237Sjb pvd->dtvd_name[DTRACE_PROVNAMELEN - 1] = '\0'; 715179237Sjb mutex_enter(&dtrace_provider_lock); 716179237Sjb 717179237Sjb for (pvp = dtrace_provider; pvp != NULL; pvp = pvp->dtpv_next) { 718179237Sjb if (strcmp(pvp->dtpv_name, pvd->dtvd_name) == 0) 719179237Sjb break; 720179237Sjb } 721179237Sjb 722179237Sjb mutex_exit(&dtrace_provider_lock); 723179237Sjb 724179237Sjb if (pvp == NULL) 725179237Sjb return (ESRCH); 726179237Sjb 727179237Sjb bcopy(&pvp->dtpv_priv, &pvd->dtvd_priv, sizeof (dtrace_ppriv_t)); 728179237Sjb bcopy(&pvp->dtpv_attr, &pvd->dtvd_attr, sizeof (dtrace_pattr_t)); 729179237Sjb 730179237Sjb return (0); 731179237Sjb } 732179237Sjb case DTRACEIOC_REPLICATE: { 733179237Sjb dtrace_repldesc_t *desc = (dtrace_repldesc_t *) addr; 734179237Sjb dtrace_probedesc_t *match = &desc->dtrpd_match; 735179237Sjb dtrace_probedesc_t *create = &desc->dtrpd_create; 736179237Sjb int err; 737179237Sjb 738179237Sjb DTRACE_IOCTL_PRINTF("%s(%d): DTRACEIOC_REPLICATE\n",__func__,__LINE__); 739179237Sjb 740179237Sjb match->dtpd_provider[DTRACE_PROVNAMELEN - 1] = '\0'; 741179237Sjb match->dtpd_mod[DTRACE_MODNAMELEN - 1] = '\0'; 742179237Sjb match->dtpd_func[DTRACE_FUNCNAMELEN - 1] = '\0'; 743179237Sjb match->dtpd_name[DTRACE_NAMELEN - 1] = '\0'; 744179237Sjb 745179237Sjb create->dtpd_provider[DTRACE_PROVNAMELEN - 1] = '\0'; 746179237Sjb create->dtpd_mod[DTRACE_MODNAMELEN - 1] = '\0'; 747179237Sjb create->dtpd_func[DTRACE_FUNCNAMELEN - 1] = '\0'; 748179237Sjb create->dtpd_name[DTRACE_NAMELEN - 1] = '\0'; 749179237Sjb 750179237Sjb mutex_enter(&dtrace_lock); 751179237Sjb err = dtrace_enabling_replicate(state, match, create); 752179237Sjb mutex_exit(&dtrace_lock); 753179237Sjb 754179237Sjb return (err); 755179237Sjb } 756179237Sjb case DTRACEIOC_STATUS: { 757179237Sjb dtrace_status_t *stat = (dtrace_status_t *) addr; 758179237Sjb dtrace_dstate_t *dstate; 759179237Sjb int i, j; 760179237Sjb uint64_t nerrs; 761179237Sjb 762179237Sjb DTRACE_IOCTL_PRINTF("%s(%d): DTRACEIOC_STATUS\n",__func__,__LINE__); 763179237Sjb 764179237Sjb /* 765179237Sjb * See the comment in dtrace_state_deadman() for the reason 766179237Sjb * for setting dts_laststatus to INT64_MAX before setting 767179237Sjb * it to the correct value. 768179237Sjb */ 769179237Sjb state->dts_laststatus = INT64_MAX; 770179237Sjb dtrace_membar_producer(); 771179237Sjb state->dts_laststatus = dtrace_gethrtime(); 772179237Sjb 773179237Sjb bzero(stat, sizeof (*stat)); 774179237Sjb 775179237Sjb mutex_enter(&dtrace_lock); 776179237Sjb 777179237Sjb if (state->dts_activity == DTRACE_ACTIVITY_INACTIVE) { 778179237Sjb mutex_exit(&dtrace_lock); 779179237Sjb return (ENOENT); 780179237Sjb } 781179237Sjb 782179237Sjb if (state->dts_activity == DTRACE_ACTIVITY_DRAINING) 783179237Sjb stat->dtst_exiting = 1; 784179237Sjb 785179237Sjb nerrs = state->dts_errors; 786179237Sjb dstate = &state->dts_vstate.dtvs_dynvars; 787179237Sjb 788179237Sjb for (i = 0; i < NCPU; i++) { 789179237Sjb#if !defined(sun) 790179237Sjb if (pcpu_find(i) == NULL) 791179237Sjb continue; 792179237Sjb#endif 793179237Sjb dtrace_dstate_percpu_t *dcpu = &dstate->dtds_percpu[i]; 794179237Sjb 795179237Sjb stat->dtst_dyndrops += dcpu->dtdsc_drops; 796179237Sjb stat->dtst_dyndrops_dirty += dcpu->dtdsc_dirty_drops; 797179237Sjb stat->dtst_dyndrops_rinsing += dcpu->dtdsc_rinsing_drops; 798179237Sjb 799179237Sjb if (state->dts_buffer[i].dtb_flags & DTRACEBUF_FULL) 800179237Sjb stat->dtst_filled++; 801179237Sjb 802179237Sjb nerrs += state->dts_buffer[i].dtb_errors; 803179237Sjb 804179237Sjb for (j = 0; j < state->dts_nspeculations; j++) { 805179237Sjb dtrace_speculation_t *spec; 806179237Sjb dtrace_buffer_t *buf; 807179237Sjb 808179237Sjb spec = &state->dts_speculations[j]; 809179237Sjb buf = &spec->dtsp_buffer[i]; 810179237Sjb stat->dtst_specdrops += buf->dtb_xamot_drops; 811179237Sjb } 812179237Sjb } 813179237Sjb 814179237Sjb stat->dtst_specdrops_busy = state->dts_speculations_busy; 815179237Sjb stat->dtst_specdrops_unavail = state->dts_speculations_unavail; 816179237Sjb stat->dtst_stkstroverflows = state->dts_stkstroverflows; 817179237Sjb stat->dtst_dblerrors = state->dts_dblerrors; 818179237Sjb stat->dtst_killed = 819179237Sjb (state->dts_activity == DTRACE_ACTIVITY_KILLED); 820179237Sjb stat->dtst_errors = nerrs; 821179237Sjb 822179237Sjb mutex_exit(&dtrace_lock); 823179237Sjb 824179237Sjb return (0); 825179237Sjb } 826179237Sjb case DTRACEIOC_STOP: { 827179237Sjb int rval; 828179237Sjb processorid_t *cpuid = (processorid_t *) addr; 829179237Sjb 830179237Sjb DTRACE_IOCTL_PRINTF("%s(%d): DTRACEIOC_STOP\n",__func__,__LINE__); 831179237Sjb 832179237Sjb mutex_enter(&dtrace_lock); 833179237Sjb rval = dtrace_state_stop(state, cpuid); 834179237Sjb mutex_exit(&dtrace_lock); 835179237Sjb 836179237Sjb return (rval); 837179237Sjb } 838179237Sjb default: 839179237Sjb error = ENOTTY; 840179237Sjb } 841179237Sjb return (error); 842179237Sjb} 843