plockstat.c revision 210236
1/* 2 * CDDL HEADER START 3 * 4 * The contents of this file are subject to the terms of the 5 * Common Development and Distribution License (the "License"). 6 * You may not use this file except in compliance with the License. 7 * 8 * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE 9 * or http://www.opensolaris.org/os/licensing. 10 * See the License for the specific language governing permissions 11 * and limitations under the License. 12 * 13 * When distributing Covered Code, include this CDDL HEADER in each 14 * file and include the License file at usr/src/OPENSOLARIS.LICENSE. 15 * If applicable, add the following below this CDDL HEADER, with the 16 * fields enclosed by brackets "[]" replaced with your own identifying 17 * information: Portions Copyright [yyyy] [name of copyright owner] 18 * 19 * CDDL HEADER END 20 */ 21 22/* 23 * Copyright 2006 Sun Microsystems, Inc. All rights reserved. 24 * Use is subject to license terms. 25 */ 26 27#pragma ident "%Z%%M% %I% %E% SMI" 28 29#include <assert.h> 30#include <dtrace.h> 31#include <limits.h> 32#include <link.h> 33#include <priv.h> 34#include <signal.h> 35#include <stdlib.h> 36#include <stdarg.h> 37#include <stdio.h> 38#include <string.h> 39#include <strings.h> 40#include <errno.h> 41#include <sys/wait.h> 42#include <libgen.h> 43#include <libproc.h> 44 45static char *g_pname; 46static dtrace_hdl_t *g_dtp; 47struct ps_prochandle *g_pr; 48 49#define E_SUCCESS 0 50#define E_ERROR 1 51#define E_USAGE 2 52 53/* 54 * For hold times we use a global associative array since for mutexes, in 55 * user-land, it's not invalid to release a sychonization primitive that 56 * another thread acquired; rwlocks require a thread-local associative array 57 * since multiple thread can hold the same lock for reading. Note that we 58 * ignore recursive mutex acquisitions and releases as they don't truly 59 * affect lock contention. 60 */ 61static const char *g_hold_init = 62"plockstat$target:::rw-acquire\n" 63"{\n" 64" self->rwhold[arg0] = timestamp;\n" 65"}\n" 66"plockstat$target:::mutex-acquire\n" 67"/arg1 == 0/\n" 68"{\n" 69" mtxhold[arg0] = timestamp;\n" 70"}\n"; 71 72static const char *g_hold_histogram = 73"plockstat$target:::rw-release\n" 74"/self->rwhold[arg0] && arg1 == 1/\n" 75"{\n" 76" @rw_w_hold[arg0, ustack()] =\n" 77" quantize(timestamp - self->rwhold[arg0]);\n" 78" self->rwhold[arg0] = 0;\n" 79" rw_w_hold_found = 1;\n" 80"}\n" 81"plockstat$target:::rw-release\n" 82"/self->rwhold[arg0]/\n" 83"{\n" 84" @rw_r_hold[arg0, ustack()] =\n" 85" quantize(timestamp - self->rwhold[arg0]);\n" 86" self->rwhold[arg0] = 0;\n" 87" rw_r_hold_found = 1;\n" 88"}\n" 89"plockstat$target:::mutex-release\n" 90"/mtxhold[arg0] && arg1 == 0/\n" 91"{\n" 92" @mtx_hold[arg0, ustack()] = quantize(timestamp - mtxhold[arg0]);\n" 93" mtxhold[arg0] = 0;\n" 94" mtx_hold_found = 1;\n" 95"}\n" 96"\n" 97"END\n" 98"/mtx_hold_found/\n" 99"{\n" 100" trace(\"Mutex hold\");\n" 101" printa(@mtx_hold);\n" 102"}\n" 103"END\n" 104"/rw_r_hold_found/\n" 105"{\n" 106" trace(\"R/W reader hold\");\n" 107" printa(@rw_r_hold);\n" 108"}\n" 109"END\n" 110"/rw_w_hold_found/\n" 111"{\n" 112" trace(\"R/W writer hold\");\n" 113" printa(@rw_w_hold);\n" 114"}\n"; 115 116static const char *g_hold_times = 117"plockstat$target:::rw-release\n" 118"/self->rwhold[arg0] && arg1 == 1/\n" 119"{\n" 120" @rw_w_hold[arg0, ustack(5)] = sum(timestamp - self->rwhold[arg0]);\n" 121" @rw_w_hold_count[arg0, ustack(5)] = count();\n" 122" self->rwhold[arg0] = 0;\n" 123" rw_w_hold_found = 1;\n" 124"}\n" 125"plockstat$target:::rw-release\n" 126"/self->rwhold[arg0]/\n" 127"{\n" 128" @rw_r_hold[arg0, ustack(5)] = sum(timestamp - self->rwhold[arg0]);\n" 129" @rw_r_hold_count[arg0, ustack(5)] = count();\n" 130" self->rwhold[arg0] = 0;\n" 131" rw_r_hold_found = 1;\n" 132"}\n" 133"plockstat$target:::mutex-release\n" 134"/mtxhold[arg0] && arg1 == 0/\n" 135"{\n" 136" @mtx_hold[arg0, ustack(5)] = sum(timestamp - mtxhold[arg0]);\n" 137" @mtx_hold_count[arg0, ustack(5)] = count();\n" 138" mtxhold[arg0] = 0;\n" 139" mtx_hold_found = 1;\n" 140"}\n" 141"\n" 142"END\n" 143"/mtx_hold_found/\n" 144"{\n" 145" trace(\"Mutex hold\");\n" 146" printa(@mtx_hold, @mtx_hold_count);\n" 147"}\n" 148"END\n" 149"/rw_r_hold_found/\n" 150"{\n" 151" trace(\"R/W reader hold\");\n" 152" printa(@rw_r_hold, @rw_r_hold_count);\n" 153"}\n" 154"END\n" 155"/rw_w_hold_found/\n" 156"{\n" 157" trace(\"R/W writer hold\");\n" 158" printa(@rw_w_hold, @rw_w_hold_count);\n" 159"}\n"; 160 161 162/* 163 * For contention, we use thread-local associative arrays since we're tracing 164 * a single thread's activity in libc and multiple threads can be blocking or 165 * spinning on the same sychonization primitive. 166 */ 167static const char *g_ctnd_init = 168"plockstat$target:::rw-block\n" 169"{\n" 170" self->rwblock[arg0] = timestamp;\n" 171"}\n" 172"plockstat$target:::mutex-block\n" 173"{\n" 174" self->mtxblock[arg0] = timestamp;\n" 175"}\n" 176"plockstat$target:::mutex-spin\n" 177"{\n" 178" self->mtxspin[arg0] = timestamp;\n" 179"}\n"; 180 181static const char *g_ctnd_histogram = 182"plockstat$target:::rw-blocked\n" 183"/self->rwblock[arg0] && arg1 == 1 && arg2 != 0/\n" 184"{\n" 185" @rw_w_block[arg0, ustack()] =\n" 186" quantize(timestamp - self->rwblock[arg0]);\n" 187" self->rwblock[arg0] = 0;\n" 188" rw_w_block_found = 1;\n" 189"}\n" 190"plockstat$target:::rw-blocked\n" 191"/self->rwblock[arg0] && arg2 != 0/\n" 192"{\n" 193" @rw_r_block[arg0, ustack()] =\n" 194" quantize(timestamp - self->rwblock[arg0]);\n" 195" self->rwblock[arg0] = 0;\n" 196" rw_r_block_found = 1;\n" 197"}\n" 198"plockstat$target:::rw-blocked\n" 199"/self->rwblock[arg0]/\n" 200"{\n" 201" self->rwblock[arg0] = 0;\n" 202"}\n" 203"plockstat$target:::mutex-spun\n" 204"/self->mtxspin[arg0] && arg1 != 0/\n" 205"{\n" 206" @mtx_spin[arg0, ustack()] =\n" 207" quantize(timestamp - self->mtxspin[arg0]);\n" 208" self->mtxspin[arg0] = 0;\n" 209" mtx_spin_found = 1;\n" 210"}\n" 211"plockstat$target:::mutex-spun\n" 212"/self->mtxspin[arg0]/\n" 213"{\n" 214" @mtx_vain_spin[arg0, ustack()] =\n" 215" quantize(timestamp - self->mtxspin[arg0]);\n" 216" self->mtxspin[arg0] = 0;\n" 217" mtx_vain_spin_found = 1;\n" 218"}\n" 219"plockstat$target:::mutex-blocked\n" 220"/self->mtxblock[arg0] && arg1 != 0/\n" 221"{\n" 222" @mtx_block[arg0, ustack()] =\n" 223" quantize(timestamp - self->mtxblock[arg0]);\n" 224" self->mtxblock[arg0] = 0;\n" 225" mtx_block_found = 1;\n" 226"}\n" 227"plockstat$target:::mutex-blocked\n" 228"/self->mtxblock[arg0]/\n" 229"{\n" 230" self->mtxblock[arg0] = 0;\n" 231"}\n" 232"\n" 233"END\n" 234"/mtx_block_found/\n" 235"{\n" 236" trace(\"Mutex block\");\n" 237" printa(@mtx_block);\n" 238"}\n" 239"END\n" 240"/mtx_spin_found/\n" 241"{\n" 242" trace(\"Mutex spin\");\n" 243" printa(@mtx_spin);\n" 244"}\n" 245"END\n" 246"/mtx_vain_spin_found/\n" 247"{\n" 248" trace(\"Mutex unsuccessful spin\");\n" 249" printa(@mtx_vain_spin);\n" 250"}\n" 251"END\n" 252"/rw_r_block_found/\n" 253"{\n" 254" trace(\"R/W reader block\");\n" 255" printa(@rw_r_block);\n" 256"}\n" 257"END\n" 258"/rw_w_block_found/\n" 259"{\n" 260" trace(\"R/W writer block\");\n" 261" printa(@rw_w_block);\n" 262"}\n"; 263 264 265static const char *g_ctnd_times = 266"plockstat$target:::rw-blocked\n" 267"/self->rwblock[arg0] && arg1 == 1 && arg2 != 0/\n" 268"{\n" 269" @rw_w_block[arg0, ustack(5)] =\n" 270" sum(timestamp - self->rwblock[arg0]);\n" 271" @rw_w_block_count[arg0, ustack(5)] = count();\n" 272" self->rwblock[arg0] = 0;\n" 273" rw_w_block_found = 1;\n" 274"}\n" 275"plockstat$target:::rw-blocked\n" 276"/self->rwblock[arg0] && arg2 != 0/\n" 277"{\n" 278" @rw_r_block[arg0, ustack(5)] =\n" 279" sum(timestamp - self->rwblock[arg0]);\n" 280" @rw_r_block_count[arg0, ustack(5)] = count();\n" 281" self->rwblock[arg0] = 0;\n" 282" rw_r_block_found = 1;\n" 283"}\n" 284"plockstat$target:::rw-blocked\n" 285"/self->rwblock[arg0]/\n" 286"{\n" 287" self->rwblock[arg0] = 0;\n" 288"}\n" 289"plockstat$target:::mutex-spun\n" 290"/self->mtxspin[arg0] && arg1 != 0/\n" 291"{\n" 292" @mtx_spin[arg0, ustack(5)] =\n" 293" sum(timestamp - self->mtxspin[arg0]);\n" 294" @mtx_spin_count[arg0, ustack(5)] = count();\n" 295" self->mtxspin[arg0] = 0;\n" 296" mtx_spin_found = 1;\n" 297"}\n" 298"plockstat$target:::mutex-spun\n" 299"/self->mtxspin[arg0]/\n" 300"{\n" 301" @mtx_vain_spin[arg0, ustack(5)] =\n" 302" sum(timestamp - self->mtxspin[arg0]);\n" 303" @mtx_vain_spin_count[arg0, ustack(5)] = count();\n" 304" self->mtxspin[arg0] = 0;\n" 305" mtx_vain_spin_found = 1;\n" 306"}\n" 307"plockstat$target:::mutex-blocked\n" 308"/self->mtxblock[arg0] && arg1 != 0/\n" 309"{\n" 310" @mtx_block[arg0, ustack(5)] =\n" 311" sum(timestamp - self->mtxblock[arg0]);\n" 312" @mtx_block_count[arg0, ustack(5)] = count();\n" 313" self->mtxblock[arg0] = 0;\n" 314" mtx_block_found = 1;\n" 315"}\n" 316"plockstat$target:::mutex-blocked\n" 317"/self->mtxblock[arg0]/\n" 318"{\n" 319" self->mtxblock[arg0] = 0;\n" 320"}\n" 321"\n" 322"END\n" 323"/mtx_block_found/\n" 324"{\n" 325" trace(\"Mutex block\");\n" 326" printa(@mtx_block, @mtx_block_count);\n" 327"}\n" 328"END\n" 329"/mtx_spin_found/\n" 330"{\n" 331" trace(\"Mutex spin\");\n" 332" printa(@mtx_spin, @mtx_spin_count);\n" 333"}\n" 334"END\n" 335"/mtx_vain_spin_found/\n" 336"{\n" 337" trace(\"Mutex unsuccessful spin\");\n" 338" printa(@mtx_vain_spin, @mtx_vain_spin_count);\n" 339"}\n" 340"END\n" 341"/rw_r_block_found/\n" 342"{\n" 343" trace(\"R/W reader block\");\n" 344" printa(@rw_r_block, @rw_r_block_count);\n" 345"}\n" 346"END\n" 347"/rw_w_block_found/\n" 348"{\n" 349" trace(\"R/W writer block\");\n" 350" printa(@rw_w_block, @rw_w_block_count);\n" 351"}\n"; 352 353static char g_prog[4096]; 354static size_t g_proglen; 355static int g_opt_V, g_opt_s; 356static int g_intr; 357static int g_exited; 358static dtrace_optval_t g_nframes; 359static ulong_t g_nent = ULONG_MAX; 360 361#define PLOCKSTAT_OPTSTR "n:ps:e:vx:ACHV" 362 363static void 364usage(void) 365{ 366 (void) fprintf(stderr, "Usage:\n" 367 "\t%s [-vACHV] [-n count] [-s depth] [-e secs] [-x opt[=val]]\n" 368 "\t command [arg...]\n" 369 "\t%s [-vACHV] [-n count] [-s depth] [-e secs] [-x opt[=val]]\n" 370 "\t -p pid\n", g_pname, g_pname); 371 372 exit(E_USAGE); 373} 374 375static void 376verror(const char *fmt, va_list ap) 377{ 378 int error = errno; 379 380 (void) fprintf(stderr, "%s: ", g_pname); 381 (void) vfprintf(stderr, fmt, ap); 382 383 if (fmt[strlen(fmt) - 1] != '\n') 384 (void) fprintf(stderr, ": %s\n", strerror(error)); 385} 386 387/*PRINTFLIKE1*/ 388static void 389fatal(const char *fmt, ...) 390{ 391 va_list ap; 392 393 va_start(ap, fmt); 394 verror(fmt, ap); 395 va_end(ap); 396 397 if (g_pr != NULL && g_dtp != NULL) 398 dtrace_proc_release(g_dtp, g_pr); 399 400 exit(E_ERROR); 401} 402 403/*PRINTFLIKE1*/ 404static void 405dfatal(const char *fmt, ...) 406{ 407 va_list ap; 408 409 va_start(ap, fmt); 410 411 (void) fprintf(stderr, "%s: ", g_pname); 412 if (fmt != NULL) 413 (void) vfprintf(stderr, fmt, ap); 414 415 va_end(ap); 416 417 if (fmt != NULL && fmt[strlen(fmt) - 1] != '\n') { 418 (void) fprintf(stderr, ": %s\n", 419 dtrace_errmsg(g_dtp, dtrace_errno(g_dtp))); 420 } else if (fmt == NULL) { 421 (void) fprintf(stderr, "%s\n", 422 dtrace_errmsg(g_dtp, dtrace_errno(g_dtp))); 423 } 424 425 if (g_pr != NULL) { 426 dtrace_proc_continue(g_dtp, g_pr); 427 dtrace_proc_release(g_dtp, g_pr); 428 } 429 430 exit(E_ERROR); 431} 432 433/*PRINTFLIKE1*/ 434static void 435notice(const char *fmt, ...) 436{ 437 va_list ap; 438 439 va_start(ap, fmt); 440 verror(fmt, ap); 441 va_end(ap); 442} 443 444static void 445dprog_add(const char *prog) 446{ 447 size_t len = strlen(prog); 448 bcopy(prog, g_prog + g_proglen, len + 1); 449 g_proglen += len; 450 assert(g_proglen < sizeof (g_prog)); 451} 452 453static void 454dprog_compile(void) 455{ 456 dtrace_prog_t *prog; 457 dtrace_proginfo_t info; 458 459 if (g_opt_V) { 460 (void) fprintf(stderr, "%s: vvvv D program vvvv\n", g_pname); 461 (void) fputs(g_prog, stderr); 462 (void) fprintf(stderr, "%s: ^^^^ D program ^^^^\n", g_pname); 463 } 464 465 if ((prog = dtrace_program_strcompile(g_dtp, g_prog, 466 DTRACE_PROBESPEC_NAME, 0, 0, NULL)) == NULL) 467 dfatal("failed to compile program"); 468 469 if (dtrace_program_exec(g_dtp, prog, &info) == -1) 470 dfatal("failed to enable probes"); 471} 472 473void 474print_legend(void) 475{ 476 (void) printf("%5s %8s %-28s %s\n", "Count", "nsec", "Lock", "Caller"); 477} 478 479void 480print_bar(void) 481{ 482 (void) printf("---------------------------------------" 483 "----------------------------------------\n"); 484} 485 486void 487print_histogram_header(void) 488{ 489 (void) printf("\n%10s ---- Time Distribution --- %5s %s\n", 490 "nsec", "count", "Stack"); 491} 492 493/* 494 * Convert an address to a symbolic string or a numeric string. If nolocks 495 * is set, we return an error code if this symbol appears to be a mutex- or 496 * rwlock-related symbol in libc so the caller has a chance to find a more 497 * helpful symbol. 498 */ 499static int 500getsym(struct ps_prochandle *P, uintptr_t addr, char *buf, size_t size, 501 int nolocks) 502{ 503 char name[256]; 504 GElf_Sym sym; 505 prsyminfo_t info; 506 size_t len; 507 508 if (P == NULL || Pxlookup_by_addr(P, addr, name, sizeof (name), 509 &sym, &info) != 0) { 510 (void) snprintf(buf, size, "%#lx", addr); 511 return (0); 512 } 513 if (info.prs_object == NULL) 514 info.prs_object = "<unknown>"; 515 516 if (info.prs_lmid != LM_ID_BASE) { 517 len = snprintf(buf, size, "LM%lu`", info.prs_lmid); 518 buf += len; 519 size -= len; 520 } 521 522 len = snprintf(buf, size, "%s`%s", info.prs_object, info.prs_name); 523 buf += len; 524 size -= len; 525 526 if (sym.st_value != addr) 527 len = snprintf(buf, size, "+%#lx", addr - sym.st_value); 528 529 if (nolocks && strcmp("libc.so.1", info.prs_object) == 0 && 530 (strstr("mutex", info.prs_name) == 0 || 531 strstr("rw", info.prs_name) == 0)) 532 return (-1); 533 534 return (0); 535} 536 537/*ARGSUSED*/ 538static int 539process_aggregate(const dtrace_aggdata_t **aggsdata, int naggvars, void *arg) 540{ 541 const dtrace_recdesc_t *rec; 542 uintptr_t lock; 543 uint64_t *stack; 544 caddr_t data; 545 pid_t pid; 546 struct ps_prochandle *P; 547 char buf[256]; 548 int i, j; 549 uint64_t sum, count, avg; 550 551 if ((*(uint_t *)arg)++ >= g_nent) 552 return (DTRACE_AGGWALK_NEXT); 553 554 rec = aggsdata[0]->dtada_desc->dtagd_rec; 555 data = aggsdata[0]->dtada_data; 556 557 /*LINTED - alignment*/ 558 lock = (uintptr_t)*(uint64_t *)(data + rec[1].dtrd_offset); 559 /*LINTED - alignment*/ 560 stack = (uint64_t *)(data + rec[2].dtrd_offset); 561 562 if (!g_opt_s) { 563 /*LINTED - alignment*/ 564 sum = *(uint64_t *)(aggsdata[1]->dtada_data + 565 aggsdata[1]->dtada_desc->dtagd_rec[3].dtrd_offset); 566 /*LINTED - alignment*/ 567 count = *(uint64_t *)(aggsdata[2]->dtada_data + 568 aggsdata[2]->dtada_desc->dtagd_rec[3].dtrd_offset); 569 } else { 570 uint64_t *a; 571 572 /*LINTED - alignment*/ 573 a = (uint64_t *)(aggsdata[1]->dtada_data + 574 aggsdata[1]->dtada_desc->dtagd_rec[3].dtrd_offset); 575 576 print_bar(); 577 print_legend(); 578 579 for (count = sum = 0, i = DTRACE_QUANTIZE_ZEROBUCKET, j = 0; 580 i < DTRACE_QUANTIZE_NBUCKETS; i++, j++) { 581 count += a[i]; 582 sum += a[i] << (j - 64); 583 } 584 } 585 586 avg = sum / count; 587 (void) printf("%5llu %8llu ", (u_longlong_t)count, (u_longlong_t)avg); 588 589 pid = stack[0]; 590 P = dtrace_proc_grab(g_dtp, pid, PGRAB_RDONLY); 591 592 (void) getsym(P, lock, buf, sizeof (buf), 0); 593 (void) printf("%-28s ", buf); 594 595 for (i = 2; i <= 5; i++) { 596 if (getsym(P, stack[i], buf, sizeof (buf), 1) == 0) 597 break; 598 } 599 (void) printf("%s\n", buf); 600 601 if (g_opt_s) { 602 int stack_done = 0; 603 int quant_done = 0; 604 int first_bin, last_bin; 605 uint64_t bin_size, *a; 606 607 /*LINTED - alignment*/ 608 a = (uint64_t *)(aggsdata[1]->dtada_data + 609 aggsdata[1]->dtada_desc->dtagd_rec[3].dtrd_offset); 610 611 print_histogram_header(); 612 613 for (first_bin = DTRACE_QUANTIZE_ZEROBUCKET; 614 a[first_bin] == 0; first_bin++) 615 continue; 616 for (last_bin = DTRACE_QUANTIZE_ZEROBUCKET + 63; 617 a[last_bin] == 0; last_bin--) 618 continue; 619 620 for (i = 0; !stack_done || !quant_done; i++) { 621 if (!stack_done) { 622 (void) getsym(P, stack[i + 2], buf, 623 sizeof (buf), 0); 624 } else { 625 buf[0] = '\0'; 626 } 627 628 if (!quant_done) { 629 bin_size = a[first_bin]; 630 631 (void) printf("%10llu |%-24.*s| %5llu %s\n", 632 1ULL << 633 (first_bin - DTRACE_QUANTIZE_ZEROBUCKET), 634 (int)(24.0 * bin_size / count), 635 "@@@@@@@@@@@@@@@@@@@@@@@@@@", 636 (u_longlong_t)bin_size, buf); 637 } else { 638 (void) printf("%43s %s\n", "", buf); 639 } 640 641 if (i + 1 >= g_nframes || stack[i + 3] == 0) 642 stack_done = 1; 643 644 if (first_bin++ == last_bin) 645 quant_done = 1; 646 } 647 } 648 649 dtrace_proc_release(g_dtp, P); 650 651 return (DTRACE_AGGWALK_NEXT); 652} 653 654/*ARGSUSED*/ 655static void 656prochandler(struct ps_prochandle *P, const char *msg, void *arg) 657{ 658 const psinfo_t *prp = Ppsinfo(P); 659 int pid = Pstatus(P)->pr_pid; 660 char name[SIG2STR_MAX]; 661 662 if (msg != NULL) { 663 notice("pid %d: %s\n", pid, msg); 664 return; 665 } 666 667 switch (Pstate(P)) { 668 case PS_UNDEAD: 669 /* 670 * Ideally we would like to always report pr_wstat here, but it 671 * isn't possible given current /proc semantics. If we grabbed 672 * the process, Ppsinfo() will either fail or return a zeroed 673 * psinfo_t depending on how far the parent is in reaping it. 674 * When /proc provides a stable pr_wstat in the status file, 675 * this code can be improved by examining this new pr_wstat. 676 */ 677 if (prp != NULL && WIFSIGNALED(prp->pr_wstat)) { 678 notice("pid %d terminated by %s\n", pid, 679 proc_signame(WTERMSIG(prp->pr_wstat), 680 name, sizeof (name))); 681 } else if (prp != NULL && WEXITSTATUS(prp->pr_wstat) != 0) { 682 notice("pid %d exited with status %d\n", 683 pid, WEXITSTATUS(prp->pr_wstat)); 684 } else { 685 notice("pid %d has exited\n", pid); 686 } 687 g_exited = 1; 688 break; 689 690 case PS_LOST: 691 notice("pid %d exec'd a set-id or unobservable program\n", pid); 692 g_exited = 1; 693 break; 694 } 695} 696 697/*ARGSUSED*/ 698static int 699chewrec(const dtrace_probedata_t *data, const dtrace_recdesc_t *rec, void *arg) 700{ 701 dtrace_eprobedesc_t *epd = data->dtpda_edesc; 702 dtrace_aggvarid_t aggvars[2]; 703 const void *buf; 704 int i, nagv; 705 706 /* 707 * A NULL rec indicates that we've processed the last record. 708 */ 709 if (rec == NULL) 710 return (DTRACE_CONSUME_NEXT); 711 712 buf = data->dtpda_data - rec->dtrd_offset; 713 714 switch (rec->dtrd_action) { 715 case DTRACEACT_DIFEXPR: 716 (void) printf("\n%s\n\n", (char *)buf + rec->dtrd_offset); 717 if (!g_opt_s) { 718 print_legend(); 719 print_bar(); 720 } 721 return (DTRACE_CONSUME_NEXT); 722 723 case DTRACEACT_PRINTA: 724 for (nagv = 0, i = 0; i < epd->dtepd_nrecs - 1; i++) { 725 const dtrace_recdesc_t *nrec = &rec[i]; 726 727 if (nrec->dtrd_uarg != rec->dtrd_uarg) 728 break; 729 730 /*LINTED - alignment*/ 731 aggvars[nagv++] = *(dtrace_aggvarid_t *)((caddr_t)buf + 732 nrec->dtrd_offset); 733 } 734 735 if (nagv == (g_opt_s ? 1 : 2)) { 736 uint_t nent = 0; 737 if (dtrace_aggregate_walk_joined(g_dtp, aggvars, nagv, 738 process_aggregate, &nent) != 0) 739 dfatal("failed to walk aggregate"); 740 } 741 742 return (DTRACE_CONSUME_NEXT); 743 } 744 745 return (DTRACE_CONSUME_THIS); 746} 747 748/*ARGSUSED*/ 749static void 750intr(int signo) 751{ 752 g_intr = 1; 753} 754 755int 756main(int argc, char **argv) 757{ 758 ucred_t *ucp; 759 int err; 760 int opt_C = 0, opt_H = 0, opt_p = 0, opt_v = 0; 761 char c, *p, *end; 762 struct sigaction act; 763 int done = 0; 764 765 g_pname = basename(argv[0]); 766 argv[0] = g_pname; /* rewrite argv[0] for getopt errors */ 767 768 /* 769 * Make sure we have the required dtrace_proc privilege. 770 */ 771 if ((ucp = ucred_get(getpid())) != NULL) { 772 const priv_set_t *psp; 773 if ((psp = ucred_getprivset(ucp, PRIV_EFFECTIVE)) != NULL && 774 !priv_ismember(psp, PRIV_DTRACE_PROC)) { 775 fatal("dtrace_proc privilege required\n"); 776 } 777 778 ucred_free(ucp); 779 } 780 781 while ((c = getopt(argc, argv, PLOCKSTAT_OPTSTR)) != EOF) { 782 switch (c) { 783 case 'n': 784 errno = 0; 785 g_nent = strtoul(optarg, &end, 10); 786 if (*end != '\0' || errno != 0) { 787 (void) fprintf(stderr, "%s: invalid count " 788 "'%s'\n", g_pname, optarg); 789 usage(); 790 } 791 break; 792 793 case 'p': 794 opt_p = 1; 795 break; 796 797 case 'v': 798 opt_v = 1; 799 break; 800 801 case 'A': 802 opt_C = opt_H = 1; 803 break; 804 805 case 'C': 806 opt_C = 1; 807 break; 808 809 case 'H': 810 opt_H = 1; 811 break; 812 813 case 'V': 814 g_opt_V = 1; 815 break; 816 817 default: 818 if (strchr(PLOCKSTAT_OPTSTR, c) == NULL) 819 usage(); 820 } 821 } 822 823 /* 824 * We need a command or at least one pid. 825 */ 826 if (argc == optind) 827 usage(); 828 829 if (opt_C == 0 && opt_H == 0) 830 opt_C = 1; 831 832 if ((g_dtp = dtrace_open(DTRACE_VERSION, 0, &err)) == NULL) 833 fatal("failed to initialize dtrace: %s\n", 834 dtrace_errmsg(NULL, err)); 835 836 /* 837 * The longest string we trace is 23 bytes long -- so 32 is plenty. 838 */ 839 if (dtrace_setopt(g_dtp, "strsize", "32") == -1) 840 dfatal("failed to set 'strsize'"); 841 842 /* 843 * 1k should be more than enough for all trace() and printa() actions. 844 */ 845 if (dtrace_setopt(g_dtp, "bufsize", "1k") == -1) 846 dfatal("failed to set 'bufsize'"); 847 848 /* 849 * The table we produce has the hottest locks at the top. 850 */ 851 if (dtrace_setopt(g_dtp, "aggsortrev", NULL) == -1) 852 dfatal("failed to set 'aggsortrev'"); 853 854 /* 855 * These are two reasonable defaults which should suffice. 856 */ 857 if (dtrace_setopt(g_dtp, "aggsize", "256k") == -1) 858 dfatal("failed to set 'aggsize'"); 859 if (dtrace_setopt(g_dtp, "aggrate", "1sec") == -1) 860 dfatal("failed to set 'aggrate'"); 861 862 /* 863 * Take a second pass through to look for options that set options now 864 * that we have an open dtrace handle. 865 */ 866 optind = 1; 867 while ((c = getopt(argc, argv, PLOCKSTAT_OPTSTR)) != EOF) { 868 switch (c) { 869 case 's': 870 g_opt_s = 1; 871 if (dtrace_setopt(g_dtp, "ustackframes", optarg) == -1) 872 dfatal("failed to set 'ustackframes'"); 873 break; 874 875 case 'x': 876 if ((p = strchr(optarg, '=')) != NULL) 877 *p++ = '\0'; 878 879 if (dtrace_setopt(g_dtp, optarg, p) != 0) 880 dfatal("failed to set -x %s", optarg); 881 break; 882 883 case 'e': 884 errno = 0; 885 (void) strtoul(optarg, &end, 10); 886 if (*optarg == '-' || *end != '\0' || errno != 0) { 887 (void) fprintf(stderr, "%s: invalid timeout " 888 "'%s'\n", g_pname, optarg); 889 usage(); 890 } 891 892 /* 893 * Construct a DTrace enabling that will exit after 894 * the specified number of seconds. 895 */ 896 dprog_add("BEGIN\n{\n\tend = timestamp + "); 897 dprog_add(optarg); 898 dprog_add(" * 1000000000;\n}\n"); 899 dprog_add("tick-10hz\n/timestamp >= end/\n"); 900 dprog_add("{\n\texit(0);\n}\n"); 901 break; 902 } 903 } 904 905 argc -= optind; 906 argv += optind; 907 908 if (opt_H) { 909 dprog_add(g_hold_init); 910 if (g_opt_s == NULL) 911 dprog_add(g_hold_times); 912 else 913 dprog_add(g_hold_histogram); 914 } 915 916 if (opt_C) { 917 dprog_add(g_ctnd_init); 918 if (g_opt_s == NULL) 919 dprog_add(g_ctnd_times); 920 else 921 dprog_add(g_ctnd_histogram); 922 } 923 924 if (opt_p) { 925 ulong_t pid; 926 927 if (argc > 1) { 928 (void) fprintf(stderr, "%s: only one pid is allowed\n", 929 g_pname); 930 usage(); 931 } 932 933 errno = 0; 934 pid = strtoul(argv[0], &end, 10); 935 if (*end != '\0' || errno != 0 || (pid_t)pid != pid) { 936 (void) fprintf(stderr, "%s: invalid pid '%s'\n", 937 g_pname, argv[0]); 938 usage(); 939 } 940 941 if ((g_pr = dtrace_proc_grab(g_dtp, (pid_t)pid, 0)) == NULL) 942 dfatal(NULL); 943 } else { 944 if ((g_pr = dtrace_proc_create(g_dtp, argv[0], argv)) == NULL) 945 dfatal(NULL); 946 } 947 948 dprog_compile(); 949 950 if (dtrace_handle_proc(g_dtp, &prochandler, NULL) == -1) 951 dfatal("failed to establish proc handler"); 952 953 (void) sigemptyset(&act.sa_mask); 954 act.sa_flags = 0; 955 act.sa_handler = intr; 956 (void) sigaction(SIGINT, &act, NULL); 957 (void) sigaction(SIGTERM, &act, NULL); 958 959 if (dtrace_go(g_dtp) != 0) 960 dfatal("dtrace_go()"); 961 962 if (dtrace_getopt(g_dtp, "ustackframes", &g_nframes) != 0) 963 dfatal("failed to get 'ustackframes'"); 964 965 dtrace_proc_continue(g_dtp, g_pr); 966 967 if (opt_v) 968 (void) printf("%s: tracing enabled for pid %d\n", g_pname, 969 (int)Pstatus(g_pr)->pr_pid); 970 971 do { 972 if (!g_intr && !done) 973 dtrace_sleep(g_dtp); 974 975 if (done || g_intr || g_exited) { 976 done = 1; 977 if (dtrace_stop(g_dtp) == -1) 978 dfatal("couldn't stop tracing"); 979 } 980 981 switch (dtrace_work(g_dtp, stdout, NULL, chewrec, NULL)) { 982 case DTRACE_WORKSTATUS_DONE: 983 done = 1; 984 break; 985 case DTRACE_WORKSTATUS_OKAY: 986 break; 987 default: 988 dfatal("processing aborted"); 989 } 990 991 } while (!done); 992 993 dtrace_close(g_dtp); 994 995 return (0); 996} 997