pmcstat_log.c revision 210794
168349Sobrien/*-
268349Sobrien * Copyright (c) 2005-2007, Joseph Koshy
3354939Sdelphij * Copyright (c) 2007 The FreeBSD Foundation
468349Sobrien * All rights reserved.
568349Sobrien *
668349Sobrien * Portions of this software were developed by A. Joseph Koshy under
768349Sobrien * sponsorship from the FreeBSD Foundation and Google, Inc.
8328874Seadler *
9298192Sdelphij * Redistribution and use in source and binary forms, with or without
10298192Sdelphij * modification, are permitted provided that the following conditions
11298192Sdelphij * are met:
12298192Sdelphij * 1. Redistributions of source code must retain the above copyright
13298192Sdelphij *    notice, this list of conditions and the following disclaimer.
14328874Seadler * 2. Redistributions in binary form must reproduce the above copyright
15354939Sdelphij *    notice, this list of conditions and the following disclaimer in the
16298192Sdelphij *    documentation and/or other materials provided with the distribution.
17298192Sdelphij *
18328874Seadler * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
19328874Seadler * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
20298192Sdelphij * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
21298192Sdelphij * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
22298192Sdelphij * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
23298192Sdelphij * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
24328874Seadler * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
25298192Sdelphij * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
26298192Sdelphij * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
27298192Sdelphij * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
28298192Sdelphij * SUCH DAMAGE.
29103373Sobrien */
30103373Sobrien
31103373Sobrien/*
32103373Sobrien * Transform a hwpmc(4) log into human readable form, and into
33103373Sobrien * gprof(1) compatible profiles.
34103373Sobrien */
35103373Sobrien
36103373Sobrien#include <sys/cdefs.h>
37103373Sobrien__FBSDID("$FreeBSD: head/usr.sbin/pmcstat/pmcstat_log.c 210794 2010-08-03 09:23:53Z fabient $");
38
39#include <sys/param.h>
40#include <sys/endian.h>
41#include <sys/gmon.h>
42#include <sys/imgact_aout.h>
43#include <sys/imgact_elf.h>
44#include <sys/mman.h>
45#include <sys/pmc.h>
46#include <sys/queue.h>
47#include <sys/socket.h>
48#include <sys/stat.h>
49#include <sys/wait.h>
50
51#include <netinet/in.h>
52
53#include <assert.h>
54#include <curses.h>
55#include <err.h>
56#include <errno.h>
57#include <fcntl.h>
58#include <gelf.h>
59#include <libgen.h>
60#include <limits.h>
61#include <netdb.h>
62#include <pmc.h>
63#include <pmclog.h>
64#include <sysexits.h>
65#include <stdint.h>
66#include <stdio.h>
67#include <stdlib.h>
68#include <string.h>
69#include <unistd.h>
70
71#include "pmcstat.h"
72#include "pmcstat_log.h"
73#include "pmcstat_top.h"
74
75#define	PMCSTAT_ALLOCATE		1
76
77/*
78 * PUBLIC INTERFACES
79 *
80 * pmcstat_initialize_logging()	initialize this module, called first
81 * pmcstat_shutdown_logging()		orderly shutdown, called last
82 * pmcstat_open_log()			open an eventlog for processing
83 * pmcstat_process_log()		print/convert an event log
84 * pmcstat_display_log()		top mode display for the log
85 * pmcstat_close_log()			finish processing an event log
86 *
87 * IMPLEMENTATION NOTES
88 *
89 * We correlate each 'callchain' or 'sample' entry seen in the event
90 * log back to an executable object in the system. Executable objects
91 * include:
92 * 	- program executables,
93 *	- shared libraries loaded by the runtime loader,
94 *	- dlopen()'ed objects loaded by the program,
95 *	- the runtime loader itself,
96 *	- the kernel and kernel modules.
97 *
98 * Each process that we know about is treated as a set of regions that
99 * map to executable objects.  Processes are described by
100 * 'pmcstat_process' structures.  Executable objects are tracked by
101 * 'pmcstat_image' structures.  The kernel and kernel modules are
102 * common to all processes (they reside at the same virtual addresses
103 * for all processes).  Individual processes can have their text
104 * segments and shared libraries loaded at process-specific locations.
105 *
106 * A given executable object can be in use by multiple processes
107 * (e.g., libc.so) and loaded at a different address in each.
108 * pmcstat_pcmap structures track per-image mappings.
109 *
110 * The sample log could have samples from multiple PMCs; we
111 * generate one 'gmon.out' profile per PMC.
112 *
113 * IMPLEMENTATION OF GMON OUTPUT
114 *
115 * Each executable object gets one 'gmon.out' profile, per PMC in
116 * use.  Creation of 'gmon.out' profiles is done lazily.  The
117 * 'gmon.out' profiles generated for a given sampling PMC are
118 * aggregates of all the samples for that particular executable
119 * object.
120 *
121 * IMPLEMENTATION OF SYSTEM-WIDE CALLGRAPH OUTPUT
122 *
123 * Each active pmcid has its own callgraph structure, described by a
124 * 'struct pmcstat_callgraph'.  Given a process id and a list of pc
125 * values, we map each pc value to a tuple (image, symbol), where
126 * 'image' denotes an executable object and 'symbol' is the closest
127 * symbol that precedes the pc value.  Each pc value in the list is
128 * also given a 'rank' that reflects its depth in the call stack.
129 */
130
131struct pmcstat_pmcs pmcstat_pmcs = LIST_HEAD_INITIALIZER(pmcstat_pmcs);
132
133/*
134 * All image descriptors are kept in a hash table.
135 */
136struct pmcstat_image_hash_list pmcstat_image_hash[PMCSTAT_NHASH];
137
138/*
139 * All process descriptors are kept in a hash table.
140 */
141struct pmcstat_process_hash_list pmcstat_process_hash[PMCSTAT_NHASH];
142
143struct pmcstat_stats pmcstat_stats; /* statistics */
144int ps_samples_period; /* samples count between top refresh. */
145
146struct pmcstat_process *pmcstat_kernproc; /* kernel 'process' */
147
148#include "pmcpl_gprof.h"
149#include "pmcpl_callgraph.h"
150#include "pmcpl_annotate.h"
151#include "pmcpl_calltree.h"
152
153struct pmc_plugins  {
154	const char 	*pl_name;	/* name */
155
156	/* configure */
157	int (*pl_configure)(char *opt);
158
159	/* init and shutdown */
160	int (*pl_init)(void);
161	void (*pl_shutdown)(FILE *mf);
162
163	/* sample processing */
164	void (*pl_process)(struct pmcstat_process *pp,
165	    struct pmcstat_pmcrecord *pmcr, uint32_t nsamples,
166	    uintfptr_t *cc, int usermode, uint32_t cpu);
167
168	/* image */
169	void (*pl_initimage)(struct pmcstat_image *pi);
170	void (*pl_shutdownimage)(struct pmcstat_image *pi);
171
172	/* pmc */
173	void (*pl_newpmc)(pmcstat_interned_string ps,
174		struct pmcstat_pmcrecord *pr);
175
176	/* top display */
177	void (*pl_topdisplay)(void);
178
179	/* top keypress */
180	int (*pl_topkeypress)(int c, WINDOW *w);
181
182} plugins[] = {
183	{
184		.pl_name		= "none",
185	},
186	{
187		.pl_name		= "callgraph",
188		.pl_init		= pmcpl_cg_init,
189		.pl_shutdown		= pmcpl_cg_shutdown,
190		.pl_process		= pmcpl_cg_process,
191		.pl_topkeypress		= pmcpl_cg_topkeypress,
192		.pl_topdisplay		= pmcpl_cg_topdisplay
193	},
194	{
195		.pl_name		= "gprof",
196		.pl_shutdown		= pmcpl_gmon_shutdown,
197		.pl_process		= pmcpl_gmon_process,
198		.pl_initimage		= pmcpl_gmon_initimage,
199		.pl_shutdownimage	= pmcpl_gmon_shutdownimage,
200		.pl_newpmc		= pmcpl_gmon_newpmc
201	},
202	{
203		.pl_name		= "annotate",
204		.pl_process		= pmcpl_annotate_process
205	},
206	{
207		.pl_name		= "calltree",
208		.pl_configure		= pmcpl_ct_configure,
209		.pl_init		= pmcpl_ct_init,
210		.pl_shutdown		= pmcpl_ct_shutdown,
211		.pl_process		= pmcpl_ct_process,
212		.pl_topkeypress		= pmcpl_ct_topkeypress,
213		.pl_topdisplay		= pmcpl_ct_topdisplay
214	},
215	{
216		.pl_name		= NULL
217	}
218};
219
220int pmcstat_mergepmc;
221
222int pmcstat_pmcinfilter = 0; /* PMC filter for top mode. */
223float pmcstat_threshold = 0.5; /* Cost filter for top mode. */
224
225/*
226 * Prototypes
227 */
228
229static struct pmcstat_image *pmcstat_image_from_path(pmcstat_interned_string
230    _path, int _iskernelmodule);
231static void pmcstat_image_get_aout_params(struct pmcstat_image *_image);
232static void pmcstat_image_get_elf_params(struct pmcstat_image *_image);
233static void	pmcstat_image_link(struct pmcstat_process *_pp,
234    struct pmcstat_image *_i, uintfptr_t _lpc);
235
236static void	pmcstat_pmcid_add(pmc_id_t _pmcid,
237    pmcstat_interned_string _name);
238
239static void	pmcstat_process_aout_exec(struct pmcstat_process *_pp,
240    struct pmcstat_image *_image, uintfptr_t _entryaddr);
241static void	pmcstat_process_elf_exec(struct pmcstat_process *_pp,
242    struct pmcstat_image *_image, uintfptr_t _entryaddr);
243static void	pmcstat_process_exec(struct pmcstat_process *_pp,
244    pmcstat_interned_string _path, uintfptr_t _entryaddr);
245static struct pmcstat_process *pmcstat_process_lookup(pid_t _pid,
246    int _allocate);
247static int	pmcstat_string_compute_hash(const char *_string);
248static void pmcstat_string_initialize(void);
249static int	pmcstat_string_lookup_hash(pmcstat_interned_string _is);
250static void pmcstat_string_shutdown(void);
251static void pmcstat_stats_reset(int _reset_global);
252
253/*
254 * A simple implementation of interned strings.  Each interned string
255 * is assigned a unique address, so that subsequent string compares
256 * can be done by a simple pointer comparision instead of using
257 * strcmp().  This speeds up hash table lookups and saves memory if
258 * duplicate strings are the norm.
259 */
260struct pmcstat_string {
261	LIST_ENTRY(pmcstat_string)	ps_next;	/* hash link */
262	int		ps_len;
263	int		ps_hash;
264	char		*ps_string;
265};
266
267static LIST_HEAD(,pmcstat_string)	pmcstat_string_hash[PMCSTAT_NHASH];
268
269/*
270 * PMC count.
271 */
272int pmcstat_npmcs;
273
274/*
275 * PMC Top mode pause state.
276 */
277int pmcstat_pause;
278
279static void
280pmcstat_stats_reset(int reset_global)
281{
282	struct pmcstat_pmcrecord *pr;
283
284	/* Flush PMCs stats. */
285	LIST_FOREACH(pr, &pmcstat_pmcs, pr_next) {
286		pr->pr_samples = 0;
287		pr->pr_dubious_frames = 0;
288	}
289	ps_samples_period = 0;
290
291	/* Flush global stats. */
292	if (reset_global)
293		bzero(&pmcstat_stats, sizeof(struct pmcstat_stats));
294}
295
296/*
297 * Compute a 'hash' value for a string.
298 */
299
300static int
301pmcstat_string_compute_hash(const char *s)
302{
303	int hash;
304
305	for (hash = 0; *s; s++)
306		hash ^= *s;
307
308	return (hash & PMCSTAT_HASH_MASK);
309}
310
311/*
312 * Intern a copy of string 's', and return a pointer to the
313 * interned structure.
314 */
315
316pmcstat_interned_string
317pmcstat_string_intern(const char *s)
318{
319	struct pmcstat_string *ps;
320	const struct pmcstat_string *cps;
321	int hash, len;
322
323	if ((cps = pmcstat_string_lookup(s)) != NULL)
324		return (cps);
325
326	hash = pmcstat_string_compute_hash(s);
327	len  = strlen(s);
328
329	if ((ps = malloc(sizeof(*ps))) == NULL)
330		err(EX_OSERR, "ERROR: Could not intern string");
331	ps->ps_len = len;
332	ps->ps_hash = hash;
333	ps->ps_string = strdup(s);
334	LIST_INSERT_HEAD(&pmcstat_string_hash[hash], ps, ps_next);
335	return ((pmcstat_interned_string) ps);
336}
337
338const char *
339pmcstat_string_unintern(pmcstat_interned_string str)
340{
341	const char *s;
342
343	s = ((const struct pmcstat_string *) str)->ps_string;
344	return (s);
345}
346
347pmcstat_interned_string
348pmcstat_string_lookup(const char *s)
349{
350	struct pmcstat_string *ps;
351	int hash, len;
352
353	hash = pmcstat_string_compute_hash(s);
354	len = strlen(s);
355
356	LIST_FOREACH(ps, &pmcstat_string_hash[hash], ps_next)
357	    if (ps->ps_len == len && ps->ps_hash == hash &&
358		strcmp(ps->ps_string, s) == 0)
359		    return (ps);
360	return (NULL);
361}
362
363static int
364pmcstat_string_lookup_hash(pmcstat_interned_string s)
365{
366	const struct pmcstat_string *ps;
367
368	ps = (const struct pmcstat_string *) s;
369	return (ps->ps_hash);
370}
371
372/*
373 * Initialize the string interning facility.
374 */
375
376static void
377pmcstat_string_initialize(void)
378{
379	int i;
380
381	for (i = 0; i < PMCSTAT_NHASH; i++)
382		LIST_INIT(&pmcstat_string_hash[i]);
383}
384
385/*
386 * Destroy the string table, free'ing up space.
387 */
388
389static void
390pmcstat_string_shutdown(void)
391{
392	int i;
393	struct pmcstat_string *ps, *pstmp;
394
395	for (i = 0; i < PMCSTAT_NHASH; i++)
396		LIST_FOREACH_SAFE(ps, &pmcstat_string_hash[i], ps_next,
397		    pstmp) {
398			LIST_REMOVE(ps, ps_next);
399			free(ps->ps_string);
400			free(ps);
401		}
402}
403
404/*
405 * Determine whether a given executable image is an A.OUT object, and
406 * if so, fill in its parameters from the text file.
407 * Sets image->pi_type.
408 */
409
410static void
411pmcstat_image_get_aout_params(struct pmcstat_image *image)
412{
413	int fd;
414	ssize_t nbytes;
415	struct exec ex;
416	const char *path;
417	char buffer[PATH_MAX];
418
419	path = pmcstat_string_unintern(image->pi_execpath);
420	assert(path != NULL);
421
422	if (image->pi_iskernelmodule)
423		errx(EX_SOFTWARE, "ERROR: a.out kernel modules are "
424		    "unsupported \"%s\"", path);
425
426	(void) snprintf(buffer, sizeof(buffer), "%s%s",
427	    args.pa_fsroot, path);
428
429	if ((fd = open(buffer, O_RDONLY, 0)) < 0 ||
430	    (nbytes = read(fd, &ex, sizeof(ex))) < 0) {
431		warn("WARNING: Cannot determine type of \"%s\"", path);
432		image->pi_type = PMCSTAT_IMAGE_INDETERMINABLE;
433		if (fd != -1)
434			(void) close(fd);
435		return;
436	}
437
438	(void) close(fd);
439
440	if ((unsigned) nbytes != sizeof(ex) ||
441	    N_BADMAG(ex))
442		return;
443
444	image->pi_type = PMCSTAT_IMAGE_AOUT;
445
446	/* TODO: the rest of a.out processing */
447
448	return;
449}
450
451/*
452 * Helper function.
453 */
454
455static int
456pmcstat_symbol_compare(const void *a, const void *b)
457{
458	const struct pmcstat_symbol *sym1, *sym2;
459
460	sym1 = (const struct pmcstat_symbol *) a;
461	sym2 = (const struct pmcstat_symbol *) b;
462
463	if (sym1->ps_end <= sym2->ps_start)
464		return (-1);
465	if (sym1->ps_start >= sym2->ps_end)
466		return (1);
467	return (0);
468}
469
470/*
471 * Map an address to a symbol in an image.
472 */
473
474struct pmcstat_symbol *
475pmcstat_symbol_search(struct pmcstat_image *image, uintfptr_t addr)
476{
477	struct pmcstat_symbol sym;
478
479	if (image->pi_symbols == NULL)
480		return (NULL);
481
482	sym.ps_name  = NULL;
483	sym.ps_start = addr;
484	sym.ps_end   = addr + 1;
485
486	return (bsearch((void *) &sym, image->pi_symbols,
487		    image->pi_symcount, sizeof(struct pmcstat_symbol),
488		    pmcstat_symbol_compare));
489}
490
491/*
492 * Add the list of symbols in the given section to the list associated
493 * with the object.
494 */
495static void
496pmcstat_image_add_symbols(struct pmcstat_image *image, Elf *e,
497    Elf_Scn *scn, GElf_Shdr *sh)
498{
499	int firsttime;
500	size_t n, newsyms, nshsyms, nfuncsyms;
501	struct pmcstat_symbol *symptr;
502	char *fnname;
503	GElf_Sym sym;
504	Elf_Data *data;
505
506	if ((data = elf_getdata(scn, NULL)) == NULL)
507		return;
508
509	/*
510	 * Determine the number of functions named in this
511	 * section.
512	 */
513
514	nshsyms = sh->sh_size / sh->sh_entsize;
515	for (n = nfuncsyms = 0; n < nshsyms; n++) {
516		if (gelf_getsym(data, (int) n, &sym) != &sym)
517			return;
518		if (GELF_ST_TYPE(sym.st_info) == STT_FUNC)
519			nfuncsyms++;
520	}
521
522	if (nfuncsyms == 0)
523		return;
524
525	/*
526	 * Allocate space for the new entries.
527	 */
528	firsttime = image->pi_symbols == NULL;
529	symptr = realloc(image->pi_symbols,
530	    sizeof(*symptr) * (image->pi_symcount + nfuncsyms));
531	if (symptr == image->pi_symbols) /* realloc() failed. */
532		return;
533	image->pi_symbols = symptr;
534
535	/*
536	 * Append new symbols to the end of the current table.
537	 */
538	symptr += image->pi_symcount;
539
540	for (n = newsyms = 0; n < nshsyms; n++) {
541		if (gelf_getsym(data, (int) n, &sym) != &sym)
542			return;
543		if (GELF_ST_TYPE(sym.st_info) != STT_FUNC)
544			continue;
545		if (sym.st_shndx == STN_UNDEF)
546			continue;
547
548		if (!firsttime && pmcstat_symbol_search(image, sym.st_value))
549			continue; /* We've seen this symbol already. */
550
551		if ((fnname = elf_strptr(e, sh->sh_link, sym.st_name))
552		    == NULL)
553			continue;
554
555		symptr->ps_name  = pmcstat_string_intern(fnname);
556		symptr->ps_start = sym.st_value - image->pi_vaddr;
557		symptr->ps_end   = symptr->ps_start + sym.st_size;
558		symptr++;
559
560		newsyms++;
561	}
562
563	image->pi_symcount += newsyms;
564
565	assert(newsyms <= nfuncsyms);
566
567	/*
568	 * Return space to the system if there were duplicates.
569	 */
570	if (newsyms < nfuncsyms)
571		image->pi_symbols = realloc(image->pi_symbols,
572		    sizeof(*symptr) * image->pi_symcount);
573
574	/*
575	 * Keep the list of symbols sorted.
576	 */
577	qsort(image->pi_symbols, image->pi_symcount, sizeof(*symptr),
578	    pmcstat_symbol_compare);
579
580	/*
581	 * Deal with function symbols that have a size of 'zero' by
582	 * making them extend to the next higher address.  These
583	 * symbols are usually defined in assembly code.
584	 */
585	for (symptr = image->pi_symbols;
586	     symptr < image->pi_symbols + (image->pi_symcount - 1);
587	     symptr++)
588		if (symptr->ps_start == symptr->ps_end)
589			symptr->ps_end = (symptr+1)->ps_start;
590}
591
592/*
593 * Examine an ELF file to determine the size of its text segment.
594 * Sets image->pi_type if anything conclusive can be determined about
595 * this image.
596 */
597
598static void
599pmcstat_image_get_elf_params(struct pmcstat_image *image)
600{
601	int fd;
602	size_t i, nph, nsh;
603	const char *path, *elfbase;
604	char *p, *endp;
605	uintfptr_t minva, maxva;
606	Elf *e;
607	Elf_Scn *scn;
608	GElf_Ehdr eh;
609	GElf_Phdr ph;
610	GElf_Shdr sh;
611	enum pmcstat_image_type image_type;
612	char buffer[PATH_MAX], rtldpath[PATH_MAX];
613
614	assert(image->pi_type == PMCSTAT_IMAGE_UNKNOWN);
615
616	image->pi_start = minva = ~(uintfptr_t) 0;
617	image->pi_end = maxva = (uintfptr_t) 0;
618	image->pi_type = image_type = PMCSTAT_IMAGE_INDETERMINABLE;
619	image->pi_isdynamic = 0;
620	image->pi_dynlinkerpath = NULL;
621	image->pi_vaddr = 0;
622
623	path = pmcstat_string_unintern(image->pi_execpath);
624	assert(path != NULL);
625
626	/*
627	 * Look for kernel modules under FSROOT/KERNELPATH/NAME,
628	 * and user mode executable objects under FSROOT/PATHNAME.
629	 */
630	if (image->pi_iskernelmodule)
631		(void) snprintf(buffer, sizeof(buffer), "%s%s/%s",
632		    args.pa_fsroot, args.pa_kernel, path);
633	else
634		(void) snprintf(buffer, sizeof(buffer), "%s%s",
635		    args.pa_fsroot, path);
636
637	e = NULL;
638	if ((fd = open(buffer, O_RDONLY, 0)) < 0 ||
639	    (e = elf_begin(fd, ELF_C_READ, NULL)) == NULL ||
640	    (elf_kind(e) != ELF_K_ELF)) {
641		warnx("WARNING: Cannot determine the type of \"%s\".",
642		    buffer);
643		goto done;
644	}
645
646	if (gelf_getehdr(e, &eh) != &eh) {
647		warnx("WARNING: Cannot retrieve the ELF Header for "
648		    "\"%s\": %s.", buffer, elf_errmsg(-1));
649		goto done;
650	}
651
652	if (eh.e_type != ET_EXEC && eh.e_type != ET_DYN &&
653	    !(image->pi_iskernelmodule && eh.e_type == ET_REL)) {
654		warnx("WARNING: \"%s\" is of an unsupported ELF type.",
655		    buffer);
656		goto done;
657	}
658
659	image_type = eh.e_ident[EI_CLASS] == ELFCLASS32 ?
660	    PMCSTAT_IMAGE_ELF32 : PMCSTAT_IMAGE_ELF64;
661
662	/*
663	 * Determine the virtual address where an executable would be
664	 * loaded.  Additionally, for dynamically linked executables,
665	 * save the pathname to the runtime linker.
666	 */
667	if (eh.e_type == ET_EXEC) {
668		if (elf_getphnum(e, &nph) == 0) {
669			warnx("WARNING: Could not determine the number of "
670			    "program headers in \"%s\": %s.", buffer,
671			    elf_errmsg(-1));
672			goto done;
673		}
674		for (i = 0; i < eh.e_phnum; i++) {
675			if (gelf_getphdr(e, i, &ph) != &ph) {
676				warnx("WARNING: Retrieval of PHDR entry #%ju "
677				    "in \"%s\" failed: %s.", (uintmax_t) i,
678				    buffer, elf_errmsg(-1));
679				goto done;
680			}
681			switch (ph.p_type) {
682			case PT_DYNAMIC:
683				image->pi_isdynamic = 1;
684				break;
685			case PT_INTERP:
686				if ((elfbase = elf_rawfile(e, NULL)) == NULL) {
687					warnx("WARNING: Cannot retrieve the "
688					    "interpreter for \"%s\": %s.",
689					    buffer, elf_errmsg(-1));
690					goto done;
691				}
692				snprintf(rtldpath, sizeof(rtldpath), "%s%s",
693				    args.pa_fsroot, elfbase + ph.p_offset);
694				image->pi_dynlinkerpath =
695				    pmcstat_string_intern(rtldpath);
696				break;
697			case PT_LOAD:
698				if (ph.p_offset == 0)
699					image->pi_vaddr = ph.p_vaddr;
700				break;
701			}
702		}
703	}
704
705	/*
706	 * Get the min and max VA associated with this ELF object.
707	 */
708	if (elf_getshnum(e, &nsh) == 0) {
709		warnx("WARNING: Could not determine the number of sections "
710		    "for \"%s\": %s.", buffer, elf_errmsg(-1));
711		goto done;
712	}
713
714	for (i = 0; i < nsh; i++) {
715		if ((scn = elf_getscn(e, i)) == NULL ||
716		    gelf_getshdr(scn, &sh) != &sh) {
717			warnx("WARNING: Could not retrieve section header "
718			    "#%ju in \"%s\": %s.", (uintmax_t) i, buffer,
719			    elf_errmsg(-1));
720			goto done;
721		}
722		if (sh.sh_flags & SHF_EXECINSTR) {
723			minva = min(minva, sh.sh_addr);
724			maxva = max(maxva, sh.sh_addr + sh.sh_size);
725		}
726		if (sh.sh_type == SHT_SYMTAB || sh.sh_type == SHT_DYNSYM)
727			pmcstat_image_add_symbols(image, e, scn, &sh);
728	}
729
730	image->pi_start = minva;
731	image->pi_end   = maxva;
732	image->pi_type  = image_type;
733	image->pi_fullpath = pmcstat_string_intern(buffer);
734
735	/* Build display name
736	 */
737	endp = buffer;
738	for (p = buffer; *p; p++)
739		if (*p == '/')
740			endp = p+1;
741	image->pi_name = pmcstat_string_intern(endp);
742
743 done:
744	(void) elf_end(e);
745	if (fd >= 0)
746		(void) close(fd);
747	return;
748}
749
750/*
751 * Given an image descriptor, determine whether it is an ELF, or AOUT.
752 * If no handler claims the image, set its type to 'INDETERMINABLE'.
753 */
754
755void
756pmcstat_image_determine_type(struct pmcstat_image *image)
757{
758	assert(image->pi_type == PMCSTAT_IMAGE_UNKNOWN);
759
760	/* Try each kind of handler in turn */
761	if (image->pi_type == PMCSTAT_IMAGE_UNKNOWN)
762		pmcstat_image_get_elf_params(image);
763	if (image->pi_type == PMCSTAT_IMAGE_UNKNOWN)
764		pmcstat_image_get_aout_params(image);
765
766	/*
767	 * Otherwise, remember that we tried to determine
768	 * the object's type and had failed.
769	 */
770	if (image->pi_type == PMCSTAT_IMAGE_UNKNOWN)
771		image->pi_type = PMCSTAT_IMAGE_INDETERMINABLE;
772}
773
774/*
775 * Locate an image descriptor given an interned path, adding a fresh
776 * descriptor to the cache if necessary.  This function also finds a
777 * suitable name for this image's sample file.
778 *
779 * We defer filling in the file format specific parts of the image
780 * structure till the time we actually see a sample that would fall
781 * into this image.
782 */
783
784static struct pmcstat_image *
785pmcstat_image_from_path(pmcstat_interned_string internedpath,
786    int iskernelmodule)
787{
788	int hash;
789	struct pmcstat_image *pi;
790
791	hash = pmcstat_string_lookup_hash(internedpath);
792
793	/* First, look for an existing entry. */
794	LIST_FOREACH(pi, &pmcstat_image_hash[hash], pi_next)
795	    if (pi->pi_execpath == internedpath &&
796		  pi->pi_iskernelmodule == iskernelmodule)
797		    return (pi);
798
799	/*
800	 * Allocate a new entry and place it at the head of the hash
801	 * and LRU lists.
802	 */
803	pi = malloc(sizeof(*pi));
804	if (pi == NULL)
805		return (NULL);
806
807	pi->pi_type = PMCSTAT_IMAGE_UNKNOWN;
808	pi->pi_execpath = internedpath;
809	pi->pi_start = ~0;
810	pi->pi_end = 0;
811	pi->pi_entry = 0;
812	pi->pi_vaddr = 0;
813	pi->pi_isdynamic = 0;
814	pi->pi_iskernelmodule = iskernelmodule;
815	pi->pi_dynlinkerpath = NULL;
816	pi->pi_symbols = NULL;
817	pi->pi_symcount = 0;
818	pi->pi_addr2line = NULL;
819
820	if (plugins[args.pa_pplugin].pl_initimage != NULL)
821		plugins[args.pa_pplugin].pl_initimage(pi);
822	if (plugins[args.pa_plugin].pl_initimage != NULL)
823		plugins[args.pa_plugin].pl_initimage(pi);
824
825	LIST_INSERT_HEAD(&pmcstat_image_hash[hash], pi, pi_next);
826
827	return (pi);
828}
829
830/*
831 * Record the fact that PC values from 'start' to 'end' come from
832 * image 'image'.
833 */
834
835static void
836pmcstat_image_link(struct pmcstat_process *pp, struct pmcstat_image *image,
837    uintfptr_t start)
838{
839	struct pmcstat_pcmap *pcm, *pcmnew;
840	uintfptr_t offset;
841
842	assert(image->pi_type != PMCSTAT_IMAGE_UNKNOWN &&
843	    image->pi_type != PMCSTAT_IMAGE_INDETERMINABLE);
844
845	if ((pcmnew = malloc(sizeof(*pcmnew))) == NULL)
846		err(EX_OSERR, "ERROR: Cannot create a map entry");
847
848	/*
849	 * Adjust the map entry to only cover the text portion
850	 * of the object.
851	 */
852
853	offset = start - image->pi_vaddr;
854	pcmnew->ppm_lowpc  = image->pi_start + offset;
855	pcmnew->ppm_highpc = image->pi_end + offset;
856	pcmnew->ppm_image  = image;
857
858	assert(pcmnew->ppm_lowpc < pcmnew->ppm_highpc);
859
860	/* Overlapped mmap()'s are assumed to never occur. */
861	TAILQ_FOREACH(pcm, &pp->pp_map, ppm_next)
862	    if (pcm->ppm_lowpc >= pcmnew->ppm_highpc)
863		    break;
864
865	if (pcm == NULL)
866		TAILQ_INSERT_TAIL(&pp->pp_map, pcmnew, ppm_next);
867	else
868		TAILQ_INSERT_BEFORE(pcm, pcmnew, ppm_next);
869}
870
871/*
872 * Unmap images in the range [start..end) associated with process
873 * 'pp'.
874 */
875
876static void
877pmcstat_image_unmap(struct pmcstat_process *pp, uintfptr_t start,
878    uintfptr_t end)
879{
880	struct pmcstat_pcmap *pcm, *pcmtmp, *pcmnew;
881
882	assert(pp != NULL);
883	assert(start < end);
884
885	/*
886	 * Cases:
887	 * - we could have the range completely in the middle of an
888	 *   existing pcmap; in this case we have to split the pcmap
889	 *   structure into two (i.e., generate a 'hole').
890	 * - we could have the range covering multiple pcmaps; these
891	 *   will have to be removed.
892	 * - we could have either 'start' or 'end' falling in the
893	 *   middle of a pcmap; in this case shorten the entry.
894	 */
895	TAILQ_FOREACH_SAFE(pcm, &pp->pp_map, ppm_next, pcmtmp) {
896		assert(pcm->ppm_lowpc < pcm->ppm_highpc);
897		if (pcm->ppm_highpc <= start)
898			continue;
899		if (pcm->ppm_lowpc >= end)
900			return;
901		if (pcm->ppm_lowpc >= start && pcm->ppm_highpc <= end) {
902			/*
903			 * The current pcmap is completely inside the
904			 * unmapped range: remove it entirely.
905			 */
906			TAILQ_REMOVE(&pp->pp_map, pcm, ppm_next);
907			free(pcm);
908		} else if (pcm->ppm_lowpc < start && pcm->ppm_highpc > end) {
909			/*
910			 * Split this pcmap into two; curtail the
911			 * current map to end at [start-1], and start
912			 * the new one at [end].
913			 */
914			if ((pcmnew = malloc(sizeof(*pcmnew))) == NULL)
915				err(EX_OSERR, "ERROR: Cannot split a map "
916				    "entry");
917
918			pcmnew->ppm_image = pcm->ppm_image;
919
920			pcmnew->ppm_lowpc = end;
921			pcmnew->ppm_highpc = pcm->ppm_highpc;
922
923			pcm->ppm_highpc = start;
924
925			TAILQ_INSERT_AFTER(&pp->pp_map, pcm, pcmnew, ppm_next);
926
927			return;
928		} else if (pcm->ppm_lowpc < start && pcm->ppm_highpc <= end)
929			pcm->ppm_highpc = start;
930		else if (pcm->ppm_lowpc >= start && pcm->ppm_highpc > end)
931			pcm->ppm_lowpc = end;
932		else
933			assert(0);
934	}
935}
936
937/*
938 * Resolve file name and line number for the given address.
939 */
940int
941pmcstat_image_addr2line(struct pmcstat_image *image, uintfptr_t addr,
942    char *sourcefile, size_t sourcefile_len, unsigned *sourceline,
943    char *funcname, size_t funcname_len)
944{
945	static int addr2line_warn = 0;
946
947	char *sep, cmdline[PATH_MAX], imagepath[PATH_MAX];
948	int fd;
949
950	if (image->pi_addr2line == NULL) {
951		snprintf(imagepath, sizeof(imagepath), "%s%s.symbols",
952		    args.pa_fsroot,
953		    pmcstat_string_unintern(image->pi_fullpath));
954		fd = open(imagepath, O_RDONLY);
955		if (fd < 0) {
956			snprintf(imagepath, sizeof(imagepath), "%s%s",
957			    args.pa_fsroot,
958			    pmcstat_string_unintern(image->pi_fullpath));
959		} else
960			close(fd);
961		snprintf(cmdline, sizeof(cmdline), "addr2line -Cfe \"%s\"",
962		    imagepath);
963		image->pi_addr2line = popen(cmdline, "r+");
964		if (image->pi_addr2line == NULL) {
965			if (!addr2line_warn) {
966				addr2line_warn = 1;
967				warnx("WARNING: addr2line is needed"
968				    "for source code information.");
969			}
970			return (0);
971		}
972	}
973
974	if (feof(image->pi_addr2line) || ferror(image->pi_addr2line)) {
975		warnx("WARNING: addr2line pipe error");
976		pclose(image->pi_addr2line);
977		image->pi_addr2line = NULL;
978		return (0);
979	}
980
981	fprintf(image->pi_addr2line, "%p\n", (void *)addr);
982
983	if (fgets(funcname, funcname_len, image->pi_addr2line) == NULL) {
984		warnx("WARNING: addr2line function name read error");
985		return (0);
986	}
987	sep = strchr(funcname, '\n');
988	if (sep != NULL)
989		*sep = '\0';
990
991	if (fgets(sourcefile, sourcefile_len, image->pi_addr2line) == NULL) {
992		warnx("WARNING: addr2line source file read error");
993		return (0);
994	}
995	sep = strchr(sourcefile, ':');
996	if (sep == NULL) {
997		warnx("WARNING: addr2line source line separator missing");
998		return (0);
999	}
1000	*sep = '\0';
1001	*sourceline = atoi(sep+1);
1002	if (*sourceline == 0)
1003		return (0);
1004
1005	return (1);
1006}
1007
1008/*
1009 * Add a {pmcid,name} mapping.
1010 */
1011
1012static void
1013pmcstat_pmcid_add(pmc_id_t pmcid, pmcstat_interned_string ps)
1014{
1015	struct pmcstat_pmcrecord *pr, *prm;
1016
1017	/* Replace an existing name for the PMC. */
1018	prm = NULL;
1019	LIST_FOREACH(pr, &pmcstat_pmcs, pr_next)
1020		if (pr->pr_pmcid == pmcid) {
1021			pr->pr_pmcname = ps;
1022			return;
1023		} else if (pr->pr_pmcname == ps)
1024			prm = pr;
1025
1026	/*
1027	 * Otherwise, allocate a new descriptor and call the
1028	 * plugins hook.
1029	 */
1030	if ((pr = malloc(sizeof(*pr))) == NULL)
1031		err(EX_OSERR, "ERROR: Cannot allocate pmc record");
1032
1033	pr->pr_pmcid = pmcid;
1034	pr->pr_pmcname = ps;
1035	pr->pr_pmcin = pmcstat_npmcs++;
1036	pr->pr_samples = 0;
1037	pr->pr_dubious_frames = 0;
1038	pr->pr_merge = prm == NULL ? pr : prm;
1039
1040	LIST_INSERT_HEAD(&pmcstat_pmcs, pr, pr_next);
1041
1042	if (plugins[args.pa_pplugin].pl_newpmc != NULL)
1043		plugins[args.pa_pplugin].pl_newpmc(ps, pr);
1044	if (plugins[args.pa_plugin].pl_newpmc != NULL)
1045		plugins[args.pa_plugin].pl_newpmc(ps, pr);
1046}
1047
1048/*
1049 * Given a pmcid in use, find its human-readable name.
1050 */
1051
1052const char *
1053pmcstat_pmcid_to_name(pmc_id_t pmcid)
1054{
1055	struct pmcstat_pmcrecord *pr;
1056
1057	LIST_FOREACH(pr, &pmcstat_pmcs, pr_next)
1058	    if (pr->pr_pmcid == pmcid)
1059		    return (pmcstat_string_unintern(pr->pr_pmcname));
1060
1061	return NULL;
1062}
1063
1064/*
1065 * Convert PMC index to name.
1066 */
1067
1068const char *
1069pmcstat_pmcindex_to_name(int pmcin)
1070{
1071	struct pmcstat_pmcrecord *pr;
1072
1073	LIST_FOREACH(pr, &pmcstat_pmcs, pr_next)
1074		if (pr->pr_pmcin == pmcin)
1075			return pmcstat_string_unintern(pr->pr_pmcname);
1076
1077	return NULL;
1078}
1079
1080/*
1081 * Return PMC record with given index.
1082 */
1083
1084struct pmcstat_pmcrecord *
1085pmcstat_pmcindex_to_pmcr(int pmcin)
1086{
1087	struct pmcstat_pmcrecord *pr;
1088
1089	LIST_FOREACH(pr, &pmcstat_pmcs, pr_next)
1090		if (pr->pr_pmcin == pmcin)
1091			return pr;
1092
1093	return NULL;
1094}
1095
1096/*
1097 * Get PMC record by id, apply merge policy.
1098 */
1099
1100static struct pmcstat_pmcrecord *
1101pmcstat_lookup_pmcid(pmc_id_t pmcid)
1102{
1103	struct pmcstat_pmcrecord *pr;
1104
1105	LIST_FOREACH(pr, &pmcstat_pmcs, pr_next) {
1106		if (pr->pr_pmcid == pmcid) {
1107			if (pmcstat_mergepmc)
1108				return pr->pr_merge;
1109			return pr;
1110		}
1111	}
1112
1113	return NULL;
1114}
1115
1116/*
1117 * Associate an AOUT image with a process.
1118 */
1119
1120static void
1121pmcstat_process_aout_exec(struct pmcstat_process *pp,
1122    struct pmcstat_image *image, uintfptr_t entryaddr)
1123{
1124	(void) pp;
1125	(void) image;
1126	(void) entryaddr;
1127	/* TODO Implement a.out handling */
1128}
1129
1130/*
1131 * Associate an ELF image with a process.
1132 */
1133
1134static void
1135pmcstat_process_elf_exec(struct pmcstat_process *pp,
1136    struct pmcstat_image *image, uintfptr_t entryaddr)
1137{
1138	uintmax_t libstart;
1139	struct pmcstat_image *rtldimage;
1140
1141	assert(image->pi_type == PMCSTAT_IMAGE_ELF32 ||
1142	    image->pi_type == PMCSTAT_IMAGE_ELF64);
1143
1144	/* Create a map entry for the base executable. */
1145	pmcstat_image_link(pp, image, image->pi_vaddr);
1146
1147	/*
1148	 * For dynamically linked executables we need to determine
1149	 * where the dynamic linker was mapped to for this process,
1150	 * Subsequent executable objects that are mapped in by the
1151	 * dynamic linker will be tracked by log events of type
1152	 * PMCLOG_TYPE_MAP_IN.
1153	 */
1154
1155	if (image->pi_isdynamic) {
1156
1157		/*
1158		 * The runtime loader gets loaded just after the maximum
1159		 * possible heap address.  Like so:
1160		 *
1161		 * [  TEXT DATA BSS HEAP -->*RTLD  SHLIBS   <--STACK]
1162		 * ^					            ^
1163		 * 0				   VM_MAXUSER_ADDRESS
1164
1165		 *
1166		 * The exact address where the loader gets mapped in
1167		 * will vary according to the size of the executable
1168		 * and the limits on the size of the process'es data
1169		 * segment at the time of exec().  The entry address
1170		 * recorded at process exec time corresponds to the
1171		 * 'start' address inside the dynamic linker.  From
1172		 * this we can figure out the address where the
1173		 * runtime loader's file object had been mapped to.
1174		 */
1175		rtldimage = pmcstat_image_from_path(image->pi_dynlinkerpath, 0);
1176		if (rtldimage == NULL) {
1177			warnx("WARNING: Cannot find image for \"%s\".",
1178			    pmcstat_string_unintern(image->pi_dynlinkerpath));
1179			pmcstat_stats.ps_exec_errors++;
1180			return;
1181		}
1182
1183		if (rtldimage->pi_type == PMCSTAT_IMAGE_UNKNOWN)
1184			pmcstat_image_get_elf_params(rtldimage);
1185
1186		if (rtldimage->pi_type != PMCSTAT_IMAGE_ELF32 &&
1187		    rtldimage->pi_type != PMCSTAT_IMAGE_ELF64) {
1188			warnx("WARNING: rtld not an ELF object \"%s\".",
1189			    pmcstat_string_unintern(image->pi_dynlinkerpath));
1190			return;
1191		}
1192
1193		libstart = entryaddr - rtldimage->pi_entry;
1194		pmcstat_image_link(pp, rtldimage, libstart);
1195	}
1196}
1197
1198/*
1199 * Find the process descriptor corresponding to a PID.  If 'allocate'
1200 * is zero, we return a NULL if a pid descriptor could not be found or
1201 * a process descriptor process.  If 'allocate' is non-zero, then we
1202 * will attempt to allocate a fresh process descriptor.  Zombie
1203 * process descriptors are only removed if a fresh allocation for the
1204 * same PID is requested.
1205 */
1206
1207static struct pmcstat_process *
1208pmcstat_process_lookup(pid_t pid, int allocate)
1209{
1210	uint32_t hash;
1211	struct pmcstat_pcmap *ppm, *ppmtmp;
1212	struct pmcstat_process *pp, *pptmp;
1213
1214	hash = (uint32_t) pid & PMCSTAT_HASH_MASK;	/* simplicity wins */
1215
1216	LIST_FOREACH_SAFE(pp, &pmcstat_process_hash[hash], pp_next, pptmp)
1217	    if (pp->pp_pid == pid) {
1218		    /* Found a descriptor, check and process zombies */
1219		    if (allocate && pp->pp_isactive == 0) {
1220			    /* remove maps */
1221			    TAILQ_FOREACH_SAFE(ppm, &pp->pp_map, ppm_next,
1222				ppmtmp) {
1223				    TAILQ_REMOVE(&pp->pp_map, ppm, ppm_next);
1224				    free(ppm);
1225			    }
1226			    /* remove process entry */
1227			    LIST_REMOVE(pp, pp_next);
1228			    free(pp);
1229			    break;
1230		    }
1231		    return (pp);
1232	    }
1233
1234	if (!allocate)
1235		return (NULL);
1236
1237	if ((pp = malloc(sizeof(*pp))) == NULL)
1238		err(EX_OSERR, "ERROR: Cannot allocate pid descriptor");
1239
1240	pp->pp_pid = pid;
1241	pp->pp_isactive = 1;
1242
1243	TAILQ_INIT(&pp->pp_map);
1244
1245	LIST_INSERT_HEAD(&pmcstat_process_hash[hash], pp, pp_next);
1246	return (pp);
1247}
1248
1249/*
1250 * Associate an image and a process.
1251 */
1252
1253static void
1254pmcstat_process_exec(struct pmcstat_process *pp,
1255    pmcstat_interned_string path, uintfptr_t entryaddr)
1256{
1257	struct pmcstat_image *image;
1258
1259	if ((image = pmcstat_image_from_path(path, 0)) == NULL) {
1260		pmcstat_stats.ps_exec_errors++;
1261		return;
1262	}
1263
1264	if (image->pi_type == PMCSTAT_IMAGE_UNKNOWN)
1265		pmcstat_image_determine_type(image);
1266
1267	assert(image->pi_type != PMCSTAT_IMAGE_UNKNOWN);
1268
1269	switch (image->pi_type) {
1270	case PMCSTAT_IMAGE_ELF32:
1271	case PMCSTAT_IMAGE_ELF64:
1272		pmcstat_stats.ps_exec_elf++;
1273		pmcstat_process_elf_exec(pp, image, entryaddr);
1274		break;
1275
1276	case PMCSTAT_IMAGE_AOUT:
1277		pmcstat_stats.ps_exec_aout++;
1278		pmcstat_process_aout_exec(pp, image, entryaddr);
1279		break;
1280
1281	case PMCSTAT_IMAGE_INDETERMINABLE:
1282		pmcstat_stats.ps_exec_indeterminable++;
1283		break;
1284
1285	default:
1286		err(EX_SOFTWARE, "ERROR: Unsupported executable type for "
1287		    "\"%s\"", pmcstat_string_unintern(path));
1288	}
1289}
1290
1291
1292/*
1293 * Find the map entry associated with process 'p' at PC value 'pc'.
1294 */
1295
1296struct pmcstat_pcmap *
1297pmcstat_process_find_map(struct pmcstat_process *p, uintfptr_t pc)
1298{
1299	struct pmcstat_pcmap *ppm;
1300
1301	TAILQ_FOREACH(ppm, &p->pp_map, ppm_next) {
1302		if (pc >= ppm->ppm_lowpc && pc < ppm->ppm_highpc)
1303			return (ppm);
1304		if (pc < ppm->ppm_lowpc)
1305			return (NULL);
1306	}
1307
1308	return (NULL);
1309}
1310
1311/*
1312 * Convert a hwpmc(4) log to profile information.  A system-wide
1313 * callgraph is generated if FLAG_DO_CALLGRAPHS is set.  gmon.out
1314 * files usable by gprof(1) are created if FLAG_DO_GPROF is set.
1315 */
1316static int
1317pmcstat_analyze_log(void)
1318{
1319	uint32_t cpu, cpuflags;
1320	uintfptr_t pc;
1321	pid_t pid;
1322	struct pmcstat_image *image;
1323	struct pmcstat_process *pp, *ppnew;
1324	struct pmcstat_pcmap *ppm, *ppmtmp;
1325	struct pmclog_ev ev;
1326	struct pmcstat_pmcrecord *pmcr;
1327	pmcstat_interned_string image_path;
1328
1329	assert(args.pa_flags & FLAG_DO_ANALYSIS);
1330
1331	if (elf_version(EV_CURRENT) == EV_NONE)
1332		err(EX_UNAVAILABLE, "Elf library intialization failed");
1333
1334	while (pmclog_read(args.pa_logparser, &ev) == 0) {
1335		assert(ev.pl_state == PMCLOG_OK);
1336
1337		switch (ev.pl_type) {
1338		case PMCLOG_TYPE_INITIALIZE:
1339			if ((ev.pl_u.pl_i.pl_version & 0xFF000000) !=
1340			    PMC_VERSION_MAJOR << 24 && args.pa_verbosity > 0)
1341				warnx("WARNING: Log version 0x%x does not "
1342				    "match compiled version 0x%x.",
1343				    ev.pl_u.pl_i.pl_version,
1344				    PMC_VERSION_MAJOR);
1345			break;
1346
1347		case PMCLOG_TYPE_MAP_IN:
1348			/*
1349			 * Introduce an address range mapping for a
1350			 * userland process or the kernel (pid == -1).
1351			 *
1352			 * We always allocate a process descriptor so
1353			 * that subsequent samples seen for this
1354			 * address range are mapped to the current
1355			 * object being mapped in.
1356			 */
1357			pid = ev.pl_u.pl_mi.pl_pid;
1358			if (pid == -1)
1359				pp = pmcstat_kernproc;
1360			else
1361				pp = pmcstat_process_lookup(pid,
1362				    PMCSTAT_ALLOCATE);
1363
1364			assert(pp != NULL);
1365
1366			image_path = pmcstat_string_intern(ev.pl_u.pl_mi.
1367			    pl_pathname);
1368			image = pmcstat_image_from_path(image_path, pid == -1);
1369			if (image->pi_type == PMCSTAT_IMAGE_UNKNOWN)
1370				pmcstat_image_determine_type(image);
1371			if (image->pi_type != PMCSTAT_IMAGE_INDETERMINABLE)
1372				pmcstat_image_link(pp, image,
1373				    ev.pl_u.pl_mi.pl_start);
1374			break;
1375
1376		case PMCLOG_TYPE_MAP_OUT:
1377			/*
1378			 * Remove an address map.
1379			 */
1380			pid = ev.pl_u.pl_mo.pl_pid;
1381			if (pid == -1)
1382				pp = pmcstat_kernproc;
1383			else
1384				pp = pmcstat_process_lookup(pid, 0);
1385
1386			if (pp == NULL)	/* unknown process */
1387				break;
1388
1389			pmcstat_image_unmap(pp, ev.pl_u.pl_mo.pl_start,
1390			    ev.pl_u.pl_mo.pl_end);
1391			break;
1392
1393		case PMCLOG_TYPE_PCSAMPLE:
1394			/*
1395			 * Note: the `PCSAMPLE' log entry is not
1396			 * generated by hpwmc(4) after version 2.
1397			 */
1398
1399			/*
1400			 * We bring in the gmon file for the image
1401			 * currently associated with the PMC & pid
1402			 * pair and increment the appropriate entry
1403			 * bin inside this.
1404			 */
1405			pmcstat_stats.ps_samples_total++;
1406			ps_samples_period++;
1407
1408			pc = ev.pl_u.pl_s.pl_pc;
1409			pp = pmcstat_process_lookup(ev.pl_u.pl_s.pl_pid,
1410			    PMCSTAT_ALLOCATE);
1411
1412			/* Get PMC record. */
1413			pmcr = pmcstat_lookup_pmcid(ev.pl_u.pl_s.pl_pmcid);
1414			assert(pmcr != NULL);
1415			pmcr->pr_samples++;
1416
1417			/*
1418			 * Call the plugins processing
1419			 * TODO: move pmcstat_process_find_map inside plugins
1420			 */
1421
1422			if (plugins[args.pa_pplugin].pl_process != NULL)
1423				plugins[args.pa_pplugin].pl_process(
1424				    pp, pmcr, 1, &pc,
1425				    pmcstat_process_find_map(pp, pc) != NULL, 0);
1426			plugins[args.pa_plugin].pl_process(
1427			    pp, pmcr, 1, &pc,
1428			    pmcstat_process_find_map(pp, pc) != NULL, 0);
1429			break;
1430
1431		case PMCLOG_TYPE_CALLCHAIN:
1432			pmcstat_stats.ps_samples_total++;
1433			ps_samples_period++;
1434
1435			cpuflags = ev.pl_u.pl_cc.pl_cpuflags;
1436			cpu = PMC_CALLCHAIN_CPUFLAGS_TO_CPU(cpuflags);
1437
1438			/* Filter on the CPU id. */
1439			if ((args.pa_cpumask & (1 << cpu)) == 0) {
1440				pmcstat_stats.ps_samples_skipped++;
1441				break;
1442			}
1443
1444			pp = pmcstat_process_lookup(ev.pl_u.pl_cc.pl_pid,
1445			    PMCSTAT_ALLOCATE);
1446
1447			/* Get PMC record. */
1448			pmcr = pmcstat_lookup_pmcid(ev.pl_u.pl_cc.pl_pmcid);
1449			assert(pmcr != NULL);
1450			pmcr->pr_samples++;
1451
1452			/*
1453			 * Call the plugins processing
1454			 */
1455
1456			if (plugins[args.pa_pplugin].pl_process != NULL)
1457				plugins[args.pa_pplugin].pl_process(
1458				    pp, pmcr,
1459				    ev.pl_u.pl_cc.pl_npc,
1460				    ev.pl_u.pl_cc.pl_pc,
1461				    PMC_CALLCHAIN_CPUFLAGS_TO_USERMODE(cpuflags),
1462				    cpu);
1463			plugins[args.pa_plugin].pl_process(
1464			    pp, pmcr,
1465			    ev.pl_u.pl_cc.pl_npc,
1466			    ev.pl_u.pl_cc.pl_pc,
1467			    PMC_CALLCHAIN_CPUFLAGS_TO_USERMODE(cpuflags),
1468			    cpu);
1469			break;
1470
1471		case PMCLOG_TYPE_PMCALLOCATE:
1472			/*
1473			 * Record the association pmc id between this
1474			 * PMC and its name.
1475			 */
1476			pmcstat_pmcid_add(ev.pl_u.pl_a.pl_pmcid,
1477			    pmcstat_string_intern(ev.pl_u.pl_a.pl_evname));
1478			break;
1479
1480		case PMCLOG_TYPE_PROCEXEC:
1481
1482			/*
1483			 * Change the executable image associated with
1484			 * a process.
1485			 */
1486			pp = pmcstat_process_lookup(ev.pl_u.pl_x.pl_pid,
1487			    PMCSTAT_ALLOCATE);
1488
1489			/* delete the current process map */
1490			TAILQ_FOREACH_SAFE(ppm, &pp->pp_map, ppm_next, ppmtmp) {
1491				TAILQ_REMOVE(&pp->pp_map, ppm, ppm_next);
1492				free(ppm);
1493			}
1494
1495			/* associate this process  image */
1496			image_path = pmcstat_string_intern(
1497				ev.pl_u.pl_x.pl_pathname);
1498			assert(image_path != NULL);
1499			pmcstat_process_exec(pp, image_path,
1500			    ev.pl_u.pl_x.pl_entryaddr);
1501			break;
1502
1503		case PMCLOG_TYPE_PROCEXIT:
1504
1505			/*
1506			 * Due to the way the log is generated, the
1507			 * last few samples corresponding to a process
1508			 * may appear in the log after the process
1509			 * exit event is recorded.  Thus we keep the
1510			 * process' descriptor and associated data
1511			 * structures around, but mark the process as
1512			 * having exited.
1513			 */
1514			pp = pmcstat_process_lookup(ev.pl_u.pl_e.pl_pid, 0);
1515			if (pp == NULL)
1516				break;
1517			pp->pp_isactive = 0;	/* mark as a zombie */
1518			break;
1519
1520		case PMCLOG_TYPE_SYSEXIT:
1521			pp = pmcstat_process_lookup(ev.pl_u.pl_se.pl_pid, 0);
1522			if (pp == NULL)
1523				break;
1524			pp->pp_isactive = 0;	/* make a zombie */
1525			break;
1526
1527		case PMCLOG_TYPE_PROCFORK:
1528
1529			/*
1530			 * Allocate a process descriptor for the new
1531			 * (child) process.
1532			 */
1533			ppnew =
1534			    pmcstat_process_lookup(ev.pl_u.pl_f.pl_newpid,
1535				PMCSTAT_ALLOCATE);
1536
1537			/*
1538			 * If we had been tracking the parent, clone
1539			 * its address maps.
1540			 */
1541			pp = pmcstat_process_lookup(ev.pl_u.pl_f.pl_oldpid, 0);
1542			if (pp == NULL)
1543				break;
1544			TAILQ_FOREACH(ppm, &pp->pp_map, ppm_next)
1545			    pmcstat_image_link(ppnew, ppm->ppm_image,
1546				ppm->ppm_lowpc);
1547			break;
1548
1549		default:	/* other types of entries are not relevant */
1550			break;
1551		}
1552	}
1553
1554	if (ev.pl_state == PMCLOG_EOF)
1555		return (PMCSTAT_FINISHED);
1556	else if (ev.pl_state == PMCLOG_REQUIRE_DATA)
1557		return (PMCSTAT_RUNNING);
1558
1559	err(EX_DATAERR, "ERROR: event parsing failed (record %jd, "
1560	    "offset 0x%jx)", (uintmax_t) ev.pl_count + 1, ev.pl_offset);
1561}
1562
1563/*
1564 * Print log entries as text.
1565 */
1566
1567static int
1568pmcstat_print_log(void)
1569{
1570	struct pmclog_ev ev;
1571	uint32_t npc;
1572
1573	while (pmclog_read(args.pa_logparser, &ev) == 0) {
1574		assert(ev.pl_state == PMCLOG_OK);
1575		switch (ev.pl_type) {
1576		case PMCLOG_TYPE_CALLCHAIN:
1577			PMCSTAT_PRINT_ENTRY("callchain",
1578			    "%d 0x%x %d %d %c", ev.pl_u.pl_cc.pl_pid,
1579			    ev.pl_u.pl_cc.pl_pmcid,
1580			    PMC_CALLCHAIN_CPUFLAGS_TO_CPU(ev.pl_u.pl_cc. \
1581				pl_cpuflags), ev.pl_u.pl_cc.pl_npc,
1582			    PMC_CALLCHAIN_CPUFLAGS_TO_USERMODE(ev.pl_u.pl_cc.\
1583			        pl_cpuflags) ? 'u' : 's');
1584			for (npc = 0; npc < ev.pl_u.pl_cc.pl_npc; npc++)
1585				PMCSTAT_PRINT_ENTRY("...", "%p",
1586				    (void *) ev.pl_u.pl_cc.pl_pc[npc]);
1587			break;
1588		case PMCLOG_TYPE_CLOSELOG:
1589			PMCSTAT_PRINT_ENTRY("closelog",);
1590			break;
1591		case PMCLOG_TYPE_DROPNOTIFY:
1592			PMCSTAT_PRINT_ENTRY("drop",);
1593			break;
1594		case PMCLOG_TYPE_INITIALIZE:
1595			PMCSTAT_PRINT_ENTRY("initlog","0x%x \"%s\"",
1596			    ev.pl_u.pl_i.pl_version,
1597			    pmc_name_of_cputype(ev.pl_u.pl_i.pl_arch));
1598			if ((ev.pl_u.pl_i.pl_version & 0xFF000000) !=
1599			    PMC_VERSION_MAJOR << 24 && args.pa_verbosity > 0)
1600				warnx("WARNING: Log version 0x%x != expected "
1601				    "version 0x%x.", ev.pl_u.pl_i.pl_version,
1602				    PMC_VERSION);
1603			break;
1604		case PMCLOG_TYPE_MAP_IN:
1605			PMCSTAT_PRINT_ENTRY("map-in","%d %p \"%s\"",
1606			    ev.pl_u.pl_mi.pl_pid,
1607			    (void *) ev.pl_u.pl_mi.pl_start,
1608			    ev.pl_u.pl_mi.pl_pathname);
1609			break;
1610		case PMCLOG_TYPE_MAP_OUT:
1611			PMCSTAT_PRINT_ENTRY("map-out","%d %p %p",
1612			    ev.pl_u.pl_mo.pl_pid,
1613			    (void *) ev.pl_u.pl_mo.pl_start,
1614			    (void *) ev.pl_u.pl_mo.pl_end);
1615			break;
1616		case PMCLOG_TYPE_PCSAMPLE:
1617			PMCSTAT_PRINT_ENTRY("sample","0x%x %d %p %c",
1618			    ev.pl_u.pl_s.pl_pmcid,
1619			    ev.pl_u.pl_s.pl_pid,
1620			    (void *) ev.pl_u.pl_s.pl_pc,
1621			    ev.pl_u.pl_s.pl_usermode ? 'u' : 's');
1622			break;
1623		case PMCLOG_TYPE_PMCALLOCATE:
1624			PMCSTAT_PRINT_ENTRY("allocate","0x%x \"%s\" 0x%x",
1625			    ev.pl_u.pl_a.pl_pmcid,
1626			    ev.pl_u.pl_a.pl_evname,
1627			    ev.pl_u.pl_a.pl_flags);
1628			break;
1629		case PMCLOG_TYPE_PMCATTACH:
1630			PMCSTAT_PRINT_ENTRY("attach","0x%x %d \"%s\"",
1631			    ev.pl_u.pl_t.pl_pmcid,
1632			    ev.pl_u.pl_t.pl_pid,
1633			    ev.pl_u.pl_t.pl_pathname);
1634			break;
1635		case PMCLOG_TYPE_PMCDETACH:
1636			PMCSTAT_PRINT_ENTRY("detach","0x%x %d",
1637			    ev.pl_u.pl_d.pl_pmcid,
1638			    ev.pl_u.pl_d.pl_pid);
1639			break;
1640		case PMCLOG_TYPE_PROCCSW:
1641			PMCSTAT_PRINT_ENTRY("cswval","0x%x %d %jd",
1642			    ev.pl_u.pl_c.pl_pmcid,
1643			    ev.pl_u.pl_c.pl_pid,
1644			    ev.pl_u.pl_c.pl_value);
1645			break;
1646		case PMCLOG_TYPE_PROCEXEC:
1647			PMCSTAT_PRINT_ENTRY("exec","0x%x %d %p \"%s\"",
1648			    ev.pl_u.pl_x.pl_pmcid,
1649			    ev.pl_u.pl_x.pl_pid,
1650			    (void *) ev.pl_u.pl_x.pl_entryaddr,
1651			    ev.pl_u.pl_x.pl_pathname);
1652			break;
1653		case PMCLOG_TYPE_PROCEXIT:
1654			PMCSTAT_PRINT_ENTRY("exitval","0x%x %d %jd",
1655			    ev.pl_u.pl_e.pl_pmcid,
1656			    ev.pl_u.pl_e.pl_pid,
1657			    ev.pl_u.pl_e.pl_value);
1658			break;
1659		case PMCLOG_TYPE_PROCFORK:
1660			PMCSTAT_PRINT_ENTRY("fork","%d %d",
1661			    ev.pl_u.pl_f.pl_oldpid,
1662			    ev.pl_u.pl_f.pl_newpid);
1663			break;
1664		case PMCLOG_TYPE_USERDATA:
1665			PMCSTAT_PRINT_ENTRY("userdata","0x%x",
1666			    ev.pl_u.pl_u.pl_userdata);
1667			break;
1668		case PMCLOG_TYPE_SYSEXIT:
1669			PMCSTAT_PRINT_ENTRY("exit","%d",
1670			    ev.pl_u.pl_se.pl_pid);
1671			break;
1672		default:
1673			fprintf(args.pa_printfile, "unknown event (type %d).\n",
1674			    ev.pl_type);
1675		}
1676	}
1677
1678	if (ev.pl_state == PMCLOG_EOF)
1679		return (PMCSTAT_FINISHED);
1680	else if (ev.pl_state ==  PMCLOG_REQUIRE_DATA)
1681		return (PMCSTAT_RUNNING);
1682
1683	errx(EX_DATAERR, "ERROR: event parsing failed "
1684	    "(record %jd, offset 0x%jx).",
1685	    (uintmax_t) ev.pl_count + 1, ev.pl_offset);
1686	/*NOTREACHED*/
1687}
1688
1689/*
1690 * Public Interfaces.
1691 */
1692
1693/*
1694 * Close a logfile, after first flushing all in-module queued data.
1695 */
1696
1697int
1698pmcstat_close_log(void)
1699{
1700	/* If a local logfile is configured ask the kernel to stop
1701	 * and flush data. Kernel will close the file when data is flushed
1702	 * so keep the status to EXITING.
1703	 */
1704	if (args.pa_logfd != -1) {
1705		if (pmc_flush_logfile() < 0)
1706			err(EX_OSERR, "ERROR: logging failed");
1707	}
1708
1709	return (args.pa_flags & FLAG_HAS_PIPE ? PMCSTAT_EXITING :
1710	    PMCSTAT_FINISHED);
1711}
1712
1713
1714
1715/*
1716 * Open a log file, for reading or writing.
1717 *
1718 * The function returns the fd of a successfully opened log or -1 in
1719 * case of failure.
1720 */
1721
1722int
1723pmcstat_open_log(const char *path, int mode)
1724{
1725	int error, fd, cfd;
1726	size_t hlen;
1727	const char *p, *errstr;
1728	struct addrinfo hints, *res, *res0;
1729	char hostname[MAXHOSTNAMELEN];
1730
1731	errstr = NULL;
1732	fd = -1;
1733
1734	/*
1735	 * If 'path' is "-" then open one of stdin or stdout depending
1736	 * on the value of 'mode'.
1737	 *
1738	 * If 'path' contains a ':' and does not start with a '/' or '.',
1739	 * and is being opened for writing, treat it as a "host:port"
1740	 * specification and open a network socket.
1741	 *
1742	 * Otherwise, treat 'path' as a file name and open that.
1743	 */
1744	if (path[0] == '-' && path[1] == '\0')
1745		fd = (mode == PMCSTAT_OPEN_FOR_READ) ? 0 : 1;
1746	else if (path[0] != '/' &&
1747	    path[0] != '.' && strchr(path, ':') != NULL) {
1748
1749		p = strrchr(path, ':');
1750		hlen = p - path;
1751		if (p == path || hlen >= sizeof(hostname)) {
1752			errstr = strerror(EINVAL);
1753			goto done;
1754		}
1755
1756		assert(hlen < sizeof(hostname));
1757		(void) strncpy(hostname, path, hlen);
1758		hostname[hlen] = '\0';
1759
1760		(void) memset(&hints, 0, sizeof(hints));
1761		hints.ai_family = AF_UNSPEC;
1762		hints.ai_socktype = SOCK_STREAM;
1763		if ((error = getaddrinfo(hostname, p+1, &hints, &res0)) != 0) {
1764			errstr = gai_strerror(error);
1765			goto done;
1766		}
1767
1768		fd = -1;
1769		for (res = res0; res; res = res->ai_next) {
1770			if ((fd = socket(res->ai_family, res->ai_socktype,
1771			    res->ai_protocol)) < 0) {
1772				errstr = strerror(errno);
1773				continue;
1774			}
1775			if (mode == PMCSTAT_OPEN_FOR_READ) {
1776				if (bind(fd, res->ai_addr, res->ai_addrlen) < 0) {
1777					errstr = strerror(errno);
1778					(void) close(fd);
1779					fd = -1;
1780					continue;
1781				}
1782				listen(fd, 1);
1783				cfd = accept(fd, NULL, NULL);
1784				(void) close(fd);
1785				if (cfd < 0) {
1786					errstr = strerror(errno);
1787					fd = -1;
1788					break;
1789				}
1790				fd = cfd;
1791			} else {
1792				if (connect(fd, res->ai_addr, res->ai_addrlen) < 0) {
1793					errstr = strerror(errno);
1794					(void) close(fd);
1795					fd = -1;
1796					continue;
1797				}
1798			}
1799			errstr = NULL;
1800			break;
1801		}
1802		freeaddrinfo(res0);
1803
1804	} else if ((fd = open(path, mode == PMCSTAT_OPEN_FOR_READ ?
1805		    O_RDONLY : (O_WRONLY|O_CREAT|O_TRUNC),
1806		    S_IRUSR|S_IWUSR|S_IRGRP|S_IROTH)) < 0)
1807			errstr = strerror(errno);
1808
1809  done:
1810	if (errstr)
1811		errx(EX_OSERR, "ERROR: Cannot open \"%s\" for %s: %s.", path,
1812		    (mode == PMCSTAT_OPEN_FOR_READ ? "reading" : "writing"),
1813		    errstr);
1814
1815	return (fd);
1816}
1817
1818/*
1819 * Process a log file in offline analysis mode.
1820 */
1821
1822int
1823pmcstat_process_log(void)
1824{
1825
1826	/*
1827	 * If analysis has not been asked for, just print the log to
1828	 * the current output file.
1829	 */
1830	if (args.pa_flags & FLAG_DO_PRINT)
1831		return (pmcstat_print_log());
1832	else
1833		return (pmcstat_analyze_log());
1834}
1835
1836/*
1837 * Refresh top display.
1838 */
1839
1840static void
1841pmcstat_refresh_top(void)
1842{
1843	int v_attrs;
1844	float v;
1845	char pmcname[40];
1846	struct pmcstat_pmcrecord *pmcpr;
1847
1848	/* If in pause mode do not refresh display. */
1849	if (pmcstat_pause)
1850		return;
1851
1852	/* Wait until PMC pop in the log. */
1853	pmcpr = pmcstat_pmcindex_to_pmcr(pmcstat_pmcinfilter);
1854	if (pmcpr == NULL)
1855		return;
1856
1857	/* Format PMC name. */
1858	if (pmcstat_mergepmc)
1859		snprintf(pmcname, sizeof(pmcname), "[%s]",
1860		    pmcstat_string_unintern(pmcpr->pr_pmcname));
1861	else
1862		snprintf(pmcname, sizeof(pmcname), "%s.%d",
1863		    pmcstat_string_unintern(pmcpr->pr_pmcname),
1864		    pmcstat_pmcinfilter);
1865
1866	/* Format samples count. */
1867	if (ps_samples_period > 0)
1868		v = (pmcpr->pr_samples * 100.0) / ps_samples_period;
1869	else
1870		v = 0.;
1871	v_attrs = PMCSTAT_ATTRPERCENT(v);
1872
1873	PMCSTAT_PRINTBEGIN();
1874	PMCSTAT_PRINTW("PMC: %s Samples: %u ",
1875	    pmcname,
1876	    pmcpr->pr_samples);
1877	PMCSTAT_ATTRON(v_attrs);
1878	PMCSTAT_PRINTW("(%.1f%%) ", v);
1879	PMCSTAT_ATTROFF(v_attrs);
1880	PMCSTAT_PRINTW(", %u unresolved\n\n",
1881	    pmcpr->pr_dubious_frames);
1882	if (plugins[args.pa_plugin].pl_topdisplay != NULL)
1883		plugins[args.pa_plugin].pl_topdisplay();
1884	PMCSTAT_PRINTEND();
1885}
1886
1887/*
1888 * Find the next pmc index to display.
1889 */
1890
1891static void
1892pmcstat_changefilter(void)
1893{
1894	int pmcin;
1895	struct pmcstat_pmcrecord *pmcr;
1896
1897	/*
1898	 * Find the next merge target.
1899	 */
1900	if (pmcstat_mergepmc) {
1901		pmcin = pmcstat_pmcinfilter;
1902
1903		do {
1904			pmcr = pmcstat_pmcindex_to_pmcr(pmcstat_pmcinfilter);
1905			if (pmcr == NULL || pmcr == pmcr->pr_merge)
1906				break;
1907
1908			pmcstat_pmcinfilter++;
1909			if (pmcstat_pmcinfilter >= pmcstat_npmcs)
1910				pmcstat_pmcinfilter = 0;
1911
1912		} while (pmcstat_pmcinfilter != pmcin);
1913	}
1914}
1915
1916/*
1917 * Top mode keypress.
1918 */
1919
1920int
1921pmcstat_keypress_log(void)
1922{
1923	int c, ret = 0;
1924	WINDOW *w;
1925
1926	w = newwin(1, 0, 1, 0);
1927	c = wgetch(w);
1928	wprintw(w, "Key: %c => ", c);
1929	switch (c) {
1930	case 'c':
1931		wprintw(w, "enter mode 'd' or 'a' => ");
1932		c = wgetch(w);
1933		if (c == 'd') {
1934			args.pa_topmode = PMCSTAT_TOP_DELTA;
1935			wprintw(w, "switching to delta mode");
1936		} else {
1937			args.pa_topmode = PMCSTAT_TOP_ACCUM;
1938			wprintw(w, "switching to accumulation mode");
1939		}
1940		break;
1941	case 'm':
1942		pmcstat_mergepmc = !pmcstat_mergepmc;
1943		/*
1944		 * Changing merge state require data reset.
1945		 */
1946		if (plugins[args.pa_plugin].pl_shutdown != NULL)
1947			plugins[args.pa_plugin].pl_shutdown(NULL);
1948		pmcstat_stats_reset(0);
1949		if (plugins[args.pa_plugin].pl_init != NULL)
1950			plugins[args.pa_plugin].pl_init();
1951
1952		/* Update filter to be on a merge target. */
1953		pmcstat_changefilter();
1954		wprintw(w, "merge PMC %s", pmcstat_mergepmc ? "on" : "off");
1955		break;
1956	case 'n':
1957		/* Close current plugin. */
1958		if (plugins[args.pa_plugin].pl_shutdown != NULL)
1959			plugins[args.pa_plugin].pl_shutdown(NULL);
1960
1961		/* Find next top display available. */
1962		do {
1963			args.pa_plugin++;
1964			if (plugins[args.pa_plugin].pl_name == NULL)
1965				args.pa_plugin = 0;
1966		} while (plugins[args.pa_plugin].pl_topdisplay == NULL);
1967
1968		/* Open new plugin. */
1969		pmcstat_stats_reset(0);
1970		if (plugins[args.pa_plugin].pl_init != NULL)
1971			plugins[args.pa_plugin].pl_init();
1972		wprintw(w, "switching to plugin %s",
1973		    plugins[args.pa_plugin].pl_name);
1974		break;
1975	case 'p':
1976		pmcstat_pmcinfilter++;
1977		if (pmcstat_pmcinfilter >= pmcstat_npmcs)
1978			pmcstat_pmcinfilter = 0;
1979		pmcstat_changefilter();
1980		wprintw(w, "switching to PMC %s.%d",
1981		    pmcstat_pmcindex_to_name(pmcstat_pmcinfilter),
1982		    pmcstat_pmcinfilter);
1983		break;
1984	case ' ':
1985		pmcstat_pause = !pmcstat_pause;
1986		if (pmcstat_pause)
1987			wprintw(w, "pause => press space again to continue");
1988		break;
1989	case 'q':
1990		wprintw(w, "exiting...");
1991		ret = 1;
1992		break;
1993	default:
1994		if (plugins[args.pa_plugin].pl_topkeypress != NULL)
1995			if (plugins[args.pa_plugin].pl_topkeypress(c, w))
1996				ret = 1;
1997	}
1998
1999	wrefresh(w);
2000	delwin(w);
2001	return ret;
2002}
2003
2004
2005/*
2006 * Top mode display.
2007 */
2008
2009void
2010pmcstat_display_log(void)
2011{
2012
2013	pmcstat_refresh_top();
2014
2015	/* Reset everythings if delta mode. */
2016	if (args.pa_topmode == PMCSTAT_TOP_DELTA) {
2017		if (plugins[args.pa_plugin].pl_shutdown != NULL)
2018			plugins[args.pa_plugin].pl_shutdown(NULL);
2019		pmcstat_stats_reset(0);
2020		if (plugins[args.pa_plugin].pl_init != NULL)
2021			plugins[args.pa_plugin].pl_init();
2022	}
2023
2024}
2025
2026/*
2027 * Configure a plugins.
2028 */
2029
2030void
2031pmcstat_pluginconfigure_log(char *opt)
2032{
2033
2034	if (strncmp(opt, "threshold=", 10) == 0) {
2035		pmcstat_threshold = atof(opt+10);
2036	} else {
2037		if (plugins[args.pa_plugin].pl_configure != NULL) {
2038			if (!plugins[args.pa_plugin].pl_configure(opt))
2039				err(EX_USAGE,
2040				    "ERROR: unknown option <%s>.", opt);
2041		}
2042	}
2043}
2044
2045/*
2046 * Initialize module.
2047 */
2048
2049void
2050pmcstat_initialize_logging(void)
2051{
2052	int i;
2053
2054	/* use a convenient format for 'ldd' output */
2055	if (setenv("LD_TRACE_LOADED_OBJECTS_FMT1","%o \"%p\" %x\n",1) != 0)
2056		err(EX_OSERR, "ERROR: Cannot setenv");
2057
2058	/* Initialize hash tables */
2059	pmcstat_string_initialize();
2060	for (i = 0; i < PMCSTAT_NHASH; i++) {
2061		LIST_INIT(&pmcstat_image_hash[i]);
2062		LIST_INIT(&pmcstat_process_hash[i]);
2063	}
2064
2065	/*
2066	 * Create a fake 'process' entry for the kernel with pid -1.
2067	 * hwpmc(4) will subsequently inform us about where the kernel
2068	 * and any loaded kernel modules are mapped.
2069	 */
2070	if ((pmcstat_kernproc = pmcstat_process_lookup((pid_t) -1,
2071		 PMCSTAT_ALLOCATE)) == NULL)
2072		err(EX_OSERR, "ERROR: Cannot initialize logging");
2073
2074	/* PMC count. */
2075	pmcstat_npmcs = 0;
2076
2077	/* Merge PMC with same name. */
2078	pmcstat_mergepmc = args.pa_mergepmc;
2079
2080	/*
2081	 * Initialize plugins
2082	 */
2083
2084	if (plugins[args.pa_pplugin].pl_init != NULL)
2085		plugins[args.pa_pplugin].pl_init();
2086	if (plugins[args.pa_plugin].pl_init != NULL)
2087		plugins[args.pa_plugin].pl_init();
2088}
2089
2090/*
2091 * Shutdown module.
2092 */
2093
2094void
2095pmcstat_shutdown_logging(void)
2096{
2097	int i;
2098	FILE *mf;
2099	struct pmcstat_image *pi, *pitmp;
2100	struct pmcstat_process *pp, *pptmp;
2101	struct pmcstat_pcmap *ppm, *ppmtmp;
2102
2103	/* determine where to send the map file */
2104	mf = NULL;
2105	if (args.pa_mapfilename != NULL)
2106		mf = (strcmp(args.pa_mapfilename, "-") == 0) ?
2107		    args.pa_printfile : fopen(args.pa_mapfilename, "w");
2108
2109	if (mf == NULL && args.pa_flags & FLAG_DO_GPROF &&
2110	    args.pa_verbosity >= 2)
2111		mf = args.pa_printfile;
2112
2113	if (mf)
2114		(void) fprintf(mf, "MAP:\n");
2115
2116	/*
2117	 * Shutdown the plugins
2118	 */
2119
2120	if (plugins[args.pa_plugin].pl_shutdown != NULL)
2121		plugins[args.pa_plugin].pl_shutdown(mf);
2122	if (plugins[args.pa_pplugin].pl_shutdown != NULL)
2123		plugins[args.pa_pplugin].pl_shutdown(mf);
2124
2125	for (i = 0; i < PMCSTAT_NHASH; i++) {
2126		LIST_FOREACH_SAFE(pi, &pmcstat_image_hash[i], pi_next,
2127		    pitmp) {
2128			if (plugins[args.pa_plugin].pl_shutdownimage != NULL)
2129				plugins[args.pa_plugin].pl_shutdownimage(pi);
2130			if (plugins[args.pa_pplugin].pl_shutdownimage != NULL)
2131				plugins[args.pa_pplugin].pl_shutdownimage(pi);
2132
2133			free(pi->pi_symbols);
2134			if (pi->pi_addr2line != NULL)
2135				pclose(pi->pi_addr2line);
2136			LIST_REMOVE(pi, pi_next);
2137			free(pi);
2138		}
2139
2140		LIST_FOREACH_SAFE(pp, &pmcstat_process_hash[i], pp_next,
2141		    pptmp) {
2142			TAILQ_FOREACH_SAFE(ppm, &pp->pp_map, ppm_next, ppmtmp) {
2143				TAILQ_REMOVE(&pp->pp_map, ppm, ppm_next);
2144				free(ppm);
2145			}
2146			LIST_REMOVE(pp, pp_next);
2147			free(pp);
2148		}
2149	}
2150
2151	pmcstat_string_shutdown();
2152
2153	/*
2154	 * Print errors unless -q was specified.  Print all statistics
2155	 * if verbosity > 1.
2156	 */
2157#define	PRINT(N,V) do {							\
2158		if (pmcstat_stats.ps_##V || args.pa_verbosity >= 2)	\
2159			(void) fprintf(args.pa_printfile, " %-40s %d\n",\
2160			    N, pmcstat_stats.ps_##V);			\
2161	} while (0)
2162
2163	if (args.pa_verbosity >= 1 && (args.pa_flags & FLAG_DO_ANALYSIS)) {
2164		(void) fprintf(args.pa_printfile, "CONVERSION STATISTICS:\n");
2165		PRINT("#exec/a.out", exec_aout);
2166		PRINT("#exec/elf", exec_elf);
2167		PRINT("#exec/unknown", exec_indeterminable);
2168		PRINT("#exec handling errors", exec_errors);
2169		PRINT("#samples/total", samples_total);
2170		PRINT("#samples/unclaimed", samples_unknown_offset);
2171		PRINT("#samples/unknown-object", samples_indeterminable);
2172		PRINT("#callchain/dubious-frames", callchain_dubious_frames);
2173	}
2174
2175	if (mf)
2176		(void) fclose(mf);
2177}
2178