diff options
Diffstat (limited to 'usr.sbin/pmcstat/pmcpl_callgraph.c')
| -rw-r--r-- | usr.sbin/pmcstat/pmcpl_callgraph.c | 708 | 
1 files changed, 708 insertions, 0 deletions
diff --git a/usr.sbin/pmcstat/pmcpl_callgraph.c b/usr.sbin/pmcstat/pmcpl_callgraph.c new file mode 100644 index 000000000000..63684f800bdc --- /dev/null +++ b/usr.sbin/pmcstat/pmcpl_callgraph.c @@ -0,0 +1,708 @@ +/*- + * SPDX-License-Identifier: BSD-2-Clause + * + * Copyright (c) 2005-2007, Joseph Koshy + * Copyright (c) 2007 The FreeBSD Foundation + * All rights reserved. + * + * Portions of this software were developed by A. Joseph Koshy under + * sponsorship from the FreeBSD Foundation and Google, Inc. + * + * Redistribution and use in source and binary forms, with or without + * modification, are permitted provided that the following conditions + * are met: + * 1. Redistributions of source code must retain the above copyright + *    notice, this list of conditions and the following disclaimer. + * 2. Redistributions in binary form must reproduce the above copyright + *    notice, this list of conditions and the following disclaimer in the + *    documentation and/or other materials provided with the distribution. + * + * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND + * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE + * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE + * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE + * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL + * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS + * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) + * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT + * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY + * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF + * SUCH DAMAGE. + */ + +/* + * Transform a hwpmc(4) log into human readable form, and into + * gprof(1) compatible profiles. + */ + +#include <sys/param.h> +#include <sys/endian.h> +#include <sys/gmon.h> +#include <sys/imgact_aout.h> +#include <sys/imgact_elf.h> +#include <sys/mman.h> +#include <sys/pmc.h> +#include <sys/queue.h> +#include <sys/socket.h> +#include <sys/stat.h> +#include <sys/wait.h> + +#include <netinet/in.h> + +#include <assert.h> +#include <curses.h> +#include <err.h> +#include <errno.h> +#include <fcntl.h> +#include <gelf.h> +#include <inttypes.h> +#include <libgen.h> +#include <limits.h> +#include <netdb.h> +#include <pmc.h> +#include <pmclog.h> +#include <sysexits.h> +#include <stdint.h> +#include <stdio.h> +#include <stdlib.h> +#include <string.h> +#include <unistd.h> + +#include "pmcstat.h" +#include "pmcstat_log.h" +#include "pmcstat_top.h" +#include "pmcpl_callgraph.h" + +#define	min(A,B)		((A) < (B) ? (A) : (B)) +#define	max(A,B)		((A) > (B) ? (A) : (B)) + +/* Get the sample value in percent related to nsamples. */ +#define PMCPL_CG_COUNTP(a) \ +	((a)->pcg_count * 100.0 / nsamples) + +/* + * The toplevel CG nodes (i.e., with rank == 0) are placed in a hash table. + */ + +struct pmcstat_cgnode_hash_list pmcstat_cgnode_hash[PMCSTAT_NHASH]; +int pmcstat_cgnode_hash_count; + +static pmcstat_interned_string pmcstat_previous_filename_printed; + +static struct pmcstat_cgnode * +pmcstat_cgnode_allocate(struct pmcstat_image *image, uintfptr_t pc) +{ +	struct pmcstat_cgnode *cg; + +	if ((cg = malloc(sizeof(*cg))) == NULL) +		err(EX_OSERR, "ERROR: Cannot allocate callgraph node"); + +	cg->pcg_image = image; +	cg->pcg_func = pc; + +	cg->pcg_count = 0; +	cg->pcg_nchildren = 0; +	LIST_INIT(&cg->pcg_children); + +	return (cg); +} + +/* + * Free a node and its children. + */ +static void +pmcstat_cgnode_free(struct pmcstat_cgnode *cg) +{ +	struct pmcstat_cgnode *cgc, *cgtmp; + +	LIST_FOREACH_SAFE(cgc, &cg->pcg_children, pcg_sibling, cgtmp) +		pmcstat_cgnode_free(cgc); +	free(cg); +} + +/* + * Look for a callgraph node associated with pmc `pmcid' in the global + * hash table that corresponds to the given `pc' value in the process + * `pp'. + */ +static struct pmcstat_cgnode * +pmcstat_cgnode_hash_lookup_pc(struct pmcstat_process *pp, pmc_id_t pmcid, +    uintfptr_t pc, int usermode) +{ +	struct pmcstat_pcmap *ppm; +	struct pmcstat_symbol *sym; +	struct pmcstat_image *image; +	struct pmcstat_cgnode *cg; +	struct pmcstat_cgnode_hash *h; +	uintfptr_t loadaddress; +	unsigned int i, hash; + +	ppm = pmcstat_process_find_map(usermode ? pp : pmcstat_kernproc, pc); +	if (ppm == NULL) +		return (NULL); + +	image = ppm->ppm_image; + +	loadaddress = ppm->ppm_lowpc + image->pi_vaddr - image->pi_start; +	pc -= loadaddress;	/* Convert to an offset in the image. */ + +	/* +	 * Try determine the function at this offset.  If we can't +	 * find a function round leave the `pc' value alone. +	 */ +	if (!(args.pa_flags & (FLAG_SKIP_TOP_FN_RES | FLAG_SHOW_OFFSET))) { +		if ((sym = pmcstat_symbol_search(image, pc)) != NULL) +			pc = sym->ps_start; +		else +			pmcstat_stats.ps_samples_unknown_function++; +	} + +	for (hash = i = 0; i < sizeof(uintfptr_t); i++) +		hash += (pc >> i) & 0xFF; + +	hash &= PMCSTAT_HASH_MASK; + +	cg = NULL; +	LIST_FOREACH(h, &pmcstat_cgnode_hash[hash], pch_next) +	{ +		if (h->pch_pmcid != pmcid) +			continue; + +		cg = h->pch_cgnode; + +		assert(cg != NULL); + +		if (cg->pcg_image == image && cg->pcg_func == pc) +			return (cg); +	} + +	/* +	 * We haven't seen this (pmcid, pc) tuple yet, so allocate a +	 * new callgraph node and a new hash table entry for it. +	 */ +	cg = pmcstat_cgnode_allocate(image, pc); +	if ((h = malloc(sizeof(*h))) == NULL) +		err(EX_OSERR, "ERROR: Could not allocate callgraph node"); + +	h->pch_pmcid = pmcid; +	h->pch_cgnode = cg; +	LIST_INSERT_HEAD(&pmcstat_cgnode_hash[hash], h, pch_next); + +	pmcstat_cgnode_hash_count++; + +	return (cg); +} + +/* + * Compare two callgraph nodes for sorting. + */ +static int +pmcstat_cgnode_compare(const void *a, const void *b) +{ +	const struct pmcstat_cgnode *const *pcg1, *const *pcg2, *cg1, *cg2; + +	pcg1 = (const struct pmcstat_cgnode *const *) a; +	cg1 = *pcg1; +	pcg2 = (const struct pmcstat_cgnode *const *) b; +	cg2 = *pcg2; + +	/* Sort in reverse order */ +	if (cg1->pcg_count < cg2->pcg_count) +		return (1); +	if (cg1->pcg_count > cg2->pcg_count) +		return (-1); +	return (0); +} + +/* + * Find (allocating if a needed) a callgraph node in the given + * parent with the same (image, pcoffset) pair. + */ + +static struct pmcstat_cgnode * +pmcstat_cgnode_find(struct pmcstat_cgnode *parent, struct pmcstat_image *image, +    uintfptr_t pcoffset) +{ +	struct pmcstat_cgnode *child; + +	LIST_FOREACH(child, &parent->pcg_children, pcg_sibling) { +		if (child->pcg_image == image && +		    child->pcg_func == pcoffset) +			return (child); +	} + +	/* +	 * Allocate a new structure. +	 */ + +	child = pmcstat_cgnode_allocate(image, pcoffset); + +	/* +	 * Link it into the parent. +	 */ +	LIST_INSERT_HEAD(&parent->pcg_children, child, pcg_sibling); +	parent->pcg_nchildren++; + +	return (child); +} + +/* + * Print one callgraph node.  The output format is: + * + * indentation %(parent's samples) #nsamples function@object + */ +static void +pmcstat_cgnode_print(struct pmcstat_cgnode *cg, int depth, uint32_t total) +{ +	uint32_t n; +	const char *space; +	struct pmcstat_symbol *sym; +	struct pmcstat_cgnode **sortbuffer, **cgn, *pcg; + +	space = " "; + +	if (depth > 0) +		(void) fprintf(args.pa_graphfile, "%*s", depth, space); + +	if (cg->pcg_count == total) +		(void) fprintf(args.pa_graphfile, "100.0%% "); +	else +		(void) fprintf(args.pa_graphfile, "%05.2f%% ", +		    100.0 * cg->pcg_count / total); + +	n = fprintf(args.pa_graphfile, " [%u] ", cg->pcg_count); + +	/* #samples is a 12 character wide field. */ +	if (n < 12) +		(void) fprintf(args.pa_graphfile, "%*s", 12 - n, space); + +	if (depth > 0) +		(void) fprintf(args.pa_graphfile, "%*s", depth, space); + +	sym = pmcstat_symbol_search(cg->pcg_image, cg->pcg_func); +	if (sym) +		(void) fprintf(args.pa_graphfile, "%s", +		    pmcstat_string_unintern(sym->ps_name)); +	else +		(void) fprintf(args.pa_graphfile, "%p", +		    (void *) (cg->pcg_image->pi_vaddr + cg->pcg_func)); + +	if (pmcstat_previous_filename_printed != +	    cg->pcg_image->pi_fullpath) { +		pmcstat_previous_filename_printed = cg->pcg_image->pi_fullpath; +		(void) fprintf(args.pa_graphfile, " @ %s\n", +		    pmcstat_string_unintern( +		    pmcstat_previous_filename_printed)); +	} else +		(void) fprintf(args.pa_graphfile, "\n"); + +	if (cg->pcg_nchildren == 0) +		return; + +	if ((sortbuffer = (struct pmcstat_cgnode **) +		malloc(sizeof(struct pmcstat_cgnode *) * +		    cg->pcg_nchildren)) == NULL) +		err(EX_OSERR, "ERROR: Cannot print callgraph"); +	cgn = sortbuffer; + +	LIST_FOREACH(pcg, &cg->pcg_children, pcg_sibling) +	    *cgn++ = pcg; + +	assert(cgn - sortbuffer == (int) cg->pcg_nchildren); + +	qsort(sortbuffer, cg->pcg_nchildren, sizeof(struct pmcstat_cgnode *), +	    pmcstat_cgnode_compare); + +	for (cgn = sortbuffer, n = 0; n < cg->pcg_nchildren; n++, cgn++) +		pmcstat_cgnode_print(*cgn, depth+1, cg->pcg_count); + +	free(sortbuffer); +} + +/* + * Record a callchain. + */ + +void +pmcpl_cg_process(struct pmcstat_process *pp, struct pmcstat_pmcrecord *pmcr, +    uint32_t nsamples, uintfptr_t *cc, int usermode, uint32_t cpu) +{ +	uintfptr_t pc, loadaddress; +	uint32_t n; +	struct pmcstat_image *image; +	struct pmcstat_pcmap *ppm; +	struct pmcstat_symbol *sym; +	struct pmcstat_cgnode *parent, *child; +	struct pmcstat_process *km; +	pmc_id_t pmcid; + +	(void) cpu; + +	/* +	 * Find the callgraph node recorded in the global hash table +	 * for this (pmcid, pc). +	 */ + +	pc = cc[0]; +	pmcid = pmcr->pr_pmcid; +	child = parent = pmcstat_cgnode_hash_lookup_pc(pp, pmcid, pc, usermode); +	if (parent == NULL) { +		pmcstat_stats.ps_callchain_dubious_frames++; +		pmcr->pr_dubious_frames++; +		return; +	} + +	parent->pcg_count++; + +	/* +	 * For each return address in the call chain record, subject +	 * to the maximum depth desired. +	 * - Find the image associated with the sample.  Stop if there +	 *   is no valid image at that address. +	 * - Find the function that overlaps the return address. +	 * - If found: use the start address of the function. +	 *   If not found (say an object's symbol table is not present or +	 *   is incomplete), round down to the gprof bucket granularity. +	 * - Convert return virtual address to an offset in the image. +	 * - Look for a child with the same {offset,image} tuple, +	 *   inserting one if needed. +	 * - Increment the count of occurrences of the child. +	 */ +	km = pmcstat_kernproc; + +	for (n = 1; n < (uint32_t) args.pa_graphdepth && n < nsamples; n++, +	    parent = child) { +		pc = cc[n]; + +		ppm = pmcstat_process_find_map(usermode ? pp : km, pc); +		if (ppm == NULL) { +			/* Detect full frame capture (kernel + user). */ +			if (!usermode) { +				ppm = pmcstat_process_find_map(pp, pc); +				if (ppm != NULL) +					km = pp; +			} +		} +		if (ppm == NULL) +			continue; + +		image = ppm->ppm_image; +		loadaddress = ppm->ppm_lowpc + image->pi_vaddr - +		    image->pi_start; +		pc -= loadaddress; + +		if ((sym = pmcstat_symbol_search(image, pc)) != NULL) +			pc = sym->ps_start; + +		child = pmcstat_cgnode_find(parent, image, pc); +		child->pcg_count++; +	} +} + +/* + * Printing a callgraph for a PMC. + */ +static void +pmcstat_callgraph_print_for_pmcid(struct pmcstat_pmcrecord *pmcr) +{ +	int n, nentries; +	uint32_t nsamples; +	pmc_id_t pmcid; +	struct pmcstat_cgnode **sortbuffer, **cgn; +	struct pmcstat_cgnode_hash *pch; + +	/* +	 * We pull out all callgraph nodes in the top-level hash table +	 * with a matching PMC id.  We then sort these based on the +	 * frequency of occurrence.  Each callgraph node is then +	 * printed. +	 */ + +	nsamples = 0; +	pmcid = pmcr->pr_pmcid; +	if ((sortbuffer = (struct pmcstat_cgnode **) +	    malloc(sizeof(struct pmcstat_cgnode *) * +	    pmcstat_cgnode_hash_count)) == NULL) +		err(EX_OSERR, "ERROR: Cannot sort callgraph"); +	cgn = sortbuffer; + +	for (n = 0; n < PMCSTAT_NHASH; n++) +		LIST_FOREACH(pch, &pmcstat_cgnode_hash[n], pch_next) +		    if (pch->pch_pmcid == pmcid) { +			    nsamples += pch->pch_cgnode->pcg_count; +			    *cgn++ = pch->pch_cgnode; +		    } + +	nentries = cgn - sortbuffer; +	assert(nentries <= pmcstat_cgnode_hash_count); + +	if (nentries == 0) { +		free(sortbuffer); +		return; +	} + +	qsort(sortbuffer, nentries, sizeof(struct pmcstat_cgnode *), +	    pmcstat_cgnode_compare); + +	(void) fprintf(args.pa_graphfile, +	    "@ %s [%u samples]\n\n", +	    pmcstat_string_unintern(pmcr->pr_pmcname), +	    nsamples); + +	for (cgn = sortbuffer, n = 0; n < nentries; n++, cgn++) { +		pmcstat_previous_filename_printed = NULL; +		pmcstat_cgnode_print(*cgn, 0, nsamples); +		(void) fprintf(args.pa_graphfile, "\n"); +	} + +	free(sortbuffer); +} + +/* + * Print out callgraphs. + */ + +static void +pmcstat_callgraph_print(void) +{ +	struct pmcstat_pmcrecord *pmcr; + +	LIST_FOREACH(pmcr, &pmcstat_pmcs, pr_next) +	    pmcstat_callgraph_print_for_pmcid(pmcr); +} + +static void +pmcstat_cgnode_topprint(struct pmcstat_cgnode *cg, +    int depth __unused, uint32_t nsamples) +{ +	int v_attrs, vs_len, ns_len, width, len, n, nchildren; +	float v; +	char ns[30], vs[10]; +	struct pmcstat_symbol *sym; +	struct pmcstat_cgnode **sortbuffer, **cgn, *pcg; + +	/* Format value. */ +	v = PMCPL_CG_COUNTP(cg); +	snprintf(vs, sizeof(vs), "%.1f", v); +	v_attrs = PMCSTAT_ATTRPERCENT(v); + +	/* Format name. */ +	sym = pmcstat_symbol_search(cg->pcg_image, cg->pcg_func); +	if (sym == NULL) { +		snprintf(ns, sizeof(ns), "%p", +		    (void *)(cg->pcg_image->pi_vaddr + cg->pcg_func)); +	} else { +		switch (args.pa_flags & (FLAG_SKIP_TOP_FN_RES | FLAG_SHOW_OFFSET)) { +		case FLAG_SKIP_TOP_FN_RES | FLAG_SHOW_OFFSET: +		case FLAG_SKIP_TOP_FN_RES: +			snprintf(ns, sizeof(ns), "%p", +			    (void *)(cg->pcg_image->pi_vaddr + cg->pcg_func)); +			break; +		case FLAG_SHOW_OFFSET: +			snprintf(ns, sizeof(ns), "%s+%#0" PRIx64, +			    pmcstat_string_unintern(sym->ps_name), +			    cg->pcg_func - sym->ps_start); +			break; +		default: +			snprintf(ns, sizeof(ns), "%s", +			    pmcstat_string_unintern(sym->ps_name)); +			break; +		} +	} + +	PMCSTAT_ATTRON(v_attrs); +	PMCSTAT_PRINTW("%5.5s", vs); +	PMCSTAT_ATTROFF(v_attrs); +	PMCSTAT_PRINTW(" %-10.10s %-30.30s", +	    pmcstat_string_unintern(cg->pcg_image->pi_name), +	    ns); + +	nchildren = cg->pcg_nchildren; +	if (nchildren == 0) { +		PMCSTAT_PRINTW("\n"); +		return; +	} + +	width = pmcstat_displaywidth - 40; + +	if ((sortbuffer = (struct pmcstat_cgnode **) +		malloc(sizeof(struct pmcstat_cgnode *) * +		    nchildren)) == NULL) +		err(EX_OSERR, "ERROR: Cannot print callgraph"); +	cgn = sortbuffer; + +	LIST_FOREACH(pcg, &cg->pcg_children, pcg_sibling) +	    *cgn++ = pcg; + +	assert(cgn - sortbuffer == (int)nchildren); + +	qsort(sortbuffer, nchildren, sizeof(struct pmcstat_cgnode *), +	    pmcstat_cgnode_compare); + +	/* Count how many callers. */ +	for (cgn = sortbuffer, n = 0; n < nchildren; n++, cgn++) { +		pcg = *cgn; + +		v = PMCPL_CG_COUNTP(pcg); +		if (v < pmcstat_threshold) +			break; +	} +	nchildren = n; + +	for (cgn = sortbuffer, n = 0; n < nchildren; n++, cgn++) { +		pcg = *cgn; + +		/* Format value. */ +		if (nchildren > 1) { +			v = PMCPL_CG_COUNTP(pcg); +			vs_len = snprintf(vs, sizeof(vs), ":%.1f", v); +			v_attrs = PMCSTAT_ATTRPERCENT(v); +		} else +			vs_len = 0; + +		/* Format name. */ +		sym = pmcstat_symbol_search(pcg->pcg_image, pcg->pcg_func); +		if (sym != NULL) { +			ns_len = snprintf(ns, sizeof(ns), "%s", +			    pmcstat_string_unintern(sym->ps_name)); +		} else +			ns_len = snprintf(ns, sizeof(ns), "%p", +			    (void *)pcg->pcg_func); + +		len = ns_len + vs_len + 1; +		if (width - len < 0) { +			PMCSTAT_PRINTW(" ..."); +			break; +		} +		width -= len; + +		PMCSTAT_PRINTW(" %s", ns); +		if (nchildren > 1) { +			PMCSTAT_ATTRON(v_attrs); +			PMCSTAT_PRINTW("%s", vs); +			PMCSTAT_ATTROFF(v_attrs); +		} +	} +	PMCSTAT_PRINTW("\n"); +	free(sortbuffer); +} + +/* + * Top mode display. + */ + +void +pmcpl_cg_topdisplay(void) +{ +	int n, nentries; +	uint32_t nsamples; +	struct pmcstat_cgnode **sortbuffer, **cgn; +	struct pmcstat_cgnode_hash *pch; +	struct pmcstat_pmcrecord *pmcr; + +	pmcr = pmcstat_pmcindex_to_pmcr(pmcstat_pmcinfilter); +	if (!pmcr) +		err(EX_SOFTWARE, "ERROR: invalid pmcindex"); + +	/* +	 * We pull out all callgraph nodes in the top-level hash table +	 * with a matching PMC index.  We then sort these based on the +	 * frequency of occurrence.  Each callgraph node is then +	 * printed. +	 */ + +	nsamples = 0; + +	if ((sortbuffer = (struct pmcstat_cgnode **) +	    malloc(sizeof(struct pmcstat_cgnode *) * +	    pmcstat_cgnode_hash_count)) == NULL) +		err(EX_OSERR, "ERROR: Cannot sort callgraph"); +	cgn = sortbuffer; + +	for (n = 0; n < PMCSTAT_NHASH; n++) +		LIST_FOREACH(pch, &pmcstat_cgnode_hash[n], pch_next) +		    if (pmcr == NULL || pch->pch_pmcid == pmcr->pr_pmcid) { +			    nsamples += pch->pch_cgnode->pcg_count; +			    *cgn++ = pch->pch_cgnode; +		    } + +	nentries = cgn - sortbuffer; +	assert(nentries <= pmcstat_cgnode_hash_count); + +	if (nentries == 0) { +		free(sortbuffer); +		return; +	} + +	qsort(sortbuffer, nentries, sizeof(struct pmcstat_cgnode *), +	    pmcstat_cgnode_compare); + +	PMCSTAT_PRINTW("%5.5s %-10.10s %-30.30s %s\n", +	    "%SAMP", "IMAGE", "FUNCTION", "CALLERS"); + +	nentries = min(pmcstat_displayheight - 2, nentries); + +	for (cgn = sortbuffer, n = 0; n < nentries; n++, cgn++) { +		if (PMCPL_CG_COUNTP(*cgn) < pmcstat_threshold) +			break; +		pmcstat_cgnode_topprint(*cgn, 0, nsamples); +	} + +	free(sortbuffer); +} + +/* + * Handle top mode keypress. + */ + +int +pmcpl_cg_topkeypress(int c, void *arg) +{ +	WINDOW *w; + +	w = (WINDOW *)arg; + +	(void) c; (void) w; + +	return 0; +} + +int +pmcpl_cg_init(void) +{ +	int i; + +	pmcstat_cgnode_hash_count = 0; +	pmcstat_previous_filename_printed = NULL; + +	for (i = 0; i < PMCSTAT_NHASH; i++) { +		LIST_INIT(&pmcstat_cgnode_hash[i]); +	} + +	return (0); +} + +void +pmcpl_cg_shutdown(FILE *mf) +{ +	int i; +	struct pmcstat_cgnode_hash *pch, *pchtmp; + +	(void) mf; + +	if (args.pa_flags & FLAG_DO_CALLGRAPHS) +		pmcstat_callgraph_print(); + +	/* +	 * Free memory. +	 */ +	for (i = 0; i < PMCSTAT_NHASH; i++) { +		LIST_FOREACH_SAFE(pch, &pmcstat_cgnode_hash[i], pch_next, +		    pchtmp) { +			pmcstat_cgnode_free(pch->pch_cgnode); +			LIST_REMOVE(pch, pch_next); +			free(pch); +		} +	} +} +  | 
