Home | History | Annotate | Line # | Download | only in tprof
tprof_analyze.c revision 1.8.4.1
      1  1.8.4.1  perseant /*	$NetBSD: tprof_analyze.c,v 1.8.4.1 2025/08/02 05:59:00 perseant Exp $	*/
      2      1.1      maxv 
      3      1.1      maxv /*
      4      1.1      maxv  * Copyright (c) 2010,2011,2012 YAMAMOTO Takashi,
      5      1.1      maxv  * All rights reserved.
      6      1.1      maxv  *
      7      1.1      maxv  * Redistribution and use in source and binary forms, with or without
      8      1.1      maxv  * modification, are permitted provided that the following conditions
      9      1.1      maxv  * are met:
     10      1.1      maxv  * 1. Redistributions of source code must retain the above copyright
     11      1.1      maxv  *    notice, this list of conditions and the following disclaimer.
     12      1.1      maxv  * 2. Redistributions in binary form must reproduce the above copyright
     13      1.1      maxv  *    notice, this list of conditions and the following disclaimer in the
     14      1.1      maxv  *    documentation and/or other materials provided with the distribution.
     15      1.1      maxv  *
     16      1.1      maxv  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
     17      1.1      maxv  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     18      1.1      maxv  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     19      1.1      maxv  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
     20      1.1      maxv  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     21      1.1      maxv  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     22      1.1      maxv  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     23      1.1      maxv  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     24      1.1      maxv  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     25      1.1      maxv  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     26      1.1      maxv  * SUCH DAMAGE.
     27      1.1      maxv  */
     28      1.1      maxv 
     29      1.1      maxv #include <sys/cdefs.h>
     30      1.1      maxv #ifndef lint
     31  1.8.4.1  perseant __RCSID("$NetBSD: tprof_analyze.c,v 1.8.4.1 2025/08/02 05:59:00 perseant Exp $");
     32      1.1      maxv #endif /* not lint */
     33      1.1      maxv 
     34      1.1      maxv #include <assert.h>
     35      1.1      maxv #include <err.h>
     36      1.1      maxv #include <errno.h>
     37      1.1      maxv #include <fcntl.h>
     38      1.1      maxv #include <gelf.h>
     39      1.1      maxv #include <inttypes.h>
     40      1.1      maxv #include <libelf.h>
     41      1.1      maxv #include <stdbool.h>
     42      1.1      maxv #include <stdlib.h>
     43      1.1      maxv #include <stdio.h>
     44      1.1      maxv #include <unistd.h>
     45      1.1      maxv #include <string.h>
     46      1.1      maxv #include <util.h>
     47      1.1      maxv #include <dev/tprof/tprof_ioctl.h>
     48      1.1      maxv #include "tprof.h"
     49      1.7       ryo #include "ksyms.h"
     50      1.1      maxv 
     51      1.1      maxv #include <sys/rbtree.h>
     52      1.1      maxv 
     53      1.1      maxv static bool filter_by_pid;
     54      1.1      maxv static pid_t target_pid;
     55      1.1      maxv static bool per_symbol;
     56      1.1      maxv 
     57      1.1      maxv struct addr {
     58      1.1      maxv 	struct rb_node node;
     59      1.1      maxv 	uint64_t addr;		/* address */
     60      1.1      maxv 	uint32_t pid;		/* process id */
     61      1.1      maxv 	uint32_t lwpid;		/* lwp id */
     62      1.1      maxv 	uint32_t cpuid;		/* cpu id */
     63      1.1      maxv 	bool in_kernel;		/* if addr is in the kernel address space */
     64      1.1      maxv 	unsigned int nsamples;	/* number of samples taken for the address */
     65      1.6       ryo 	unsigned int ncount[TPROF_MAXCOUNTERS];	/* count per event */
     66      1.1      maxv };
     67      1.1      maxv 
     68      1.1      maxv static rb_tree_t addrtree;
     69      1.1      maxv 
     70      1.1      maxv static signed int
     71      1.1      maxv addrtree_compare_key(void *ctx, const void *n1, const void *keyp)
     72      1.1      maxv {
     73      1.1      maxv 	const struct addr *a1 = n1;
     74      1.1      maxv 	const struct addr *a2 = (const struct addr *)keyp;
     75      1.1      maxv 
     76      1.1      maxv 	if (a1->addr > a2->addr) {
     77      1.1      maxv 		return 1;
     78      1.1      maxv 	} else if (a1->addr < a2->addr) {
     79      1.1      maxv 		return -1;
     80      1.1      maxv 	}
     81      1.1      maxv 	if (a1->pid > a2->pid) {
     82      1.1      maxv 		return -1;
     83      1.1      maxv 	} else if (a1->pid < a2->pid) {
     84      1.1      maxv 		return 1;
     85      1.1      maxv 	}
     86      1.1      maxv 	if (a1->lwpid > a2->lwpid) {
     87      1.1      maxv 		return -1;
     88      1.1      maxv 	} else if (a1->lwpid < a2->lwpid) {
     89      1.1      maxv 		return 1;
     90      1.1      maxv 	}
     91      1.1      maxv 	if (a1->cpuid > a2->cpuid) {
     92      1.1      maxv 		return -1;
     93      1.1      maxv 	} else if (a1->cpuid < a2->cpuid) {
     94      1.1      maxv 		return 1;
     95      1.1      maxv 	}
     96      1.1      maxv 	if (a1->in_kernel > a2->in_kernel) {
     97      1.1      maxv 		return -1;
     98      1.1      maxv 	} else if (a1->in_kernel < a2->in_kernel) {
     99      1.1      maxv 		return 1;
    100      1.1      maxv 	}
    101      1.1      maxv 	return 0;
    102      1.1      maxv }
    103      1.1      maxv 
    104      1.1      maxv static signed int
    105      1.1      maxv addrtree_compare_nodes(void *ctx, const void *n1, const void *n2)
    106      1.1      maxv {
    107      1.1      maxv 	const struct addr *a2 = n2;
    108      1.1      maxv 
    109      1.1      maxv 	return addrtree_compare_key(ctx, n1, a2);
    110      1.1      maxv }
    111      1.1      maxv 
    112      1.1      maxv static const rb_tree_ops_t addrtree_ops = {
    113      1.1      maxv 	.rbto_compare_nodes = addrtree_compare_nodes,
    114      1.1      maxv 	.rbto_compare_key = addrtree_compare_key,
    115      1.1      maxv };
    116      1.1      maxv 
    117      1.1      maxv static int
    118      1.1      maxv compare_nsamples(const void *p1, const void *p2)
    119      1.1      maxv {
    120      1.1      maxv 	const struct addr *a1 = *(const struct addr * const *)p1;
    121      1.1      maxv 	const struct addr *a2 = *(const struct addr * const *)p2;
    122      1.1      maxv 
    123      1.1      maxv 	if (a1->nsamples > a2->nsamples) {
    124      1.1      maxv 		return -1;
    125      1.1      maxv 	} else if (a1->nsamples < a2->nsamples) {
    126      1.1      maxv 		return 1;
    127      1.1      maxv 	}
    128      1.1      maxv 	return 0;
    129      1.1      maxv }
    130      1.1      maxv 
    131      1.1      maxv void
    132      1.1      maxv tprof_analyze(int argc, char **argv)
    133      1.1      maxv {
    134      1.1      maxv 	struct addr *a;
    135      1.1      maxv 	struct addr **l;
    136      1.1      maxv 	struct addr **p;
    137      1.3      maxv 	size_t naddrs, nsamples, i;
    138      1.3      maxv 	float perc;
    139      1.1      maxv 	int ch;
    140      1.6       ryo 	u_int c, maxevent = 0;
    141      1.1      maxv 	bool distinguish_processes = true;
    142      1.1      maxv 	bool distinguish_cpus = true;
    143      1.1      maxv 	bool distinguish_lwps = true;
    144      1.1      maxv 	bool kernel_only = false;
    145      1.2      maxv 	FILE *f;
    146      1.1      maxv 
    147      1.1      maxv 	while ((ch = getopt(argc, argv, "CkLPp:s")) != -1) {
    148      1.1      maxv 		uintmax_t val;
    149      1.1      maxv 		char *ep;
    150      1.1      maxv 
    151      1.1      maxv 		switch (ch) {
    152      1.1      maxv 		case 'C':	/* don't distinguish cpus */
    153      1.1      maxv 			distinguish_cpus = false;
    154      1.1      maxv 			break;
    155      1.1      maxv 		case 'k':	/* kernel only */
    156      1.1      maxv 			kernel_only = true;
    157      1.1      maxv 			break;
    158      1.1      maxv 		case 'L':	/* don't distinguish lwps */
    159      1.1      maxv 			distinguish_lwps = false;
    160      1.1      maxv 			break;
    161      1.1      maxv 		case 'p':	/* only for the process for the given pid */
    162      1.1      maxv 			errno = 0;
    163      1.1      maxv 			val = strtoumax(optarg, &ep, 10);
    164      1.1      maxv 			if (optarg[0] == 0 || *ep != 0 ||
    165      1.1      maxv 			    val > INT32_MAX) {
    166      1.1      maxv 				errx(EXIT_FAILURE, "invalid p option");
    167      1.1      maxv 			}
    168      1.1      maxv 			target_pid = val;
    169      1.1      maxv 			filter_by_pid = true;
    170      1.1      maxv 			break;
    171      1.1      maxv 		case 'P':	/* don't distinguish processes */
    172      1.1      maxv 			distinguish_processes = false;
    173      1.1      maxv 			break;
    174      1.1      maxv 		case 's':	/* per symbol */
    175      1.1      maxv 			per_symbol = true;
    176      1.1      maxv 			break;
    177      1.1      maxv 		default:
    178      1.1      maxv 			exit(EXIT_FAILURE);
    179      1.1      maxv 		}
    180      1.1      maxv 	}
    181      1.1      maxv 	argc -= optind;
    182      1.1      maxv 	argv += optind;
    183      1.1      maxv 
    184      1.2      maxv 	if (argc == 0) {
    185      1.2      maxv 		errx(EXIT_FAILURE, "missing file name");
    186      1.2      maxv 	}
    187      1.2      maxv 
    188      1.2      maxv 	f = fopen(argv[0], "rb");
    189      1.2      maxv 	if (f == NULL) {
    190      1.2      maxv 		errx(EXIT_FAILURE, "fopen");
    191      1.2      maxv 	}
    192      1.2      maxv 
    193      1.8       ryo 	ksymload(NULL);
    194      1.1      maxv 	rb_tree_init(&addrtree, &addrtree_ops);
    195      1.1      maxv 
    196      1.1      maxv 	/*
    197      1.1      maxv 	 * read and count samples.
    198      1.1      maxv 	 */
    199      1.1      maxv 
    200      1.1      maxv 	naddrs = 0;
    201      1.3      maxv 	nsamples = 0;
    202      1.1      maxv 	while (/*CONSTCOND*/true) {
    203      1.1      maxv 		struct addr *o;
    204      1.1      maxv 		tprof_sample_t sample;
    205      1.2      maxv 		size_t n = fread(&sample, sizeof(sample), 1, f);
    206      1.1      maxv 		bool in_kernel;
    207      1.1      maxv 
    208      1.1      maxv 		if (n == 0) {
    209      1.2      maxv 			if (feof(f)) {
    210      1.1      maxv 				break;
    211      1.1      maxv 			}
    212      1.2      maxv 			if (ferror(f)) {
    213      1.1      maxv 				err(EXIT_FAILURE, "fread");
    214      1.1      maxv 			}
    215      1.1      maxv 		}
    216      1.1      maxv 		if (filter_by_pid && (pid_t)sample.s_pid != target_pid) {
    217      1.1      maxv 			continue;
    218      1.1      maxv 		}
    219      1.1      maxv 		in_kernel = (sample.s_flags & TPROF_SAMPLE_INKERNEL) != 0;
    220      1.1      maxv 		if (kernel_only && !in_kernel) {
    221      1.1      maxv 			continue;
    222      1.1      maxv 		}
    223      1.1      maxv 		a = emalloc(sizeof(*a));
    224      1.6       ryo 		memset(a, 0, sizeof(*a));
    225      1.1      maxv 		a->addr = (uint64_t)sample.s_pc;
    226      1.1      maxv 		if (distinguish_processes) {
    227      1.1      maxv 			a->pid = sample.s_pid;
    228      1.1      maxv 		} else {
    229      1.1      maxv 			a->pid = 0;
    230      1.1      maxv 		}
    231      1.1      maxv 		if (distinguish_lwps) {
    232      1.1      maxv 			a->lwpid = sample.s_lwpid;
    233      1.1      maxv 		} else {
    234      1.1      maxv 			a->lwpid = 0;
    235      1.1      maxv 		}
    236      1.1      maxv 		if (distinguish_cpus) {
    237      1.1      maxv 			a->cpuid = sample.s_cpuid;
    238      1.1      maxv 		} else {
    239      1.1      maxv 			a->cpuid = 0;
    240      1.1      maxv 		}
    241      1.1      maxv 		a->in_kernel = in_kernel;
    242      1.1      maxv 		if (per_symbol) {
    243      1.1      maxv 			const char *name;
    244      1.1      maxv 			uint64_t offset;
    245      1.1      maxv 
    246      1.8       ryo 			name = ksymlookup(a->addr, &offset, NULL);
    247      1.1      maxv 			if (name != NULL) {
    248      1.1      maxv 				a->addr -= offset;
    249      1.1      maxv 			}
    250      1.1      maxv 		}
    251      1.6       ryo 		c = __SHIFTOUT(sample.s_flags, TPROF_SAMPLE_COUNTER_MASK);
    252      1.6       ryo 		assert(c < TPROF_MAXCOUNTERS);
    253      1.6       ryo 		if (maxevent < c)
    254      1.6       ryo 			maxevent = c;
    255      1.6       ryo 
    256      1.1      maxv 		a->nsamples = 1;
    257      1.6       ryo 		a->ncount[c] = 1;
    258      1.1      maxv 		o = rb_tree_insert_node(&addrtree, a);
    259      1.1      maxv 		if (o != a) {
    260      1.1      maxv 			assert(a->addr == o->addr);
    261      1.1      maxv 			assert(a->pid == o->pid);
    262      1.1      maxv 			assert(a->lwpid == o->lwpid);
    263      1.1      maxv 			assert(a->cpuid == o->cpuid);
    264      1.1      maxv 			assert(a->in_kernel == o->in_kernel);
    265      1.1      maxv 			free(a);
    266      1.6       ryo 
    267      1.1      maxv 			o->nsamples++;
    268      1.6       ryo 			o->ncount[c]++;
    269      1.1      maxv 		} else {
    270      1.1      maxv 			naddrs++;
    271      1.1      maxv 		}
    272      1.3      maxv 		nsamples++;
    273      1.1      maxv 	}
    274      1.1      maxv 
    275      1.1      maxv 	/*
    276      1.1      maxv 	 * sort samples by addresses.
    277      1.1      maxv 	 */
    278      1.1      maxv 
    279      1.1      maxv 	l = emalloc(naddrs * sizeof(*l));
    280      1.1      maxv 	p = l;
    281      1.1      maxv 	RB_TREE_FOREACH(a, &addrtree) {
    282      1.1      maxv 		*p++ = a;
    283      1.1      maxv 	}
    284      1.1      maxv 	assert(l + naddrs == p);
    285      1.1      maxv 	qsort(l, naddrs, sizeof(*l), compare_nsamples);
    286      1.1      maxv 
    287      1.1      maxv 	/*
    288      1.1      maxv 	 * print addresses and number of samples, preferably with
    289      1.1      maxv 	 * resolved symbol names.
    290      1.1      maxv 	 */
    291      1.3      maxv 	printf("File: %s\n", argv[0]);
    292      1.3      maxv 	printf("Number of samples: %zu\n\n", nsamples);
    293      1.6       ryo 
    294      1.6       ryo 	printf("percentage   nsamples ");
    295      1.6       ryo 	for (c = 0; c <= maxevent; c++)
    296      1.6       ryo 		printf("event#%02u ", c);
    297      1.6       ryo 	printf("pid    lwp    cpu  k address          symbol\n");
    298      1.6       ryo 
    299      1.6       ryo 	printf("------------ -------- ");
    300      1.6       ryo 	for (c = 0; c <= maxevent; c++)
    301      1.6       ryo 		printf("-------- ");
    302      1.6       ryo 
    303      1.6       ryo 	printf("------ ------ ---- - ---------------- ------\n");
    304      1.1      maxv 	for (i = 0; i < naddrs; i++) {
    305      1.1      maxv 		const char *name;
    306      1.1      maxv 		char buf[100];
    307      1.1      maxv 		uint64_t offset;
    308      1.1      maxv 
    309      1.1      maxv 		a = l[i];
    310      1.1      maxv 		if (a->in_kernel) {
    311      1.8       ryo 			name = ksymlookup(a->addr, &offset, NULL);
    312      1.1      maxv 		} else {
    313      1.1      maxv 			name = NULL;
    314      1.1      maxv 		}
    315      1.1      maxv 		if (name == NULL) {
    316      1.1      maxv 			(void)snprintf(buf, sizeof(buf), "<%016" PRIx64 ">",
    317      1.1      maxv 			    a->addr);
    318      1.1      maxv 			name = buf;
    319      1.1      maxv 		} else if (offset != 0) {
    320      1.1      maxv 			(void)snprintf(buf, sizeof(buf), "%s+0x%" PRIx64, name,
    321      1.1      maxv 			    offset);
    322      1.1      maxv 			name = buf;
    323      1.1      maxv 		}
    324      1.3      maxv 
    325      1.3      maxv 		perc = ((float)a->nsamples / (float)nsamples) * 100.0;
    326      1.3      maxv 
    327      1.6       ryo 		printf("%11f%% %8u", perc, a->nsamples);
    328      1.6       ryo 
    329      1.6       ryo 		for (c = 0; c <= maxevent; c++)
    330      1.6       ryo 			printf(" %8u", a->ncount[c]);
    331      1.6       ryo 
    332      1.6       ryo 		printf(" %6" PRIu32 " %6" PRIu32 " %4" PRIu32 " %u %016"
    333      1.6       ryo 		    PRIx64" %s",
    334      1.6       ryo 		    a->pid, a->lwpid, a->cpuid, a->in_kernel, a->addr, name);
    335      1.6       ryo 
    336      1.6       ryo 
    337      1.6       ryo 		printf("\n");
    338      1.1      maxv 	}
    339      1.2      maxv 
    340      1.2      maxv 	fclose(f);
    341      1.1      maxv }
    342