builtin-annotate.c 17.3 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12
/*
 * builtin-annotate.c
 *
 * Builtin annotate command: Analyze the perf.data input file,
 * look up and read DSOs and symbol information and display
 * a histogram of results, along various sorting keys.
 */
#include "builtin.h"

#include "util/util.h"

#include "util/color.h"
13
#include <linux/list.h>
14
#include "util/cache.h"
15
#include <linux/rbtree.h>
16 17 18 19
#include "util/symbol.h"
#include "util/string.h"

#include "perf.h"
20
#include "util/debug.h"
21 22 23

#include "util/parse-options.h"
#include "util/parse-events.h"
24
#include "util/thread.h"
25
#include "util/sort.h"
26
#include "util/hist.h"
27 28 29

static char		const *input_name = "perf.data";

30
static int		force;
31 32
static int		input;

33 34
static int		full_paths;

35 36
static int		print_line;

37 38 39
static unsigned long	page_size;
static unsigned long	mmap_window = 32;

40 41 42 43 44
struct sym_hist {
	u64		sum;
	u64		ip[0];
};

45
struct sym_ext {
46
	struct rb_node	node;
47 48 49 50
	double		percent;
	char		*path;
};

51 52 53 54 55 56 57
struct sym_priv {
	struct sym_hist	*hist;
	struct sym_ext	*ext;
};

static const char *sym_hist_filter;

58
static int symbol_filter(struct map *map __used, struct symbol *sym)
59
{
60 61
	if (sym_hist_filter == NULL ||
	    strcmp(sym->name, sym_hist_filter) == 0) {
62
		struct sym_priv *priv = symbol__priv(sym);
63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78
		const int size = (sizeof(*priv->hist) +
				  (sym->end - sym->start) * sizeof(u64));

		priv->hist = malloc(size);
		if (priv->hist)
			memset(priv->hist, 0, size);
		return 0;
	}
	/*
	 * FIXME: We should really filter it out, as we don't want to go thru symbols
	 * we're not interested, and if a DSO ends up with no symbols, delete it too,
	 * but right now the kernel loading routines in symbol.c bail out if no symbols
	 * are found, fix it later.
	 */
	return 0;
}
79

80 81 82
/*
 * collect histogram counts
 */
83
static void hist_hit(struct hist_entry *he, u64 ip)
84
{
85 86
	unsigned int sym_size, offset;
	struct symbol *sym = he->sym;
87 88
	struct sym_priv *priv;
	struct sym_hist *h;
89

90
	he->count++;
91

92 93 94
	if (!sym || !he->map)
		return;

95
	priv = symbol__priv(sym);
96
	if (!priv->hist)
97
		return;
98

99 100
	sym_size = sym->end - sym->start;
	offset = ip - sym->start;
101

102 103 104 105
	if (verbose)
		fprintf(stderr, "%s: ip=%Lx\n", __func__,
			he->map->unmap_ip(he->map, ip));

106 107
	if (offset >= sym_size)
		return;
108

109 110 111
	h = priv->hist;
	h->sum++;
	h->ip[offset]++;
112

113 114
	if (verbose >= 3)
		printf("%p %s: count++ [ip: %p, %08Lx] => %Ld\n",
115
			(void *)(unsigned long)he->sym->start,
116
			he->sym->name,
117
			(void *)(unsigned long)ip, ip - he->sym->start,
118
			h->ip[offset]);
119 120
}

121 122
static int hist_entry__add(struct thread *thread, struct map *map,
			   struct symbol *sym, u64 ip, u64 count, char level)
123
{
124 125 126 127
	bool hit;
	struct hist_entry *he = __hist_entry__add(thread, map, sym, NULL, ip,
						  count, level, &hit);
	if (he == NULL)
128
		return -ENOMEM;
129
	hist_hit(he, ip);
130 131 132 133
	return 0;
}

static int
134
process_sample_event(event_t *event, unsigned long offset, unsigned long head)
135 136
{
	char level;
137
	u64 ip = event->ip.ip;
138
	struct map *map = NULL;
139
	struct symbol *sym = NULL;
140
	struct thread *thread = threads__findnew(event->ip.pid);
141

142
	dump_printf("%p [%p]: PERF_EVENT (IP, %d): %d: %p\n",
143 144 145 146 147 148 149 150 151 152 153 154
		(void *)(offset + head),
		(void *)(long)(event->header.size),
		event->header.misc,
		event->ip.pid,
		(void *)(long)ip);

	if (thread == NULL) {
		fprintf(stderr, "problem processing %d event, skipping it.\n",
			event->header.type);
		return -1;
	}

155 156
	dump_printf(" ... thread: %s:%d\n", thread->comm, thread->pid);

157
	if (event->header.misc & PERF_RECORD_MISC_KERNEL) {
158
		level = 'k';
159 160 161
		sym = kernel_maps__find_symbol(ip, &map);
		dump_printf(" ...... dso: %s\n",
			    map ? map->dso->long_name : "<not found>");
162
	} else if (event->header.misc & PERF_RECORD_MISC_USER) {
163 164 165
		level = '.';
		map = thread__find_map(thread, ip);
		if (map != NULL) {
166
got_map:
167
			ip = map->map_ip(map, ip);
168
			sym = map__find_symbol(map, ip, symbol_filter);
169 170 171 172 173
		} else {
			/*
			 * If this is outside of all known maps,
			 * and is a negative address, try to look it
			 * up in the kernel dso, as it might be a
174 175 176 177 178
			 * vsyscall or vdso (which executes in user-mode).
			 *
			 * XXX This is nasty, we should have a symbol list in
			 * the "[vdso]" dso, but for now lets use the old
			 * trick of looking in the whole kernel symbol list.
179
			 */
180 181 182 183
			if ((long long)ip < 0) {
				map = kernel_map;
				goto got_map;
			}
184
		}
185 186
		dump_printf(" ...... dso: %s\n",
			    map ? map->dso->long_name : "<not found>");
187 188
	} else {
		level = 'H';
189
		dump_printf(" ...... dso: [hypervisor]\n");
190 191
	}

192 193 194 195
	if (hist_entry__add(thread, map, sym, ip, 1, level)) {
		fprintf(stderr, "problem incrementing symbol count, "
				"skipping event\n");
		return -1;
196 197 198 199 200 201 202 203 204
	}
	total++;

	return 0;
}

static int
process_mmap_event(event_t *event, unsigned long offset, unsigned long head)
{
205
	struct map *map = map__new(&event->mmap, NULL, 0);
206
	struct thread *thread = threads__findnew(event->mmap.pid);
207

208
	dump_printf("%p [%p]: PERF_RECORD_MMAP %d: [%p(%p) @ %p]: %s\n",
209 210 211 212 213 214 215 216 217
		(void *)(offset + head),
		(void *)(long)(event->header.size),
		event->mmap.pid,
		(void *)(long)event->mmap.start,
		(void *)(long)event->mmap.len,
		(void *)(long)event->mmap.pgoff,
		event->mmap.filename);

	if (thread == NULL || map == NULL) {
218
		dump_printf("problem processing PERF_RECORD_MMAP, skipping event.\n");
219 220 221 222 223 224 225 226 227 228 229 230
		return 0;
	}

	thread__insert_map(thread, map);
	total_mmap++;

	return 0;
}

static int
process_comm_event(event_t *event, unsigned long offset, unsigned long head)
{
231
	struct thread *thread = threads__findnew(event->comm.pid);
232

233
	dump_printf("%p [%p]: PERF_RECORD_COMM: %s:%d\n",
234 235 236 237 238 239
		(void *)(offset + head),
		(void *)(long)(event->header.size),
		event->comm.comm, event->comm.pid);

	if (thread == NULL ||
	    thread__set_comm(thread, event->comm.comm)) {
240
		dump_printf("problem processing PERF_RECORD_COMM, skipping event.\n");
241 242 243 244 245 246 247 248 249 250
		return -1;
	}
	total_comm++;

	return 0;
}

static int
process_fork_event(event_t *event, unsigned long offset, unsigned long head)
{
251 252
	struct thread *thread = threads__findnew(event->fork.pid);
	struct thread *parent = threads__findnew(event->fork.ppid);
253

254
	dump_printf("%p [%p]: PERF_RECORD_FORK: %d:%d\n",
255 256 257 258
		(void *)(offset + head),
		(void *)(long)(event->header.size),
		event->fork.pid, event->fork.ppid);

259 260 261 262 263 264 265
	/*
	 * A thread clone will have the same PID for both
	 * parent and child.
	 */
	if (thread == parent)
		return 0;

266
	if (!thread || !parent || thread__fork(thread, parent)) {
267
		dump_printf("problem processing PERF_RECORD_FORK, skipping event.\n");
268 269 270 271 272 273 274 275 276 277 278
		return -1;
	}
	total_fork++;

	return 0;
}

static int
process_event(event_t *event, unsigned long offset, unsigned long head)
{
	switch (event->header.type) {
279
	case PERF_RECORD_SAMPLE:
280 281
		return process_sample_event(event, offset, head);

282
	case PERF_RECORD_MMAP:
283 284
		return process_mmap_event(event, offset, head);

285
	case PERF_RECORD_COMM:
286 287
		return process_comm_event(event, offset, head);

288
	case PERF_RECORD_FORK:
289 290 291 292 293
		return process_fork_event(event, offset, head);
	/*
	 * We dont process them right now but they are fine:
	 */

294 295
	case PERF_RECORD_THROTTLE:
	case PERF_RECORD_UNTHROTTLE:
296 297 298 299 300 301 302 303 304
		return 0;

	default:
		return -1;
	}

	return 0;
}

305
static int parse_line(FILE *file, struct hist_entry *he, u64 len)
306
{
307
	struct symbol *sym = he->sym;
308
	char *line = NULL, *tmp, *tmp2;
309 310
	static const char *prev_line;
	static const char *prev_color;
311 312
	unsigned int offset;
	size_t line_len;
313
	u64 start;
314
	s64 line_ip;
315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349
	int ret;
	char *c;

	if (getline(&line, &line_len, file) < 0)
		return -1;
	if (!line)
		return -1;

	c = strchr(line, '\n');
	if (c)
		*c = 0;

	line_ip = -1;
	offset = 0;
	ret = -2;

	/*
	 * Strip leading spaces:
	 */
	tmp = line;
	while (*tmp) {
		if (*tmp != ' ')
			break;
		tmp++;
	}

	if (*tmp) {
		/*
		 * Parse hexa addresses followed by ':'
		 */
		line_ip = strtoull(tmp, &tmp2, 16);
		if (*tmp2 != ':')
			line_ip = -1;
	}

350 351
	start = he->map->unmap_ip(he->map, sym->start);

352
	if (line_ip != -1) {
353
		const char *path = NULL;
354 355
		unsigned int hits = 0;
		double percent = 0.0;
356
		const char *color;
357
		struct sym_priv *priv = symbol__priv(sym);
358 359
		struct sym_ext *sym_ext = priv->ext;
		struct sym_hist *h = priv->hist;
360

361
		offset = line_ip - start;
362
		if (offset < len)
363
			hits = h->ip[offset];
364

365
		if (offset < len && sym_ext) {
366 367
			path = sym_ext[offset].path;
			percent = sym_ext[offset].percent;
368 369
		} else if (h->sum)
			percent = 100.0 * hits / h->sum;
370

371
		color = get_percent_color(percent);
372

373 374 375 376 377 378 379 380 381 382 383 384 385 386
		/*
		 * Also color the filename and line if needed, with
		 * the same color than the percentage. Don't print it
		 * twice for close colored ip with the same filename:line
		 */
		if (path) {
			if (!prev_line || strcmp(prev_line, path)
				       || color != prev_color) {
				color_fprintf(stdout, color, " %s", path);
				prev_line = path;
				prev_color = color;
			}
		}

387 388 389 390 391 392 393 394 395 396 397 398 399
		color_fprintf(stdout, color, " %7.2f", percent);
		printf(" :	");
		color_fprintf(stdout, PERF_COLOR_BLUE, "%s\n", line);
	} else {
		if (!*line)
			printf("         :\n");
		else
			printf("         :	%s\n", line);
	}

	return 0;
}

400 401 402 403 404 405 406 407 408 409 410 411 412 413 414 415 416 417 418 419 420 421
static struct rb_root root_sym_ext;

static void insert_source_line(struct sym_ext *sym_ext)
{
	struct sym_ext *iter;
	struct rb_node **p = &root_sym_ext.rb_node;
	struct rb_node *parent = NULL;

	while (*p != NULL) {
		parent = *p;
		iter = rb_entry(parent, struct sym_ext, node);

		if (sym_ext->percent > iter->percent)
			p = &(*p)->rb_left;
		else
			p = &(*p)->rb_right;
	}

	rb_link_node(&sym_ext->node, parent, p);
	rb_insert_color(&sym_ext->node, &root_sym_ext);
}

422
static void free_source_line(struct hist_entry *he, int len)
423
{
424
	struct sym_priv *priv = symbol__priv(he->sym);
425
	struct sym_ext *sym_ext = priv->ext;
426 427 428 429 430 431 432 433 434
	int i;

	if (!sym_ext)
		return;

	for (i = 0; i < len; i++)
		free(sym_ext[i].path);
	free(sym_ext);

435
	priv->ext = NULL;
436
	root_sym_ext = RB_ROOT;
437 438 439
}

/* Get the filename:line for the colored entries */
440
static void
441
get_source_line(struct hist_entry *he, int len, const char *filename)
442
{
443 444
	struct symbol *sym = he->sym;
	u64 start;
445 446 447
	int i;
	char cmd[PATH_MAX * 2];
	struct sym_ext *sym_ext;
448
	struct sym_priv *priv = symbol__priv(sym);
449
	struct sym_hist *h = priv->hist;
450

451
	if (!h->sum)
452 453
		return;

454 455
	sym_ext = priv->ext = calloc(len, sizeof(struct sym_ext));
	if (!priv->ext)
456 457
		return;

458
	start = he->map->unmap_ip(he->map, sym->start);
459 460 461 462

	for (i = 0; i < len; i++) {
		char *path = NULL;
		size_t line_len;
463
		u64 offset;
464 465
		FILE *fp;

466
		sym_ext[i].percent = 100.0 * h->ip[i] / h->sum;
467 468 469
		if (sym_ext[i].percent <= 0.5)
			continue;

470
		offset = start + i;
471
		sprintf(cmd, "addr2line -e %s %016llx", filename, offset);
472 473 474 475 476 477 478
		fp = popen(cmd, "r");
		if (!fp)
			continue;

		if (getline(&path, &line_len, fp) < 0 || !line_len)
			goto next;

479
		sym_ext[i].path = malloc(sizeof(char) * line_len + 1);
480 481 482 483
		if (!sym_ext[i].path)
			goto next;

		strcpy(sym_ext[i].path, path);
484
		insert_source_line(&sym_ext[i]);
485 486 487 488 489 490

	next:
		pclose(fp);
	}
}

491
static void print_summary(const char *filename)
492 493 494 495 496 497 498 499 500 501 502 503 504 505 506
{
	struct sym_ext *sym_ext;
	struct rb_node *node;

	printf("\nSorted summary for file %s\n", filename);
	printf("----------------------------------------------\n\n");

	if (RB_EMPTY_ROOT(&root_sym_ext)) {
		printf(" Nothing higher than %1.1f%%\n", MIN_GREEN);
		return;
	}

	node = rb_first(&root_sym_ext);
	while (node) {
		double percent;
507
		const char *color;
508 509 510 511
		char *path;

		sym_ext = rb_entry(node, struct sym_ext, node);
		percent = sym_ext->percent;
512
		color = get_percent_color(percent);
513 514 515 516 517 518 519
		path = sym_ext->path;

		color_fprintf(stdout, color, " %7.2f %s", percent, path);
		node = rb_next(node);
	}
}

520
static void annotate_sym(struct hist_entry *he)
521
{
522 523 524
	struct map *map = he->map;
	struct dso *dso = map->dso;
	struct symbol *sym = he->sym;
525 526
	const char *filename = dso->long_name, *d_filename;
	u64 len;
527 528 529 530 531
	char command[PATH_MAX*2];
	FILE *file;

	if (!filename)
		return;
532

533 534 535 536 537 538
	if (verbose)
		fprintf(stderr, "%s: filename=%s, sym=%s, start=%Lx, end=%Lx\n",
			__func__, filename, sym->name,
			map->unmap_ip(map, sym->start),
			map->unmap_ip(map, sym->end));

539 540 541 542
	if (full_paths)
		d_filename = filename;
	else
		d_filename = basename(filename);
543 544 545

	len = sym->end - sym->start;

546
	if (print_line) {
547
		get_source_line(he, len, filename);
548 549 550 551
		print_summary(filename);
	}

	printf("\n\n------------------------------------------------\n");
552
	printf(" Percent |	Source code & Disassembly of %s\n", d_filename);
553 554 555
	printf("------------------------------------------------\n");

	if (verbose >= 2)
556 557
		printf("annotating [%p] %30s : [%p] %30s\n",
		       dso, dso->long_name, sym, sym->name);
558

559
	sprintf(command, "objdump --start-address=0x%016Lx --stop-address=0x%016Lx -dS %s|grep -v %s",
560 561
		map->unmap_ip(map, sym->start), map->unmap_ip(map, sym->end),
		filename, filename);
562 563 564 565 566 567 568 569 570

	if (verbose >= 3)
		printf("doing: %s\n", command);

	file = popen(command, "r");
	if (!file)
		return;

	while (!feof(file)) {
571
		if (parse_line(file, he, len) < 0)
572 573 574 575
			break;
	}

	pclose(file);
576
	if (print_line)
577
		free_source_line(he, len);
578 579 580 581 582 583
}

static void find_annotations(void)
{
	struct rb_node *nd;

584 585
	for (nd = rb_first(&output_hists); nd; nd = rb_next(nd)) {
		struct hist_entry *he = rb_entry(nd, struct hist_entry, rb_node);
586
		struct sym_priv *priv;
587

588 589
		if (he->sym == NULL)
			continue;
590

591
		priv = symbol__priv(he->sym);
592 593 594 595 596 597 598 599 600 601
		if (priv->hist == NULL)
			continue;

		annotate_sym(he);
		/*
		 * Since we have a hist_entry per IP for the same symbol, free
		 * he->sym->hist to signal we already processed this symbol.
		 */
		free(priv->hist);
		priv->hist = NULL;
602 603 604
	}
}

605 606 607 608 609
static int __cmd_annotate(void)
{
	int ret, rc = EXIT_FAILURE;
	unsigned long offset = 0;
	unsigned long head = 0;
610
	struct stat input_stat;
611 612 613 614
	event_t *event;
	uint32_t size;
	char *buf;

615
	register_idle_thread();
616 617 618 619 620 621 622

	input = open(input_name, O_RDONLY);
	if (input < 0) {
		perror("failed to open file");
		exit(-1);
	}

623
	ret = fstat(input, &input_stat);
624 625 626 627 628
	if (ret < 0) {
		perror("failed to stat file");
		exit(-1);
	}

629 630
	if (!force && input_stat.st_uid && (input_stat.st_uid != geteuid())) {
		fprintf(stderr, "file: %s not owned by current user or root\n", input_name);
631 632 633
		exit(-1);
	}

634
	if (!input_stat.st_size) {
635 636 637 638
		fprintf(stderr, "zero-sized file, nothing to do!\n");
		exit(0);
	}

639
	if (load_kernel(symbol_filter) < 0) {
640 641 642 643 644 645 646 647 648 649 650 651 652 653 654 655 656 657 658 659 660
		perror("failed to load kernel symbols");
		return EXIT_FAILURE;
	}

remap:
	buf = (char *)mmap(NULL, page_size * mmap_window, PROT_READ,
			   MAP_SHARED, input, offset);
	if (buf == MAP_FAILED) {
		perror("failed to mmap file");
		exit(-1);
	}

more:
	event = (event_t *)(buf + head);

	size = event->header.size;
	if (!size)
		size = 8;

	if (head + event->header.size >= page_size * mmap_window) {
		unsigned long shift = page_size * (head / page_size);
661
		int munmap_ret;
662

663 664
		munmap_ret = munmap(buf, page_size * mmap_window);
		assert(munmap_ret == 0);
665 666 667 668 669 670 671 672

		offset += shift;
		head -= shift;
		goto remap;
	}

	size = event->header.size;

673
	dump_printf("%p [%p]: event: %d\n",
674 675 676 677 678 679
			(void *)(offset + head),
			(void *)(long)event->header.size,
			event->header.type);

	if (!size || process_event(event, offset, head) < 0) {

680
		dump_printf("%p [%p]: skipping unknown header type: %d\n",
681 682 683 684 685 686 687 688 689 690 691 692 693 694 695 696 697 698 699
			(void *)(offset + head),
			(void *)(long)(event->header.size),
			event->header.type);

		total_unknown++;

		/*
		 * assume we lost track of the stream, check alignment, and
		 * increment a single u64 in the hope to catch on again 'soon'.
		 */

		if (unlikely(head & 7))
			head &= ~7ULL;

		size = 8;
	}

	head += size;

700
	if (offset + head < (unsigned long)input_stat.st_size)
701 702 703 704 705
		goto more;

	rc = EXIT_SUCCESS;
	close(input);

706 707 708 709 710
	dump_printf("      IP events: %10ld\n", total);
	dump_printf("    mmap events: %10ld\n", total_mmap);
	dump_printf("    comm events: %10ld\n", total_comm);
	dump_printf("    fork events: %10ld\n", total_fork);
	dump_printf(" unknown events: %10ld\n", total_unknown);
711 712 713 714

	if (dump_trace)
		return 0;

715
	if (verbose > 3)
716
		threads__fprintf(stdout);
717

718
	if (verbose > 2)
719 720 721
		dsos__fprintf(stdout);

	collapse__resort();
722
	output__resort(total);
723 724

	find_annotations();
725 726 727 728 729 730 731 732 733 734 735 736

	return rc;
}

static const char * const annotate_usage[] = {
	"perf annotate [<options>] <command>",
	NULL
};

static const struct option options[] = {
	OPT_STRING('i', "input", &input_name, "file",
		    "input file name"),
737
	OPT_STRING('s', "symbol", &sym_hist_filter, "symbol",
738
		    "symbol to annotate"),
739
	OPT_BOOLEAN('f', "force", &force, "don't complain, do it"),
740 741 742 743
	OPT_BOOLEAN('v', "verbose", &verbose,
		    "be more verbose (show symbol address, etc)"),
	OPT_BOOLEAN('D', "dump-raw-trace", &dump_trace,
		    "dump raw trace in ASCII"),
744
	OPT_STRING('k', "vmlinux", &vmlinux_name, "file", "vmlinux pathname"),
745 746
	OPT_BOOLEAN('m', "modules", &modules,
		    "load module symbols - WARNING: use only with -k and LIVE kernel"),
747 748
	OPT_BOOLEAN('l', "print-line", &print_line,
		    "print matching source lines (may be slow)"),
749 750
	OPT_BOOLEAN('P', "full-paths", &full_paths,
		    "Don't shorten the displayed pathnames"),
751 752 753 754 755 756 757 758 759 760 761 762 763 764 765 766 767 768
	OPT_END()
};

static void setup_sorting(void)
{
	char *tmp, *tok, *str = strdup(sort_order);

	for (tok = strtok_r(str, ", ", &tmp);
			tok; tok = strtok_r(NULL, ", ", &tmp)) {
		if (sort_dimension__add(tok) < 0) {
			error("Unknown --sort key: `%s'", tok);
			usage_with_options(annotate_usage, options);
		}
	}

	free(str);
}

769
int cmd_annotate(int argc, const char **argv, const char *prefix __used)
770
{
771
	symbol__init(sizeof(struct sym_priv));
772 773 774 775 776 777 778

	page_size = getpagesize();

	argc = parse_options(argc, argv, options, annotate_usage, 0);

	setup_sorting();

779 780 781 782 783 784 785 786 787 788 789
	if (argc) {
		/*
		 * Special case: if there's an argument left then assume tha
		 * it's a symbol filter:
		 */
		if (argc > 1)
			usage_with_options(annotate_usage, options);

		sym_hist_filter = argv[0];
	}

790 791
	setup_pager();

792 793 794 795 796 797
	if (field_sep && *field_sep == '.') {
		fputs("'.' is the only non valid --field-separator argument\n",
				stderr);
		exit(129);
	}

798 799
	return __cmd_annotate();
}