builtin-annotate.c 13.9 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12
/*
 * builtin-annotate.c
 *
 * Builtin annotate command: Analyze the perf.data input file,
 * look up and read DSOs and symbol information and display
 * a histogram of results, along various sorting keys.
 */
#include "builtin.h"

#include "util/util.h"

#include "util/color.h"
13
#include <linux/list.h>
14
#include "util/cache.h"
15
#include <linux/rbtree.h>
16 17 18
#include "util/symbol.h"

#include "perf.h"
19
#include "util/debug.h"
20

21
#include "util/event.h"
22 23
#include "util/parse-options.h"
#include "util/parse-events.h"
24
#include "util/thread.h"
25
#include "util/sort.h"
26
#include "util/hist.h"
27
#include "util/session.h"
28 29 30

static char		const *input_name = "perf.data";

31
static bool		force;
32

33
static bool		full_paths;
34

35
static bool		print_line;
36

37 38 39 40 41
struct sym_hist {
	u64		sum;
	u64		ip[0];
};

42
struct sym_ext {
43
	struct rb_node	node;
44 45 46 47
	double		percent;
	char		*path;
};

48 49 50 51 52 53 54
struct sym_priv {
	struct sym_hist	*hist;
	struct sym_ext	*ext;
};

static const char *sym_hist_filter;

55
static int sym__alloc_hist(struct symbol *self)
56
{
57 58 59 60 61 62
	struct sym_priv *priv = symbol__priv(self);
	const int size = (sizeof(*priv->hist) +
			  (self->end - self->start) * sizeof(u64));

	priv->hist = zalloc(size);
	return priv->hist == NULL ? -1 : 0;
63
}
64

65 66 67
/*
 * collect histogram counts
 */
68
static int annotate__hist_hit(struct hist_entry *he, u64 ip)
69
{
70
	unsigned int sym_size, offset;
71
	struct symbol *sym = he->ms.sym;
72 73
	struct sym_priv *priv;
	struct sym_hist *h;
74

75
	if (!sym || !he->ms.map)
76
		return 0;
77

78
	priv = symbol__priv(sym);
79 80
	if (priv->hist == NULL && sym__alloc_hist(sym) < 0)
		return -ENOMEM;
81

82 83
	sym_size = sym->end - sym->start;
	offset = ip - sym->start;
84

85
	pr_debug3("%s: ip=%#Lx\n", __func__, he->ms.map->unmap_ip(he->ms.map, ip));
86

87
	if (offset >= sym_size)
88
		return 0;
89

90 91 92
	h = priv->hist;
	h->sum++;
	h->ip[offset]++;
93

94 95
	pr_debug3("%#Lx %s: count++ [ip: %#Lx, %#Lx] => %Ld\n", he->ms.sym->start,
		  he->ms.sym->name, ip, ip - he->ms.sym->start, h->ip[offset]);
96
	return 0;
97 98
}

99
static int hists__add_entry(struct hists *self, struct addr_location *al)
100
{
101 102 103 104 105 106 107 108 109 110 111 112 113
	struct hist_entry *he;

	if (sym_hist_filter != NULL &&
	    (al->sym == NULL || strcmp(sym_hist_filter, al->sym->name) != 0)) {
		/* We're only interested in a symbol named sym_hist_filter */
		if (al->sym != NULL) {
			rb_erase(&al->sym->rb_node,
				 &al->map->dso->symbols[al->map->type]);
			symbol__delete(al->sym);
		}
		return 0;
	}

114
	he = __hists__add_entry(self, al, NULL, 1);
115
	if (he == NULL)
116
		return -ENOMEM;
117 118

	return annotate__hist_hit(he, al->addr);
119 120
}

121
static int process_sample_event(event_t *event, struct perf_session *session)
122
{
123
	struct addr_location al;
124

125 126
	dump_printf("(IP, %d): %d: %#Lx\n", event->header.misc,
		    event->ip.pid, event->ip.ip);
127

128
	if (event__preprocess_sample(event, session, &al, NULL) < 0) {
129 130
		pr_warning("problem processing %d event, skipping it.\n",
			   event->header.type);
131 132 133
		return -1;
	}

134
	if (!al.filtered && hists__add_entry(&session->hists, &al)) {
135 136
		pr_warning("problem incrementing symbol count, "
			   "skipping event\n");
137
		return -1;
138 139 140 141 142
	}

	return 0;
}

143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183
struct objdump_line {
	struct list_head node;
	s64		 offset;
	char		 *line;
};

static struct objdump_line *objdump_line__new(s64 offset, char *line)
{
	struct objdump_line *self = malloc(sizeof(*self));

	if (self != NULL) {
		self->offset = offset;
		self->line = line;
	}

	return self;
}

static void objdump_line__free(struct objdump_line *self)
{
	free(self->line);
	free(self);
}

static void objdump__add_line(struct list_head *head, struct objdump_line *line)
{
	list_add_tail(&line->node, head);
}

static struct objdump_line *objdump__get_next_ip_line(struct list_head *head,
						      struct objdump_line *pos)
{
	list_for_each_entry_continue(pos, head, node)
		if (pos->offset >= 0)
			return pos;

	return NULL;
}

static int parse_line(FILE *file, struct hist_entry *he,
		      struct list_head *head)
184
{
185
	struct symbol *sym = he->ms.sym;
186
	struct objdump_line *objdump_line;
187 188
	char *line = NULL, *tmp, *tmp2;
	size_t line_len;
189
	s64 line_ip, offset = -1;
190 191 192 193
	char *c;

	if (getline(&line, &line_len, file) < 0)
		return -1;
194

195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223
	if (!line)
		return -1;

	c = strchr(line, '\n');
	if (c)
		*c = 0;

	line_ip = -1;

	/*
	 * Strip leading spaces:
	 */
	tmp = line;
	while (*tmp) {
		if (*tmp != ' ')
			break;
		tmp++;
	}

	if (*tmp) {
		/*
		 * Parse hexa addresses followed by ':'
		 */
		line_ip = strtoull(tmp, &tmp2, 16);
		if (*tmp2 != ':')
			line_ip = -1;
	}

	if (line_ip != -1) {
224
		u64 start = map__rip_2objdump(he->ms.map, sym->start);
225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241
		offset = line_ip - start;
	}

	objdump_line = objdump_line__new(offset, line);
	if (objdump_line == NULL) {
		free(line);
		return -1;
	}
	objdump__add_line(head, objdump_line);

	return 0;
}

static int objdump_line__print(struct objdump_line *self,
			       struct list_head *head,
			       struct hist_entry *he, u64 len)
{
242
	struct symbol *sym = he->ms.sym;
243 244 245 246
	static const char *prev_line;
	static const char *prev_color;

	if (self->offset != -1) {
247
		const char *path = NULL;
248 249
		unsigned int hits = 0;
		double percent = 0.0;
250
		const char *color;
251
		struct sym_priv *priv = symbol__priv(sym);
252 253
		struct sym_ext *sym_ext = priv->ext;
		struct sym_hist *h = priv->hist;
254 255 256 257 258 259 260 261 262 263 264 265 266 267
		s64 offset = self->offset;
		struct objdump_line *next = objdump__get_next_ip_line(head, self);

		while (offset < (s64)len &&
		       (next == NULL || offset < next->offset)) {
			if (sym_ext) {
				if (path == NULL)
					path = sym_ext[offset].path;
				percent += sym_ext[offset].percent;
			} else
				hits += h->ip[offset];

			++offset;
		}
268

269
		if (sym_ext == NULL && h->sum)
270
			percent = 100.0 * hits / h->sum;
271

272
		color = get_percent_color(percent);
273

274 275 276 277 278 279 280 281 282 283 284 285 286 287
		/*
		 * Also color the filename and line if needed, with
		 * the same color than the percentage. Don't print it
		 * twice for close colored ip with the same filename:line
		 */
		if (path) {
			if (!prev_line || strcmp(prev_line, path)
				       || color != prev_color) {
				color_fprintf(stdout, color, " %s", path);
				prev_line = path;
				prev_color = color;
			}
		}

288 289
		color_fprintf(stdout, color, " %7.2f", percent);
		printf(" :	");
290
		color_fprintf(stdout, PERF_COLOR_BLUE, "%s\n", self->line);
291
	} else {
292
		if (!*self->line)
293 294
			printf("         :\n");
		else
295
			printf("         :	%s\n", self->line);
296 297 298 299 300
	}

	return 0;
}

301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322
static struct rb_root root_sym_ext;

static void insert_source_line(struct sym_ext *sym_ext)
{
	struct sym_ext *iter;
	struct rb_node **p = &root_sym_ext.rb_node;
	struct rb_node *parent = NULL;

	while (*p != NULL) {
		parent = *p;
		iter = rb_entry(parent, struct sym_ext, node);

		if (sym_ext->percent > iter->percent)
			p = &(*p)->rb_left;
		else
			p = &(*p)->rb_right;
	}

	rb_link_node(&sym_ext->node, parent, p);
	rb_insert_color(&sym_ext->node, &root_sym_ext);
}

323
static void free_source_line(struct hist_entry *he, int len)
324
{
325
	struct sym_priv *priv = symbol__priv(he->ms.sym);
326
	struct sym_ext *sym_ext = priv->ext;
327 328 329 330 331 332 333 334 335
	int i;

	if (!sym_ext)
		return;

	for (i = 0; i < len; i++)
		free(sym_ext[i].path);
	free(sym_ext);

336
	priv->ext = NULL;
337
	root_sym_ext = RB_ROOT;
338 339 340
}

/* Get the filename:line for the colored entries */
341
static void
342
get_source_line(struct hist_entry *he, int len, const char *filename)
343
{
344
	struct symbol *sym = he->ms.sym;
345
	u64 start;
346 347 348
	int i;
	char cmd[PATH_MAX * 2];
	struct sym_ext *sym_ext;
349
	struct sym_priv *priv = symbol__priv(sym);
350
	struct sym_hist *h = priv->hist;
351

352
	if (!h->sum)
353 354
		return;

355 356
	sym_ext = priv->ext = calloc(len, sizeof(struct sym_ext));
	if (!priv->ext)
357 358
		return;

359
	start = he->ms.map->unmap_ip(he->ms.map, sym->start);
360 361 362 363

	for (i = 0; i < len; i++) {
		char *path = NULL;
		size_t line_len;
364
		u64 offset;
365 366
		FILE *fp;

367
		sym_ext[i].percent = 100.0 * h->ip[i] / h->sum;
368 369 370
		if (sym_ext[i].percent <= 0.5)
			continue;

371
		offset = start + i;
372
		sprintf(cmd, "addr2line -e %s %016llx", filename, offset);
373 374 375 376 377 378 379
		fp = popen(cmd, "r");
		if (!fp)
			continue;

		if (getline(&path, &line_len, fp) < 0 || !line_len)
			goto next;

380
		sym_ext[i].path = malloc(sizeof(char) * line_len + 1);
381 382 383 384
		if (!sym_ext[i].path)
			goto next;

		strcpy(sym_ext[i].path, path);
385
		insert_source_line(&sym_ext[i]);
386 387 388 389 390 391

	next:
		pclose(fp);
	}
}

392
static void print_summary(const char *filename)
393 394 395 396 397 398 399 400 401 402 403 404 405 406 407
{
	struct sym_ext *sym_ext;
	struct rb_node *node;

	printf("\nSorted summary for file %s\n", filename);
	printf("----------------------------------------------\n\n");

	if (RB_EMPTY_ROOT(&root_sym_ext)) {
		printf(" Nothing higher than %1.1f%%\n", MIN_GREEN);
		return;
	}

	node = rb_first(&root_sym_ext);
	while (node) {
		double percent;
408
		const char *color;
409 410 411 412
		char *path;

		sym_ext = rb_entry(node, struct sym_ext, node);
		percent = sym_ext->percent;
413
		color = get_percent_color(percent);
414 415 416 417 418 419 420
		path = sym_ext->path;

		color_fprintf(stdout, color, " %7.2f %s", percent, path);
		node = rb_next(node);
	}
}

421 422
static void hist_entry__print_hits(struct hist_entry *self)
{
423
	struct symbol *sym = self->ms.sym;
424 425 426 427 428 429 430 431 432 433 434
	struct sym_priv *priv = symbol__priv(sym);
	struct sym_hist *h = priv->hist;
	u64 len = sym->end - sym->start, offset;

	for (offset = 0; offset < len; ++offset)
		if (h->ip[offset] != 0)
			printf("%*Lx: %Lu\n", BITS_PER_LONG / 2,
			       sym->start + offset, h->ip[offset]);
	printf("%*s: %Lu\n", BITS_PER_LONG / 2, "h->sum", h->sum);
}

435
static void annotate_sym(struct hist_entry *he)
436
{
437
	struct map *map = he->ms.map;
438
	struct dso *dso = map->dso;
439
	struct symbol *sym = he->ms.sym;
440 441
	const char *filename = dso->long_name, *d_filename;
	u64 len;
442 443
	char command[PATH_MAX*2];
	FILE *file;
444 445
	LIST_HEAD(head);
	struct objdump_line *pos, *n;
446 447 448

	if (!filename)
		return;
449

450 451 452 453 454 455 456 457 458 459
	if (dso->origin == DSO__ORIG_KERNEL) {
		if (dso->annotate_warned)
			return;
		dso->annotate_warned = 1;
		pr_err("Can't annotate %s: No vmlinux file was found in the "
		       "path:\n", sym->name);
		vmlinux_path__fprintf(stderr);
		return;
	}

460 461 462
	pr_debug("%s: filename=%s, sym=%s, start=%#Lx, end=%#Lx\n", __func__,
		 filename, sym->name, map->unmap_ip(map, sym->start),
		 map->unmap_ip(map, sym->end));
463

464 465 466 467
	if (full_paths)
		d_filename = filename;
	else
		d_filename = basename(filename);
468 469 470

	len = sym->end - sym->start;

471
	if (print_line) {
472
		get_source_line(he, len, filename);
473 474 475 476
		print_summary(filename);
	}

	printf("\n\n------------------------------------------------\n");
477
	printf(" Percent |	Source code & Disassembly of %s\n", d_filename);
478 479 480
	printf("------------------------------------------------\n");

	if (verbose >= 2)
481 482
		printf("annotating [%p] %30s : [%p] %30s\n",
		       dso, dso->long_name, sym, sym->name);
483

484
	sprintf(command, "objdump --start-address=0x%016Lx --stop-address=0x%016Lx -dS %s|grep -v %s",
485 486
		map__rip_2objdump(map, sym->start),
		map__rip_2objdump(map, sym->end),
487
		filename, filename);
488 489 490 491 492 493 494 495 496

	if (verbose >= 3)
		printf("doing: %s\n", command);

	file = popen(command, "r");
	if (!file)
		return;

	while (!feof(file)) {
497
		if (parse_line(file, he, &head) < 0)
498 499 500 501
			break;
	}

	pclose(file);
502 503 504 505 506 507 508 509 510 511

	if (verbose)
		hist_entry__print_hits(he);

	list_for_each_entry_safe(pos, n, &head, node) {
		objdump_line__print(pos, &head, he, len);
		list_del(&pos->node);
		objdump_line__free(pos);
	}

512
	if (print_line)
513
		free_source_line(he, len);
514 515
}

516
static void hists__find_annotations(struct hists *self)
517 518 519
{
	struct rb_node *nd;

520
	for (nd = rb_first(&self->entries); nd; nd = rb_next(nd)) {
521
		struct hist_entry *he = rb_entry(nd, struct hist_entry, rb_node);
522
		struct sym_priv *priv;
523

524
		if (he->ms.sym == NULL)
525
			continue;
526

527
		priv = symbol__priv(he->ms.sym);
528 529 530 531 532 533
		if (priv->hist == NULL)
			continue;

		annotate_sym(he);
		/*
		 * Since we have a hist_entry per IP for the same symbol, free
534
		 * he->ms.sym->hist to signal we already processed this symbol.
535 536 537
		 */
		free(priv->hist);
		priv->hist = NULL;
538 539 540
	}
}

541
static struct perf_event_ops event_ops = {
542 543 544 545
	.sample	= process_sample_event,
	.mmap	= event__process_mmap,
	.comm	= event__process_comm,
	.fork	= event__process_task,
L
Li Zefan 已提交
546 547
};

548 549
static int __cmd_annotate(void)
{
L
Li Zefan 已提交
550
	int ret;
551
	struct perf_session *session;
552

T
Tom Zanussi 已提交
553
	session = perf_session__new(input_name, O_RDONLY, force, false);
554 555 556
	if (session == NULL)
		return -ENOMEM;

557
	ret = perf_session__process_events(session, &event_ops);
L
Li Zefan 已提交
558
	if (ret)
559
		goto out_delete;
560

561 562
	if (dump_trace) {
		event__print_totals();
563
		goto out_delete;
564
	}
565

566
	if (verbose > 3)
567
		perf_session__fprintf(session, stdout);
568

569
	if (verbose > 2)
570
		perf_session__fprintf_dsos(session, stdout);
571

572 573 574
	hists__collapse_resort(&session->hists);
	hists__output_resort(&session->hists);
	hists__find_annotations(&session->hists);
575 576
out_delete:
	perf_session__delete(session);
577

L
Li Zefan 已提交
578
	return ret;
579 580 581 582 583 584 585 586 587 588
}

static const char * const annotate_usage[] = {
	"perf annotate [<options>] <command>",
	NULL
};

static const struct option options[] = {
	OPT_STRING('i', "input", &input_name, "file",
		    "input file name"),
589 590
	OPT_STRING('d', "dsos", &symbol_conf.dso_list_str, "dso[,dso...]",
		   "only consider symbols in these dsos"),
591
	OPT_STRING('s', "symbol", &sym_hist_filter, "symbol",
592
		    "symbol to annotate"),
593
	OPT_BOOLEAN('f', "force", &force, "don't complain, do it"),
594
	OPT_INCR('v', "verbose", &verbose,
595 596 597
		    "be more verbose (show symbol address, etc)"),
	OPT_BOOLEAN('D', "dump-raw-trace", &dump_trace,
		    "dump raw trace in ASCII"),
598 599 600
	OPT_STRING('k', "vmlinux", &symbol_conf.vmlinux_name,
		   "file", "vmlinux pathname"),
	OPT_BOOLEAN('m', "modules", &symbol_conf.use_modules,
601
		    "load module symbols - WARNING: use only with -k and LIVE kernel"),
602 603
	OPT_BOOLEAN('l', "print-line", &print_line,
		    "print matching source lines (may be slow)"),
604 605
	OPT_BOOLEAN('P', "full-paths", &full_paths,
		    "Don't shorten the displayed pathnames"),
606 607 608
	OPT_END()
};

609
int cmd_annotate(int argc, const char **argv, const char *prefix __used)
610
{
611 612
	argc = parse_options(argc, argv, options, annotate_usage, 0);

613 614 615 616
	symbol_conf.priv_size = sizeof(struct sym_priv);
	symbol_conf.try_vmlinux_path = true;

	if (symbol__init() < 0)
617
		return -1;
618

619
	setup_sorting(annotate_usage, options);
620

621 622 623 624 625 626 627 628 629 630 631
	if (argc) {
		/*
		 * Special case: if there's an argument left then assume tha
		 * it's a symbol filter:
		 */
		if (argc > 1)
			usage_with_options(annotate_usage, options);

		sym_hist_filter = argv[0];
	}

632 633
	setup_pager();

634
	if (field_sep && *field_sep == '.') {
635 636
		pr_err("'.' is the only non valid --field-separator argument\n");
		return -1;
637 638
	}

639 640
	return __cmd_annotate();
}