builtin-annotate.c 12.0 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12
/*
 * builtin-annotate.c
 *
 * Builtin annotate command: Analyze the perf.data input file,
 * look up and read DSOs and symbol information and display
 * a histogram of results, along various sorting keys.
 */
#include "builtin.h"

#include "util/util.h"

#include "util/color.h"
13
#include <linux/list.h>
14
#include "util/cache.h"
15
#include <linux/rbtree.h>
16 17 18 19
#include "util/symbol.h"
#include "util/string.h"

#include "perf.h"
20
#include "util/debug.h"
21

22
#include "util/event.h"
23 24
#include "util/parse-options.h"
#include "util/parse-events.h"
25
#include "util/thread.h"
26
#include "util/sort.h"
27
#include "util/hist.h"
28
#include "util/session.h"
29 30 31

static char		const *input_name = "perf.data";

32
static int		force;
33

34 35
static int		full_paths;

36 37
static int		print_line;

38 39 40 41 42
struct sym_hist {
	u64		sum;
	u64		ip[0];
};

43
struct sym_ext {
44
	struct rb_node	node;
45 46 47 48
	double		percent;
	char		*path;
};

49 50 51 52 53
struct sym_priv {
	struct sym_hist	*hist;
	struct sym_ext	*ext;
};

54 55 56 57 58
static struct symbol_conf symbol_conf = {
	.priv_size	  = sizeof(struct sym_priv),
	.try_vmlinux_path = true,
};

59 60
static const char *sym_hist_filter;

61
static int symbol_filter(struct map *map __used, struct symbol *sym)
62
{
63 64
	if (sym_hist_filter == NULL ||
	    strcmp(sym->name, sym_hist_filter) == 0) {
65
		struct sym_priv *priv = symbol__priv(sym);
66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81
		const int size = (sizeof(*priv->hist) +
				  (sym->end - sym->start) * sizeof(u64));

		priv->hist = malloc(size);
		if (priv->hist)
			memset(priv->hist, 0, size);
		return 0;
	}
	/*
	 * FIXME: We should really filter it out, as we don't want to go thru symbols
	 * we're not interested, and if a DSO ends up with no symbols, delete it too,
	 * but right now the kernel loading routines in symbol.c bail out if no symbols
	 * are found, fix it later.
	 */
	return 0;
}
82

83 84 85
/*
 * collect histogram counts
 */
86
static void hist_hit(struct hist_entry *he, u64 ip)
87
{
88 89
	unsigned int sym_size, offset;
	struct symbol *sym = he->sym;
90 91
	struct sym_priv *priv;
	struct sym_hist *h;
92

93
	he->count++;
94

95 96 97
	if (!sym || !he->map)
		return;

98
	priv = symbol__priv(sym);
99
	if (!priv->hist)
100
		return;
101

102 103
	sym_size = sym->end - sym->start;
	offset = ip - sym->start;
104

105 106 107 108
	if (verbose)
		fprintf(stderr, "%s: ip=%Lx\n", __func__,
			he->map->unmap_ip(he->map, ip));

109 110
	if (offset >= sym_size)
		return;
111

112 113 114
	h = priv->hist;
	h->sum++;
	h->ip[offset]++;
115

116 117
	if (verbose >= 3)
		printf("%p %s: count++ [ip: %p, %08Lx] => %Ld\n",
118
			(void *)(unsigned long)he->sym->start,
119
			he->sym->name,
120
			(void *)(unsigned long)ip, ip - he->sym->start,
121
			h->ip[offset]);
122 123
}

124
static int hist_entry__add(struct addr_location *al, u64 count)
125
{
126
	bool hit;
127
	struct hist_entry *he = __hist_entry__add(al, NULL, count, &hit);
128
	if (he == NULL)
129
		return -ENOMEM;
130
	hist_hit(he, al->addr);
131 132 133
	return 0;
}

134
static int process_sample_event(event_t *event, struct perf_session *session)
135
{
136
	struct addr_location al;
137

138
	dump_printf("(IP, %d): %d: %p\n", event->header.misc,
139
		    event->ip.pid, (void *)(long)event->ip.ip);
140

141
	if (event__preprocess_sample(event, session, &al, symbol_filter) < 0) {
142 143 144 145 146
		fprintf(stderr, "problem processing %d event, skipping it.\n",
			event->header.type);
		return -1;
	}

147
	if (hist_entry__add(&al, 1)) {
148 149 150
		fprintf(stderr, "problem incrementing symbol count, "
				"skipping event\n");
		return -1;
151 152 153 154 155
	}

	return 0;
}

156
static int parse_line(FILE *file, struct hist_entry *he, u64 len)
157
{
158
	struct symbol *sym = he->sym;
159
	char *line = NULL, *tmp, *tmp2;
160 161
	static const char *prev_line;
	static const char *prev_color;
162 163
	unsigned int offset;
	size_t line_len;
164
	u64 start;
165
	s64 line_ip;
166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200
	int ret;
	char *c;

	if (getline(&line, &line_len, file) < 0)
		return -1;
	if (!line)
		return -1;

	c = strchr(line, '\n');
	if (c)
		*c = 0;

	line_ip = -1;
	offset = 0;
	ret = -2;

	/*
	 * Strip leading spaces:
	 */
	tmp = line;
	while (*tmp) {
		if (*tmp != ' ')
			break;
		tmp++;
	}

	if (*tmp) {
		/*
		 * Parse hexa addresses followed by ':'
		 */
		line_ip = strtoull(tmp, &tmp2, 16);
		if (*tmp2 != ':')
			line_ip = -1;
	}

201 202
	start = he->map->unmap_ip(he->map, sym->start);

203
	if (line_ip != -1) {
204
		const char *path = NULL;
205 206
		unsigned int hits = 0;
		double percent = 0.0;
207
		const char *color;
208
		struct sym_priv *priv = symbol__priv(sym);
209 210
		struct sym_ext *sym_ext = priv->ext;
		struct sym_hist *h = priv->hist;
211

212
		offset = line_ip - start;
213
		if (offset < len)
214
			hits = h->ip[offset];
215

216
		if (offset < len && sym_ext) {
217 218
			path = sym_ext[offset].path;
			percent = sym_ext[offset].percent;
219 220
		} else if (h->sum)
			percent = 100.0 * hits / h->sum;
221

222
		color = get_percent_color(percent);
223

224 225 226 227 228 229 230 231 232 233 234 235 236 237
		/*
		 * Also color the filename and line if needed, with
		 * the same color than the percentage. Don't print it
		 * twice for close colored ip with the same filename:line
		 */
		if (path) {
			if (!prev_line || strcmp(prev_line, path)
				       || color != prev_color) {
				color_fprintf(stdout, color, " %s", path);
				prev_line = path;
				prev_color = color;
			}
		}

238 239 240 241 242 243 244 245 246 247 248 249 250
		color_fprintf(stdout, color, " %7.2f", percent);
		printf(" :	");
		color_fprintf(stdout, PERF_COLOR_BLUE, "%s\n", line);
	} else {
		if (!*line)
			printf("         :\n");
		else
			printf("         :	%s\n", line);
	}

	return 0;
}

251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272
static struct rb_root root_sym_ext;

static void insert_source_line(struct sym_ext *sym_ext)
{
	struct sym_ext *iter;
	struct rb_node **p = &root_sym_ext.rb_node;
	struct rb_node *parent = NULL;

	while (*p != NULL) {
		parent = *p;
		iter = rb_entry(parent, struct sym_ext, node);

		if (sym_ext->percent > iter->percent)
			p = &(*p)->rb_left;
		else
			p = &(*p)->rb_right;
	}

	rb_link_node(&sym_ext->node, parent, p);
	rb_insert_color(&sym_ext->node, &root_sym_ext);
}

273
static void free_source_line(struct hist_entry *he, int len)
274
{
275
	struct sym_priv *priv = symbol__priv(he->sym);
276
	struct sym_ext *sym_ext = priv->ext;
277 278 279 280 281 282 283 284 285
	int i;

	if (!sym_ext)
		return;

	for (i = 0; i < len; i++)
		free(sym_ext[i].path);
	free(sym_ext);

286
	priv->ext = NULL;
287
	root_sym_ext = RB_ROOT;
288 289 290
}

/* Get the filename:line for the colored entries */
291
static void
292
get_source_line(struct hist_entry *he, int len, const char *filename)
293
{
294 295
	struct symbol *sym = he->sym;
	u64 start;
296 297 298
	int i;
	char cmd[PATH_MAX * 2];
	struct sym_ext *sym_ext;
299
	struct sym_priv *priv = symbol__priv(sym);
300
	struct sym_hist *h = priv->hist;
301

302
	if (!h->sum)
303 304
		return;

305 306
	sym_ext = priv->ext = calloc(len, sizeof(struct sym_ext));
	if (!priv->ext)
307 308
		return;

309
	start = he->map->unmap_ip(he->map, sym->start);
310 311 312 313

	for (i = 0; i < len; i++) {
		char *path = NULL;
		size_t line_len;
314
		u64 offset;
315 316
		FILE *fp;

317
		sym_ext[i].percent = 100.0 * h->ip[i] / h->sum;
318 319 320
		if (sym_ext[i].percent <= 0.5)
			continue;

321
		offset = start + i;
322
		sprintf(cmd, "addr2line -e %s %016llx", filename, offset);
323 324 325 326 327 328 329
		fp = popen(cmd, "r");
		if (!fp)
			continue;

		if (getline(&path, &line_len, fp) < 0 || !line_len)
			goto next;

330
		sym_ext[i].path = malloc(sizeof(char) * line_len + 1);
331 332 333 334
		if (!sym_ext[i].path)
			goto next;

		strcpy(sym_ext[i].path, path);
335
		insert_source_line(&sym_ext[i]);
336 337 338 339 340 341

	next:
		pclose(fp);
	}
}

342
static void print_summary(const char *filename)
343 344 345 346 347 348 349 350 351 352 353 354 355 356 357
{
	struct sym_ext *sym_ext;
	struct rb_node *node;

	printf("\nSorted summary for file %s\n", filename);
	printf("----------------------------------------------\n\n");

	if (RB_EMPTY_ROOT(&root_sym_ext)) {
		printf(" Nothing higher than %1.1f%%\n", MIN_GREEN);
		return;
	}

	node = rb_first(&root_sym_ext);
	while (node) {
		double percent;
358
		const char *color;
359 360 361 362
		char *path;

		sym_ext = rb_entry(node, struct sym_ext, node);
		percent = sym_ext->percent;
363
		color = get_percent_color(percent);
364 365 366 367 368 369 370
		path = sym_ext->path;

		color_fprintf(stdout, color, " %7.2f %s", percent, path);
		node = rb_next(node);
	}
}

371
static void annotate_sym(struct hist_entry *he)
372
{
373 374 375
	struct map *map = he->map;
	struct dso *dso = map->dso;
	struct symbol *sym = he->sym;
376 377
	const char *filename = dso->long_name, *d_filename;
	u64 len;
378 379 380 381 382
	char command[PATH_MAX*2];
	FILE *file;

	if (!filename)
		return;
383

384 385 386 387 388 389
	if (verbose)
		fprintf(stderr, "%s: filename=%s, sym=%s, start=%Lx, end=%Lx\n",
			__func__, filename, sym->name,
			map->unmap_ip(map, sym->start),
			map->unmap_ip(map, sym->end));

390 391 392 393
	if (full_paths)
		d_filename = filename;
	else
		d_filename = basename(filename);
394 395 396

	len = sym->end - sym->start;

397
	if (print_line) {
398
		get_source_line(he, len, filename);
399 400 401 402
		print_summary(filename);
	}

	printf("\n\n------------------------------------------------\n");
403
	printf(" Percent |	Source code & Disassembly of %s\n", d_filename);
404 405 406
	printf("------------------------------------------------\n");

	if (verbose >= 2)
407 408
		printf("annotating [%p] %30s : [%p] %30s\n",
		       dso, dso->long_name, sym, sym->name);
409

410
	sprintf(command, "objdump --start-address=0x%016Lx --stop-address=0x%016Lx -dS %s|grep -v %s",
411 412
		map->unmap_ip(map, sym->start), map->unmap_ip(map, sym->end),
		filename, filename);
413 414 415 416 417 418 419 420 421

	if (verbose >= 3)
		printf("doing: %s\n", command);

	file = popen(command, "r");
	if (!file)
		return;

	while (!feof(file)) {
422
		if (parse_line(file, he, len) < 0)
423 424 425 426
			break;
	}

	pclose(file);
427
	if (print_line)
428
		free_source_line(he, len);
429 430 431 432 433 434
}

static void find_annotations(void)
{
	struct rb_node *nd;

435
	for (nd = rb_first(&hist); nd; nd = rb_next(nd)) {
436
		struct hist_entry *he = rb_entry(nd, struct hist_entry, rb_node);
437
		struct sym_priv *priv;
438

439 440
		if (he->sym == NULL)
			continue;
441

442
		priv = symbol__priv(he->sym);
443 444 445 446 447 448 449 450 451 452
		if (priv->hist == NULL)
			continue;

		annotate_sym(he);
		/*
		 * Since we have a hist_entry per IP for the same symbol, free
		 * he->sym->hist to signal we already processed this symbol.
		 */
		free(priv->hist);
		priv->hist = NULL;
453 454 455
	}
}

456
static struct perf_event_ops event_ops = {
L
Li Zefan 已提交
457 458 459 460 461 462
	.process_sample_event	= process_sample_event,
	.process_mmap_event	= event__process_mmap,
	.process_comm_event	= event__process_comm,
	.process_fork_event	= event__process_task,
};

463 464
static int __cmd_annotate(void)
{
465
	struct perf_session *session = perf_session__new(input_name, O_RDONLY,
466
							 force, &symbol_conf);
L
Li Zefan 已提交
467
	int ret;
468

469 470 471
	if (session == NULL)
		return -ENOMEM;

472
	ret = perf_session__process_events(session, &event_ops);
L
Li Zefan 已提交
473
	if (ret)
474
		goto out_delete;
475

476 477
	if (dump_trace) {
		event__print_totals();
478
		goto out_delete;
479
	}
480

481
	if (verbose > 3)
482
		perf_session__fprintf(session, stdout);
483

484
	if (verbose > 2)
485 486 487
		dsos__fprintf(stdout);

	collapse__resort();
488
	output__resort(event__total[0]);
489 490

	find_annotations();
491 492
out_delete:
	perf_session__delete(session);
493

L
Li Zefan 已提交
494
	return ret;
495 496 497 498 499 500 501 502 503 504
}

static const char * const annotate_usage[] = {
	"perf annotate [<options>] <command>",
	NULL
};

static const struct option options[] = {
	OPT_STRING('i', "input", &input_name, "file",
		    "input file name"),
505
	OPT_STRING('s', "symbol", &sym_hist_filter, "symbol",
506
		    "symbol to annotate"),
507
	OPT_BOOLEAN('f', "force", &force, "don't complain, do it"),
508 509 510 511
	OPT_BOOLEAN('v', "verbose", &verbose,
		    "be more verbose (show symbol address, etc)"),
	OPT_BOOLEAN('D', "dump-raw-trace", &dump_trace,
		    "dump raw trace in ASCII"),
512 513 514
	OPT_STRING('k', "vmlinux", &symbol_conf.vmlinux_name,
		   "file", "vmlinux pathname"),
	OPT_BOOLEAN('m', "modules", &symbol_conf.use_modules,
515
		    "load module symbols - WARNING: use only with -k and LIVE kernel"),
516 517
	OPT_BOOLEAN('l', "print-line", &print_line,
		    "print matching source lines (may be slow)"),
518 519
	OPT_BOOLEAN('P', "full-paths", &full_paths,
		    "Don't shorten the displayed pathnames"),
520 521 522 523 524 525 526 527 528 529 530 531 532 533 534 535 536 537
	OPT_END()
};

static void setup_sorting(void)
{
	char *tmp, *tok, *str = strdup(sort_order);

	for (tok = strtok_r(str, ", ", &tmp);
			tok; tok = strtok_r(NULL, ", ", &tmp)) {
		if (sort_dimension__add(tok) < 0) {
			error("Unknown --sort key: `%s'", tok);
			usage_with_options(annotate_usage, options);
		}
	}

	free(str);
}

538
int cmd_annotate(int argc, const char **argv, const char *prefix __used)
539
{
540 541
	if (symbol__init(&symbol_conf) < 0)
		return -1;
542 543 544 545 546

	argc = parse_options(argc, argv, options, annotate_usage, 0);

	setup_sorting();

547 548 549 550 551 552 553 554 555 556 557
	if (argc) {
		/*
		 * Special case: if there's an argument left then assume tha
		 * it's a symbol filter:
		 */
		if (argc > 1)
			usage_with_options(annotate_usage, options);

		sym_hist_filter = argv[0];
	}

558 559
	setup_pager();

560 561 562 563 564 565
	if (field_sep && *field_sep == '.') {
		fputs("'.' is the only non valid --field-separator argument\n",
				stderr);
		exit(129);
	}

566 567
	return __cmd_annotate();
}