builtin-report.c 31.4 KB
Newer Older
1 2 3 4 5 6 7
/*
 * builtin-report.c
 *
 * Builtin report command: Analyze the perf.data input file,
 * look up and read DSOs and symbol information and display
 * a histogram of results, along various sorting keys.
 */
8
#include "builtin.h"
9

10 11
#include "util/util.h"

12
#include "util/color.h"
13
#include "util/list.h"
14
#include "util/cache.h"
15
#include "util/rbtree.h"
16
#include "util/symbol.h"
17
#include "util/string.h"
18

19
#include "perf.h"
20
#include "util/header.h"
21 22 23 24

#include "util/parse-options.h"
#include "util/parse-events.h"

25 26 27 28
#define SHOW_KERNEL	1
#define SHOW_USER	2
#define SHOW_HV		4

29
static char		const *input_name = "perf.data";
30
static char		*vmlinux = NULL;
31 32 33 34

static char		default_sort_order[] = "comm,dso";
static char		*sort_order = default_sort_order;

35 36 37
static int		input;
static int		show_mask = SHOW_KERNEL | SHOW_USER | SHOW_HV;

38
static int		dump_trace = 0;
I
Ingo Molnar 已提交
39
#define dprintf(x...)	do { if (dump_trace) printf(x); } while (0)
40
#define cdprintf(x...)	do { if (dump_trace) color_fprintf(stdout, color, x); } while (0)
I
Ingo Molnar 已提交
41

42
static int		verbose;
43 44
#define eprintf(x...)	do { if (verbose) fprintf(stderr, x); } while (0)

45
static int		full_paths;
46

47 48 49
static unsigned long	page_size;
static unsigned long	mmap_window = 32;

50 51
static char		default_parent_pattern[] = "^sys_|^do_page_fault";
static char		*parent_pattern = default_parent_pattern;
52
static regex_t		parent_regex;
53

54 55
static int		exclude_other = 1;

56 57
struct ip_event {
	struct perf_event_header header;
58 59
	u64 ip;
	u32 pid, tid;
60
	unsigned char __more_data[];
61
};
62

63
struct ip_callchain {
64 65
	u64 nr;
	u64 ips[0];
66 67
};

68 69
struct mmap_event {
	struct perf_event_header header;
70 71 72 73
	u32 pid, tid;
	u64 start;
	u64 len;
	u64 pgoff;
74 75
	char filename[PATH_MAX];
};
76

77 78
struct comm_event {
	struct perf_event_header header;
79
	u32 pid, tid;
80 81 82
	char comm[16];
};

83 84
struct fork_event {
	struct perf_event_header header;
85
	u32 pid, ppid;
86 87
};

88
struct period_event {
89
	struct perf_event_header header;
90 91 92
	u64 time;
	u64 id;
	u64 sample_period;
93 94
};

95 96
struct lost_event {
	struct perf_event_header header;
97 98
	u64 id;
	u64 lost;
99 100
};

101 102 103 104 105 106 107
typedef union event_union {
	struct perf_event_header	header;
	struct ip_event			ip;
	struct mmap_event		mmap;
	struct comm_event		comm;
	struct fork_event		fork;
	struct period_event		period;
108
	struct lost_event		lost;
109 110 111 112
} event_t;

static LIST_HEAD(dsos);
static struct dso *kernel_dso;
P
Peter Zijlstra 已提交
113
static struct dso *vdso;
114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132

static void dsos__add(struct dso *dso)
{
	list_add_tail(&dso->node, &dsos);
}

static struct dso *dsos__find(const char *name)
{
	struct dso *pos;

	list_for_each_entry(pos, &dsos, node)
		if (strcmp(pos->name, name) == 0)
			return pos;
	return NULL;
}

static struct dso *dsos__findnew(const char *name)
{
	struct dso *dso = dsos__find(name);
133
	int nr;
134

135 136 137 138 139 140
	if (dso)
		return dso;

	dso = dso__new(name, 0);
	if (!dso)
		goto out_delete_dso;
141

142
	nr = dso__load(dso, NULL, verbose);
143
	if (nr < 0) {
144
		eprintf("Failed to open: %s\n", name);
145
		goto out_delete_dso;
146
	}
147 148
	if (!nr)
		eprintf("No symbols found in: %s, maybe install a debug package?\n", name);
149 150

	dsos__add(dso);
151 152 153 154 155 156 157 158

	return dso;

out_delete_dso:
	dso__delete(dso);
	return NULL;
}

159
static void dsos__fprintf(FILE *fp)
160 161 162 163 164 165 166
{
	struct dso *pos;

	list_for_each_entry(pos, &dsos, node)
		dso__fprintf(pos, fp);
}

167
static struct symbol *vdso__find_symbol(struct dso *dso, u64 ip)
P
Peter Zijlstra 已提交
168 169 170 171
{
	return dso__find_symbol(kernel_dso, ip);
}

172 173
static int load_kernel(void)
{
174
	int err;
175

176
	kernel_dso = dso__new("[kernel]", 0);
177
	if (!kernel_dso)
178
		return -1;
179

180
	err = dso__load_kernel(kernel_dso, vmlinux, NULL, verbose);
181 182 183 184 185
	if (err) {
		dso__delete(kernel_dso);
		kernel_dso = NULL;
	} else
		dsos__add(kernel_dso);
186

P
Peter Zijlstra 已提交
187 188 189 190 191 192 193 194
	vdso = dso__new("[vdso]", 0);
	if (!vdso)
		return -1;

	vdso->find_symbol = vdso__find_symbol;

	dsos__add(vdso);

195
	return err;
196 197
}

198 199 200 201 202
static char __cwd[PATH_MAX];
static char *cwd = __cwd;
static int cwdlen;

static int strcommon(const char *pathname)
203 204 205 206 207 208 209 210 211
{
	int n = 0;

	while (pathname[n] == cwd[n] && n < cwdlen)
		++n;

	return n;
}

212 213
struct map {
	struct list_head node;
214 215 216 217
	u64	 start;
	u64	 end;
	u64	 pgoff;
	u64	 (*map_ip)(struct map *, u64);
218 219 220
	struct dso	 *dso;
};

221
static u64 map__map_ip(struct map *map, u64 ip)
P
Peter Zijlstra 已提交
222 223 224 225
{
	return ip - map->start + map->pgoff;
}

226
static u64 vdso__map_ip(struct map *map, u64 ip)
P
Peter Zijlstra 已提交
227 228 229 230
{
	return ip;
}

231 232 233 234 235
static inline int is_anon_memory(const char *filename)
{
     return strcmp(filename, "//anon") == 0;
}

236
static struct map *map__new(struct mmap_event *event)
237 238 239 240
{
	struct map *self = malloc(sizeof(*self));

	if (self != NULL) {
241 242
		const char *filename = event->filename;
		char newfilename[PATH_MAX];
243
		int anon;
244 245

		if (cwd) {
246 247
			int n = strcommon(filename);

248 249 250 251 252 253 254
			if (n == cwdlen) {
				snprintf(newfilename, sizeof(newfilename),
					 ".%s", filename + n);
				filename = newfilename;
			}
		}

255 256 257 258 259 260 261
		anon = is_anon_memory(filename);

		if (anon) {
			snprintf(newfilename, sizeof(newfilename), "/tmp/perf-%d.map", event->pid);
			filename = newfilename;
		}

262 263 264 265
		self->start = event->start;
		self->end   = event->start + event->len;
		self->pgoff = event->pgoff;

266
		self->dso = dsos__findnew(filename);
267 268
		if (self->dso == NULL)
			goto out_delete;
P
Peter Zijlstra 已提交
269

270
		if (self->dso == vdso || anon)
P
Peter Zijlstra 已提交
271 272 273
			self->map_ip = vdso__map_ip;
		else
			self->map_ip = map__map_ip;
274 275 276 277 278 279 280
	}
	return self;
out_delete:
	free(self);
	return NULL;
}

281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305
static struct map *map__clone(struct map *self)
{
	struct map *map = malloc(sizeof(*self));

	if (!map)
		return NULL;

	memcpy(map, self, sizeof(*self));

	return map;
}

static int map__overlap(struct map *l, struct map *r)
{
	if (l->start > r->start) {
		struct map *t = l;
		l = r;
		r = t;
	}

	if (l->end > r->start)
		return 1;

	return 0;
}
306

307 308
static size_t map__fprintf(struct map *self, FILE *fp)
{
309
	return fprintf(fp, " %Lx-%Lx %Lx %s\n",
310 311 312 313
		       self->start, self->end, self->pgoff, self->dso->name);
}


314
struct thread {
315
	struct rb_node	 rb_node;
316 317 318 319 320 321 322 323 324 325 326
	struct list_head maps;
	pid_t		 pid;
	char		 *comm;
};

static struct thread *thread__new(pid_t pid)
{
	struct thread *self = malloc(sizeof(*self));

	if (self != NULL) {
		self->pid = pid;
P
Peter Zijlstra 已提交
327
		self->comm = malloc(32);
328
		if (self->comm)
P
Peter Zijlstra 已提交
329
			snprintf(self->comm, 32, ":%d", self->pid);
330 331 332 333 334 335 336 337
		INIT_LIST_HEAD(&self->maps);
	}

	return self;
}

static int thread__set_comm(struct thread *self, const char *comm)
{
P
Peter Zijlstra 已提交
338 339
	if (self->comm)
		free(self->comm);
340 341 342 343
	self->comm = strdup(comm);
	return self->comm ? 0 : -ENOMEM;
}

344 345 346 347 348 349 350 351 352 353 354 355
static size_t thread__fprintf(struct thread *self, FILE *fp)
{
	struct map *pos;
	size_t ret = fprintf(fp, "Thread %d %s\n", self->pid, self->comm);

	list_for_each_entry(pos, &self->maps, node)
		ret += map__fprintf(pos, fp);

	return ret;
}


356
static struct rb_root threads;
357
static struct thread *last_match;
358

359
static struct thread *threads__findnew(pid_t pid)
360
{
361 362 363
	struct rb_node **p = &threads.rb_node;
	struct rb_node *parent = NULL;
	struct thread *th;
364

365 366 367 368 369 370 371 372
	/*
	 * Font-end cache - PID lookups come in blocks,
	 * so most of the time we dont have to look up
	 * the full rbtree:
	 */
	if (last_match && last_match->pid == pid)
		return last_match;

373 374 375
	while (*p != NULL) {
		parent = *p;
		th = rb_entry(parent, struct thread, rb_node);
376

377 378
		if (th->pid == pid) {
			last_match = th;
379
			return th;
380
		}
381

382 383 384 385
		if (pid < th->pid)
			p = &(*p)->rb_left;
		else
			p = &(*p)->rb_right;
386 387
	}

388 389 390 391
	th = thread__new(pid);
	if (th != NULL) {
		rb_link_node(&th->rb_node, parent, p);
		rb_insert_color(&th->rb_node, &threads);
392
		last_match = th;
393
	}
394

395
	return th;
396 397 398 399
}

static void thread__insert_map(struct thread *self, struct map *map)
{
400 401 402 403
	struct map *pos, *tmp;

	list_for_each_entry_safe(pos, tmp, &self->maps, node) {
		if (map__overlap(pos, map)) {
404 405 406 407 408 409 410 411 412 413 414 415 416 417 418 419 420 421 422 423 424
			if (verbose >= 2) {
				printf("overlapping maps:\n");
				map__fprintf(map, stdout);
				map__fprintf(pos, stdout);
			}

			if (map->start <= pos->start && map->end > pos->start)
				pos->start = map->end;

			if (map->end >= pos->end && map->start < pos->end)
				pos->end = map->start;

			if (verbose >= 2) {
				printf("after collision:\n");
				map__fprintf(pos, stdout);
			}

			if (pos->start >= pos->end) {
				list_del_init(&pos->node);
				free(pos);
			}
425 426 427
		}
	}

428 429 430
	list_add_tail(&map->node, &self->maps);
}

431 432 433 434 435 436 437 438 439 440 441 442 443 444 445 446 447 448 449 450
static int thread__fork(struct thread *self, struct thread *parent)
{
	struct map *map;

	if (self->comm)
		free(self->comm);
	self->comm = strdup(parent->comm);
	if (!self->comm)
		return -ENOMEM;

	list_for_each_entry(map, &parent->maps, node) {
		struct map *new = map__clone(map);
		if (!new)
			return -ENOMEM;
		thread__insert_map(self, new);
	}

	return 0;
}

451
static struct map *thread__find_map(struct thread *self, u64 ip)
452
{
453 454
	struct map *pos;

455 456 457 458 459 460 461 462 463 464
	if (self == NULL)
		return NULL;

	list_for_each_entry(pos, &self->maps, node)
		if (ip >= pos->start && ip <= pos->end)
			return pos;

	return NULL;
}

465 466 467 468 469 470 471 472 473 474 475 476 477 478
static size_t threads__fprintf(FILE *fp)
{
	size_t ret = 0;
	struct rb_node *nd;

	for (nd = rb_first(&threads); nd; nd = rb_next(nd)) {
		struct thread *pos = rb_entry(nd, struct thread, rb_node);

		ret += thread__fprintf(pos, fp);
	}

	return ret;
}

479 480 481 482 483 484 485 486 487 488 489 490 491
/*
 * histogram, sorted on item, collects counts
 */

static struct rb_root hist;

struct hist_entry {
	struct rb_node	 rb_node;

	struct thread	 *thread;
	struct map	 *map;
	struct dso	 *dso;
	struct symbol	 *sym;
492
	struct symbol	 *parent;
493
	u64		 ip;
494 495
	char		 level;

496
	u64		 count;
497 498
};

499 500 501 502 503 504 505
/*
 * configurable sorting bits
 */

struct sort_entry {
	struct list_head list;

506 507
	char *header;

508
	int64_t (*cmp)(struct hist_entry *, struct hist_entry *);
P
Peter Zijlstra 已提交
509
	int64_t (*collapse)(struct hist_entry *, struct hist_entry *);
510 511 512
	size_t	(*print)(FILE *fp, struct hist_entry *);
};

513 514 515 516 517 518 519 520 521 522
static int64_t cmp_null(void *l, void *r)
{
	if (!l && !r)
		return 0;
	else if (!l)
		return -1;
	else
		return 1;
}

P
Peter Zijlstra 已提交
523 524
/* --sort pid */

525
static int64_t
526
sort__thread_cmp(struct hist_entry *left, struct hist_entry *right)
527
{
528 529 530 531 532 533
	return right->thread->pid - left->thread->pid;
}

static size_t
sort__thread_print(FILE *fp, struct hist_entry *self)
{
534
	return fprintf(fp, "%16s:%5d", self->thread->comm ?: "", self->thread->pid);
535
}
536

537
static struct sort_entry sort_thread = {
538
	.header = "         Command:  Pid",
539 540 541 542
	.cmp	= sort__thread_cmp,
	.print	= sort__thread_print,
};

P
Peter Zijlstra 已提交
543 544
/* --sort comm */

545 546
static int64_t
sort__comm_cmp(struct hist_entry *left, struct hist_entry *right)
P
Peter Zijlstra 已提交
547 548 549 550 551 552
{
	return right->thread->pid - left->thread->pid;
}

static int64_t
sort__comm_collapse(struct hist_entry *left, struct hist_entry *right)
553 554 555 556
{
	char *comm_l = left->thread->comm;
	char *comm_r = right->thread->comm;

557 558
	if (!comm_l || !comm_r)
		return cmp_null(comm_l, comm_r);
559 560 561 562 563 564 565

	return strcmp(comm_l, comm_r);
}

static size_t
sort__comm_print(FILE *fp, struct hist_entry *self)
{
566
	return fprintf(fp, "%16s", self->thread->comm);
567 568 569
}

static struct sort_entry sort_comm = {
570
	.header		= "         Command",
P
Peter Zijlstra 已提交
571 572 573
	.cmp		= sort__comm_cmp,
	.collapse	= sort__comm_collapse,
	.print		= sort__comm_print,
574 575
};

P
Peter Zijlstra 已提交
576 577
/* --sort dso */

578 579 580 581 582 583
static int64_t
sort__dso_cmp(struct hist_entry *left, struct hist_entry *right)
{
	struct dso *dso_l = left->dso;
	struct dso *dso_r = right->dso;

584 585
	if (!dso_l || !dso_r)
		return cmp_null(dso_l, dso_r);
586 587 588 589 590 591 592

	return strcmp(dso_l->name, dso_r->name);
}

static size_t
sort__dso_print(FILE *fp, struct hist_entry *self)
{
593
	if (self->dso)
594
		return fprintf(fp, "%-25s", self->dso->name);
595

596
	return fprintf(fp, "%016llx         ", (u64)self->ip);
597 598 599
}

static struct sort_entry sort_dso = {
600
	.header = "Shared Object            ",
601 602 603 604
	.cmp	= sort__dso_cmp,
	.print	= sort__dso_print,
};

P
Peter Zijlstra 已提交
605 606
/* --sort symbol */

607 608 609
static int64_t
sort__sym_cmp(struct hist_entry *left, struct hist_entry *right)
{
610
	u64 ip_l, ip_r;
611 612 613 614 615 616 617 618 619 620

	if (left->sym == right->sym)
		return 0;

	ip_l = left->sym ? left->sym->start : left->ip;
	ip_r = right->sym ? right->sym->start : right->ip;

	return (int64_t)(ip_r - ip_l);
}

621 622 623 624 625 626
static size_t
sort__sym_print(FILE *fp, struct hist_entry *self)
{
	size_t ret = 0;

	if (verbose)
627
		ret += fprintf(fp, "%#018llx  ", (u64)self->ip);
628

629 630 631 632
	if (self->sym) {
		ret += fprintf(fp, "[%c] %s",
			self->dso == kernel_dso ? 'k' : '.', self->sym->name);
	} else {
633
		ret += fprintf(fp, "%#016llx", (u64)self->ip);
634
	}
635 636 637 638 639

	return ret;
}

static struct sort_entry sort_sym = {
640
	.header = "Symbol",
641 642
	.cmp	= sort__sym_cmp,
	.print	= sort__sym_print,
643 644
};

645
/* --sort parent */
646 647

static int64_t
648
sort__parent_cmp(struct hist_entry *left, struct hist_entry *right)
649
{
650 651
	struct symbol *sym_l = left->parent;
	struct symbol *sym_r = right->parent;
652 653 654 655 656 657 658 659

	if (!sym_l || !sym_r)
		return cmp_null(sym_l, sym_r);

	return strcmp(sym_l->name, sym_r->name);
}

static size_t
660
sort__parent_print(FILE *fp, struct hist_entry *self)
661 662 663
{
	size_t ret = 0;

664
	ret += fprintf(fp, "%-20s", self->parent ? self->parent->name : "[other]");
665 666 667 668

	return ret;
}

669 670 671 672
static struct sort_entry sort_parent = {
	.header = "Parent symbol       ",
	.cmp	= sort__parent_cmp,
	.print	= sort__parent_print,
673 674
};

P
Peter Zijlstra 已提交
675
static int sort__need_collapse = 0;
676
static int sort__has_parent = 0;
P
Peter Zijlstra 已提交
677

678
struct sort_dimension {
679 680 681
	char			*name;
	struct sort_entry	*entry;
	int			taken;
682 683 684 685
};

static struct sort_dimension sort_dimensions[] = {
	{ .name = "pid",	.entry = &sort_thread,	},
686
	{ .name = "comm",	.entry = &sort_comm,	},
687
	{ .name = "dso",	.entry = &sort_dso,	},
688
	{ .name = "symbol",	.entry = &sort_sym,	},
689
	{ .name = "parent",	.entry = &sort_parent,	},
690 691
};

692 693
static LIST_HEAD(hist_entry__sort_list);

694 695 696 697 698 699 700 701 702 703
static int sort_dimension__add(char *tok)
{
	int i;

	for (i = 0; i < ARRAY_SIZE(sort_dimensions); i++) {
		struct sort_dimension *sd = &sort_dimensions[i];

		if (sd->taken)
			continue;

704
		if (strncasecmp(tok, sd->name, strlen(tok)))
705 706
			continue;

P
Peter Zijlstra 已提交
707 708 709
		if (sd->entry->collapse)
			sort__need_collapse = 1;

710 711
		if (sd->entry == &sort_parent) {
			int ret = regcomp(&parent_regex, parent_pattern, REG_EXTENDED);
712 713 714
			if (ret) {
				char err[BUFSIZ];

715 716 717
				regerror(ret, &parent_regex, err, sizeof(err));
				fprintf(stderr, "Invalid regex: %s\n%s",
					parent_pattern, err);
718 719
				exit(-1);
			}
720
			sort__has_parent = 1;
721 722
		}

723 724
		list_add_tail(&sd->entry->list, &hist_entry__sort_list);
		sd->taken = 1;
725

726 727 728 729 730 731
		return 0;
	}

	return -ESRCH;
}

732 733 734 735 736 737 738 739 740 741 742 743 744 745 746
static int64_t
hist_entry__cmp(struct hist_entry *left, struct hist_entry *right)
{
	struct sort_entry *se;
	int64_t cmp = 0;

	list_for_each_entry(se, &hist_entry__sort_list, list) {
		cmp = se->cmp(left, right);
		if (cmp)
			break;
	}

	return cmp;
}

P
Peter Zijlstra 已提交
747 748 749 750 751 752 753 754 755 756 757 758 759 760 761 762 763 764 765
static int64_t
hist_entry__collapse(struct hist_entry *left, struct hist_entry *right)
{
	struct sort_entry *se;
	int64_t cmp = 0;

	list_for_each_entry(se, &hist_entry__sort_list, list) {
		int64_t (*f)(struct hist_entry *, struct hist_entry *);

		f = se->collapse ?: se->cmp;

		cmp = f(left, right);
		if (cmp)
			break;
	}

	return cmp;
}

766
static size_t
767
hist_entry__fprintf(FILE *fp, struct hist_entry *self, u64 total_samples)
768 769 770 771
{
	struct sort_entry *se;
	size_t ret;

772 773 774
	if (exclude_other && !self->parent)
		return 0;

775
	if (total_samples) {
776 777 778 779
		double percent = self->count * 100.0 / total_samples;
		char *color = PERF_COLOR_NORMAL;

		/*
780 781 782
		 * We color high-overhead entries in red, mid-overhead
		 * entries in green - and keep the low overhead places
		 * normal:
783
		 */
784
		if (percent >= 5.0) {
785
			color = PERF_COLOR_RED;
786 787 788 789
		} else {
			if (percent >= 0.5)
				color = PERF_COLOR_GREEN;
		}
790 791

		ret = color_fprintf(fp, color, "   %6.2f%%",
792 793
				(self->count * 100.0) / total_samples);
	} else
794
		ret = fprintf(fp, "%12Ld ", self->count);
795

796
	list_for_each_entry(se, &hist_entry__sort_list, list) {
797 798 799
		if (exclude_other && (se == &sort_parent))
			continue;

800
		fprintf(fp, "  ");
801
		ret += se->print(fp, self);
802
	}
803 804 805 806 807 808

	ret += fprintf(fp, "\n");

	return ret;
}

809 810 811 812 813 814
/*
 *
 */

static struct symbol *
resolve_symbol(struct thread *thread, struct map **mapp,
815
	       struct dso **dsop, u64 *ipp)
816 817 818
{
	struct dso *dso = dsop ? *dsop : NULL;
	struct map *map = mapp ? *mapp : NULL;
819
	u64 ip = *ipp;
820 821 822 823 824 825 826 827 828 829 830 831 832 833 834 835 836 837 838 839 840 841 842 843 844 845 846 847 848

	if (!thread)
		return NULL;

	if (dso)
		goto got_dso;

	if (map)
		goto got_map;

	map = thread__find_map(thread, ip);
	if (map != NULL) {
		if (mapp)
			*mapp = map;
got_map:
		ip = map->map_ip(map, ip);

		dso = map->dso;
	} else {
		/*
		 * If this is outside of all known maps,
		 * and is a negative address, try to look it
		 * up in the kernel dso, as it might be a
		 * vsyscall (which executes in user-mode):
		 */
		if ((long long)ip < 0)
		dso = kernel_dso;
	}
	dprintf(" ...... dso: %s\n", dso ? dso->name : "<not found>");
849 850
	dprintf(" ...... map: %Lx -> %Lx\n", *ipp, ip);
	*ipp  = ip;
851 852 853 854 855 856 857 858 859 860

	if (dsop)
		*dsop = dso;

	if (!dso)
		return NULL;
got_dso:
	return dso->find_symbol(dso, ip);
}

861
static int call__match(struct symbol *sym)
862
{
863
	if (sym->name && !regexec(&parent_regex, sym->name, 0, NULL, 0))
864
		return 1;
865

866
	return 0;
867 868
}

869 870 871 872
/*
 * collect histogram counts
 */

873 874
static int
hist_entry__add(struct thread *thread, struct map *map, struct dso *dso,
875 876
		struct symbol *sym, u64 ip, struct ip_callchain *chain,
		char level, u64 count)
877
{
878 879 880 881 882 883 884 885 886 887
	struct rb_node **p = &hist.rb_node;
	struct rb_node *parent = NULL;
	struct hist_entry *he;
	struct hist_entry entry = {
		.thread	= thread,
		.map	= map,
		.dso	= dso,
		.sym	= sym,
		.ip	= ip,
		.level	= level,
888
		.count	= count,
889
		.parent = NULL,
890 891 892
	};
	int cmp;

893
	if (sort__has_parent && chain) {
894
		u64 context = PERF_CONTEXT_MAX;
895 896 897
		int i;

		for (i = 0; i < chain->nr; i++) {
898
			u64 ip = chain->ips[i];
899 900 901 902 903 904 905 906 907 908 909 910 911 912 913 914
			struct dso *dso = NULL;
			struct symbol *sym;

			if (ip >= PERF_CONTEXT_MAX) {
				context = ip;
				continue;
			}

			switch (context) {
			case PERF_CONTEXT_KERNEL:
				dso = kernel_dso;
				break;
			default:
				break;
			}

915
			sym = resolve_symbol(thread, NULL, &dso, &ip);
916 917 918 919 920

			if (sym && call__match(sym)) {
				entry.parent = sym;
				break;
			}
921 922 923
		}
	}

924 925 926 927 928 929 930
	while (*p != NULL) {
		parent = *p;
		he = rb_entry(parent, struct hist_entry, rb_node);

		cmp = hist_entry__cmp(&entry, he);

		if (!cmp) {
931
			he->count += count;
932 933 934 935 936 937 938
			return 0;
		}

		if (cmp < 0)
			p = &(*p)->rb_left;
		else
			p = &(*p)->rb_right;
939
	}
940 941 942 943 944 945 946 947 948

	he = malloc(sizeof(*he));
	if (!he)
		return -ENOMEM;
	*he = entry;
	rb_link_node(&he->rb_node, parent, p);
	rb_insert_color(&he->rb_node, &hist);

	return 0;
949 950
}

P
Peter Zijlstra 已提交
951 952 953 954 955 956 957 958 959 960 961 962 963 964 965 966 967 968 969 970 971 972 973 974 975 976 977 978 979 980 981 982 983 984 985 986 987 988 989 990 991 992 993 994 995 996 997 998 999 1000 1001 1002 1003 1004 1005 1006 1007 1008
static void hist_entry__free(struct hist_entry *he)
{
	free(he);
}

/*
 * collapse the histogram
 */

static struct rb_root collapse_hists;

static void collapse__insert_entry(struct hist_entry *he)
{
	struct rb_node **p = &collapse_hists.rb_node;
	struct rb_node *parent = NULL;
	struct hist_entry *iter;
	int64_t cmp;

	while (*p != NULL) {
		parent = *p;
		iter = rb_entry(parent, struct hist_entry, rb_node);

		cmp = hist_entry__collapse(iter, he);

		if (!cmp) {
			iter->count += he->count;
			hist_entry__free(he);
			return;
		}

		if (cmp < 0)
			p = &(*p)->rb_left;
		else
			p = &(*p)->rb_right;
	}

	rb_link_node(&he->rb_node, parent, p);
	rb_insert_color(&he->rb_node, &collapse_hists);
}

static void collapse__resort(void)
{
	struct rb_node *next;
	struct hist_entry *n;

	if (!sort__need_collapse)
		return;

	next = rb_first(&hist);
	while (next) {
		n = rb_entry(next, struct hist_entry, rb_node);
		next = rb_next(&n->rb_node);

		rb_erase(&n->rb_node, &hist);
		collapse__insert_entry(n);
	}
}

1009 1010 1011 1012 1013 1014 1015
/*
 * reverse the map, sort on count.
 */

static struct rb_root output_hists;

static void output__insert_entry(struct hist_entry *he)
1016
{
1017
	struct rb_node **p = &output_hists.rb_node;
1018
	struct rb_node *parent = NULL;
1019
	struct hist_entry *iter;
1020 1021 1022

	while (*p != NULL) {
		parent = *p;
1023
		iter = rb_entry(parent, struct hist_entry, rb_node);
1024

1025
		if (he->count > iter->count)
1026 1027 1028 1029 1030
			p = &(*p)->rb_left;
		else
			p = &(*p)->rb_right;
	}

1031 1032
	rb_link_node(&he->rb_node, parent, p);
	rb_insert_color(&he->rb_node, &output_hists);
1033 1034
}

1035
static void output__resort(void)
1036
{
P
Peter Zijlstra 已提交
1037
	struct rb_node *next;
1038
	struct hist_entry *n;
1039
	struct rb_root *tree = &hist;
1040

P
Peter Zijlstra 已提交
1041
	if (sort__need_collapse)
1042 1043 1044
		tree = &collapse_hists;

	next = rb_first(tree);
P
Peter Zijlstra 已提交
1045

1046 1047 1048
	while (next) {
		n = rb_entry(next, struct hist_entry, rb_node);
		next = rb_next(&n->rb_node);
1049

1050
		rb_erase(&n->rb_node, tree);
1051
		output__insert_entry(n);
1052 1053 1054
	}
}

1055
static size_t output__fprintf(FILE *fp, u64 total_samples)
1056
{
1057
	struct hist_entry *pos;
1058
	struct sort_entry *se;
1059 1060 1061
	struct rb_node *nd;
	size_t ret = 0;

1062
	fprintf(fp, "\n");
1063
	fprintf(fp, "#\n");
1064
	fprintf(fp, "# (%Ld samples)\n", (u64)total_samples);
1065 1066 1067
	fprintf(fp, "#\n");

	fprintf(fp, "# Overhead");
1068 1069 1070
	list_for_each_entry(se, &hist_entry__sort_list, list) {
		if (exclude_other && (se == &sort_parent))
			continue;
1071
		fprintf(fp, "  %s", se->header);
1072
	}
1073 1074 1075
	fprintf(fp, "\n");

	fprintf(fp, "# ........");
1076
	list_for_each_entry(se, &hist_entry__sort_list, list) {
1077 1078
		int i;

1079 1080 1081
		if (exclude_other && (se == &sort_parent))
			continue;

1082
		fprintf(fp, "  ");
1083
		for (i = 0; i < strlen(se->header); i++)
1084
			fprintf(fp, ".");
1085
	}
1086 1087 1088
	fprintf(fp, "\n");

	fprintf(fp, "#\n");
1089

1090 1091 1092
	for (nd = rb_first(&output_hists); nd; nd = rb_next(nd)) {
		pos = rb_entry(nd, struct hist_entry, rb_node);
		ret += hist_entry__fprintf(fp, pos, total_samples);
1093 1094
	}

1095 1096
	if (sort_order == default_sort_order &&
			parent_pattern == default_parent_pattern) {
1097
		fprintf(fp, "#\n");
1098
		fprintf(fp, "# (For more details, try: perf report --sort comm,dso,symbol)\n");
1099 1100
		fprintf(fp, "#\n");
	}
1101
	fprintf(fp, "\n");
1102

1103 1104 1105
	return ret;
}

1106 1107 1108 1109 1110 1111 1112 1113 1114 1115 1116
static void register_idle_thread(void)
{
	struct thread *thread = threads__findnew(0);

	if (thread == NULL ||
			thread__set_comm(thread, "[idle]")) {
		fprintf(stderr, "problem inserting idle task.\n");
		exit(-1);
	}
}

1117 1118 1119 1120
static unsigned long total = 0,
		     total_mmap = 0,
		     total_comm = 0,
		     total_fork = 0,
1121 1122
		     total_unknown = 0,
		     total_lost = 0;
1123

1124
static int validate_chain(struct ip_callchain *chain, event_t *event)
1125 1126 1127 1128 1129 1130
{
	unsigned int chain_size;

	chain_size = event->header.size;
	chain_size -= (unsigned long)&event->ip.__more_data - (unsigned long)event;

1131
	if (chain->nr*sizeof(u64) > chain_size)
1132 1133 1134 1135 1136
		return -1;

	return 0;
}

1137
static int
1138 1139 1140 1141 1142 1143
process_overflow_event(event_t *event, unsigned long offset, unsigned long head)
{
	char level;
	int show = 0;
	struct dso *dso = NULL;
	struct thread *thread = threads__findnew(event->ip.pid);
1144 1145
	u64 ip = event->ip.ip;
	u64 period = 1;
1146
	struct map *map = NULL;
1147
	void *more_data = event->ip.__more_data;
1148
	struct ip_callchain *chain = NULL;
1149

1150
	if (event->header.type & PERF_SAMPLE_PERIOD) {
1151 1152
		period = *(u64 *)more_data;
		more_data += sizeof(u64);
1153
	}
1154

1155
	dprintf("%p [%p]: PERF_EVENT (IP, %d): %d: %p period: %Ld\n",
1156 1157 1158 1159
		(void *)(offset + head),
		(void *)(long)(event->header.size),
		event->header.misc,
		event->ip.pid,
1160
		(void *)(long)ip,
1161
		(long long)period);
1162

1163 1164 1165 1166 1167
	if (event->header.type & PERF_SAMPLE_CALLCHAIN) {
		int i;

		chain = (void *)more_data;

1168
		dprintf("... chain: nr:%Lu\n", chain->nr);
1169

1170 1171 1172 1173 1174 1175
		if (validate_chain(chain, event) < 0) {
			eprintf("call-chain problem with event, skipping it.\n");
			return 0;
		}

		if (dump_trace) {
1176
			for (i = 0; i < chain->nr; i++)
1177
				dprintf("..... %2d: %016Lx\n", i, chain->ips[i]);
1178 1179 1180
		}
	}

1181 1182 1183
	dprintf(" ... thread: %s:%d\n", thread->comm, thread->pid);

	if (thread == NULL) {
1184
		eprintf("problem processing %d event, skipping it.\n",
1185 1186 1187
			event->header.type);
		return -1;
	}
1188

1189 1190 1191
	if (event->header.misc & PERF_EVENT_MISC_KERNEL) {
		show = SHOW_KERNEL;
		level = 'k';
1192

1193
		dso = kernel_dso;
1194

1195
		dprintf(" ...... dso: %s\n", dso->name);
1196

1197
	} else if (event->header.misc & PERF_EVENT_MISC_USER) {
1198

1199 1200
		show = SHOW_USER;
		level = '.';
1201

1202 1203 1204 1205 1206
	} else {
		show = SHOW_HV;
		level = 'H';
		dprintf(" ...... dso: [hypervisor]\n");
	}
1207

1208
	if (show & show_mask) {
1209
		struct symbol *sym = resolve_symbol(thread, &map, &dso, &ip);
1210

1211
		if (hist_entry__add(thread, map, dso, sym, ip, chain, level, period)) {
1212
			eprintf("problem incrementing symbol count, skipping event\n");
1213
			return -1;
1214
		}
1215
	}
1216
	total += period;
1217

1218 1219
	return 0;
}
I
Ingo Molnar 已提交
1220

1221 1222 1223 1224 1225 1226
static int
process_mmap_event(event_t *event, unsigned long offset, unsigned long head)
{
	struct thread *thread = threads__findnew(event->mmap.pid);
	struct map *map = map__new(&event->mmap);

1227
	dprintf("%p [%p]: PERF_EVENT_MMAP %d: [%p(%p) @ %p]: %s\n",
1228 1229
		(void *)(offset + head),
		(void *)(long)(event->header.size),
1230
		event->mmap.pid,
1231 1232 1233 1234 1235 1236 1237
		(void *)(long)event->mmap.start,
		(void *)(long)event->mmap.len,
		(void *)(long)event->mmap.pgoff,
		event->mmap.filename);

	if (thread == NULL || map == NULL) {
		dprintf("problem processing PERF_EVENT_MMAP, skipping event.\n");
1238
		return 0;
1239 1240 1241 1242 1243 1244 1245 1246 1247 1248 1249 1250 1251 1252 1253 1254 1255 1256 1257 1258 1259 1260
	}

	thread__insert_map(thread, map);
	total_mmap++;

	return 0;
}

static int
process_comm_event(event_t *event, unsigned long offset, unsigned long head)
{
	struct thread *thread = threads__findnew(event->comm.pid);

	dprintf("%p [%p]: PERF_EVENT_COMM: %s:%d\n",
		(void *)(offset + head),
		(void *)(long)(event->header.size),
		event->comm.comm, event->comm.pid);

	if (thread == NULL ||
	    thread__set_comm(thread, event->comm.comm)) {
		dprintf("problem processing PERF_EVENT_COMM, skipping event.\n");
		return -1;
1261
	}
1262 1263 1264 1265 1266
	total_comm++;

	return 0;
}

1267 1268 1269 1270 1271 1272 1273 1274 1275 1276 1277 1278 1279 1280 1281 1282 1283 1284 1285 1286
static int
process_fork_event(event_t *event, unsigned long offset, unsigned long head)
{
	struct thread *thread = threads__findnew(event->fork.pid);
	struct thread *parent = threads__findnew(event->fork.ppid);

	dprintf("%p [%p]: PERF_EVENT_FORK: %d:%d\n",
		(void *)(offset + head),
		(void *)(long)(event->header.size),
		event->fork.pid, event->fork.ppid);

	if (!thread || !parent || thread__fork(thread, parent)) {
		dprintf("problem processing PERF_EVENT_FORK, skipping event.\n");
		return -1;
	}
	total_fork++;

	return 0;
}

1287 1288 1289 1290 1291 1292 1293 1294 1295 1296 1297 1298 1299
static int
process_period_event(event_t *event, unsigned long offset, unsigned long head)
{
	dprintf("%p [%p]: PERF_EVENT_PERIOD: time:%Ld, id:%Ld: period:%Ld\n",
		(void *)(offset + head),
		(void *)(long)(event->header.size),
		event->period.time,
		event->period.id,
		event->period.sample_period);

	return 0;
}

1300 1301 1302 1303 1304 1305 1306 1307 1308 1309 1310 1311 1312 1313
static int
process_lost_event(event_t *event, unsigned long offset, unsigned long head)
{
	dprintf("%p [%p]: PERF_EVENT_LOST: id:%Ld: lost:%Ld\n",
		(void *)(offset + head),
		(void *)(long)(event->header.size),
		event->lost.id,
		event->lost.lost);

	total_lost += event->lost.lost;

	return 0;
}

1314 1315 1316
static void trace_event(event_t *event)
{
	unsigned char *raw_event = (void *)event;
1317
	char *color = PERF_COLOR_BLUE;
1318 1319 1320 1321 1322
	int i, j;

	if (!dump_trace)
		return;

1323 1324
	dprintf(".");
	cdprintf("\n. ... raw event: size %d bytes\n", event->header.size);
1325 1326

	for (i = 0; i < event->header.size; i++) {
1327 1328 1329 1330
		if ((i & 15) == 0) {
			dprintf(".");
			cdprintf("  %04x: ", i);
		}
1331

1332
		cdprintf(" %02x", raw_event[i]);
1333 1334

		if (((i & 15) == 15) || i == event->header.size-1) {
1335
			cdprintf("  ");
1336
			for (j = 0; j < 15-(i & 15); j++)
1337
				cdprintf("   ");
1338
			for (j = 0; j < (i & 15); j++) {
1339
				if (isprint(raw_event[i-15+j]))
1340
					cdprintf("%c", raw_event[i-15+j]);
1341
				else
1342
					cdprintf(".");
1343
			}
1344
			cdprintf("\n");
1345 1346 1347 1348 1349
		}
	}
	dprintf(".\n");
}

1350 1351 1352
static int
process_event(event_t *event, unsigned long offset, unsigned long head)
{
1353 1354
	trace_event(event);

1355 1356 1357 1358 1359 1360 1361 1362 1363 1364
	if (event->header.misc & PERF_EVENT_MISC_OVERFLOW)
		return process_overflow_event(event, offset, head);

	switch (event->header.type) {
	case PERF_EVENT_MMAP:
		return process_mmap_event(event, offset, head);

	case PERF_EVENT_COMM:
		return process_comm_event(event, offset, head);

1365 1366 1367
	case PERF_EVENT_FORK:
		return process_fork_event(event, offset, head);

1368 1369
	case PERF_EVENT_PERIOD:
		return process_period_event(event, offset, head);
1370 1371 1372 1373

	case PERF_EVENT_LOST:
		return process_lost_event(event, offset, head);

1374 1375 1376
	/*
	 * We dont process them right now but they are fine:
	 */
1377

1378 1379 1380 1381
	case PERF_EVENT_THROTTLE:
	case PERF_EVENT_UNTHROTTLE:
		return 0;

1382 1383 1384 1385 1386 1387 1388
	default:
		return -1;
	}

	return 0;
}

1389 1390 1391 1392 1393 1394 1395 1396 1397 1398 1399 1400 1401 1402 1403
static struct perf_header	*header;

static int perf_header__has_sample(u64 sample_mask)
{
	int i;

	for (i = 0; i < header->attrs; i++) {
		struct perf_header_attr *attr = header->attr[i];

		if (!(attr->attr.sample_type & sample_mask))
			return 0;
	}

	return 1;
}
1404

1405 1406
static int __cmd_report(void)
{
1407
	int ret, rc = EXIT_FAILURE;
1408
	unsigned long offset = 0;
1409
	unsigned long head, shift;
1410 1411 1412
	struct stat stat;
	event_t *event;
	uint32_t size;
1413
	char *buf;
1414 1415 1416 1417 1418

	register_idle_thread();

	input = open(input_name, O_RDONLY);
	if (input < 0) {
1419 1420 1421 1422
		fprintf(stderr, " failed to open file: %s", input_name);
		if (!strcmp(input_name, "perf.data"))
			fprintf(stderr, "  (try 'perf record' first)");
		fprintf(stderr, "\n");
1423 1424 1425 1426 1427 1428 1429 1430 1431 1432 1433 1434 1435 1436
		exit(-1);
	}

	ret = fstat(input, &stat);
	if (ret < 0) {
		perror("failed to stat file");
		exit(-1);
	}

	if (!stat.st_size) {
		fprintf(stderr, "zero-sized file, nothing to do!\n");
		exit(0);
	}

1437 1438
	header = perf_header__read(input);
	head = header->data_offset;
1439 1440

	if (sort__has_parent &&
1441
	    !perf_header__has_sample(PERF_SAMPLE_CALLCHAIN)) {
1442 1443 1444 1445
		fprintf(stderr, "selected --sort parent, but no callchain data\n");
		exit(-1);
	}

1446 1447 1448 1449 1450 1451 1452 1453 1454 1455 1456 1457 1458 1459 1460
	if (load_kernel() < 0) {
		perror("failed to load kernel symbols");
		return EXIT_FAILURE;
	}

	if (!full_paths) {
		if (getcwd(__cwd, sizeof(__cwd)) == NULL) {
			perror("failed to get the current directory");
			return EXIT_FAILURE;
		}
		cwdlen = strlen(cwd);
	} else {
		cwd = NULL;
		cwdlen = 0;
	}
1461 1462 1463 1464 1465

	shift = page_size * (head / page_size);
	offset += shift;
	head -= shift;

1466 1467 1468 1469 1470 1471 1472 1473 1474 1475 1476 1477 1478 1479 1480 1481 1482 1483
remap:
	buf = (char *)mmap(NULL, page_size * mmap_window, PROT_READ,
			   MAP_SHARED, input, offset);
	if (buf == MAP_FAILED) {
		perror("failed to mmap file");
		exit(-1);
	}

more:
	event = (event_t *)(buf + head);

	size = event->header.size;
	if (!size)
		size = 8;

	if (head + event->header.size >= page_size * mmap_window) {
		int ret;

1484 1485
		shift = page_size * (head / page_size);

1486 1487 1488 1489 1490 1491 1492 1493 1494 1495
		ret = munmap(buf, page_size * mmap_window);
		assert(ret == 0);

		offset += shift;
		head -= shift;
		goto remap;
	}

	size = event->header.size;

1496
	dprintf("\n%p [%p]: event: %d\n",
1497 1498 1499 1500
			(void *)(offset + head),
			(void *)(long)event->header.size,
			event->header.type);

1501 1502
	if (!size || process_event(event, offset, head) < 0) {

I
Ingo Molnar 已提交
1503 1504 1505 1506
		dprintf("%p [%p]: skipping unknown header type: %d\n",
			(void *)(offset + head),
			(void *)(long)(event->header.size),
			event->header.type);
1507

1508
		total_unknown++;
1509 1510 1511 1512 1513 1514 1515 1516 1517 1518

		/*
		 * assume we lost track of the stream, check alignment, and
		 * increment a single u64 in the hope to catch on again 'soon'.
		 */

		if (unlikely(head & 7))
			head &= ~7ULL;

		size = 8;
1519
	}
1520

1521
	head += size;
I
Ingo Molnar 已提交
1522

1523
	if (offset + head >= header->data_offset + header->data_size)
1524 1525
		goto done;

1526 1527 1528
	if (offset + head < stat.st_size)
		goto more;

1529
done:
1530 1531
	rc = EXIT_SUCCESS;
	close(input);
1532

I
Ingo Molnar 已提交
1533 1534 1535
	dprintf("      IP events: %10ld\n", total);
	dprintf("    mmap events: %10ld\n", total_mmap);
	dprintf("    comm events: %10ld\n", total_comm);
1536
	dprintf("    fork events: %10ld\n", total_fork);
1537
	dprintf("    lost events: %10ld\n", total_lost);
I
Ingo Molnar 已提交
1538
	dprintf(" unknown events: %10ld\n", total_unknown);
1539

I
Ingo Molnar 已提交
1540
	if (dump_trace)
1541 1542
		return 0;

1543 1544 1545
	if (verbose >= 3)
		threads__fprintf(stdout);

1546
	if (verbose >= 2)
1547 1548
		dsos__fprintf(stdout);

P
Peter Zijlstra 已提交
1549
	collapse__resort();
1550 1551
	output__resort();
	output__fprintf(stdout, total);
1552 1553 1554 1555

	return rc;
}

1556 1557 1558 1559 1560 1561 1562 1563
static const char * const report_usage[] = {
	"perf report [<options>] <command>",
	NULL
};

static const struct option options[] = {
	OPT_STRING('i', "input", &input_name, "file",
		    "input file name"),
1564 1565
	OPT_BOOLEAN('v', "verbose", &verbose,
		    "be more verbose (show symbol address, etc)"),
1566 1567
	OPT_BOOLEAN('D', "dump-raw-trace", &dump_trace,
		    "dump raw trace in ASCII"),
1568
	OPT_STRING('k', "vmlinux", &vmlinux, "file", "vmlinux pathname"),
1569
	OPT_STRING('s', "sort", &sort_order, "key[,key2...]",
1570
		   "sort by key(s): pid, comm, dso, symbol, parent"),
1571 1572
	OPT_BOOLEAN('P', "full-paths", &full_paths,
		    "Don't shorten the pathnames taking into account the cwd"),
1573 1574
	OPT_STRING('p', "parent", &parent_pattern, "regex",
		   "regex filter to identify parent, see: '--sort parent'"),
1575 1576
	OPT_BOOLEAN('x', "exclude-other", &exclude_other,
		    "Only display entries with parent-match"),
1577 1578 1579
	OPT_END()
};

1580 1581 1582 1583 1584 1585 1586 1587 1588 1589 1590 1591 1592 1593 1594
static void setup_sorting(void)
{
	char *tmp, *tok, *str = strdup(sort_order);

	for (tok = strtok_r(str, ", ", &tmp);
			tok; tok = strtok_r(NULL, ", ", &tmp)) {
		if (sort_dimension__add(tok) < 0) {
			error("Unknown --sort key: `%s'", tok);
			usage_with_options(report_usage, options);
		}
	}

	free(str);
}

1595 1596
int cmd_report(int argc, const char **argv, const char *prefix)
{
1597
	symbol__init();
1598 1599 1600

	page_size = getpagesize();

1601
	argc = parse_options(argc, argv, options, report_usage, 0);
1602

1603 1604
	setup_sorting();

1605 1606 1607 1608 1609
	if (parent_pattern != default_parent_pattern)
		sort_dimension__add("parent");
	else
		exclude_other = 0;

1610 1611 1612 1613 1614 1615
	/*
	 * Any (unrecognized) arguments left?
	 */
	if (argc)
		usage_with_options(report_usage, options);

1616 1617
	setup_pager();

1618 1619
	return __cmd_report();
}