builtin-report.c 25.4 KB
Newer Older
1 2 3 4 5 6 7
/*
 * builtin-report.c
 *
 * Builtin report command: Analyze the perf.data input file,
 * look up and read DSOs and symbol information and display
 * a histogram of results, along various sorting keys.
 */
8
#include "builtin.h"
9

10
#include "util/util.h"
11
#include "util/cache.h"
12

13
#include "util/annotate.h"
14
#include "util/color.h"
15
#include <linux/list.h>
16
#include <linux/rbtree.h>
17
#include "util/symbol.h"
18
#include "util/callchain.h"
19
#include "util/strlist.h"
20
#include "util/values.h"
21

22
#include "perf.h"
23
#include "util/debug.h"
24 25
#include "util/evlist.h"
#include "util/evsel.h"
26
#include "util/header.h"
27
#include "util/session.h"
28
#include "util/tool.h"
29 30 31 32

#include "util/parse-options.h"
#include "util/parse-events.h"

33
#include "util/thread.h"
34
#include "util/sort.h"
35
#include "util/hist.h"
36
#include "util/data.h"
37
#include "arch/common.h"
38

39
#include <dlfcn.h>
40 41
#include <linux/bitmap.h>

42
struct report {
43
	struct perf_tool	tool;
44
	struct perf_session	*session;
45
	bool			force, use_tui, use_gtk, use_stdio;
46 47 48 49 50
	bool			hide_unresolved;
	bool			dont_use_callchains;
	bool			show_full_info;
	bool			show_threads;
	bool			inverted_callchain;
51
	bool			mem_mode;
52 53
	bool			header;
	bool			header_only;
54
	int			max_stack;
55 56 57
	struct perf_read_values	show_threads_values;
	const char		*pretty_printing_style;
	const char		*cpu_list;
58
	const char		*symbol_filter_str;
59
	float			min_percent;
60
	u64			nr_entries;
61
	DECLARE_BITMAP(cpu_bitmap, MAX_NR_CPUS);
62
};
63

64
static int report__config(const char *var, const char *value, void *cb)
65 66 67 68 69
{
	if (!strcmp(var, "report.group")) {
		symbol_conf.event_group = perf_config_bool(var, value);
		return 0;
	}
70
	if (!strcmp(var, "report.percent-limit")) {
71
		struct report *rep = cb;
72 73 74
		rep->min_percent = strtof(value, NULL);
		return 0;
	}
75 76 77 78

	return perf_default_config(var, value, cb);
}

79 80 81 82 83 84 85 86 87
static void report__inc_stats(struct report *rep, struct hist_entry *he)
{
	/*
	 * The @he is either of a newly created one or an existing one
	 * merging current sample.  We only want to count a new one so
	 * checking ->nr_events being 1.
	 */
	if (he->stat.nr_events == 1)
		rep->nr_entries++;
88 89 90 91 92 93 94 95 96 97

	/*
	 * Only counts number of samples at this stage as it's more
	 * natural to do it here and non-sample events are also
	 * counted in perf_session_deliver_event().  The dump_trace
	 * requires this info is ready before going to the output tree.
	 */
	hists__inc_nr_events(he->hists, PERF_RECORD_SAMPLE);
	if (!he->filtered)
		he->hists->stats.nr_non_filtered_samples++;
98 99
}

100
static int report__add_mem_hist_entry(struct report *rep, struct addr_location *al,
101
				      struct perf_sample *sample, struct perf_evsel *evsel)
102 103 104 105 106
{
	struct symbol *parent = NULL;
	struct hist_entry *he;
	struct mem_info *mi, *mx;
	uint64_t cost;
107
	int err = sample__resolve_callchain(sample, &parent, evsel, al, rep->max_stack);
108

109 110
	if (err)
		return err;
111

112
	mi = sample__resolve_mem(sample, al);
113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129
	if (!mi)
		return -ENOMEM;

	if (rep->hide_unresolved && !al->sym)
		return 0;

	cost = sample->weight;
	if (!cost)
		cost = 1;

	/*
	 * must pass period=weight in order to get the correct
	 * sorting from hists__collapse_resort() which is solely
	 * based on periods. We want sorting be done on nr_events * weight
	 * and this is indirectly achieved by passing period=weight here
	 * and the he_stat__add_period() function.
	 */
130 131
	he = __hists__add_entry(&evsel->hists, al, parent, NULL, mi,
				cost, cost, 0);
132 133 134
	if (!he)
		return -ENOMEM;

135 136 137 138
	if (ui__has_annotation()) {
		err = hist_entry__inc_addr_samples(he, evsel->idx, al->addr);
		if (err)
			goto out;
139

140 141 142 143 144
		mx = he->mem_info;
		err = addr_map_symbol__inc_samples(&mx->daddr, evsel->idx);
		if (err)
			goto out;
	}
145

146 147
	report__inc_stats(rep, he);

148
	err = hist_entry__append_callchain(he, sample);
149 150 151 152
out:
	return err;
}

153
static int report__add_branch_hist_entry(struct report *rep, struct addr_location *al,
154
					 struct perf_sample *sample, struct perf_evsel *evsel)
155 156 157 158
{
	struct symbol *parent = NULL;
	unsigned i;
	struct hist_entry *he;
159
	struct branch_info *bi, *bx;
160
	int err = sample__resolve_callchain(sample, &parent, evsel, al, rep->max_stack);
161

162 163
	if (err)
		return err;
164

165
	bi = sample__resolve_bstack(sample, al);
166 167 168 169 170 171
	if (!bi)
		return -ENOMEM;

	for (i = 0; i < sample->branch_stack->nr; i++) {
		if (rep->hide_unresolved && !(bi[i].from.sym && bi[i].to.sym))
			continue;
172 173 174

		err = -ENOMEM;

175 176 177 178
		/* overwrite the 'al' to branch-to info */
		al->map = bi[i].to.map;
		al->sym = bi[i].to.sym;
		al->addr = bi[i].to.addr;
179 180 181 182
		/*
		 * The report shows the percentage of total branches captured
		 * and not events sampled. Thus we use a pseudo period of 1.
		 */
183 184
		he = __hists__add_entry(&evsel->hists, al, parent, &bi[i], NULL,
					1, 1, 0);
185
		if (he) {
186 187 188 189 190 191 192 193 194 195 196 197
			if (ui__has_annotation()) {
				bx = he->branch_info;
				err = addr_map_symbol__inc_samples(&bx->from,
								   evsel->idx);
				if (err)
					goto out;

				err = addr_map_symbol__inc_samples(&bx->to,
								   evsel->idx);
				if (err)
					goto out;
			}
198
			report__inc_stats(rep, he);
199
		} else
200
			goto out;
201
	}
202
	err = 0;
203
out:
204
	free(bi);
205 206 207
	return err;
}

208
static int report__add_hist_entry(struct report *rep, struct perf_evsel *evsel,
209
				  struct addr_location *al, struct perf_sample *sample)
210
{
211
	struct symbol *parent = NULL;
212
	struct hist_entry *he;
213
	int err = sample__resolve_callchain(sample, &parent, evsel, al, rep->max_stack);
214

215 216
	if (err)
		return err;
217

218 219 220
	he = __hists__add_entry(&evsel->hists, al, parent, NULL, NULL,
				sample->period, sample->weight,
				sample->transaction);
221
	if (he == NULL)
222 223
		return -ENOMEM;

224 225 226
	err = hist_entry__append_callchain(he, sample);
	if (err)
		goto out;
227

228 229 230
	if (ui__has_annotation())
		err = hist_entry__inc_addr_samples(he, evsel->idx, al->addr);

231 232
	report__inc_stats(rep, he);

233
out:
234
	return err;
235 236
}

237

238
static int process_sample_event(struct perf_tool *tool,
239
				union perf_event *event,
240
				struct perf_sample *sample,
241
				struct perf_evsel *evsel,
242
				struct machine *machine)
243
{
244
	struct report *rep = container_of(tool, struct report, tool);
245
	struct addr_location al;
246
	int ret;
247

248
	if (perf_event__preprocess_sample(event, machine, &al, sample) < 0) {
249 250
		pr_debug("problem processing %d event, skipping it.\n",
			 event->header.type);
251 252
		return -1;
	}
253

254
	if (rep->hide_unresolved && al.sym == NULL)
255
		return 0;
256

257
	if (rep->cpu_list && !test_bit(sample->cpu, rep->cpu_bitmap))
258 259
		return 0;

260
	if (sort__mode == SORT_MODE__BRANCH) {
261
		ret = report__add_branch_hist_entry(rep, &al, sample, evsel);
262
		if (ret < 0)
263
			pr_debug("problem adding lbr entry, skipping event\n");
264
	} else if (rep->mem_mode == 1) {
265
		ret = report__add_mem_hist_entry(rep, &al, sample, evsel);
266
		if (ret < 0)
267
			pr_debug("problem adding mem entry, skipping event\n");
268 269 270
	} else {
		if (al.map != NULL)
			al.map->dso->hit = 1;
271

272
		ret = report__add_hist_entry(rep, evsel, &al, sample);
273
		if (ret < 0)
274
			pr_debug("problem incrementing symbol period, skipping event\n");
275
	}
276
	return ret;
277
}
I
Ingo Molnar 已提交
278

279
static int process_read_event(struct perf_tool *tool,
280
			      union perf_event *event,
281
			      struct perf_sample *sample __maybe_unused,
282
			      struct perf_evsel *evsel,
283
			      struct machine *machine __maybe_unused)
284
{
285
	struct report *rep = container_of(tool, struct report, tool);
286

287
	if (rep->show_threads) {
288
		const char *name = evsel ? perf_evsel__name(evsel) : "unknown";
289
		perf_read_values_add_value(&rep->show_threads_values,
290 291 292 293 294 295
					   event->read.pid, event->read.tid,
					   event->read.id,
					   name,
					   event->read.value);
	}

296
	dump_printf(": %d %d %s %" PRIu64 "\n", event->read.pid, event->read.tid,
297
		    evsel ? perf_evsel__name(evsel) : "FAIL",
298
		    event->read.value);
299 300 301 302

	return 0;
}

303
/* For pipe mode, sample_type is not currently set */
304
static int report__setup_sample_type(struct report *rep)
305
{
306 307 308
	struct perf_session *session = rep->session;
	u64 sample_type = perf_evlist__combined_sample_type(session->evlist);
	bool is_pipe = perf_data_file__is_pipe(session->file);
309

310
	if (!is_pipe && !(sample_type & PERF_SAMPLE_CALLCHAIN)) {
311
		if (sort__has_parent) {
312
			ui__error("Selected --sort parent, but no "
313 314
				    "callchain data. Did you call "
				    "'perf record' without -g?\n");
315
			return -EINVAL;
316
		}
317
		if (symbol_conf.use_callchain) {
318
			ui__error("Selected -g but no callchain data. Did "
319
				    "you call 'perf record' without -g?\n");
320
			return -1;
321
		}
322 323
	} else if (!rep->dont_use_callchains &&
		   callchain_param.mode != CHAIN_NONE &&
324
		   !symbol_conf.use_callchain) {
325
			symbol_conf.use_callchain = true;
326
			if (callchain_register_param(&callchain_param) < 0) {
327
				ui__error("Can't register callchain params.\n");
328
				return -EINVAL;
329
			}
330 331
	}

332
	if (sort__mode == SORT_MODE__BRANCH) {
333
		if (!is_pipe &&
334
		    !(sample_type & PERF_SAMPLE_BRANCH_STACK)) {
335 336
			ui__error("Selected -b but no branch data. "
				  "Did you call perf record without -b?\n");
337 338 339 340
			return -1;
		}
	}

341 342
	return 0;
}
343

344
static void sig_handler(int sig __maybe_unused)
345 346 347 348
{
	session_done = 1;
}

349
static size_t hists__fprintf_nr_sample_events(struct hists *hists, struct report *rep,
350 351 352 353
					      const char *evname, FILE *fp)
{
	size_t ret;
	char unit;
354 355 356
	unsigned long nr_samples = hists->stats.nr_events[PERF_RECORD_SAMPLE];
	u64 nr_events = hists->stats.total_period;
	struct perf_evsel *evsel = hists_to_evsel(hists);
357 358 359
	char buf[512];
	size_t size = sizeof(buf);

360 361 362 363 364
	if (symbol_conf.filter_relative) {
		nr_samples = hists->stats.nr_non_filtered_samples;
		nr_events = hists->stats.total_non_filtered_period;
	}

365
	if (perf_evsel__is_group_event(evsel)) {
366 367 368 369 370 371
		struct perf_evsel *pos;

		perf_evsel__group_desc(evsel, buf, size);
		evname = buf;

		for_each_group_member(pos, evsel) {
372 373 374 375 376 377 378
			if (symbol_conf.filter_relative) {
				nr_samples += pos->hists.stats.nr_non_filtered_samples;
				nr_events += pos->hists.stats.total_non_filtered_period;
			} else {
				nr_samples += pos->hists.stats.nr_events[PERF_RECORD_SAMPLE];
				nr_events += pos->hists.stats.total_period;
			}
379 380
		}
	}
381

382 383
	nr_samples = convert_unit(nr_samples, &unit);
	ret = fprintf(fp, "# Samples: %lu%c", nr_samples, unit);
384
	if (evname != NULL)
385 386
		ret += fprintf(fp, " of event '%s'", evname);

387 388 389 390 391
	if (rep->mem_mode) {
		ret += fprintf(fp, "\n# Total weight : %" PRIu64, nr_events);
		ret += fprintf(fp, "\n# Sort order   : %s", sort_order);
	} else
		ret += fprintf(fp, "\n# Event count (approx.): %" PRIu64, nr_events);
392 393 394
	return ret + fprintf(fp, "\n#\n");
}

395
static int perf_evlist__tty_browse_hists(struct perf_evlist *evlist,
396
					 struct report *rep,
397
					 const char *help)
398
{
399
	struct perf_evsel *pos;
400

401
	evlist__for_each(evlist, pos) {
402
		struct hists *hists = &pos->hists;
403
		const char *evname = perf_evsel__name(pos);
404

405 406 407 408
		if (symbol_conf.event_group &&
		    !perf_evsel__is_group_leader(pos))
			continue;

409
		hists__fprintf_nr_sample_events(hists, rep, evname, stdout);
410
		hists__fprintf(hists, true, 0, 0, rep->min_percent, stdout);
411 412 413 414 415 416 417
		fprintf(stdout, "\n\n");
	}

	if (sort_order == default_sort_order &&
	    parent_pattern == default_parent_pattern) {
		fprintf(stdout, "#\n# (%s)\n#\n", help);

418 419 420
		if (rep->show_threads) {
			bool style = !strcmp(rep->pretty_printing_style, "raw");
			perf_read_values_display(stdout, &rep->show_threads_values,
421
						 style);
422
			perf_read_values_destroy(&rep->show_threads_values);
423 424 425 426 427 428
		}
	}

	return 0;
}

429 430 431 432 433 434 435 436 437 438 439 440 441 442 443 444 445 446 447 448 449 450 451 452 453 454 455 456 457
static void report__warn_kptr_restrict(const struct report *rep)
{
	struct map *kernel_map = rep->session->machines.host.vmlinux_maps[MAP__FUNCTION];
	struct kmap *kernel_kmap = map__kmap(kernel_map);

	if (kernel_map == NULL ||
	    (kernel_map->dso->hit &&
	     (kernel_kmap->ref_reloc_sym == NULL ||
	      kernel_kmap->ref_reloc_sym->addr == 0))) {
		const char *desc =
		    "As no suitable kallsyms nor vmlinux was found, kernel samples\n"
		    "can't be resolved.";

		if (kernel_map) {
			const struct dso *kdso = kernel_map->dso;
			if (!RB_EMPTY_ROOT(&kdso->symbols[MAP__FUNCTION])) {
				desc = "If some relocation was applied (e.g. "
				       "kexec) symbols may be misresolved.";
			}
		}

		ui__warning(
"Kernel address maps (/proc/{kallsyms,modules}) were restricted.\n\n"
"Check /proc/sys/kernel/kptr_restrict before running 'perf record'.\n\n%s\n\n"
"Samples in kernel modules can't be resolved as well.\n\n",
		desc);
	}
}

458 459 460 461 462 463 464 465 466 467 468 469 470 471 472 473 474 475 476 477 478 479 480 481 482 483 484 485 486 487 488 489 490 491 492 493 494 495 496 497 498 499 500 501 502
static int report__gtk_browse_hists(struct report *rep, const char *help)
{
	int (*hist_browser)(struct perf_evlist *evlist, const char *help,
			    struct hist_browser_timer *timer, float min_pcnt);

	hist_browser = dlsym(perf_gtk_handle, "perf_evlist__gtk_browse_hists");

	if (hist_browser == NULL) {
		ui__error("GTK browser not found!\n");
		return -1;
	}

	return hist_browser(rep->session->evlist, help, NULL, rep->min_percent);
}

static int report__browse_hists(struct report *rep)
{
	int ret;
	struct perf_session *session = rep->session;
	struct perf_evlist *evlist = session->evlist;
	const char *help = "For a higher level overview, try: perf report --sort comm,dso";

	switch (use_browser) {
	case 1:
		ret = perf_evlist__tui_browse_hists(evlist, help, NULL,
						    rep->min_percent,
						    &session->header.env);
		/*
		 * Usually "ret" is the last pressed key, and we only
		 * care if the key notifies us to switch data file.
		 */
		if (ret != K_SWITCH_INPUT_DATA)
			ret = 0;
		break;
	case 2:
		ret = report__gtk_browse_hists(rep, help);
		break;
	default:
		ret = perf_evlist__tty_browse_hists(evlist, rep, help);
		break;
	}

	return ret;
}

503
static void report__collapse_hists(struct report *rep)
504 505 506 507
{
	struct ui_progress prog;
	struct perf_evsel *pos;

508
	ui_progress__init(&prog, rep->nr_entries, "Merging related events...");
509

510
	evlist__for_each(rep->session->evlist, pos) {
511 512 513 514 515 516 517 518 519 520 521 522 523 524 525 526 527 528 529 530
		struct hists *hists = &pos->hists;

		if (pos->idx == 0)
			hists->symbol_filter_str = rep->symbol_filter_str;

		hists__collapse_resort(hists, &prog);

		/* Non-group events are considered as leader */
		if (symbol_conf.event_group &&
		    !perf_evsel__is_group_leader(pos)) {
			struct hists *leader_hists = &pos->leader->hists;

			hists__match(leader_hists, hists);
			hists__link(leader_hists, hists);
		}
	}

	ui_progress__finish();
}

531
static int __cmd_report(struct report *rep)
532
{
533
	int ret;
534
	struct perf_session *session = rep->session;
535
	struct perf_evsel *pos;
536
	struct perf_data_file *file = session->file;
537

538 539
	signal(SIGINT, sig_handler);

540 541 542
	if (rep->cpu_list) {
		ret = perf_session__cpu_bitmap(session, rep->cpu_list,
					       rep->cpu_bitmap);
543
		if (ret)
544
			return ret;
545 546
	}

547 548
	if (rep->show_threads)
		perf_read_values_init(&rep->show_threads_values);
549

550
	ret = report__setup_sample_type(rep);
551
	if (ret)
552
		return ret;
553

554
	ret = perf_session__process_events(session, &rep->tool);
555
	if (ret)
556
		return ret;
557

558
	report__warn_kptr_restrict(rep);
559

560 561 562
	if (use_browser == 0) {
		if (verbose > 3)
			perf_session__fprintf(session, stdout);
563

564 565
		if (verbose > 2)
			perf_session__fprintf_dsos(session, stdout);
566

567 568 569 570
		if (dump_trace) {
			perf_session__fprintf_nr_events(session, stdout);
			return 0;
		}
571 572
	}

573
	report__collapse_hists(rep);
574

575 576 577
	if (session_done())
		return 0;

578
	if (rep->nr_entries == 0) {
579
		ui__error("The %s file has no samples!\n", file->path);
580
		return 0;
581 582
	}

583
	evlist__for_each(session->evlist, pos)
584 585
		hists__output_resort(&pos->hists);

586
	return report__browse_hists(rep);
587 588
}

589
static int
590
report_parse_callchain_opt(const struct option *opt, const char *arg, int unset)
591
{
592
	struct report *rep = (struct report *)opt->value;
593

594 595 596 597
	/*
	 * --no-call-graph
	 */
	if (unset) {
598
		rep->dont_use_callchains = true;
599 600 601
		return 0;
	}

602
	return parse_callchain_report_opt(arg);
603 604
}

605 606 607 608 609 610 611 612 613 614 615 616 617 618 619 620 621 622
int
report_parse_ignore_callees_opt(const struct option *opt __maybe_unused,
				const char *arg, int unset __maybe_unused)
{
	if (arg) {
		int err = regcomp(&ignore_callees_regex, arg, REG_EXTENDED);
		if (err) {
			char buf[BUFSIZ];
			regerror(err, &ignore_callees_regex, buf, sizeof(buf));
			pr_err("Invalid --ignore-callees regex: %s\n%s", arg, buf);
			return -1;
		}
		have_ignore_callees = 1;
	}

	return 0;
}

623
static int
624 625
parse_branch_mode(const struct option *opt __maybe_unused,
		  const char *str __maybe_unused, int unset)
626
{
627 628 629
	int *branch_mode = opt->value;

	*branch_mode = !unset;
630 631 632
	return 0;
}

633 634 635 636
static int
parse_percent_limit(const struct option *opt, const char *str,
		    int unset __maybe_unused)
{
637
	struct report *rep = opt->value;
638 639 640 641 642

	rep->min_percent = strtof(str, NULL);
	return 0;
}

643
int cmd_report(int argc, const char **argv, const char *prefix __maybe_unused)
644
{
645
	struct perf_session *session;
646
	struct stat st;
647
	bool has_br_stack = false;
648
	int branch_mode = -1;
649
	int ret = -1;
650 651
	char callchain_default_opt[] = "fractal,0.5,callee";
	const char * const report_usage[] = {
N
Namhyung Kim 已提交
652
		"perf report [<options>]",
653 654
		NULL
	};
655
	struct report report = {
656
		.tool = {
657 658
			.sample		 = process_sample_event,
			.mmap		 = perf_event__process_mmap,
659
			.mmap2		 = perf_event__process_mmap2,
660
			.comm		 = perf_event__process_comm,
661 662
			.exit		 = perf_event__process_exit,
			.fork		 = perf_event__process_fork,
663 664 665 666 667 668 669 670
			.lost		 = perf_event__process_lost,
			.read		 = process_read_event,
			.attr		 = perf_event__process_attr,
			.tracing_data	 = perf_event__process_tracing_data,
			.build_id	 = perf_event__process_build_id,
			.ordered_samples = true,
			.ordering_requires_timestamps = true,
		},
671
		.max_stack		 = PERF_MAX_STACK_DEPTH,
672 673 674
		.pretty_printing_style	 = "normal",
	};
	const struct option options[] = {
675
	OPT_STRING('i', "input", &input_name, "file",
676
		    "input file name"),
677
	OPT_INCR('v', "verbose", &verbose,
678
		    "be more verbose (show symbol address, etc)"),
679 680
	OPT_BOOLEAN('D', "dump-raw-trace", &dump_trace,
		    "dump raw trace in ASCII"),
681 682
	OPT_STRING('k', "vmlinux", &symbol_conf.vmlinux_name,
		   "file", "vmlinux pathname"),
683 684
	OPT_STRING(0, "kallsyms", &symbol_conf.kallsyms_name,
		   "file", "kallsyms pathname"),
685
	OPT_BOOLEAN('f', "force", &report.force, "don't complain, do it"),
686
	OPT_BOOLEAN('m', "modules", &symbol_conf.use_modules,
687
		    "load module symbols - WARNING: use only with -k and LIVE kernel"),
688
	OPT_BOOLEAN('n', "show-nr-samples", &symbol_conf.show_nr_samples,
689
		    "Show a column with the number of samples"),
690
	OPT_BOOLEAN('T', "threads", &report.show_threads,
691
		    "Show per-thread event counters"),
692
	OPT_STRING(0, "pretty", &report.pretty_printing_style, "key",
693
		   "pretty printing style key: normal raw"),
694
	OPT_BOOLEAN(0, "tui", &report.use_tui, "Use the TUI interface"),
695
	OPT_BOOLEAN(0, "gtk", &report.use_gtk, "Use the GTK2 interface"),
696 697
	OPT_BOOLEAN(0, "stdio", &report.use_stdio,
		    "Use the stdio interface"),
698 699 700
	OPT_BOOLEAN(0, "header", &report.header, "Show data header."),
	OPT_BOOLEAN(0, "header-only", &report.header_only,
		    "Show only data header."),
701
	OPT_STRING('s', "sort", &sort_order, "key[,key2...]",
702
		   "sort by key(s): pid, comm, dso, symbol, parent, cpu, srcline,"
703
		   " dso_to, dso_from, symbol_to, symbol_from, mispredict,"
704
		   " weight, local_weight, mem, symbol_daddr, dso_daddr, tlb, "
705
		   "snoop, locked, abort, in_tx, transaction"),
706 707
	OPT_BOOLEAN(0, "showcpuutilization", &symbol_conf.show_cpu_utilization,
		    "Show sample percentage for different cpu modes"),
708 709
	OPT_STRING('p', "parent", &parent_pattern, "regex",
		   "regex filter to identify parent, see: '--sort parent'"),
710
	OPT_BOOLEAN('x', "exclude-other", &symbol_conf.exclude_other,
711
		    "Only display entries with parent-match"),
712
	OPT_CALLBACK_DEFAULT('g', "call-graph", &report, "output_type,min_percent[,print_limit],call_order",
713
		     "Display callchains using output_type (graph, flat, fractal, or none) , min percent threshold, optional print limit, callchain order, key (function or address). "
714
		     "Default: fractal,0.5,callee,function", &report_parse_callchain_opt, callchain_default_opt),
715 716 717 718
	OPT_INTEGER(0, "max-stack", &report.max_stack,
		    "Set the maximum stack depth when parsing the callchain, "
		    "anything beyond the specified depth will be ignored. "
		    "Default: " __stringify(PERF_MAX_STACK_DEPTH)),
719 720
	OPT_BOOLEAN('G', "inverted", &report.inverted_callchain,
		    "alias for inverted call graph"),
721 722 723
	OPT_CALLBACK(0, "ignore-callees", NULL, "regex",
		   "ignore callees of these functions in call graphs",
		   report_parse_ignore_callees_opt),
724
	OPT_STRING('d', "dsos", &symbol_conf.dso_list_str, "dso[,dso...]",
725
		   "only consider symbols in these dsos"),
726
	OPT_STRING('c', "comms", &symbol_conf.comm_list_str, "comm[,comm...]",
727
		   "only consider symbols in these comms"),
728
	OPT_STRING('S', "symbols", &symbol_conf.sym_list_str, "symbol[,symbol...]",
729
		   "only consider these symbols"),
730 731
	OPT_STRING(0, "symbol-filter", &report.symbol_filter_str, "filter",
		   "only show symbols that (partially) match with this filter"),
732
	OPT_STRING('w', "column-widths", &symbol_conf.col_width_list_str,
733 734
		   "width[,width...]",
		   "don't try to adjust column width, use these fixed values"),
735
	OPT_STRING('t', "field-separator", &symbol_conf.field_sep, "separator",
736 737
		   "separator for columns, no spaces will be added between "
		   "columns '.' is reserved."),
738
	OPT_BOOLEAN('U', "hide-unresolved", &report.hide_unresolved,
739
		    "Only display entries resolved to a symbol"),
740 741
	OPT_STRING(0, "symfs", &symbol_conf.symfs, "directory",
		    "Look for files with symbols relative to this directory"),
742
	OPT_STRING('C', "cpu", &report.cpu_list, "cpu",
743 744
		   "list of cpus to profile"),
	OPT_BOOLEAN('I', "show-info", &report.show_full_info,
745
		    "Display extended information about perf.data file"),
746 747 748 749
	OPT_BOOLEAN(0, "source", &symbol_conf.annotate_src,
		    "Interleave source code with assembly code (default)"),
	OPT_BOOLEAN(0, "asm-raw", &symbol_conf.annotate_asm_raw,
		    "Display raw encoding of assembly instructions (default)"),
750 751
	OPT_STRING('M', "disassembler-style", &disassembler_style, "disassembler style",
		   "Specify disassembler style (e.g. -M intel for intel syntax)"),
752 753
	OPT_BOOLEAN(0, "show-total-period", &symbol_conf.show_total_period,
		    "Show a column with the sum of periods"),
N
Namhyung Kim 已提交
754 755
	OPT_BOOLEAN(0, "group", &symbol_conf.event_group,
		    "Show event group information together"),
756
	OPT_CALLBACK_NOOPT('b', "branch-stack", &branch_mode, "",
757
		    "use branch records for histogram filling", parse_branch_mode),
758 759
	OPT_STRING(0, "objdump", &objdump_path, "path",
		   "objdump binary to use for disassembly and annotations"),
760 761
	OPT_BOOLEAN(0, "demangle", &symbol_conf.demangle,
		    "Disable symbol demangling"),
762
	OPT_BOOLEAN(0, "mem-mode", &report.mem_mode, "mem access profile"),
763 764
	OPT_CALLBACK(0, "percent-limit", &report, "percent",
		     "Don't show entries under that percent", parse_percent_limit),
765
	OPT_CALLBACK(0, "percentage", NULL, "relative|absolute",
N
Namhyung Kim 已提交
766
		     "how to display percentage of filtered entries", parse_filter_percentage),
767
	OPT_END()
768
	};
769 770 771
	struct perf_data_file file = {
		.mode  = PERF_DATA_MODE_READ,
	};
772

773
	perf_config(report__config, &report);
774

775 776
	argc = parse_options(argc, argv, options, report_usage, 0);

777
	if (report.use_stdio)
778
		use_browser = 0;
779
	else if (report.use_tui)
780
		use_browser = 1;
781 782
	else if (report.use_gtk)
		use_browser = 2;
783

784
	if (report.inverted_callchain)
785 786
		callchain_param.order = ORDER_CALLER;

787
	if (!input_name || !strlen(input_name)) {
788
		if (!fstat(STDIN_FILENO, &st) && S_ISFIFO(st.st_mode))
789
			input_name = "-";
790
		else
791
			input_name = "perf.data";
792
	}
793

794 795 796
	file.path  = input_name;
	file.force = report.force;

797
repeat:
798
	session = perf_session__new(&file, false, &report.tool);
799 800 801 802 803 804 805
	if (session == NULL)
		return -ENOMEM;

	report.session = session;

	has_br_stack = perf_header__has_feat(&session->header,
					     HEADER_BRANCH_STACK);
806

807 808
	if (branch_mode == -1 && has_br_stack)
		sort__mode = SORT_MODE__BRANCH;
809

810 811
	/* sort__mode could be NORMAL if --no-branch-stack */
	if (sort__mode == SORT_MODE__BRANCH) {
812
		/*
813 814
		 * if no sort_order is provided, then specify
		 * branch-mode specific order
815 816 817 818 819
		 */
		if (sort_order == default_sort_order)
			sort_order = "comm,dso_from,symbol_from,"
				     "dso_to,symbol_to";

820
	}
821
	if (report.mem_mode) {
822
		if (sort__mode == SORT_MODE__BRANCH) {
823
			pr_err("branch and mem mode incompatible\n");
824 825
			goto error;
		}
826 827
		sort__mode = SORT_MODE__MEMORY;

828 829 830 831 832 833 834
		/*
		 * if no sort_order is provided, then specify
		 * branch-mode specific order
		 */
		if (sort_order == default_sort_order)
			sort_order = "local_weight,mem,sym,dso,symbol_daddr,dso_daddr,snoop,tlb,locked";
	}
835

836 837 838 839
	if (setup_sorting() < 0) {
		parse_options_usage(report_usage, options, "s", 1);
		goto error;
	}
840

841 842 843 844 845
	if (parent_pattern != default_parent_pattern) {
		if (sort_dimension__add("parent") < 0)
			goto error;
	}

846 847 848 849
	/* Force tty output for header output. */
	if (report.header || report.header_only)
		use_browser = 0;

850 851 852 853 854 855 856
	if (strcmp(input_name, "-") != 0)
		setup_browser(true);
	else {
		use_browser = 0;
		perf_hpp__init();
	}

857 858 859 860 861 862 863 864 865 866
	if (report.header || report.header_only) {
		perf_session__fprintf_info(session, stdout,
					   report.show_full_info);
		if (report.header_only)
			return 0;
	} else if (use_browser == 0) {
		fputs("# To display the perf.data header info, please use --header/--header-only options.\n#\n",
		      stdout);
	}

867
	/*
868
	 * Only in the TUI browser we are doing integrated annotation,
869 870 871
	 * so don't allocate extra space that won't be used in the stdio
	 * implementation.
	 */
872
	if (ui__has_annotation()) {
873
		symbol_conf.priv_size = sizeof(struct annotation);
874 875
		machines__set_symbol_filter(&session->machines,
					    symbol__annotate_init);
876 877 878 879 880 881 882 883 884 885 886 887 888 889 890 891
		/*
 		 * For searching by name on the "Browse map details".
 		 * providing it only in verbose mode not to bloat too
 		 * much struct symbol.
 		 */
		if (verbose) {
			/*
			 * XXX: Need to provide a less kludgy way to ask for
			 * more space per symbol, the u32 is for the index on
			 * the ui browser.
			 * See symbol__browser_index.
			 */
			symbol_conf.priv_size += sizeof(u32);
			symbol_conf.sort_by_name = true;
		}
	}
892

893
	if (symbol__init() < 0)
894
		goto error;
895

896 897 898 899 900 901 902 903 904 905
	if (argc) {
		/*
		 * Special case: if there's an argument left then assume that
		 * it's a symbol filter:
		 */
		if (argc > 1)
			usage_with_options(report_usage, options);

		report.symbol_filter_str = argv[0];
	}
906

907
	sort__setup_elide(stdout);
908

909
	ret = __cmd_report(&report);
910 911 912 913 914 915
	if (ret == K_SWITCH_INPUT_DATA) {
		perf_session__delete(session);
		goto repeat;
	} else
		ret = 0;

916 917 918
error:
	perf_session__delete(session);
	return ret;
919
}