builtin-report.c 26.8 KB
Newer Older
1 2 3 4 5 6 7
/*
 * builtin-report.c
 *
 * Builtin report command: Analyze the perf.data input file,
 * look up and read DSOs and symbol information and display
 * a histogram of results, along various sorting keys.
 */
8
#include "builtin.h"
9

10
#include "util/util.h"
11
#include "util/cache.h"
12

13
#include "util/annotate.h"
14
#include "util/color.h"
15
#include <linux/list.h>
16
#include <linux/rbtree.h>
17
#include "util/symbol.h"
18
#include "util/callchain.h"
19
#include "util/strlist.h"
20
#include "util/values.h"
21

22
#include "perf.h"
23
#include "util/debug.h"
24 25
#include "util/evlist.h"
#include "util/evsel.h"
26
#include "util/header.h"
27
#include "util/session.h"
28
#include "util/tool.h"
29 30 31 32

#include "util/parse-options.h"
#include "util/parse-events.h"

33
#include "util/thread.h"
34
#include "util/sort.h"
35
#include "util/hist.h"
36
#include "arch/common.h"
37

38 39
#include <linux/bitmap.h>

40
struct perf_report {
41
	struct perf_tool	tool;
42
	struct perf_session	*session;
43
	bool			force, use_tui, use_gtk, use_stdio;
44 45 46 47 48
	bool			hide_unresolved;
	bool			dont_use_callchains;
	bool			show_full_info;
	bool			show_threads;
	bool			inverted_callchain;
49
	bool			mem_mode;
50 51 52
	struct perf_read_values	show_threads_values;
	const char		*pretty_printing_style;
	const char		*cpu_list;
53
	const char		*symbol_filter_str;
54
	float			min_percent;
55
	DECLARE_BITMAP(cpu_bitmap, MAX_NR_CPUS);
56
};
57

58 59 60 61 62 63
static int perf_report_config(const char *var, const char *value, void *cb)
{
	if (!strcmp(var, "report.group")) {
		symbol_conf.event_group = perf_config_bool(var, value);
		return 0;
	}
64 65 66 67 68
	if (!strcmp(var, "report.percent-limit")) {
		struct perf_report *rep = cb;
		rep->min_percent = strtof(value, NULL);
		return 0;
	}
69 70 71 72

	return perf_default_config(var, value, cb);
}

73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90
static int perf_report__add_mem_hist_entry(struct perf_tool *tool,
					   struct addr_location *al,
					   struct perf_sample *sample,
					   struct perf_evsel *evsel,
					   struct machine *machine,
					   union perf_event *event)
{
	struct perf_report *rep = container_of(tool, struct perf_report, tool);
	struct symbol *parent = NULL;
	u8 cpumode = event->header.misc & PERF_RECORD_MISC_CPUMODE_MASK;
	int err = 0;
	struct hist_entry *he;
	struct mem_info *mi, *mx;
	uint64_t cost;

	if ((sort__has_parent || symbol_conf.use_callchain) &&
	    sample->callchain) {
		err = machine__resolve_callchain(machine, evsel, al->thread,
91
						 sample, &parent, al);
92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118
		if (err)
			return err;
	}

	mi = machine__resolve_mem(machine, al->thread, sample, cpumode);
	if (!mi)
		return -ENOMEM;

	if (rep->hide_unresolved && !al->sym)
		return 0;

	cost = sample->weight;
	if (!cost)
		cost = 1;

	/*
	 * must pass period=weight in order to get the correct
	 * sorting from hists__collapse_resort() which is solely
	 * based on periods. We want sorting be done on nr_events * weight
	 * and this is indirectly achieved by passing period=weight here
	 * and the he_stat__add_period() function.
	 */
	he = __hists__add_mem_entry(&evsel->hists, al, parent, mi, cost, cost);
	if (!he)
		return -ENOMEM;

	/*
119
	 * In the TUI browser, we are doing integrated annotation,
120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165
	 * so we don't allocate the extra space needed because the stdio
	 * code will not use it.
	 */
	if (sort__has_sym && he->ms.sym && use_browser > 0) {
		struct annotation *notes = symbol__annotation(he->ms.sym);

		assert(evsel != NULL);

		if (notes->src == NULL && symbol__alloc_hist(he->ms.sym) < 0)
			goto out;

		err = hist_entry__inc_addr_samples(he, evsel->idx, al->addr);
		if (err)
			goto out;
	}

	if (sort__has_sym && he->mem_info->daddr.sym && use_browser > 0) {
		struct annotation *notes;

		mx = he->mem_info;

		notes = symbol__annotation(mx->daddr.sym);
		if (notes->src == NULL && symbol__alloc_hist(mx->daddr.sym) < 0)
			goto out;

		err = symbol__inc_addr_samples(mx->daddr.sym,
					       mx->daddr.map,
					       evsel->idx,
					       mx->daddr.al_addr);
		if (err)
			goto out;
	}

	evsel->hists.stats.total_period += cost;
	hists__inc_nr_events(&evsel->hists, PERF_RECORD_SAMPLE);
	err = 0;

	if (symbol_conf.use_callchain) {
		err = callchain_append(he->callchain,
				       &callchain_cursor,
				       sample->period);
	}
out:
	return err;
}

166 167 168 169 170 171 172 173 174 175 176
static int perf_report__add_branch_hist_entry(struct perf_tool *tool,
					struct addr_location *al,
					struct perf_sample *sample,
					struct perf_evsel *evsel,
				      struct machine *machine)
{
	struct perf_report *rep = container_of(tool, struct perf_report, tool);
	struct symbol *parent = NULL;
	int err = 0;
	unsigned i;
	struct hist_entry *he;
177
	struct branch_info *bi, *bx;
178 179 180

	if ((sort__has_parent || symbol_conf.use_callchain)
	    && sample->callchain) {
181
		err = machine__resolve_callchain(machine, evsel, al->thread,
182
						 sample, &parent, al);
183 184 185 186 187 188 189 190 191 192 193 194
		if (err)
			return err;
	}

	bi = machine__resolve_bstack(machine, al->thread,
				     sample->branch_stack);
	if (!bi)
		return -ENOMEM;

	for (i = 0; i < sample->branch_stack->nr; i++) {
		if (rep->hide_unresolved && !(bi[i].from.sym && bi[i].to.sym))
			continue;
195 196 197

		err = -ENOMEM;

198 199 200 201 202
		/*
		 * The report shows the percentage of total branches captured
		 * and not events sampled. Thus we use a pseudo period of 1.
		 */
		he = __hists__add_branch_entry(&evsel->hists, al, parent,
203
				&bi[i], 1, 1);
204
		if (he) {
205 206
			struct annotation *notes;
			bx = he->branch_info;
207
			if (bx->from.sym && use_browser == 1 && sort__has_sym) {
208 209 210 211 212 213 214 215 216 217 218 219 220
				notes = symbol__annotation(bx->from.sym);
				if (!notes->src
				    && symbol__alloc_hist(bx->from.sym) < 0)
					goto out;

				err = symbol__inc_addr_samples(bx->from.sym,
							       bx->from.map,
							       evsel->idx,
							       bx->from.al_addr);
				if (err)
					goto out;
			}

221
			if (bx->to.sym && use_browser == 1 && sort__has_sym) {
222 223 224 225 226 227 228 229 230 231 232 233
				notes = symbol__annotation(bx->to.sym);
				if (!notes->src
				    && symbol__alloc_hist(bx->to.sym) < 0)
					goto out;

				err = symbol__inc_addr_samples(bx->to.sym,
							       bx->to.map,
							       evsel->idx,
							       bx->to.al_addr);
				if (err)
					goto out;
			}
234 235 236
			evsel->hists.stats.total_period += 1;
			hists__inc_nr_events(&evsel->hists, PERF_RECORD_SAMPLE);
		} else
237
			goto out;
238
	}
239
	err = 0;
240
out:
241
	free(bi);
242 243 244
	return err;
}

245 246 247 248
static int perf_evsel__add_hist_entry(struct perf_evsel *evsel,
				      struct addr_location *al,
				      struct perf_sample *sample,
				      struct machine *machine)
249
{
250
	struct symbol *parent = NULL;
251
	int err = 0;
252 253
	struct hist_entry *he;

254
	if ((sort__has_parent || symbol_conf.use_callchain) && sample->callchain) {
255
		err = machine__resolve_callchain(machine, evsel, al->thread,
256
						 sample, &parent, al);
257 258
		if (err)
			return err;
259
	}
260

261 262
	he = __hists__add_entry(&evsel->hists, al, parent, sample->period,
					sample->weight);
263
	if (he == NULL)
264 265
		return -ENOMEM;

266
	if (symbol_conf.use_callchain) {
267
		err = callchain_append(he->callchain,
268
				       &callchain_cursor,
269
				       sample->period);
270
		if (err)
271
			return err;
272 273
	}
	/*
274
	 * Only in the TUI browser we are doing integrated annotation,
275 276 277
	 * so we don't allocated the extra space needed because the stdio
	 * code will not use it.
	 */
278
	if (he->ms.sym != NULL && use_browser == 1 && sort__has_sym) {
279
		struct annotation *notes = symbol__annotation(he->ms.sym);
280 281 282 283

		assert(evsel != NULL);

		err = -ENOMEM;
284
		if (notes->src == NULL && symbol__alloc_hist(he->ms.sym) < 0)
285 286 287
			goto out;

		err = hist_entry__inc_addr_samples(he, evsel->idx, al->addr);
288
	}
289

290 291 292
	evsel->hists.stats.total_period += sample->period;
	hists__inc_nr_events(&evsel->hists, PERF_RECORD_SAMPLE);
out:
293
	return err;
294 295
}

296

297
static int process_sample_event(struct perf_tool *tool,
298
				union perf_event *event,
299
				struct perf_sample *sample,
300
				struct perf_evsel *evsel,
301
				struct machine *machine)
302
{
303
	struct perf_report *rep = container_of(tool, struct perf_report, tool);
304
	struct addr_location al;
305
	int ret;
306

307
	if (perf_event__preprocess_sample(event, machine, &al, sample) < 0) {
308
		fprintf(stderr, "problem processing %d event, skipping it.\n",
309 310 311
			event->header.type);
		return -1;
	}
312

313
	if (al.filtered || (rep->hide_unresolved && al.sym == NULL))
314
		return 0;
315

316
	if (rep->cpu_list && !test_bit(sample->cpu, rep->cpu_bitmap))
317 318
		return 0;

319
	if (sort__mode == SORT_MODE__BRANCH) {
320 321 322
		ret = perf_report__add_branch_hist_entry(tool, &al, sample,
							 evsel, machine);
		if (ret < 0)
323
			pr_debug("problem adding lbr entry, skipping event\n");
324
	} else if (rep->mem_mode == 1) {
325 326 327
		ret = perf_report__add_mem_hist_entry(tool, &al, sample,
						      evsel, machine, event);
		if (ret < 0)
328
			pr_debug("problem adding mem entry, skipping event\n");
329 330 331
	} else {
		if (al.map != NULL)
			al.map->dso->hit = 1;
332

333 334
		ret = perf_evsel__add_hist_entry(evsel, &al, sample, machine);
		if (ret < 0)
335
			pr_debug("problem incrementing symbol period, skipping event\n");
336
	}
337
	return ret;
338
}
I
Ingo Molnar 已提交
339

340
static int process_read_event(struct perf_tool *tool,
341
			      union perf_event *event,
342
			      struct perf_sample *sample __maybe_unused,
343
			      struct perf_evsel *evsel,
344
			      struct machine *machine __maybe_unused)
345
{
346
	struct perf_report *rep = container_of(tool, struct perf_report, tool);
347

348
	if (rep->show_threads) {
349
		const char *name = evsel ? perf_evsel__name(evsel) : "unknown";
350
		perf_read_values_add_value(&rep->show_threads_values,
351 352 353 354 355 356
					   event->read.pid, event->read.tid,
					   event->read.id,
					   name,
					   event->read.value);
	}

357
	dump_printf(": %d %d %s %" PRIu64 "\n", event->read.pid, event->read.tid,
358
		    evsel ? perf_evsel__name(evsel) : "FAIL",
359
		    event->read.value);
360 361 362 363

	return 0;
}

364
/* For pipe mode, sample_type is not currently set */
365
static int perf_report__setup_sample_type(struct perf_report *rep)
366
{
367
	struct perf_session *self = rep->session;
368
	u64 sample_type = perf_evlist__combined_sample_type(self->evlist);
369

370
	if (!self->fd_pipe && !(sample_type & PERF_SAMPLE_CALLCHAIN)) {
371
		if (sort__has_parent) {
372
			ui__error("Selected --sort parent, but no "
373 374
				    "callchain data. Did you call "
				    "'perf record' without -g?\n");
375
			return -EINVAL;
376
		}
377
		if (symbol_conf.use_callchain) {
378
			ui__error("Selected -g but no callchain data. Did "
379
				    "you call 'perf record' without -g?\n");
380
			return -1;
381
		}
382 383
	} else if (!rep->dont_use_callchains &&
		   callchain_param.mode != CHAIN_NONE &&
384
		   !symbol_conf.use_callchain) {
385
			symbol_conf.use_callchain = true;
386
			if (callchain_register_param(&callchain_param) < 0) {
387
				ui__error("Can't register callchain params.\n");
388
				return -EINVAL;
389
			}
390 391
	}

392
	if (sort__mode == SORT_MODE__BRANCH) {
393
		if (!self->fd_pipe &&
394
		    !(sample_type & PERF_SAMPLE_BRANCH_STACK)) {
395 396
			ui__error("Selected -b but no branch data. "
				  "Did you call perf record without -b?\n");
397 398 399 400
			return -1;
		}
	}

401 402
	return 0;
}
403

404
static void sig_handler(int sig __maybe_unused)
405 406 407 408
{
	session_done = 1;
}

409 410
static size_t hists__fprintf_nr_sample_events(struct perf_report *rep,
					      struct hists *self,
411 412 413 414
					      const char *evname, FILE *fp)
{
	size_t ret;
	char unit;
415 416
	unsigned long nr_samples = self->stats.nr_events[PERF_RECORD_SAMPLE];
	u64 nr_events = self->stats.total_period;
417 418 419 420
	struct perf_evsel *evsel = hists_to_evsel(self);
	char buf[512];
	size_t size = sizeof(buf);

421
	if (perf_evsel__is_group_event(evsel)) {
422 423 424 425 426 427 428 429 430 431
		struct perf_evsel *pos;

		perf_evsel__group_desc(evsel, buf, size);
		evname = buf;

		for_each_group_member(pos, evsel) {
			nr_samples += pos->hists.stats.nr_events[PERF_RECORD_SAMPLE];
			nr_events += pos->hists.stats.total_period;
		}
	}
432

433 434
	nr_samples = convert_unit(nr_samples, &unit);
	ret = fprintf(fp, "# Samples: %lu%c", nr_samples, unit);
435
	if (evname != NULL)
436 437
		ret += fprintf(fp, " of event '%s'", evname);

438 439 440 441 442
	if (rep->mem_mode) {
		ret += fprintf(fp, "\n# Total weight : %" PRIu64, nr_events);
		ret += fprintf(fp, "\n# Sort order   : %s", sort_order);
	} else
		ret += fprintf(fp, "\n# Event count (approx.): %" PRIu64, nr_events);
443 444 445
	return ret + fprintf(fp, "\n#\n");
}

446
static int perf_evlist__tty_browse_hists(struct perf_evlist *evlist,
447
					 struct perf_report *rep,
448
					 const char *help)
449
{
450
	struct perf_evsel *pos;
451

452 453
	list_for_each_entry(pos, &evlist->entries, node) {
		struct hists *hists = &pos->hists;
454
		const char *evname = perf_evsel__name(pos);
455

456 457 458 459
		if (symbol_conf.event_group &&
		    !perf_evsel__is_group_leader(pos))
			continue;

460
		hists__fprintf_nr_sample_events(rep, hists, evname, stdout);
461
		hists__fprintf(hists, true, 0, 0, rep->min_percent, stdout);
462 463 464 465 466 467 468
		fprintf(stdout, "\n\n");
	}

	if (sort_order == default_sort_order &&
	    parent_pattern == default_parent_pattern) {
		fprintf(stdout, "#\n# (%s)\n#\n", help);

469 470 471
		if (rep->show_threads) {
			bool style = !strcmp(rep->pretty_printing_style, "raw");
			perf_read_values_display(stdout, &rep->show_threads_values,
472
						 style);
473
			perf_read_values_destroy(&rep->show_threads_values);
474 475 476 477 478 479
		}
	}

	return 0;
}

480
static int __cmd_report(struct perf_report *rep)
481
{
482
	int ret = -EINVAL;
483
	u64 nr_samples;
484
	struct perf_session *session = rep->session;
485
	struct perf_evsel *pos;
486 487
	struct map *kernel_map;
	struct kmap *kernel_kmap;
488
	const char *help = "For a higher level overview, try: perf report --sort comm,dso";
489

490 491
	signal(SIGINT, sig_handler);

492 493 494
	if (rep->cpu_list) {
		ret = perf_session__cpu_bitmap(session, rep->cpu_list,
					       rep->cpu_bitmap);
495
		if (ret)
496
			return ret;
497 498
	}

499
	if (use_browser <= 0)
500
		perf_session__fprintf_info(session, stdout, rep->show_full_info);
501

502 503
	if (rep->show_threads)
		perf_read_values_init(&rep->show_threads_values);
504

505
	ret = perf_report__setup_sample_type(rep);
506
	if (ret)
507
		return ret;
508

509
	ret = perf_session__process_events(session, &rep->tool);
510
	if (ret)
511
		return ret;
512

513
	kernel_map = session->machines.host.vmlinux_maps[MAP__FUNCTION];
514 515 516 517 518
	kernel_kmap = map__kmap(kernel_map);
	if (kernel_map == NULL ||
	    (kernel_map->dso->hit &&
	     (kernel_kmap->ref_reloc_sym == NULL ||
	      kernel_kmap->ref_reloc_sym->addr == 0))) {
519 520 521 522 523 524 525 526 527 528 529
		const char *desc =
		    "As no suitable kallsyms nor vmlinux was found, kernel samples\n"
		    "can't be resolved.";

		if (kernel_map) {
			const struct dso *kdso = kernel_map->dso;
			if (!RB_EMPTY_ROOT(&kdso->symbols[MAP__FUNCTION])) {
				desc = "If some relocation was applied (e.g. "
				       "kexec) symbols may be misresolved.";
			}
		}
530

531 532 533 534
		ui__warning(
"Kernel address maps (/proc/{kallsyms,modules}) were restricted.\n\n"
"Check /proc/sys/kernel/kptr_restrict before running 'perf record'.\n\n%s\n\n"
"Samples in kernel modules can't be resolved as well.\n\n",
535
		desc);
536 537
	}

538
	if (verbose > 3)
539
		perf_session__fprintf(session, stdout);
540

541
	if (verbose > 2)
542
		perf_session__fprintf_dsos(session, stdout);
543

544 545
	if (dump_trace) {
		perf_session__fprintf_nr_events(session, stdout);
546
		return 0;
547 548
	}

549 550 551
	nr_samples = 0;
	list_for_each_entry(pos, &session->evlist->entries, node) {
		struct hists *hists = &pos->hists;
552

553 554 555
		if (pos->idx == 0)
			hists->symbol_filter_str = rep->symbol_filter_str;

556
		hists__collapse_resort(hists);
557
		nr_samples += hists->stats.nr_events[PERF_RECORD_SAMPLE];
558 559 560 561 562 563 564 565 566

		/* Non-group events are considered as leader */
		if (symbol_conf.event_group &&
		    !perf_evsel__is_group_leader(pos)) {
			struct hists *leader_hists = &pos->leader->hists;

			hists__match(leader_hists, hists);
			hists__link(leader_hists, hists);
		}
567 568
	}

569 570 571
	if (session_done())
		return 0;

572
	if (nr_samples == 0) {
573
		ui__error("The %s file has no samples!\n", session->filename);
574
		return 0;
575 576
	}

577 578 579
	list_for_each_entry(pos, &session->evlist->entries, node)
		hists__output_resort(&pos->hists);

580
	if (use_browser > 0) {
581
		if (use_browser == 1) {
582
			ret = perf_evlist__tui_browse_hists(session->evlist,
583 584
							help, NULL,
							rep->min_percent,
585 586 587 588 589 590 591 592
							&session->header.env);
			/*
			 * Usually "ret" is the last pressed key, and we only
			 * care if the key notifies us to switch data file.
			 */
			if (ret != K_SWITCH_INPUT_DATA)
				ret = 0;

593 594
		} else if (use_browser == 2) {
			perf_evlist__gtk_browse_hists(session->evlist, help,
595
						      NULL, rep->min_percent);
596
		}
597
	} else
598
		perf_evlist__tty_browse_hists(session->evlist, rep, help);
599

600
	return ret;
601 602
}

603
static int
604
parse_callchain_opt(const struct option *opt, const char *arg, int unset)
605
{
606
	struct perf_report *rep = (struct perf_report *)opt->value;
607
	char *tok, *tok2;
608 609
	char *endptr;

610 611 612 613
	/*
	 * --no-call-graph
	 */
	if (unset) {
614
		rep->dont_use_callchains = true;
615 616 617
		return 0;
	}

618
	symbol_conf.use_callchain = true;
619 620 621 622

	if (!arg)
		return 0;

623 624 625 626 627 628
	tok = strtok((char *)arg, ",");
	if (!tok)
		return -1;

	/* get the output mode */
	if (!strncmp(tok, "graph", strlen(arg)))
629
		callchain_param.mode = CHAIN_GRAPH_ABS;
630

631
	else if (!strncmp(tok, "flat", strlen(arg)))
632 633 634 635 636
		callchain_param.mode = CHAIN_FLAT;

	else if (!strncmp(tok, "fractal", strlen(arg)))
		callchain_param.mode = CHAIN_GRAPH_REL;

637 638
	else if (!strncmp(tok, "none", strlen(arg))) {
		callchain_param.mode = CHAIN_NONE;
639
		symbol_conf.use_callchain = false;
640 641 642 643

		return 0;
	}

644 645 646
	else
		return -1;

647 648 649
	/* get the min percentage */
	tok = strtok(NULL, ",");
	if (!tok)
650
		goto setup;
651

652
	callchain_param.min_percent = strtod(tok, &endptr);
653 654 655
	if (tok == endptr)
		return -1;

656 657 658 659 660 661
	/* get the print limit */
	tok2 = strtok(NULL, ",");
	if (!tok2)
		goto setup;

	if (tok2[0] != 'c') {
662
		callchain_param.print_limit = strtoul(tok2, &endptr, 0);
663 664 665 666 667 668
		tok2 = strtok(NULL, ",");
		if (!tok2)
			goto setup;
	}

	/* get the call chain order */
669
	if (!strncmp(tok2, "caller", strlen("caller")))
670
		callchain_param.order = ORDER_CALLER;
671
	else if (!strncmp(tok2, "callee", strlen("callee")))
672 673 674
		callchain_param.order = ORDER_CALLEE;
	else
		return -1;
675 676 677 678 679 680 681 682 683 684 685

	/* Get the sort key */
	tok2 = strtok(NULL, ",");
	if (!tok2)
		goto setup;
	if (!strncmp(tok2, "function", strlen("function")))
		callchain_param.key = CCKEY_FUNCTION;
	else if (!strncmp(tok2, "address", strlen("address")))
		callchain_param.key = CCKEY_ADDRESS;
	else
		return -1;
686
setup:
687
	if (callchain_register_param(&callchain_param) < 0) {
688 689 690
		fprintf(stderr, "Can't register callchain params\n");
		return -1;
	}
691 692 693
	return 0;
}

694 695 696 697 698 699 700 701 702 703 704 705 706 707 708 709 710 711
int
report_parse_ignore_callees_opt(const struct option *opt __maybe_unused,
				const char *arg, int unset __maybe_unused)
{
	if (arg) {
		int err = regcomp(&ignore_callees_regex, arg, REG_EXTENDED);
		if (err) {
			char buf[BUFSIZ];
			regerror(err, &ignore_callees_regex, buf, sizeof(buf));
			pr_err("Invalid --ignore-callees regex: %s\n%s", arg, buf);
			return -1;
		}
		have_ignore_callees = 1;
	}

	return 0;
}

712
static int
713 714
parse_branch_mode(const struct option *opt __maybe_unused,
		  const char *str __maybe_unused, int unset)
715
{
716 717 718
	int *branch_mode = opt->value;

	*branch_mode = !unset;
719 720 721
	return 0;
}

722 723 724 725 726 727 728 729 730 731
static int
parse_percent_limit(const struct option *opt, const char *str,
		    int unset __maybe_unused)
{
	struct perf_report *rep = opt->value;

	rep->min_percent = strtof(str, NULL);
	return 0;
}

732
int cmd_report(int argc, const char **argv, const char *prefix __maybe_unused)
733
{
734
	struct perf_session *session;
735
	struct stat st;
736
	bool has_br_stack = false;
737
	int branch_mode = -1;
738
	int ret = -1;
739 740
	char callchain_default_opt[] = "fractal,0.5,callee";
	const char * const report_usage[] = {
N
Namhyung Kim 已提交
741
		"perf report [<options>]",
742 743 744
		NULL
	};
	struct perf_report report = {
745
		.tool = {
746 747
			.sample		 = process_sample_event,
			.mmap		 = perf_event__process_mmap,
748
			.mmap2		 = perf_event__process_mmap2,
749
			.comm		 = perf_event__process_comm,
750 751
			.exit		 = perf_event__process_exit,
			.fork		 = perf_event__process_fork,
752 753 754 755 756 757 758 759 760 761 762
			.lost		 = perf_event__process_lost,
			.read		 = process_read_event,
			.attr		 = perf_event__process_attr,
			.tracing_data	 = perf_event__process_tracing_data,
			.build_id	 = perf_event__process_build_id,
			.ordered_samples = true,
			.ordering_requires_timestamps = true,
		},
		.pretty_printing_style	 = "normal",
	};
	const struct option options[] = {
763
	OPT_STRING('i', "input", &input_name, "file",
764
		    "input file name"),
765
	OPT_INCR('v', "verbose", &verbose,
766
		    "be more verbose (show symbol address, etc)"),
767 768
	OPT_BOOLEAN('D', "dump-raw-trace", &dump_trace,
		    "dump raw trace in ASCII"),
769 770
	OPT_STRING('k', "vmlinux", &symbol_conf.vmlinux_name,
		   "file", "vmlinux pathname"),
771 772
	OPT_STRING(0, "kallsyms", &symbol_conf.kallsyms_name,
		   "file", "kallsyms pathname"),
773
	OPT_BOOLEAN('f', "force", &report.force, "don't complain, do it"),
774
	OPT_BOOLEAN('m', "modules", &symbol_conf.use_modules,
775
		    "load module symbols - WARNING: use only with -k and LIVE kernel"),
776
	OPT_BOOLEAN('n', "show-nr-samples", &symbol_conf.show_nr_samples,
777
		    "Show a column with the number of samples"),
778
	OPT_BOOLEAN('T', "threads", &report.show_threads,
779
		    "Show per-thread event counters"),
780
	OPT_STRING(0, "pretty", &report.pretty_printing_style, "key",
781
		   "pretty printing style key: normal raw"),
782
	OPT_BOOLEAN(0, "tui", &report.use_tui, "Use the TUI interface"),
783
	OPT_BOOLEAN(0, "gtk", &report.use_gtk, "Use the GTK2 interface"),
784 785
	OPT_BOOLEAN(0, "stdio", &report.use_stdio,
		    "Use the stdio interface"),
786
	OPT_STRING('s', "sort", &sort_order, "key[,key2...]",
787
		   "sort by key(s): pid, comm, dso, symbol, parent, cpu, srcline,"
788
		   " dso_to, dso_from, symbol_to, symbol_from, mispredict,"
789
		   " weight, local_weight, mem, symbol_daddr, dso_daddr, tlb, "
790
		   "snoop, locked, abort, in_tx"),
791 792
	OPT_BOOLEAN(0, "showcpuutilization", &symbol_conf.show_cpu_utilization,
		    "Show sample percentage for different cpu modes"),
793 794
	OPT_STRING('p', "parent", &parent_pattern, "regex",
		   "regex filter to identify parent, see: '--sort parent'"),
795
	OPT_BOOLEAN('x', "exclude-other", &symbol_conf.exclude_other,
796
		    "Only display entries with parent-match"),
797
	OPT_CALLBACK_DEFAULT('g', "call-graph", &report, "output_type,min_percent[,print_limit],call_order",
798 799
		     "Display callchains using output_type (graph, flat, fractal, or none) , min percent threshold, optional print limit, callchain order, key (function or address). "
		     "Default: fractal,0.5,callee,function", &parse_callchain_opt, callchain_default_opt),
800 801
	OPT_BOOLEAN('G', "inverted", &report.inverted_callchain,
		    "alias for inverted call graph"),
802 803 804
	OPT_CALLBACK(0, "ignore-callees", NULL, "regex",
		   "ignore callees of these functions in call graphs",
		   report_parse_ignore_callees_opt),
805
	OPT_STRING('d', "dsos", &symbol_conf.dso_list_str, "dso[,dso...]",
806
		   "only consider symbols in these dsos"),
807
	OPT_STRING('c', "comms", &symbol_conf.comm_list_str, "comm[,comm...]",
808
		   "only consider symbols in these comms"),
809
	OPT_STRING('S', "symbols", &symbol_conf.sym_list_str, "symbol[,symbol...]",
810
		   "only consider these symbols"),
811 812
	OPT_STRING(0, "symbol-filter", &report.symbol_filter_str, "filter",
		   "only show symbols that (partially) match with this filter"),
813
	OPT_STRING('w', "column-widths", &symbol_conf.col_width_list_str,
814 815
		   "width[,width...]",
		   "don't try to adjust column width, use these fixed values"),
816
	OPT_STRING('t', "field-separator", &symbol_conf.field_sep, "separator",
817 818
		   "separator for columns, no spaces will be added between "
		   "columns '.' is reserved."),
819
	OPT_BOOLEAN('U', "hide-unresolved", &report.hide_unresolved,
820
		    "Only display entries resolved to a symbol"),
821 822
	OPT_STRING(0, "symfs", &symbol_conf.symfs, "directory",
		    "Look for files with symbols relative to this directory"),
823
	OPT_STRING('C', "cpu", &report.cpu_list, "cpu",
824 825
		   "list of cpus to profile"),
	OPT_BOOLEAN('I', "show-info", &report.show_full_info,
826
		    "Display extended information about perf.data file"),
827 828 829 830
	OPT_BOOLEAN(0, "source", &symbol_conf.annotate_src,
		    "Interleave source code with assembly code (default)"),
	OPT_BOOLEAN(0, "asm-raw", &symbol_conf.annotate_asm_raw,
		    "Display raw encoding of assembly instructions (default)"),
831 832
	OPT_STRING('M', "disassembler-style", &disassembler_style, "disassembler style",
		   "Specify disassembler style (e.g. -M intel for intel syntax)"),
833 834
	OPT_BOOLEAN(0, "show-total-period", &symbol_conf.show_total_period,
		    "Show a column with the sum of periods"),
N
Namhyung Kim 已提交
835 836
	OPT_BOOLEAN(0, "group", &symbol_conf.event_group,
		    "Show event group information together"),
837
	OPT_CALLBACK_NOOPT('b', "branch-stack", &branch_mode, "",
838
		    "use branch records for histogram filling", parse_branch_mode),
839 840
	OPT_STRING(0, "objdump", &objdump_path, "path",
		   "objdump binary to use for disassembly and annotations"),
841 842
	OPT_BOOLEAN(0, "demangle", &symbol_conf.demangle,
		    "Disable symbol demangling"),
843
	OPT_BOOLEAN(0, "mem-mode", &report.mem_mode, "mem access profile"),
844 845
	OPT_CALLBACK(0, "percent-limit", &report, "percent",
		     "Don't show entries under that percent", parse_percent_limit),
846
	OPT_END()
847
	};
848

849
	perf_config(perf_report_config, &report);
850

851 852
	argc = parse_options(argc, argv, options, report_usage, 0);

853
	if (report.use_stdio)
854
		use_browser = 0;
855
	else if (report.use_tui)
856
		use_browser = 1;
857 858
	else if (report.use_gtk)
		use_browser = 2;
859

860
	if (report.inverted_callchain)
861 862
		callchain_param.order = ORDER_CALLER;

863
	if (!input_name || !strlen(input_name)) {
864
		if (!fstat(STDIN_FILENO, &st) && S_ISFIFO(st.st_mode))
865
			input_name = "-";
866
		else
867
			input_name = "perf.data";
868
	}
869 870 871 872 873 874 875 876 877

	if (strcmp(input_name, "-") != 0)
		setup_browser(true);
	else {
		use_browser = 0;
		perf_hpp__init();
	}

repeat:
878
	session = perf_session__new(input_name, O_RDONLY,
879 880 881 882 883 884 885 886
				    report.force, false, &report.tool);
	if (session == NULL)
		return -ENOMEM;

	report.session = session;

	has_br_stack = perf_header__has_feat(&session->header,
					     HEADER_BRANCH_STACK);
887

888 889
	if (branch_mode == -1 && has_br_stack)
		sort__mode = SORT_MODE__BRANCH;
890

891 892
	/* sort__mode could be NORMAL if --no-branch-stack */
	if (sort__mode == SORT_MODE__BRANCH) {
893
		/*
894 895
		 * if no sort_order is provided, then specify
		 * branch-mode specific order
896 897 898 899 900
		 */
		if (sort_order == default_sort_order)
			sort_order = "comm,dso_from,symbol_from,"
				     "dso_to,symbol_to";

901
	}
902
	if (report.mem_mode) {
903
		if (sort__mode == SORT_MODE__BRANCH) {
904 905 906
			fprintf(stderr, "branch and mem mode incompatible\n");
			goto error;
		}
907 908
		sort__mode = SORT_MODE__MEMORY;

909 910 911 912 913 914 915
		/*
		 * if no sort_order is provided, then specify
		 * branch-mode specific order
		 */
		if (sort_order == default_sort_order)
			sort_order = "local_weight,mem,sym,dso,symbol_daddr,dso_daddr,snoop,tlb,locked";
	}
916

917 918
	if (setup_sorting() < 0)
		usage_with_options(report_usage, options);
919

920
	/*
921
	 * Only in the TUI browser we are doing integrated annotation,
922 923 924
	 * so don't allocate extra space that won't be used in the stdio
	 * implementation.
	 */
925
	if (use_browser == 1 && sort__has_sym) {
926
		symbol_conf.priv_size = sizeof(struct annotation);
927 928
		machines__set_symbol_filter(&session->machines,
					    symbol__annotate_init);
929 930 931 932 933 934 935 936 937 938 939 940 941 942 943 944
		/*
 		 * For searching by name on the "Browse map details".
 		 * providing it only in verbose mode not to bloat too
 		 * much struct symbol.
 		 */
		if (verbose) {
			/*
			 * XXX: Need to provide a less kludgy way to ask for
			 * more space per symbol, the u32 is for the index on
			 * the ui browser.
			 * See symbol__browser_index.
			 */
			symbol_conf.priv_size += sizeof(u32);
			symbol_conf.sort_by_name = true;
		}
	}
945

946
	if (symbol__init() < 0)
947
		goto error;
948

949
	if (parent_pattern != default_parent_pattern) {
950
		if (sort_dimension__add("parent") < 0)
951
			goto error;
952
	}
953

954 955 956 957 958 959 960 961 962 963
	if (argc) {
		/*
		 * Special case: if there's an argument left then assume that
		 * it's a symbol filter:
		 */
		if (argc > 1)
			usage_with_options(report_usage, options);

		report.symbol_filter_str = argv[0];
	}
964

965
	sort__setup_elide(stdout);
966

967
	ret = __cmd_report(&report);
968 969 970 971 972 973
	if (ret == K_SWITCH_INPUT_DATA) {
		perf_session__delete(session);
		goto repeat;
	} else
		ret = 0;

974 975 976
error:
	perf_session__delete(session);
	return ret;
977
}