builtin-report.c 27.2 KB
Newer Older
1 2 3 4 5 6 7
/*
 * builtin-report.c
 *
 * Builtin report command: Analyze the perf.data input file,
 * look up and read DSOs and symbol information and display
 * a histogram of results, along various sorting keys.
 */
8
#include "builtin.h"
9

10
#include "util/util.h"
11
#include "util/cache.h"
12

13
#include "util/annotate.h"
14
#include "util/color.h"
15
#include <linux/list.h>
16
#include <linux/rbtree.h>
17
#include "util/symbol.h"
18
#include "util/callchain.h"
19
#include "util/strlist.h"
20
#include "util/values.h"
21

22
#include "perf.h"
23
#include "util/debug.h"
24 25
#include "util/evlist.h"
#include "util/evsel.h"
26
#include "util/header.h"
27
#include "util/session.h"
28
#include "util/tool.h"
29 30 31 32

#include "util/parse-options.h"
#include "util/parse-events.h"

33
#include "util/thread.h"
34
#include "util/sort.h"
35
#include "util/hist.h"
36
#include "util/data.h"
37
#include "arch/common.h"
38

39
#include <dlfcn.h>
40 41
#include <linux/bitmap.h>

42
struct perf_report {
43
	struct perf_tool	tool;
44
	struct perf_session	*session;
45
	bool			force, use_tui, use_gtk, use_stdio;
46 47 48 49 50
	bool			hide_unresolved;
	bool			dont_use_callchains;
	bool			show_full_info;
	bool			show_threads;
	bool			inverted_callchain;
51
	bool			mem_mode;
52 53 54
	struct perf_read_values	show_threads_values;
	const char		*pretty_printing_style;
	const char		*cpu_list;
55
	const char		*symbol_filter_str;
56
	float			min_percent;
57
	DECLARE_BITMAP(cpu_bitmap, MAX_NR_CPUS);
58
};
59

60 61 62 63 64 65
static int perf_report_config(const char *var, const char *value, void *cb)
{
	if (!strcmp(var, "report.group")) {
		symbol_conf.event_group = perf_config_bool(var, value);
		return 0;
	}
66 67 68 69 70
	if (!strcmp(var, "report.percent-limit")) {
		struct perf_report *rep = cb;
		rep->min_percent = strtof(value, NULL);
		return 0;
	}
71 72 73 74

	return perf_default_config(var, value, cb);
}

75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92
static int perf_report__add_mem_hist_entry(struct perf_tool *tool,
					   struct addr_location *al,
					   struct perf_sample *sample,
					   struct perf_evsel *evsel,
					   struct machine *machine,
					   union perf_event *event)
{
	struct perf_report *rep = container_of(tool, struct perf_report, tool);
	struct symbol *parent = NULL;
	u8 cpumode = event->header.misc & PERF_RECORD_MISC_CPUMODE_MASK;
	int err = 0;
	struct hist_entry *he;
	struct mem_info *mi, *mx;
	uint64_t cost;

	if ((sort__has_parent || symbol_conf.use_callchain) &&
	    sample->callchain) {
		err = machine__resolve_callchain(machine, evsel, al->thread,
93
						 sample, &parent, al);
94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120
		if (err)
			return err;
	}

	mi = machine__resolve_mem(machine, al->thread, sample, cpumode);
	if (!mi)
		return -ENOMEM;

	if (rep->hide_unresolved && !al->sym)
		return 0;

	cost = sample->weight;
	if (!cost)
		cost = 1;

	/*
	 * must pass period=weight in order to get the correct
	 * sorting from hists__collapse_resort() which is solely
	 * based on periods. We want sorting be done on nr_events * weight
	 * and this is indirectly achieved by passing period=weight here
	 * and the he_stat__add_period() function.
	 */
	he = __hists__add_mem_entry(&evsel->hists, al, parent, mi, cost, cost);
	if (!he)
		return -ENOMEM;

	/*
121
	 * In the TUI browser, we are doing integrated annotation,
122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167
	 * so we don't allocate the extra space needed because the stdio
	 * code will not use it.
	 */
	if (sort__has_sym && he->ms.sym && use_browser > 0) {
		struct annotation *notes = symbol__annotation(he->ms.sym);

		assert(evsel != NULL);

		if (notes->src == NULL && symbol__alloc_hist(he->ms.sym) < 0)
			goto out;

		err = hist_entry__inc_addr_samples(he, evsel->idx, al->addr);
		if (err)
			goto out;
	}

	if (sort__has_sym && he->mem_info->daddr.sym && use_browser > 0) {
		struct annotation *notes;

		mx = he->mem_info;

		notes = symbol__annotation(mx->daddr.sym);
		if (notes->src == NULL && symbol__alloc_hist(mx->daddr.sym) < 0)
			goto out;

		err = symbol__inc_addr_samples(mx->daddr.sym,
					       mx->daddr.map,
					       evsel->idx,
					       mx->daddr.al_addr);
		if (err)
			goto out;
	}

	evsel->hists.stats.total_period += cost;
	hists__inc_nr_events(&evsel->hists, PERF_RECORD_SAMPLE);
	err = 0;

	if (symbol_conf.use_callchain) {
		err = callchain_append(he->callchain,
				       &callchain_cursor,
				       sample->period);
	}
out:
	return err;
}

168 169 170 171 172 173 174 175 176 177 178
static int perf_report__add_branch_hist_entry(struct perf_tool *tool,
					struct addr_location *al,
					struct perf_sample *sample,
					struct perf_evsel *evsel,
				      struct machine *machine)
{
	struct perf_report *rep = container_of(tool, struct perf_report, tool);
	struct symbol *parent = NULL;
	int err = 0;
	unsigned i;
	struct hist_entry *he;
179
	struct branch_info *bi, *bx;
180 181 182

	if ((sort__has_parent || symbol_conf.use_callchain)
	    && sample->callchain) {
183
		err = machine__resolve_callchain(machine, evsel, al->thread,
184
						 sample, &parent, al);
185 186 187 188 189 190 191 192 193 194 195 196
		if (err)
			return err;
	}

	bi = machine__resolve_bstack(machine, al->thread,
				     sample->branch_stack);
	if (!bi)
		return -ENOMEM;

	for (i = 0; i < sample->branch_stack->nr; i++) {
		if (rep->hide_unresolved && !(bi[i].from.sym && bi[i].to.sym))
			continue;
197 198 199

		err = -ENOMEM;

200 201 202 203 204
		/*
		 * The report shows the percentage of total branches captured
		 * and not events sampled. Thus we use a pseudo period of 1.
		 */
		he = __hists__add_branch_entry(&evsel->hists, al, parent,
205
				&bi[i], 1, 1);
206
		if (he) {
207 208
			struct annotation *notes;
			bx = he->branch_info;
209
			if (bx->from.sym && use_browser == 1 && sort__has_sym) {
210 211 212 213 214 215 216 217 218 219 220 221 222
				notes = symbol__annotation(bx->from.sym);
				if (!notes->src
				    && symbol__alloc_hist(bx->from.sym) < 0)
					goto out;

				err = symbol__inc_addr_samples(bx->from.sym,
							       bx->from.map,
							       evsel->idx,
							       bx->from.al_addr);
				if (err)
					goto out;
			}

223
			if (bx->to.sym && use_browser == 1 && sort__has_sym) {
224 225 226 227 228 229 230 231 232 233 234 235
				notes = symbol__annotation(bx->to.sym);
				if (!notes->src
				    && symbol__alloc_hist(bx->to.sym) < 0)
					goto out;

				err = symbol__inc_addr_samples(bx->to.sym,
							       bx->to.map,
							       evsel->idx,
							       bx->to.al_addr);
				if (err)
					goto out;
			}
236 237 238
			evsel->hists.stats.total_period += 1;
			hists__inc_nr_events(&evsel->hists, PERF_RECORD_SAMPLE);
		} else
239
			goto out;
240
	}
241
	err = 0;
242
out:
243
	free(bi);
244 245 246
	return err;
}

247 248 249 250
static int perf_evsel__add_hist_entry(struct perf_evsel *evsel,
				      struct addr_location *al,
				      struct perf_sample *sample,
				      struct machine *machine)
251
{
252
	struct symbol *parent = NULL;
253
	int err = 0;
254 255
	struct hist_entry *he;

256
	if ((sort__has_parent || symbol_conf.use_callchain) && sample->callchain) {
257
		err = machine__resolve_callchain(machine, evsel, al->thread,
258
						 sample, &parent, al);
259 260
		if (err)
			return err;
261
	}
262

263
	he = __hists__add_entry(&evsel->hists, al, parent, sample->period,
264
				sample->weight, sample->transaction);
265
	if (he == NULL)
266 267
		return -ENOMEM;

268
	if (symbol_conf.use_callchain) {
269
		err = callchain_append(he->callchain,
270
				       &callchain_cursor,
271
				       sample->period);
272
		if (err)
273
			return err;
274 275
	}
	/*
276
	 * Only in the TUI browser we are doing integrated annotation,
277 278 279
	 * so we don't allocated the extra space needed because the stdio
	 * code will not use it.
	 */
280
	if (he->ms.sym != NULL && use_browser == 1 && sort__has_sym) {
281
		struct annotation *notes = symbol__annotation(he->ms.sym);
282 283 284 285

		assert(evsel != NULL);

		err = -ENOMEM;
286
		if (notes->src == NULL && symbol__alloc_hist(he->ms.sym) < 0)
287 288 289
			goto out;

		err = hist_entry__inc_addr_samples(he, evsel->idx, al->addr);
290
	}
291

292 293 294
	evsel->hists.stats.total_period += sample->period;
	hists__inc_nr_events(&evsel->hists, PERF_RECORD_SAMPLE);
out:
295
	return err;
296 297
}

298

299
static int process_sample_event(struct perf_tool *tool,
300
				union perf_event *event,
301
				struct perf_sample *sample,
302
				struct perf_evsel *evsel,
303
				struct machine *machine)
304
{
305
	struct perf_report *rep = container_of(tool, struct perf_report, tool);
306
	struct addr_location al;
307
	int ret;
308

309
	if (perf_event__preprocess_sample(event, machine, &al, sample) < 0) {
310
		fprintf(stderr, "problem processing %d event, skipping it.\n",
311 312 313
			event->header.type);
		return -1;
	}
314

315
	if (al.filtered || (rep->hide_unresolved && al.sym == NULL))
316
		return 0;
317

318
	if (rep->cpu_list && !test_bit(sample->cpu, rep->cpu_bitmap))
319 320
		return 0;

321
	if (sort__mode == SORT_MODE__BRANCH) {
322 323 324
		ret = perf_report__add_branch_hist_entry(tool, &al, sample,
							 evsel, machine);
		if (ret < 0)
325
			pr_debug("problem adding lbr entry, skipping event\n");
326
	} else if (rep->mem_mode == 1) {
327 328 329
		ret = perf_report__add_mem_hist_entry(tool, &al, sample,
						      evsel, machine, event);
		if (ret < 0)
330
			pr_debug("problem adding mem entry, skipping event\n");
331 332 333
	} else {
		if (al.map != NULL)
			al.map->dso->hit = 1;
334

335 336
		ret = perf_evsel__add_hist_entry(evsel, &al, sample, machine);
		if (ret < 0)
337
			pr_debug("problem incrementing symbol period, skipping event\n");
338
	}
339
	return ret;
340
}
I
Ingo Molnar 已提交
341

342
static int process_read_event(struct perf_tool *tool,
343
			      union perf_event *event,
344
			      struct perf_sample *sample __maybe_unused,
345
			      struct perf_evsel *evsel,
346
			      struct machine *machine __maybe_unused)
347
{
348
	struct perf_report *rep = container_of(tool, struct perf_report, tool);
349

350
	if (rep->show_threads) {
351
		const char *name = evsel ? perf_evsel__name(evsel) : "unknown";
352
		perf_read_values_add_value(&rep->show_threads_values,
353 354 355 356 357 358
					   event->read.pid, event->read.tid,
					   event->read.id,
					   name,
					   event->read.value);
	}

359
	dump_printf(": %d %d %s %" PRIu64 "\n", event->read.pid, event->read.tid,
360
		    evsel ? perf_evsel__name(evsel) : "FAIL",
361
		    event->read.value);
362 363 364 365

	return 0;
}

366
/* For pipe mode, sample_type is not currently set */
367
static int perf_report__setup_sample_type(struct perf_report *rep)
368
{
369
	struct perf_session *self = rep->session;
370
	u64 sample_type = perf_evlist__combined_sample_type(self->evlist);
371

372
	if (!self->fd_pipe && !(sample_type & PERF_SAMPLE_CALLCHAIN)) {
373
		if (sort__has_parent) {
374
			ui__error("Selected --sort parent, but no "
375 376
				    "callchain data. Did you call "
				    "'perf record' without -g?\n");
377
			return -EINVAL;
378
		}
379
		if (symbol_conf.use_callchain) {
380
			ui__error("Selected -g but no callchain data. Did "
381
				    "you call 'perf record' without -g?\n");
382
			return -1;
383
		}
384 385
	} else if (!rep->dont_use_callchains &&
		   callchain_param.mode != CHAIN_NONE &&
386
		   !symbol_conf.use_callchain) {
387
			symbol_conf.use_callchain = true;
388
			if (callchain_register_param(&callchain_param) < 0) {
389
				ui__error("Can't register callchain params.\n");
390
				return -EINVAL;
391
			}
392 393
	}

394
	if (sort__mode == SORT_MODE__BRANCH) {
395
		if (!self->fd_pipe &&
396
		    !(sample_type & PERF_SAMPLE_BRANCH_STACK)) {
397 398
			ui__error("Selected -b but no branch data. "
				  "Did you call perf record without -b?\n");
399 400 401 402
			return -1;
		}
	}

403 404
	return 0;
}
405

406
static void sig_handler(int sig __maybe_unused)
407 408 409 410
{
	session_done = 1;
}

411 412
static size_t hists__fprintf_nr_sample_events(struct perf_report *rep,
					      struct hists *self,
413 414 415 416
					      const char *evname, FILE *fp)
{
	size_t ret;
	char unit;
417 418
	unsigned long nr_samples = self->stats.nr_events[PERF_RECORD_SAMPLE];
	u64 nr_events = self->stats.total_period;
419 420 421 422
	struct perf_evsel *evsel = hists_to_evsel(self);
	char buf[512];
	size_t size = sizeof(buf);

423
	if (perf_evsel__is_group_event(evsel)) {
424 425 426 427 428 429 430 431 432 433
		struct perf_evsel *pos;

		perf_evsel__group_desc(evsel, buf, size);
		evname = buf;

		for_each_group_member(pos, evsel) {
			nr_samples += pos->hists.stats.nr_events[PERF_RECORD_SAMPLE];
			nr_events += pos->hists.stats.total_period;
		}
	}
434

435 436
	nr_samples = convert_unit(nr_samples, &unit);
	ret = fprintf(fp, "# Samples: %lu%c", nr_samples, unit);
437
	if (evname != NULL)
438 439
		ret += fprintf(fp, " of event '%s'", evname);

440 441 442 443 444
	if (rep->mem_mode) {
		ret += fprintf(fp, "\n# Total weight : %" PRIu64, nr_events);
		ret += fprintf(fp, "\n# Sort order   : %s", sort_order);
	} else
		ret += fprintf(fp, "\n# Event count (approx.): %" PRIu64, nr_events);
445 446 447
	return ret + fprintf(fp, "\n#\n");
}

448
static int perf_evlist__tty_browse_hists(struct perf_evlist *evlist,
449
					 struct perf_report *rep,
450
					 const char *help)
451
{
452
	struct perf_evsel *pos;
453

454 455
	list_for_each_entry(pos, &evlist->entries, node) {
		struct hists *hists = &pos->hists;
456
		const char *evname = perf_evsel__name(pos);
457

458 459 460 461
		if (symbol_conf.event_group &&
		    !perf_evsel__is_group_leader(pos))
			continue;

462
		hists__fprintf_nr_sample_events(rep, hists, evname, stdout);
463
		hists__fprintf(hists, true, 0, 0, rep->min_percent, stdout);
464 465 466 467 468 469 470
		fprintf(stdout, "\n\n");
	}

	if (sort_order == default_sort_order &&
	    parent_pattern == default_parent_pattern) {
		fprintf(stdout, "#\n# (%s)\n#\n", help);

471 472 473
		if (rep->show_threads) {
			bool style = !strcmp(rep->pretty_printing_style, "raw");
			perf_read_values_display(stdout, &rep->show_threads_values,
474
						 style);
475
			perf_read_values_destroy(&rep->show_threads_values);
476 477 478 479 480 481
		}
	}

	return 0;
}

482
static int __cmd_report(struct perf_report *rep)
483
{
484
	int ret = -EINVAL;
485
	u64 nr_samples;
486
	struct perf_session *session = rep->session;
487
	struct perf_evsel *pos;
488 489
	struct map *kernel_map;
	struct kmap *kernel_kmap;
490
	const char *help = "For a higher level overview, try: perf report --sort comm,dso";
491

492 493
	signal(SIGINT, sig_handler);

494 495 496
	if (rep->cpu_list) {
		ret = perf_session__cpu_bitmap(session, rep->cpu_list,
					       rep->cpu_bitmap);
497
		if (ret)
498
			return ret;
499 500
	}

501
	if (use_browser <= 0)
502
		perf_session__fprintf_info(session, stdout, rep->show_full_info);
503

504 505
	if (rep->show_threads)
		perf_read_values_init(&rep->show_threads_values);
506

507
	ret = perf_report__setup_sample_type(rep);
508
	if (ret)
509
		return ret;
510

511
	ret = perf_session__process_events(session, &rep->tool);
512
	if (ret)
513
		return ret;
514

515
	kernel_map = session->machines.host.vmlinux_maps[MAP__FUNCTION];
516 517 518 519 520
	kernel_kmap = map__kmap(kernel_map);
	if (kernel_map == NULL ||
	    (kernel_map->dso->hit &&
	     (kernel_kmap->ref_reloc_sym == NULL ||
	      kernel_kmap->ref_reloc_sym->addr == 0))) {
521 522 523 524 525 526 527 528 529 530 531
		const char *desc =
		    "As no suitable kallsyms nor vmlinux was found, kernel samples\n"
		    "can't be resolved.";

		if (kernel_map) {
			const struct dso *kdso = kernel_map->dso;
			if (!RB_EMPTY_ROOT(&kdso->symbols[MAP__FUNCTION])) {
				desc = "If some relocation was applied (e.g. "
				       "kexec) symbols may be misresolved.";
			}
		}
532

533 534 535 536
		ui__warning(
"Kernel address maps (/proc/{kallsyms,modules}) were restricted.\n\n"
"Check /proc/sys/kernel/kptr_restrict before running 'perf record'.\n\n%s\n\n"
"Samples in kernel modules can't be resolved as well.\n\n",
537
		desc);
538 539
	}

540
	if (verbose > 3)
541
		perf_session__fprintf(session, stdout);
542

543
	if (verbose > 2)
544
		perf_session__fprintf_dsos(session, stdout);
545

546 547
	if (dump_trace) {
		perf_session__fprintf_nr_events(session, stdout);
548
		return 0;
549 550
	}

551 552 553
	nr_samples = 0;
	list_for_each_entry(pos, &session->evlist->entries, node) {
		struct hists *hists = &pos->hists;
554

555 556 557
		if (pos->idx == 0)
			hists->symbol_filter_str = rep->symbol_filter_str;

558
		hists__collapse_resort(hists);
559
		nr_samples += hists->stats.nr_events[PERF_RECORD_SAMPLE];
560 561 562 563 564 565 566 567 568

		/* Non-group events are considered as leader */
		if (symbol_conf.event_group &&
		    !perf_evsel__is_group_leader(pos)) {
			struct hists *leader_hists = &pos->leader->hists;

			hists__match(leader_hists, hists);
			hists__link(leader_hists, hists);
		}
569 570
	}

571 572 573
	if (session_done())
		return 0;

574
	if (nr_samples == 0) {
575
		ui__error("The %s file has no samples!\n", session->filename);
576
		return 0;
577 578
	}

579 580 581
	list_for_each_entry(pos, &session->evlist->entries, node)
		hists__output_resort(&pos->hists);

582
	if (use_browser > 0) {
583
		if (use_browser == 1) {
584
			ret = perf_evlist__tui_browse_hists(session->evlist,
585 586
							help, NULL,
							rep->min_percent,
587 588 589 590 591 592 593 594
							&session->header.env);
			/*
			 * Usually "ret" is the last pressed key, and we only
			 * care if the key notifies us to switch data file.
			 */
			if (ret != K_SWITCH_INPUT_DATA)
				ret = 0;

595
		} else if (use_browser == 2) {
596 597 598 599 600 601 602 603 604 605 606 607 608
			int (*hist_browser)(struct perf_evlist *,
					    const char *,
					    struct hist_browser_timer *,
					    float min_pcnt);

			hist_browser = dlsym(perf_gtk_handle,
					     "perf_evlist__gtk_browse_hists");
			if (hist_browser == NULL) {
				ui__error("GTK browser not found!\n");
				return ret;
			}
			hist_browser(session->evlist, help, NULL,
				     rep->min_percent);
609
		}
610
	} else
611
		perf_evlist__tty_browse_hists(session->evlist, rep, help);
612

613
	return ret;
614 615
}

616
static int
617
parse_callchain_opt(const struct option *opt, const char *arg, int unset)
618
{
619
	struct perf_report *rep = (struct perf_report *)opt->value;
620
	char *tok, *tok2;
621 622
	char *endptr;

623 624 625 626
	/*
	 * --no-call-graph
	 */
	if (unset) {
627
		rep->dont_use_callchains = true;
628 629 630
		return 0;
	}

631
	symbol_conf.use_callchain = true;
632 633 634 635

	if (!arg)
		return 0;

636 637 638 639 640 641
	tok = strtok((char *)arg, ",");
	if (!tok)
		return -1;

	/* get the output mode */
	if (!strncmp(tok, "graph", strlen(arg)))
642
		callchain_param.mode = CHAIN_GRAPH_ABS;
643

644
	else if (!strncmp(tok, "flat", strlen(arg)))
645 646 647 648 649
		callchain_param.mode = CHAIN_FLAT;

	else if (!strncmp(tok, "fractal", strlen(arg)))
		callchain_param.mode = CHAIN_GRAPH_REL;

650 651
	else if (!strncmp(tok, "none", strlen(arg))) {
		callchain_param.mode = CHAIN_NONE;
652
		symbol_conf.use_callchain = false;
653 654 655 656

		return 0;
	}

657 658 659
	else
		return -1;

660 661 662
	/* get the min percentage */
	tok = strtok(NULL, ",");
	if (!tok)
663
		goto setup;
664

665
	callchain_param.min_percent = strtod(tok, &endptr);
666 667 668
	if (tok == endptr)
		return -1;

669 670 671 672 673 674
	/* get the print limit */
	tok2 = strtok(NULL, ",");
	if (!tok2)
		goto setup;

	if (tok2[0] != 'c') {
675
		callchain_param.print_limit = strtoul(tok2, &endptr, 0);
676 677 678 679 680 681
		tok2 = strtok(NULL, ",");
		if (!tok2)
			goto setup;
	}

	/* get the call chain order */
682
	if (!strncmp(tok2, "caller", strlen("caller")))
683
		callchain_param.order = ORDER_CALLER;
684
	else if (!strncmp(tok2, "callee", strlen("callee")))
685 686 687
		callchain_param.order = ORDER_CALLEE;
	else
		return -1;
688 689 690 691 692 693 694 695 696 697 698

	/* Get the sort key */
	tok2 = strtok(NULL, ",");
	if (!tok2)
		goto setup;
	if (!strncmp(tok2, "function", strlen("function")))
		callchain_param.key = CCKEY_FUNCTION;
	else if (!strncmp(tok2, "address", strlen("address")))
		callchain_param.key = CCKEY_ADDRESS;
	else
		return -1;
699
setup:
700
	if (callchain_register_param(&callchain_param) < 0) {
701 702 703
		fprintf(stderr, "Can't register callchain params\n");
		return -1;
	}
704 705 706
	return 0;
}

707 708 709 710 711 712 713 714 715 716 717 718 719 720 721 722 723 724
int
report_parse_ignore_callees_opt(const struct option *opt __maybe_unused,
				const char *arg, int unset __maybe_unused)
{
	if (arg) {
		int err = regcomp(&ignore_callees_regex, arg, REG_EXTENDED);
		if (err) {
			char buf[BUFSIZ];
			regerror(err, &ignore_callees_regex, buf, sizeof(buf));
			pr_err("Invalid --ignore-callees regex: %s\n%s", arg, buf);
			return -1;
		}
		have_ignore_callees = 1;
	}

	return 0;
}

725
static int
726 727
parse_branch_mode(const struct option *opt __maybe_unused,
		  const char *str __maybe_unused, int unset)
728
{
729 730 731
	int *branch_mode = opt->value;

	*branch_mode = !unset;
732 733 734
	return 0;
}

735 736 737 738 739 740 741 742 743 744
static int
parse_percent_limit(const struct option *opt, const char *str,
		    int unset __maybe_unused)
{
	struct perf_report *rep = opt->value;

	rep->min_percent = strtof(str, NULL);
	return 0;
}

745
int cmd_report(int argc, const char **argv, const char *prefix __maybe_unused)
746
{
747
	struct perf_session *session;
748
	struct stat st;
749
	bool has_br_stack = false;
750
	int branch_mode = -1;
751
	int ret = -1;
752 753
	char callchain_default_opt[] = "fractal,0.5,callee";
	const char * const report_usage[] = {
N
Namhyung Kim 已提交
754
		"perf report [<options>]",
755 756 757
		NULL
	};
	struct perf_report report = {
758
		.tool = {
759 760
			.sample		 = process_sample_event,
			.mmap		 = perf_event__process_mmap,
761
			.mmap2		 = perf_event__process_mmap2,
762
			.comm		 = perf_event__process_comm,
763 764
			.exit		 = perf_event__process_exit,
			.fork		 = perf_event__process_fork,
765 766 767 768 769 770 771 772 773 774 775
			.lost		 = perf_event__process_lost,
			.read		 = process_read_event,
			.attr		 = perf_event__process_attr,
			.tracing_data	 = perf_event__process_tracing_data,
			.build_id	 = perf_event__process_build_id,
			.ordered_samples = true,
			.ordering_requires_timestamps = true,
		},
		.pretty_printing_style	 = "normal",
	};
	const struct option options[] = {
776
	OPT_STRING('i', "input", &input_name, "file",
777
		    "input file name"),
778
	OPT_INCR('v', "verbose", &verbose,
779
		    "be more verbose (show symbol address, etc)"),
780 781
	OPT_BOOLEAN('D', "dump-raw-trace", &dump_trace,
		    "dump raw trace in ASCII"),
782 783
	OPT_STRING('k', "vmlinux", &symbol_conf.vmlinux_name,
		   "file", "vmlinux pathname"),
784 785
	OPT_STRING(0, "kallsyms", &symbol_conf.kallsyms_name,
		   "file", "kallsyms pathname"),
786
	OPT_BOOLEAN('f', "force", &report.force, "don't complain, do it"),
787
	OPT_BOOLEAN('m', "modules", &symbol_conf.use_modules,
788
		    "load module symbols - WARNING: use only with -k and LIVE kernel"),
789
	OPT_BOOLEAN('n', "show-nr-samples", &symbol_conf.show_nr_samples,
790
		    "Show a column with the number of samples"),
791
	OPT_BOOLEAN('T', "threads", &report.show_threads,
792
		    "Show per-thread event counters"),
793
	OPT_STRING(0, "pretty", &report.pretty_printing_style, "key",
794
		   "pretty printing style key: normal raw"),
795
	OPT_BOOLEAN(0, "tui", &report.use_tui, "Use the TUI interface"),
796
	OPT_BOOLEAN(0, "gtk", &report.use_gtk, "Use the GTK2 interface"),
797 798
	OPT_BOOLEAN(0, "stdio", &report.use_stdio,
		    "Use the stdio interface"),
799
	OPT_STRING('s', "sort", &sort_order, "key[,key2...]",
800
		   "sort by key(s): pid, comm, dso, symbol, parent, cpu, srcline,"
801
		   " dso_to, dso_from, symbol_to, symbol_from, mispredict,"
802
		   " weight, local_weight, mem, symbol_daddr, dso_daddr, tlb, "
803
		   "snoop, locked, abort, in_tx, transaction"),
804 805
	OPT_BOOLEAN(0, "showcpuutilization", &symbol_conf.show_cpu_utilization,
		    "Show sample percentage for different cpu modes"),
806 807
	OPT_STRING('p', "parent", &parent_pattern, "regex",
		   "regex filter to identify parent, see: '--sort parent'"),
808
	OPT_BOOLEAN('x', "exclude-other", &symbol_conf.exclude_other,
809
		    "Only display entries with parent-match"),
810
	OPT_CALLBACK_DEFAULT('g', "call-graph", &report, "output_type,min_percent[,print_limit],call_order",
811 812
		     "Display callchains using output_type (graph, flat, fractal, or none) , min percent threshold, optional print limit, callchain order, key (function or address). "
		     "Default: fractal,0.5,callee,function", &parse_callchain_opt, callchain_default_opt),
813 814
	OPT_BOOLEAN('G', "inverted", &report.inverted_callchain,
		    "alias for inverted call graph"),
815 816 817
	OPT_CALLBACK(0, "ignore-callees", NULL, "regex",
		   "ignore callees of these functions in call graphs",
		   report_parse_ignore_callees_opt),
818
	OPT_STRING('d', "dsos", &symbol_conf.dso_list_str, "dso[,dso...]",
819
		   "only consider symbols in these dsos"),
820
	OPT_STRING('c', "comms", &symbol_conf.comm_list_str, "comm[,comm...]",
821
		   "only consider symbols in these comms"),
822
	OPT_STRING('S', "symbols", &symbol_conf.sym_list_str, "symbol[,symbol...]",
823
		   "only consider these symbols"),
824 825
	OPT_STRING(0, "symbol-filter", &report.symbol_filter_str, "filter",
		   "only show symbols that (partially) match with this filter"),
826
	OPT_STRING('w', "column-widths", &symbol_conf.col_width_list_str,
827 828
		   "width[,width...]",
		   "don't try to adjust column width, use these fixed values"),
829
	OPT_STRING('t', "field-separator", &symbol_conf.field_sep, "separator",
830 831
		   "separator for columns, no spaces will be added between "
		   "columns '.' is reserved."),
832
	OPT_BOOLEAN('U', "hide-unresolved", &report.hide_unresolved,
833
		    "Only display entries resolved to a symbol"),
834 835
	OPT_STRING(0, "symfs", &symbol_conf.symfs, "directory",
		    "Look for files with symbols relative to this directory"),
836
	OPT_STRING('C', "cpu", &report.cpu_list, "cpu",
837 838
		   "list of cpus to profile"),
	OPT_BOOLEAN('I', "show-info", &report.show_full_info,
839
		    "Display extended information about perf.data file"),
840 841 842 843
	OPT_BOOLEAN(0, "source", &symbol_conf.annotate_src,
		    "Interleave source code with assembly code (default)"),
	OPT_BOOLEAN(0, "asm-raw", &symbol_conf.annotate_asm_raw,
		    "Display raw encoding of assembly instructions (default)"),
844 845
	OPT_STRING('M', "disassembler-style", &disassembler_style, "disassembler style",
		   "Specify disassembler style (e.g. -M intel for intel syntax)"),
846 847
	OPT_BOOLEAN(0, "show-total-period", &symbol_conf.show_total_period,
		    "Show a column with the sum of periods"),
N
Namhyung Kim 已提交
848 849
	OPT_BOOLEAN(0, "group", &symbol_conf.event_group,
		    "Show event group information together"),
850
	OPT_CALLBACK_NOOPT('b', "branch-stack", &branch_mode, "",
851
		    "use branch records for histogram filling", parse_branch_mode),
852 853
	OPT_STRING(0, "objdump", &objdump_path, "path",
		   "objdump binary to use for disassembly and annotations"),
854 855
	OPT_BOOLEAN(0, "demangle", &symbol_conf.demangle,
		    "Disable symbol demangling"),
856
	OPT_BOOLEAN(0, "mem-mode", &report.mem_mode, "mem access profile"),
857 858
	OPT_CALLBACK(0, "percent-limit", &report, "percent",
		     "Don't show entries under that percent", parse_percent_limit),
859
	OPT_END()
860
	};
861 862 863
	struct perf_data_file file = {
		.mode  = PERF_DATA_MODE_READ,
	};
864

865
	perf_config(perf_report_config, &report);
866

867 868
	argc = parse_options(argc, argv, options, report_usage, 0);

869
	if (report.use_stdio)
870
		use_browser = 0;
871
	else if (report.use_tui)
872
		use_browser = 1;
873 874
	else if (report.use_gtk)
		use_browser = 2;
875

876
	if (report.inverted_callchain)
877 878
		callchain_param.order = ORDER_CALLER;

879
	if (!input_name || !strlen(input_name)) {
880
		if (!fstat(STDIN_FILENO, &st) && S_ISFIFO(st.st_mode))
881
			input_name = "-";
882
		else
883
			input_name = "perf.data";
884
	}
885 886 887 888 889 890 891 892

	if (strcmp(input_name, "-") != 0)
		setup_browser(true);
	else {
		use_browser = 0;
		perf_hpp__init();
	}

893 894 895
	file.path  = input_name;
	file.force = report.force;

896
repeat:
897
	session = perf_session__new(&file, false, &report.tool);
898 899 900 901 902 903 904
	if (session == NULL)
		return -ENOMEM;

	report.session = session;

	has_br_stack = perf_header__has_feat(&session->header,
					     HEADER_BRANCH_STACK);
905

906 907
	if (branch_mode == -1 && has_br_stack)
		sort__mode = SORT_MODE__BRANCH;
908

909 910
	/* sort__mode could be NORMAL if --no-branch-stack */
	if (sort__mode == SORT_MODE__BRANCH) {
911
		/*
912 913
		 * if no sort_order is provided, then specify
		 * branch-mode specific order
914 915 916 917 918
		 */
		if (sort_order == default_sort_order)
			sort_order = "comm,dso_from,symbol_from,"
				     "dso_to,symbol_to";

919
	}
920
	if (report.mem_mode) {
921
		if (sort__mode == SORT_MODE__BRANCH) {
922 923 924
			fprintf(stderr, "branch and mem mode incompatible\n");
			goto error;
		}
925 926
		sort__mode = SORT_MODE__MEMORY;

927 928 929 930 931 932 933
		/*
		 * if no sort_order is provided, then specify
		 * branch-mode specific order
		 */
		if (sort_order == default_sort_order)
			sort_order = "local_weight,mem,sym,dso,symbol_daddr,dso_daddr,snoop,tlb,locked";
	}
934

935 936
	if (setup_sorting() < 0)
		usage_with_options(report_usage, options);
937

938
	/*
939
	 * Only in the TUI browser we are doing integrated annotation,
940 941 942
	 * so don't allocate extra space that won't be used in the stdio
	 * implementation.
	 */
943
	if (use_browser == 1 && sort__has_sym) {
944
		symbol_conf.priv_size = sizeof(struct annotation);
945 946
		machines__set_symbol_filter(&session->machines,
					    symbol__annotate_init);
947 948 949 950 951 952 953 954 955 956 957 958 959 960 961 962
		/*
 		 * For searching by name on the "Browse map details".
 		 * providing it only in verbose mode not to bloat too
 		 * much struct symbol.
 		 */
		if (verbose) {
			/*
			 * XXX: Need to provide a less kludgy way to ask for
			 * more space per symbol, the u32 is for the index on
			 * the ui browser.
			 * See symbol__browser_index.
			 */
			symbol_conf.priv_size += sizeof(u32);
			symbol_conf.sort_by_name = true;
		}
	}
963

964
	if (symbol__init() < 0)
965
		goto error;
966

967
	if (parent_pattern != default_parent_pattern) {
968
		if (sort_dimension__add("parent") < 0)
969
			goto error;
970
	}
971

972 973 974 975 976 977 978 979 980 981
	if (argc) {
		/*
		 * Special case: if there's an argument left then assume that
		 * it's a symbol filter:
		 */
		if (argc > 1)
			usage_with_options(report_usage, options);

		report.symbol_filter_str = argv[0];
	}
982

983
	sort__setup_elide(stdout);
984

985
	ret = __cmd_report(&report);
986 987 988 989 990 991
	if (ret == K_SWITCH_INPUT_DATA) {
		perf_session__delete(session);
		goto repeat;
	} else
		ret = 0;

992 993 994
error:
	perf_session__delete(session);
	return ret;
995
}