annotate.c 78.2 KB
Newer Older
1
// SPDX-License-Identifier: GPL-2.0-only
2 3 4 5 6 7 8
/*
 * Copyright (C) 2011, Red Hat Inc, Arnaldo Carvalho de Melo <acme@redhat.com>
 *
 * Parts came from builtin-annotate.c, see those files for further
 * copyright notes.
 */

9
#include <errno.h>
10
#include <inttypes.h>
11
#include <libgen.h>
12
#include <stdlib.h>
13 14 15 16
#include <bpf/bpf.h>
#include <bpf/btf.h>
#include <bpf/libbpf.h>
#include <linux/btf.h>
17
#include "util.h" // hex_width()
18 19
#include "ui/ui.h"
#include "sort.h"
20 21
#include "build-id.h"
#include "color.h"
22
#include "config.h"
23
#include "dso.h"
24
#include "env.h"
25
#include "map.h"
26
#include "maps.h"
27
#include "symbol.h"
28
#include "srcline.h"
29
#include "units.h"
30 31
#include "debug.h"
#include "annotate.h"
32
#include "evsel.h"
33
#include "evlist.h"
34
#include "bpf-event.h"
35
#include "block-range.h"
36
#include "string2.h"
37
#include "util/event.h"
38
#include "arch/common.h"
39
#include <regex.h>
40
#include <pthread.h>
41
#include <linux/bitops.h>
42
#include <linux/kernel.h>
43
#include <linux/string.h>
44
#include <subcmd/parse-options.h>
45
#include <subcmd/run-command.h>
46

47 48 49 50 51 52 53
/* FIXME: For the HE_COLORSET */
#include "ui/browser.h"

/*
 * FIXME: Using the same values as slang.h,
 * but that header may not be available everywhere
 */
54 55 56 57
#define LARROW_CHAR	((unsigned char)',')
#define RARROW_CHAR	((unsigned char)'+')
#define DARROW_CHAR	((unsigned char)'.')
#define UARROW_CHAR	((unsigned char)'-')
58

59
#include <linux/ctype.h>
60

61 62 63
struct annotation_options annotation__default_options = {
	.use_offset     = true,
	.jump_arrows    = true,
64
	.annotate_src	= true,
65
	.offset_level	= ANNOTATION__OFFSET_JUMP_TARGETS,
66
	.percent_type	= PERCENT_PERIOD_LOCAL,
67 68
};

69
static regex_t	 file_lineno;
70

71
static struct ins_ops *ins__find(struct arch *arch, const char *name);
72
static void ins__sort(struct arch *arch);
73
static int disasm_line__parse(char *line, const char **namep, char **rawp);
74

75 76
struct arch {
	const char	*name;
77 78
	struct ins	*instructions;
	size_t		nr_instructions;
79 80
	size_t		nr_instructions_allocated;
	struct ins_ops  *(*associate_instruction_ops)(struct arch *arch, const char *name);
81
	bool		sorted_instructions;
82 83
	bool		initialized;
	void		*priv;
84 85
	unsigned int	model;
	unsigned int	family;
86
	int		(*init)(struct arch *arch, char *cpuid);
87 88
	bool		(*ins_is_fused)(struct arch *arch, const char *ins1,
					const char *ins2);
89 90
	struct		{
		char comment_char;
91
		char skip_functions_char;
92 93 94
	} objdump;
};

95 96 97 98 99 100 101 102
static struct ins_ops call_ops;
static struct ins_ops dec_ops;
static struct ins_ops jump_ops;
static struct ins_ops mov_ops;
static struct ins_ops nop_ops;
static struct ins_ops lock_ops;
static struct ins_ops ret_ops;

103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130
static int arch__grow_instructions(struct arch *arch)
{
	struct ins *new_instructions;
	size_t new_nr_allocated;

	if (arch->nr_instructions_allocated == 0 && arch->instructions)
		goto grow_from_non_allocated_table;

	new_nr_allocated = arch->nr_instructions_allocated + 128;
	new_instructions = realloc(arch->instructions, new_nr_allocated * sizeof(struct ins));
	if (new_instructions == NULL)
		return -1;

out_update_instructions:
	arch->instructions = new_instructions;
	arch->nr_instructions_allocated = new_nr_allocated;
	return 0;

grow_from_non_allocated_table:
	new_nr_allocated = arch->nr_instructions + 128;
	new_instructions = calloc(new_nr_allocated, sizeof(struct ins));
	if (new_instructions == NULL)
		return -1;

	memcpy(new_instructions, arch->instructions, arch->nr_instructions);
	goto out_update_instructions;
}

131
static int arch__associate_ins_ops(struct arch* arch, const char *name, struct ins_ops *ops)
132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150
{
	struct ins *ins;

	if (arch->nr_instructions == arch->nr_instructions_allocated &&
	    arch__grow_instructions(arch))
		return -1;

	ins = &arch->instructions[arch->nr_instructions];
	ins->name = strdup(name);
	if (!ins->name)
		return -1;

	ins->ops  = ops;
	arch->nr_instructions++;

	ins__sort(arch);
	return 0;
}

151
#include "arch/arc/annotate/instructions.c"
152
#include "arch/arm/annotate/instructions.c"
K
Kim Phillips 已提交
153
#include "arch/arm64/annotate/instructions.c"
M
Mao Han 已提交
154
#include "arch/csky/annotate/instructions.c"
155
#include "arch/x86/annotate/instructions.c"
156
#include "arch/powerpc/annotate/instructions.c"
157
#include "arch/s390/annotate/instructions.c"
D
David Miller 已提交
158
#include "arch/sparc/annotate/instructions.c"
159

160
static struct arch architectures[] = {
161 162 163 164
	{
		.name = "arc",
		.init = arc__annotate_init,
	},
165 166
	{
		.name = "arm",
167
		.init = arm__annotate_init,
168
	},
K
Kim Phillips 已提交
169 170 171 172
	{
		.name = "arm64",
		.init = arm64__annotate_init,
	},
M
Mao Han 已提交
173 174 175 176
	{
		.name = "csky",
		.init = csky__annotate_init,
	},
177 178
	{
		.name = "x86",
179
		.init = x86__annotate_init,
180 181
		.instructions = x86__instructions,
		.nr_instructions = ARRAY_SIZE(x86__instructions),
182
		.ins_is_fused = x86__ins_is_fused,
183 184 185 186
		.objdump =  {
			.comment_char = '#',
		},
	},
187 188 189 190
	{
		.name = "powerpc",
		.init = powerpc__annotate_init,
	},
191 192
	{
		.name = "s390",
193
		.init = s390__annotate_init,
194 195 196 197
		.objdump =  {
			.comment_char = '#',
		},
	},
D
David Miller 已提交
198 199 200 201 202 203 204
	{
		.name = "sparc",
		.init = sparc__annotate_init,
		.objdump = {
			.comment_char = '#',
		},
	},
205 206
};

207 208
static void ins__delete(struct ins_operands *ops)
{
209 210
	if (ops == NULL)
		return;
211 212 213 214
	zfree(&ops->source.raw);
	zfree(&ops->source.name);
	zfree(&ops->target.raw);
	zfree(&ops->target.name);
215 216
}

217
static int ins__raw_scnprintf(struct ins *ins, char *bf, size_t size,
218
			      struct ins_operands *ops, int max_ins_name)
219
{
220
	return scnprintf(bf, size, "%-*s %s", max_ins_name, ins->name, ops->raw);
221 222 223
}

int ins__scnprintf(struct ins *ins, char *bf, size_t size,
224
		   struct ins_operands *ops, int max_ins_name)
225 226
{
	if (ins->ops->scnprintf)
227
		return ins->ops->scnprintf(ins, bf, size, ops, max_ins_name);
228

229
	return ins__raw_scnprintf(ins, bf, size, ops, max_ins_name);
230 231
}

232 233 234 235 236 237 238 239
bool ins__is_fused(struct arch *arch, const char *ins1, const char *ins2)
{
	if (!arch || !arch->ins_is_fused)
		return false;

	return arch->ins_is_fused(arch, ins1, ins2);
}

240
static int call__parse(struct arch *arch, struct ins_operands *ops, struct map_symbol *ms)
241
{
242
	char *endptr, *tok, *name;
243
	struct map *map = ms->map;
244
	struct addr_map_symbol target = {
245
		.ms = { .map = map, },
246
	};
247

248
	ops->target.addr = strtoull(ops->raw, &endptr, 16);
249 250 251 252 253 254 255

	name = strchr(endptr, '<');
	if (name == NULL)
		goto indirect_call;

	name++;

256 257
	if (arch->objdump.skip_functions_char &&
	    strchr(name, arch->objdump.skip_functions_char))
R
Russell King 已提交
258 259
		return -1;

260 261 262 263 264
	tok = strchr(name, '>');
	if (tok == NULL)
		return -1;

	*tok = '\0';
265
	ops->target.name = strdup(name);
266 267
	*tok = '>';

268 269 270 271
	if (ops->target.name == NULL)
		return -1;
find_target:
	target.addr = map__objdump_2mem(map, ops->target.addr);
272

273
	if (maps__find_ams(ms->maps, &target) == 0 &&
274 275
	    map__rip_2objdump(target.ms.map, map->map_ip(target.ms.map, target.addr)) == ops->target.addr)
		ops->target.sym = target.ms.sym;
276

277
	return 0;
278 279 280

indirect_call:
	tok = strchr(endptr, '*');
281 282 283 284 285 286 287 288
	if (tok != NULL) {
		endptr++;

		/* Indirect call can use a non-rip register and offset: callq  *0x8(%rbx).
		 * Do not parse such instruction.  */
		if (strstr(endptr, "(%r") == NULL)
			ops->target.addr = strtoull(endptr, NULL, 16);
	}
289
	goto find_target;
290 291
}

292
static int call__scnprintf(struct ins *ins, char *bf, size_t size,
293
			   struct ins_operands *ops, int max_ins_name)
294
{
295
	if (ops->target.sym)
296
		return scnprintf(bf, size, "%-*s %s", max_ins_name, ins->name, ops->target.sym->name);
297

298
	if (ops->target.addr == 0)
299
		return ins__raw_scnprintf(ins, bf, size, ops, max_ins_name);
300

301
	if (ops->target.name)
302
		return scnprintf(bf, size, "%-*s %s", max_ins_name, ins->name, ops->target.name);
303

304
	return scnprintf(bf, size, "%-*s *%" PRIx64, max_ins_name, ins->name, ops->target.addr);
305 306
}

307
static struct ins_ops call_ops = {
308 309
	.parse	   = call__parse,
	.scnprintf = call__scnprintf,
310 311 312 313
};

bool ins__is_call(const struct ins *ins)
{
314
	return ins->ops == &call_ops || ins->ops == &s390_call_ops;
315 316
}

317 318 319 320 321 322 323 324 325 326 327 328 329
/*
 * Prevents from matching commas in the comment section, e.g.:
 * ffff200008446e70:       b.cs    ffff2000084470f4 <generic_exec_single+0x314>  // b.hs, b.nlast
 */
static inline const char *validate_comma(const char *c, struct ins_operands *ops)
{
	if (ops->raw_comment && c > ops->raw_comment)
		return NULL;

	return c;
}

static int jump__parse(struct arch *arch, struct ins_operands *ops, struct map_symbol *ms)
330
{
331 332 333
	struct map *map = ms->map;
	struct symbol *sym = ms->sym;
	struct addr_map_symbol target = {
334
		.ms = { .map = map, },
335
	};
336
	const char *c = strchr(ops->raw, ',');
337
	u64 start, end;
338 339 340 341

	ops->raw_comment = strchr(ops->raw, arch->objdump.comment_char);
	c = validate_comma(c, ops);

342 343 344 345 346 347 348 349 350 351 352
	/*
	 * Examples of lines to parse for the _cpp_lex_token@@Base
	 * function:
	 *
	 * 1159e6c: jne    115aa32 <_cpp_lex_token@@Base+0xf92>
	 * 1159e8b: jne    c469be <cpp_named_operator2name@@Base+0xa72>
	 *
	 * The first is a jump to an offset inside the same function,
	 * the second is to another function, i.e. that 0xa72 is an
	 * offset in the cpp_named_operator2name@@base function.
	 */
353 354 355 356 357
	/*
	 * skip over possible up to 2 operands to get to address, e.g.:
	 * tbnz	 w0, #26, ffff0000083cd190 <security_file_permission+0xd0>
	 */
	if (c++ != NULL) {
358
		ops->target.addr = strtoull(c, NULL, 16);
359 360
		if (!ops->target.addr) {
			c = strchr(c, ',');
361
			c = validate_comma(c, ops);
362 363 364 365
			if (c++ != NULL)
				ops->target.addr = strtoull(c, NULL, 16);
		}
	} else {
366
		ops->target.addr = strtoull(ops->raw, NULL, 16);
367
	}
368

369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 388 389 390 391
	target.addr = map__objdump_2mem(map, ops->target.addr);
	start = map->unmap_ip(map, sym->start),
	end = map->unmap_ip(map, sym->end);

	ops->target.outside = target.addr < start || target.addr > end;

	/*
	 * FIXME: things like this in _cpp_lex_token (gcc's cc1 program):

		cpp_named_operator2name@@Base+0xa72

	 * Point to a place that is after the cpp_named_operator2name
	 * boundaries, i.e.  in the ELF symbol table for cc1
	 * cpp_named_operator2name is marked as being 32-bytes long, but it in
	 * fact is much larger than that, so we seem to need a symbols__find()
	 * routine that looks for >= current->start and  < next_symbol->start,
	 * possibly just for C++ objects?
	 *
	 * For now lets just make some progress by marking jumps to outside the
	 * current function as call like.
	 *
	 * Actual navigation will come next, with further understanding of how
	 * the symbol searching and disassembly should be done.
392
	 */
393
	if (maps__find_ams(ms->maps, &target) == 0 &&
394 395
	    map__rip_2objdump(target.ms.map, map->map_ip(target.ms.map, target.addr)) == ops->target.addr)
		ops->target.sym = target.ms.sym;
396

397 398
	if (!ops->target.outside) {
		ops->target.offset = target.addr - start;
399 400 401 402
		ops->target.offset_avail = true;
	} else {
		ops->target.offset_avail = false;
	}
403 404 405 406

	return 0;
}

407
static int jump__scnprintf(struct ins *ins, char *bf, size_t size,
408
			   struct ins_operands *ops, int max_ins_name)
409
{
410
	const char *c;
411

412
	if (!ops->target.addr || ops->target.offset < 0)
413
		return ins__raw_scnprintf(ins, bf, size, ops, max_ins_name);
414

415
	if (ops->target.outside && ops->target.sym != NULL)
416
		return scnprintf(bf, size, "%-*s %s", max_ins_name, ins->name, ops->target.sym->name);
417

418
	c = strchr(ops->raw, ',');
419 420
	c = validate_comma(c, ops);

421 422 423
	if (c != NULL) {
		const char *c2 = strchr(c + 1, ',');

424
		c2 = validate_comma(c2, ops);
425 426 427 428 429 430 431 432 433 434
		/* check for 3-op insn */
		if (c2 != NULL)
			c = c2;
		c++;

		/* mirror arch objdump's space-after-comma style */
		if (*c == ' ')
			c++;
	}

435
	return scnprintf(bf, size, "%-*s %.*s%" PRIx64, max_ins_name,
436 437
			 ins->name, c ? c - ops->raw : 0, ops->raw,
			 ops->target.offset);
438 439
}

440
static struct ins_ops jump_ops = {
441 442
	.parse	   = jump__parse,
	.scnprintf = jump__scnprintf,
443 444 445 446 447 448 449
};

bool ins__is_jump(const struct ins *ins)
{
	return ins->ops == &jump_ops;
}

450 451 452 453 454 455 456 457
static int comment__symbol(char *raw, char *comment, u64 *addrp, char **namep)
{
	char *endptr, *name, *t;

	if (strstr(raw, "(%rip)") == NULL)
		return 0;

	*addrp = strtoull(comment, &endptr, 16);
458 459
	if (endptr == comment)
		return 0;
460 461 462 463 464 465 466 467 468 469 470 471 472 473 474 475 476
	name = strchr(endptr, '<');
	if (name == NULL)
		return -1;

	name++;

	t = strchr(name, '>');
	if (t == NULL)
		return 0;

	*t = '\0';
	*namep = strdup(name);
	*t = '>';

	return 0;
}

477
static int lock__parse(struct arch *arch, struct ins_operands *ops, struct map_symbol *ms)
478 479 480 481 482
{
	ops->locked.ops = zalloc(sizeof(*ops->locked.ops));
	if (ops->locked.ops == NULL)
		return 0;

483
	if (disasm_line__parse(ops->raw, &ops->locked.ins.name, &ops->locked.ops->raw) < 0)
484 485
		goto out_free_ops;

486
	ops->locked.ins.ops = ins__find(arch, ops->locked.ins.name);
487

488
	if (ops->locked.ins.ops == NULL)
N
Namhyung Kim 已提交
489
		goto out_free_ops;
490

491
	if (ops->locked.ins.ops->parse &&
492
	    ops->locked.ins.ops->parse(arch, ops->locked.ops, ms) < 0)
493
		goto out_free_ops;
494 495 496 497

	return 0;

out_free_ops:
498
	zfree(&ops->locked.ops);
499 500 501 502
	return 0;
}

static int lock__scnprintf(struct ins *ins, char *bf, size_t size,
503
			   struct ins_operands *ops, int max_ins_name)
504 505 506
{
	int printed;

507
	if (ops->locked.ins.ops == NULL)
508
		return ins__raw_scnprintf(ins, bf, size, ops, max_ins_name);
509

510
	printed = scnprintf(bf, size, "%-*s ", max_ins_name, ins->name);
511
	return printed + ins__scnprintf(&ops->locked.ins, bf + printed,
512
					size - printed, ops->locked.ops, max_ins_name);
513 514
}

515 516
static void lock__delete(struct ins_operands *ops)
{
517
	struct ins *ins = &ops->locked.ins;
518

519
	if (ins->ops && ins->ops->free)
520 521 522 523
		ins->ops->free(ops->locked.ops);
	else
		ins__delete(ops->locked.ops);

524 525 526
	zfree(&ops->locked.ops);
	zfree(&ops->target.raw);
	zfree(&ops->target.name);
527 528
}

529
static struct ins_ops lock_ops = {
530
	.free	   = lock__delete,
531 532 533 534
	.parse	   = lock__parse,
	.scnprintf = lock__scnprintf,
};

535
static int mov__parse(struct arch *arch, struct ins_operands *ops, struct map_symbol *ms __maybe_unused)
536 537 538 539 540 541 542 543 544
{
	char *s = strchr(ops->raw, ','), *target, *comment, prev;

	if (s == NULL)
		return -1;

	*s = '\0';
	ops->source.raw = strdup(ops->raw);
	*s = ',';
545

546 547 548 549
	if (ops->source.raw == NULL)
		return -1;

	target = ++s;
550
	comment = strchr(s, arch->objdump.comment_char);
551 552 553 554 555

	if (comment != NULL)
		s = comment - 1;
	else
		s = strchr(s, '\0') - 1;
556

557 558 559
	while (s > target && isspace(s[0]))
		--s;
	s++;
560 561 562 563 564 565 566 567 568 569 570 571
	prev = *s;
	*s = '\0';

	ops->target.raw = strdup(target);
	*s = prev;

	if (ops->target.raw == NULL)
		goto out_free_source;

	if (comment == NULL)
		return 0;

572
	comment = skip_spaces(comment);
573 574
	comment__symbol(ops->source.raw, comment + 1, &ops->source.addr, &ops->source.name);
	comment__symbol(ops->target.raw, comment + 1, &ops->target.addr, &ops->target.name);
575 576 577 578

	return 0;

out_free_source:
579
	zfree(&ops->source.raw);
580 581 582 583
	return -1;
}

static int mov__scnprintf(struct ins *ins, char *bf, size_t size,
584
			   struct ins_operands *ops, int max_ins_name)
585
{
586
	return scnprintf(bf, size, "%-*s %s,%s", max_ins_name, ins->name,
587 588 589 590 591 592 593 594 595
			 ops->source.name ?: ops->source.raw,
			 ops->target.name ?: ops->target.raw);
}

static struct ins_ops mov_ops = {
	.parse	   = mov__parse,
	.scnprintf = mov__scnprintf,
};

596
static int dec__parse(struct arch *arch __maybe_unused, struct ins_operands *ops, struct map_symbol *ms __maybe_unused)
597 598 599 600 601 602 603 604 605 606 607 608 609 610 611 612
{
	char *target, *comment, *s, prev;

	target = s = ops->raw;

	while (s[0] != '\0' && !isspace(s[0]))
		++s;
	prev = *s;
	*s = '\0';

	ops->target.raw = strdup(target);
	*s = prev;

	if (ops->target.raw == NULL)
		return -1;

613
	comment = strchr(s, arch->objdump.comment_char);
614 615 616
	if (comment == NULL)
		return 0;

617
	comment = skip_spaces(comment);
618
	comment__symbol(ops->target.raw, comment + 1, &ops->target.addr, &ops->target.name);
619 620 621 622 623

	return 0;
}

static int dec__scnprintf(struct ins *ins, char *bf, size_t size,
624
			   struct ins_operands *ops, int max_ins_name)
625
{
626
	return scnprintf(bf, size, "%-*s %s", max_ins_name, ins->name,
627 628 629 630 631 632 633 634
			 ops->target.name ?: ops->target.raw);
}

static struct ins_ops dec_ops = {
	.parse	   = dec__parse,
	.scnprintf = dec__scnprintf,
};

635
static int nop__scnprintf(struct ins *ins __maybe_unused, char *bf, size_t size,
636
			  struct ins_operands *ops __maybe_unused, int max_ins_name)
637
{
638
	return scnprintf(bf, size, "%-*s", max_ins_name, "nop");
639 640 641 642 643 644
}

static struct ins_ops nop_ops = {
	.scnprintf = nop__scnprintf,
};

645 646 647 648 649 650 651 652 653
static struct ins_ops ret_ops = {
	.scnprintf = ins__raw_scnprintf,
};

bool ins__is_ret(const struct ins *ins)
{
	return ins->ops == &ret_ops;
}

654 655 656 657 658
bool ins__is_lock(const struct ins *ins)
{
	return ins->ops == &lock_ops;
}

659
static int ins__key_cmp(const void *name, const void *insp)
660 661 662 663 664 665
{
	const struct ins *ins = insp;

	return strcmp(name, ins->name);
}

666 667 668 669 670 671 672 673
static int ins__cmp(const void *a, const void *b)
{
	const struct ins *ia = a;
	const struct ins *ib = b;

	return strcmp(ia->name, ib->name);
}

674
static void ins__sort(struct arch *arch)
675
{
676
	const int nmemb = arch->nr_instructions;
677

678
	qsort(arch->instructions, nmemb, sizeof(struct ins), ins__cmp);
679 680
}

681
static struct ins_ops *__ins__find(struct arch *arch, const char *name)
682
{
683
	struct ins *ins;
684
	const int nmemb = arch->nr_instructions;
685

686 687 688
	if (!arch->sorted_instructions) {
		ins__sort(arch);
		arch->sorted_instructions = true;
689
	}
690

691 692
	ins = bsearch(name, arch->instructions, nmemb, sizeof(struct ins), ins__key_cmp);
	return ins ? ins->ops : NULL;
693 694
}

695 696 697 698 699 700 701 702 703 704
static struct ins_ops *ins__find(struct arch *arch, const char *name)
{
	struct ins_ops *ops = __ins__find(arch, name);

	if (!ops && arch->associate_instruction_ops)
		ops = arch->associate_instruction_ops(arch, name);

	return ops;
}

705 706 707 708 709 710 711 712 713 714 715 716 717 718 719 720 721 722 723 724 725 726 727 728 729 730 731 732 733 734 735 736 737 738 739
static int arch__key_cmp(const void *name, const void *archp)
{
	const struct arch *arch = archp;

	return strcmp(name, arch->name);
}

static int arch__cmp(const void *a, const void *b)
{
	const struct arch *aa = a;
	const struct arch *ab = b;

	return strcmp(aa->name, ab->name);
}

static void arch__sort(void)
{
	const int nmemb = ARRAY_SIZE(architectures);

	qsort(architectures, nmemb, sizeof(struct arch), arch__cmp);
}

static struct arch *arch__find(const char *name)
{
	const int nmemb = ARRAY_SIZE(architectures);
	static bool sorted;

	if (!sorted) {
		arch__sort();
		sorted = true;
	}

	return bsearch(name, architectures, nmemb, sizeof(struct arch), arch__key_cmp);
}

740 741 742 743 744 745 746 747 748 749
static struct annotated_source *annotated_source__new(void)
{
	struct annotated_source *src = zalloc(sizeof(*src));

	if (src != NULL)
		INIT_LIST_HEAD(&src->source);

	return src;
}

750
static __maybe_unused void annotated_source__delete(struct annotated_source *src)
751 752 753 754 755 756 757 758
{
	if (src == NULL)
		return;
	zfree(&src->histograms);
	zfree(&src->cycles_hist);
	free(src);
}

759 760
static int annotated_source__alloc_histograms(struct annotated_source *src,
					      size_t size, int nr_hists)
761
{
762 763
	size_t sizeof_sym_hist;

764 765 766 767 768 769 770 771 772 773
	/*
	 * Add buffer of one element for zero length symbol.
	 * When sample is taken from first instruction of
	 * zero length symbol, perf still resolves it and
	 * shows symbol name in perf report and allows to
	 * annotate it.
	 */
	if (size == 0)
		size = 1;

774
	/* Check for overflow when calculating sizeof_sym_hist */
775
	if (size > (SIZE_MAX - sizeof(struct sym_hist)) / sizeof(struct sym_hist_entry))
776 777
		return -1;

778
	sizeof_sym_hist = (sizeof(struct sym_hist) + size * sizeof(struct sym_hist_entry));
779 780

	/* Check for overflow in zalloc argument */
781
	if (sizeof_sym_hist > SIZE_MAX / nr_hists)
782
		return -1;
783

784 785 786 787 788 789
	src->sizeof_sym_hist = sizeof_sym_hist;
	src->nr_histograms   = nr_hists;
	src->histograms	     = calloc(nr_hists, sizeof_sym_hist) ;
	return src->histograms ? 0 : -1;
}

790 791 792 793 794 795 796 797 798 799 800 801
/* The cycles histogram is lazily allocated. */
static int symbol__alloc_hist_cycles(struct symbol *sym)
{
	struct annotation *notes = symbol__annotation(sym);
	const size_t size = symbol__size(sym);

	notes->src->cycles_hist = calloc(size, sizeof(struct cyc_hist));
	if (notes->src->cycles_hist == NULL)
		return -1;
	return 0;
}

802 803 804 805
void symbol__annotate_zero_histograms(struct symbol *sym)
{
	struct annotation *notes = symbol__annotation(sym);

806
	pthread_mutex_lock(&notes->lock);
807
	if (notes->src != NULL) {
808 809
		memset(notes->src->histograms, 0,
		       notes->src->nr_histograms * notes->src->sizeof_sym_hist);
810 811 812 813
		if (notes->src->cycles_hist)
			memset(notes->src->cycles_hist, 0,
				symbol__size(sym) * sizeof(struct cyc_hist));
	}
814
	pthread_mutex_unlock(&notes->lock);
815 816
}

817
static int __symbol__account_cycles(struct cyc_hist *ch,
818 819 820 821 822 823 824 825 826 827 828 829 830 831 832
				    u64 start,
				    unsigned offset, unsigned cycles,
				    unsigned have_start)
{
	/*
	 * For now we can only account one basic block per
	 * final jump. But multiple could be overlapping.
	 * Always account the longest one. So when
	 * a shorter one has been already seen throw it away.
	 *
	 * We separately always account the full cycles.
	 */
	ch[offset].num_aggr++;
	ch[offset].cycles_aggr += cycles;

833 834 835 836 837 838 839 840 841
	if (cycles > ch[offset].cycles_max)
		ch[offset].cycles_max = cycles;

	if (ch[offset].cycles_min) {
		if (cycles && cycles < ch[offset].cycles_min)
			ch[offset].cycles_min = cycles;
	} else
		ch[offset].cycles_min = cycles;

842 843 844 845 846 847 848 849 850 851 852 853 854 855
	if (!have_start && ch[offset].have_start)
		return 0;
	if (ch[offset].num) {
		if (have_start && (!ch[offset].have_start ||
				   ch[offset].start > start)) {
			ch[offset].have_start = 0;
			ch[offset].cycles = 0;
			ch[offset].num = 0;
			if (ch[offset].reset < 0xffff)
				ch[offset].reset++;
		} else if (have_start &&
			   ch[offset].start < start)
			return 0;
	}
J
Jin Yao 已提交
856 857 858 859

	if (ch[offset].num < NUM_SPARKS)
		ch[offset].cycles_spark[ch[offset].num] = cycles;

860 861 862 863 864 865 866
	ch[offset].have_start = have_start;
	ch[offset].start = start;
	ch[offset].cycles += cycles;
	ch[offset].num++;
	return 0;
}

867
static int __symbol__inc_addr_samples(struct map_symbol *ms,
868
				      struct annotated_source *src, int evidx, u64 addr,
869
				      struct perf_sample *sample)
870
{
871
	struct symbol *sym = ms->sym;
872
	unsigned offset;
873 874
	struct sym_hist *h;

875
	pr_debug3("%s: addr=%#" PRIx64 "\n", __func__, ms->map->unmap_ip(ms->map, addr));
876

877 878
	if ((addr < sym->start || addr >= sym->end) &&
	    (addr != sym->end || sym->start != sym->end)) {
879 880
		pr_debug("%s(%d): ERANGE! sym->name=%s, start=%#" PRIx64 ", addr=%#" PRIx64 ", end=%#" PRIx64 "\n",
		       __func__, __LINE__, sym->name, sym->start, addr, sym->end);
881
		return -ERANGE;
882
	}
883

884
	offset = addr - sym->start;
885
	h = annotated_source__histogram(src, evidx);
886 887 888 889 890
	if (h == NULL) {
		pr_debug("%s(%d): ENOMEM! sym->name=%s, start=%#" PRIx64 ", addr=%#" PRIx64 ", end=%#" PRIx64 ", func: %d\n",
			 __func__, __LINE__, sym->name, sym->start, addr, sym->end, sym->type == STT_FUNC);
		return -ENOMEM;
	}
891
	h->nr_samples++;
892
	h->addr[offset].nr_samples++;
893 894
	h->period += sample->period;
	h->addr[offset].period += sample->period;
895 896

	pr_debug3("%#" PRIx64 " %s: period++ [addr: %#" PRIx64 ", %#" PRIx64
897 898 899
		  ", evidx=%d] => nr_samples: %" PRIu64 ", period: %" PRIu64 "\n",
		  sym->start, sym->name, addr, addr - sym->start, evidx,
		  h->addr[offset].nr_samples, h->addr[offset].period);
900 901 902
	return 0;
}

903
static struct cyc_hist *symbol__cycles_hist(struct symbol *sym)
904 905 906 907
{
	struct annotation *notes = symbol__annotation(sym);

	if (notes->src == NULL) {
908 909
		notes->src = annotated_source__new();
		if (notes->src == NULL)
910
			return NULL;
911
		goto alloc_cycles_hist;
912
	}
913 914 915 916

	if (!notes->src->cycles_hist) {
alloc_cycles_hist:
		symbol__alloc_hist_cycles(sym);
917
	}
918 919

	return notes->src->cycles_hist;
920 921
}

922
struct annotated_source *symbol__hists(struct symbol *sym, int nr_hists)
923 924 925 926 927 928 929 930 931 932 933 934 935
{
	struct annotation *notes = symbol__annotation(sym);

	if (notes->src == NULL) {
		notes->src = annotated_source__new();
		if (notes->src == NULL)
			return NULL;
		goto alloc_histograms;
	}

	if (notes->src->histograms == NULL) {
alloc_histograms:
		annotated_source__alloc_histograms(notes->src, symbol__size(sym),
936
						   nr_hists);
937 938 939 940 941
	}

	return notes->src;
}

942
static int symbol__inc_addr_samples(struct map_symbol *ms,
943
				    struct evsel *evsel, u64 addr,
944
				    struct perf_sample *sample)
945
{
946
	struct symbol *sym = ms->sym;
947
	struct annotated_source *src;
948

949
	if (sym == NULL)
950
		return 0;
951
	src = symbol__hists(sym, evsel->evlist->core.nr_entries);
952
	return src ? __symbol__inc_addr_samples(ms, src, evsel->idx, addr, sample) : 0;
953 954
}

955 956 957
static int symbol__account_cycles(u64 addr, u64 start,
				  struct symbol *sym, unsigned cycles)
{
958
	struct cyc_hist *cycles_hist;
959 960 961 962
	unsigned offset;

	if (sym == NULL)
		return 0;
963 964
	cycles_hist = symbol__cycles_hist(sym);
	if (cycles_hist == NULL)
965 966 967 968 969 970 971 972 973 974 975
		return -ENOMEM;
	if (addr < sym->start || addr >= sym->end)
		return -ERANGE;

	if (start) {
		if (start < sym->start || start >= sym->end)
			return -ERANGE;
		if (start >= addr)
			start = 0;
	}
	offset = addr - sym->start;
976
	return __symbol__account_cycles(cycles_hist,
977 978 979 980 981 982 983 984 985
					start ? start - sym->start : 0,
					offset, cycles,
					!!start);
}

int addr_map_symbol__account_cycles(struct addr_map_symbol *ams,
				    struct addr_map_symbol *start,
				    unsigned cycles)
{
986
	u64 saddr = 0;
987 988 989 990 991 992 993 994 995 996 997 998 999
	int err;

	if (!cycles)
		return 0;

	/*
	 * Only set start when IPC can be computed. We can only
	 * compute it when the basic block is completely in a single
	 * function.
	 * Special case the case when the jump is elsewhere, but
	 * it starts on the function start.
	 */
	if (start &&
1000 1001 1002
		(start->ms.sym == ams->ms.sym ||
		 (ams->ms.sym &&
		   start->addr == ams->ms.sym->start + ams->ms.map->start)))
1003 1004
		saddr = start->al_addr;
	if (saddr == 0)
1005
		pr_debug2("BB with bad start: addr %"PRIx64" start %"PRIx64" sym %"PRIx64" saddr %"PRIx64"\n",
1006 1007
			ams->addr,
			start ? start->addr : 0,
1008
			ams->ms.sym ? ams->ms.sym->start + ams->ms.map->start : 0,
1009
			saddr);
1010
	err = symbol__account_cycles(ams->al_addr, saddr, ams->ms.sym, cycles);
1011 1012 1013 1014 1015
	if (err)
		pr_debug2("account_cycles failed %d\n", err);
	return err;
}

1016 1017 1018 1019 1020 1021 1022 1023 1024 1025 1026 1027 1028 1029 1030
static unsigned annotation__count_insn(struct annotation *notes, u64 start, u64 end)
{
	unsigned n_insn = 0;
	u64 offset;

	for (offset = start; offset <= end; offset++) {
		if (notes->offsets[offset])
			n_insn++;
	}
	return n_insn;
}

static void annotation__count_and_fill(struct annotation *notes, u64 start, u64 end, struct cyc_hist *ch)
{
	unsigned n_insn;
1031
	unsigned int cover_insn = 0;
1032 1033 1034 1035 1036 1037 1038
	u64 offset;

	n_insn = annotation__count_insn(notes, start, end);
	if (n_insn && ch->num && ch->cycles) {
		float ipc = n_insn / ((double)ch->cycles / (double)ch->num);

		/* Hide data when there are too many overlaps. */
1039
		if (ch->reset >= 0x7fff)
1040 1041 1042 1043 1044
			return;

		for (offset = start; offset <= end; offset++) {
			struct annotation_line *al = notes->offsets[offset];

1045
			if (al && al->ipc == 0.0) {
1046
				al->ipc = ipc;
1047 1048 1049 1050 1051 1052 1053 1054
				cover_insn++;
			}
		}

		if (cover_insn) {
			notes->hit_cycles += ch->cycles;
			notes->hit_insn += n_insn * ch->num;
			notes->cover_insn += cover_insn;
1055 1056 1057 1058 1059 1060
		}
	}
}

void annotation__compute_ipc(struct annotation *notes, size_t size)
{
1061
	s64 offset;
1062 1063 1064 1065

	if (!notes->src || !notes->src->cycles_hist)
		return;

1066 1067 1068 1069 1070
	notes->total_insn = annotation__count_insn(notes, 0, size - 1);
	notes->hit_cycles = 0;
	notes->hit_insn = 0;
	notes->cover_insn = 0;

1071
	pthread_mutex_lock(&notes->lock);
1072
	for (offset = size - 1; offset >= 0; --offset) {
1073 1074 1075 1076 1077 1078 1079 1080 1081
		struct cyc_hist *ch;

		ch = &notes->src->cycles_hist[offset];
		if (ch && ch->cycles) {
			struct annotation_line *al;

			if (ch->have_start)
				annotation__count_and_fill(notes, ch->start, offset, ch);
			al = notes->offsets[offset];
1082
			if (al && ch->num_aggr) {
1083
				al->cycles = ch->cycles_aggr / ch->num_aggr;
1084 1085 1086
				al->cycles_max = ch->cycles_max;
				al->cycles_min = ch->cycles_min;
			}
1087 1088 1089 1090 1091 1092
			notes->have_cycles = true;
		}
	}
	pthread_mutex_unlock(&notes->lock);
}

1093
int addr_map_symbol__inc_samples(struct addr_map_symbol *ams, struct perf_sample *sample,
1094
				 struct evsel *evsel)
1095
{
1096
	return symbol__inc_addr_samples(&ams->ms, evsel, ams->al_addr, sample);
1097 1098
}

1099
int hist_entry__inc_addr_samples(struct hist_entry *he, struct perf_sample *sample,
1100
				 struct evsel *evsel, u64 ip)
1101
{
1102
	return symbol__inc_addr_samples(&he->ms, evsel, ip, sample);
1103 1104
}

1105
static void disasm_line__init_ins(struct disasm_line *dl, struct arch *arch, struct map_symbol *ms)
1106
{
1107
	dl->ins.ops = ins__find(arch, dl->ins.name);
1108

1109
	if (!dl->ins.ops)
1110 1111
		return;

1112
	if (dl->ins.ops->parse && dl->ins.ops->parse(arch, &dl->ops, ms) < 0)
1113
		dl->ins.ops = NULL;
1114 1115
}

1116
static int disasm_line__parse(char *line, const char **namep, char **rawp)
1117
{
1118
	char tmp, *name = skip_spaces(line);
1119 1120 1121 1122 1123 1124 1125 1126 1127 1128 1129 1130 1131 1132

	if (name[0] == '\0')
		return -1;

	*rawp = name + 1;

	while ((*rawp)[0] != '\0' && !isspace((*rawp)[0]))
		++*rawp;

	tmp = (*rawp)[0];
	(*rawp)[0] = '\0';
	*namep = strdup(name);

	if (*namep == NULL)
1133
		goto out;
1134 1135

	(*rawp)[0] = tmp;
1136
	*rawp = strim(*rawp);
1137 1138 1139

	return 0;

1140
out:
1141 1142 1143
	return -1;
}

1144
struct annotate_args {
1145 1146 1147
	struct arch		  *arch;
	struct map_symbol	  ms;
	struct evsel		  *evsel;
1148
	struct annotation_options *options;
1149 1150 1151
	s64			  offset;
	char			  *line;
	int			  line_nr;
1152 1153
};

1154 1155 1156
static void annotation_line__init(struct annotation_line *al,
				  struct annotate_args *args,
				  int nr)
1157
{
1158 1159 1160 1161 1162
	al->offset = args->offset;
	al->line = strdup(args->line);
	al->line_nr = args->line_nr;
	al->data_nr = nr;
}
1163

1164 1165
static void annotation_line__exit(struct annotation_line *al)
{
1166
	free_srcline(al->path);
1167 1168 1169
	zfree(&al->line);
}

1170
static size_t disasm_line_size(int nr)
1171 1172 1173
{
	struct annotation_line *al;

1174
	return (sizeof(struct disasm_line) + (sizeof(al->data[0]) * nr));
1175 1176 1177 1178 1179 1180
}

/*
 * Allocating the disasm annotation line data with
 * following structure:
 *
1181 1182 1183
 *    -------------------------------------------
 *    struct disasm_line | struct annotation_line
 *    -------------------------------------------
1184 1185 1186 1187
 *
 * We have 'struct annotation_line' member as last member
 * of 'struct disasm_line' to have an easy access.
 */
1188
static struct disasm_line *disasm_line__new(struct annotate_args *args)
1189
{
1190
	struct disasm_line *dl = NULL;
1191
	int nr = 1;
1192

1193
	if (evsel__is_group_event(args->evsel))
1194
		nr = args->evsel->core.nr_members;
1195

1196 1197 1198
	dl = zalloc(disasm_line_size(nr));
	if (!dl)
		return NULL;
1199

1200 1201 1202
	annotation_line__init(&dl->al, args, nr);
	if (dl->al.line == NULL)
		goto out_delete;
1203

1204 1205 1206 1207 1208
	if (args->offset != -1) {
		if (disasm_line__parse(dl->al.line, &dl->ins.name, &dl->ops.raw) < 0)
			goto out_free_line;

		disasm_line__init_ins(dl, args->arch, &args->ms);
1209 1210
	}

1211
	return dl;
1212 1213

out_free_line:
1214
	zfree(&dl->al.line);
1215
out_delete:
1216
	free(dl);
1217
	return NULL;
1218 1219
}

1220
void disasm_line__free(struct disasm_line *dl)
1221
{
1222 1223
	if (dl->ins.ops && dl->ins.ops->free)
		dl->ins.ops->free(&dl->ops);
1224 1225
	else
		ins__delete(&dl->ops);
1226
	zfree(&dl->ins.name);
1227 1228
	annotation_line__exit(&dl->al);
	free(dl);
1229 1230
}

1231
int disasm_line__scnprintf(struct disasm_line *dl, char *bf, size_t size, bool raw, int max_ins_name)
1232
{
1233
	if (raw || !dl->ins.ops)
1234
		return scnprintf(bf, size, "%-*s %s", max_ins_name, dl->ins.name, dl->ops.raw);
1235

1236
	return ins__scnprintf(&dl->ins, bf, size, &dl->ops, max_ins_name);
1237 1238
}

1239
static void annotation_line__add(struct annotation_line *al, struct list_head *head)
1240
{
1241
	list_add_tail(&al->node, head);
1242 1243
}

1244 1245
struct annotation_line *
annotation_line__next(struct annotation_line *pos, struct list_head *head)
1246
{
1247 1248
	list_for_each_entry_continue(pos, head, node)
		if (pos->offset >= 0)
1249 1250 1251 1252 1253
			return pos;

	return NULL;
}

1254 1255 1256 1257 1258 1259 1260 1261 1262 1263 1264 1265 1266 1267 1268 1269 1270 1271 1272 1273 1274 1275 1276 1277 1278 1279 1280 1281 1282 1283 1284 1285 1286 1287 1288 1289 1290 1291 1292 1293 1294 1295 1296 1297 1298 1299 1300 1301 1302 1303 1304 1305 1306 1307 1308 1309 1310 1311 1312 1313 1314 1315 1316 1317 1318 1319 1320 1321 1322 1323 1324 1325 1326 1327 1328 1329 1330 1331 1332 1333 1334 1335
static const char *annotate__address_color(struct block_range *br)
{
	double cov = block_range__coverage(br);

	if (cov >= 0) {
		/* mark red for >75% coverage */
		if (cov > 0.75)
			return PERF_COLOR_RED;

		/* mark dull for <1% coverage */
		if (cov < 0.01)
			return PERF_COLOR_NORMAL;
	}

	return PERF_COLOR_MAGENTA;
}

static const char *annotate__asm_color(struct block_range *br)
{
	double cov = block_range__coverage(br);

	if (cov >= 0) {
		/* mark dull for <1% coverage */
		if (cov < 0.01)
			return PERF_COLOR_NORMAL;
	}

	return PERF_COLOR_BLUE;
}

static void annotate__branch_printf(struct block_range *br, u64 addr)
{
	bool emit_comment = true;

	if (!br)
		return;

#if 1
	if (br->is_target && br->start == addr) {
		struct block_range *branch = br;
		double p;

		/*
		 * Find matching branch to our target.
		 */
		while (!branch->is_branch)
			branch = block_range__next(branch);

		p = 100 *(double)br->entry / branch->coverage;

		if (p > 0.1) {
			if (emit_comment) {
				emit_comment = false;
				printf("\t#");
			}

			/*
			 * The percentage of coverage joined at this target in relation
			 * to the next branch.
			 */
			printf(" +%.2f%%", p);
		}
	}
#endif
	if (br->is_branch && br->end == addr) {
		double p = 100*(double)br->taken / br->coverage;

		if (p > 0.1) {
			if (emit_comment) {
				emit_comment = false;
				printf("\t#");
			}

			/*
			 * The percentage of coverage leaving at this branch, and
			 * its prediction ratio.
			 */
			printf(" -%.2f%% (p:%.2f%%)", p, 100*(double)br->pred  / br->taken);
		}
	}
}

1336
static int disasm_line__print(struct disasm_line *dl, u64 start, int addr_fmt_width)
1337
{
1338 1339 1340 1341 1342
	s64 offset = dl->al.offset;
	const u64 addr = start + offset;
	struct block_range *br;

	br = block_range__find(addr);
1343
	color_fprintf(stdout, annotate__address_color(br), "  %*" PRIx64 ":", addr_fmt_width, addr);
1344 1345 1346 1347 1348 1349 1350
	color_fprintf(stdout, annotate__asm_color(br), "%s", dl->al.line);
	annotate__branch_printf(br, addr);
	return 0;
}

static int
annotation_line__print(struct annotation_line *al, struct symbol *sym, u64 start,
1351
		       struct evsel *evsel, u64 len, int min_pcnt, int printed,
1352 1353
		       int max_lines, struct annotation_line *queue, int addr_fmt_width,
		       int percent_type)
1354 1355
{
	struct disasm_line *dl = container_of(al, struct disasm_line, al);
1356 1357 1358
	static const char *prev_line;
	static const char *prev_color;

1359
	if (al->offset != -1) {
1360
		double max_percent = 0.0;
1361
		int i, nr_percent = 1;
1362 1363
		const char *color;
		struct annotation *notes = symbol__annotation(sym);
1364

1365
		for (i = 0; i < al->data_nr; i++) {
1366 1367 1368
			double percent;

			percent = annotation_data__percent(&al->data[i],
1369
							   percent_type);
1370

1371 1372
			if (percent > max_percent)
				max_percent = percent;
1373 1374
		}

1375 1376
		if (al->data_nr > nr_percent)
			nr_percent = al->data_nr;
1377

1378
		if (max_percent < min_pcnt)
1379 1380
			return -1;

1381
		if (max_lines && printed >= max_lines)
1382
			return 1;
1383

1384
		if (queue != NULL) {
1385 1386
			list_for_each_entry_from(queue, &notes->src->source, node) {
				if (queue == al)
1387
					break;
1388
				annotation_line__print(queue, sym, start, evsel, len,
1389 1390
						       0, 0, 1, NULL, addr_fmt_width,
						       percent_type);
1391 1392 1393
			}
		}

1394
		color = get_percent_color(max_percent);
1395 1396 1397 1398 1399 1400

		/*
		 * Also color the filename and line if needed, with
		 * the same color than the percentage. Don't print it
		 * twice for close colored addr with the same filename:line
		 */
1401 1402
		if (al->path) {
			if (!prev_line || strcmp(prev_line, al->path)
1403
				       || color != prev_color) {
1404 1405
				color_fprintf(stdout, color, " %s", al->path);
				prev_line = al->path;
1406 1407 1408 1409
				prev_color = color;
			}
		}

1410
		for (i = 0; i < nr_percent; i++) {
1411
			struct annotation_data *data = &al->data[i];
1412
			double percent;
1413

1414
			percent = annotation_data__percent(data, percent_type);
1415
			color = get_percent_color(percent);
1416 1417

			if (symbol_conf.show_total_period)
1418
				color_fprintf(stdout, color, " %11" PRIu64,
1419
					      data->he.period);
1420 1421
			else if (symbol_conf.show_nr_samples)
				color_fprintf(stdout, color, " %7" PRIu64,
1422
					      data->he.nr_samples);
1423
			else
1424
				color_fprintf(stdout, color, " %7.2f", percent);
1425 1426
		}

1427
		printf(" : ");
1428

1429
		disasm_line__print(dl, start, addr_fmt_width);
1430
		printf("\n");
1431
	} else if (max_lines && printed >= max_lines)
1432 1433
		return 1;
	else {
1434
		int width = symbol_conf.show_total_period ? 12 : 8;
1435

1436 1437 1438
		if (queue)
			return -1;

1439
		if (evsel__is_group_event(evsel))
1440
			width *= evsel->core.nr_members;
1441

1442
		if (!*al->line)
1443
			printf(" %*s:\n", width, " ");
1444
		else
1445
			printf(" %*s:     %*s %s\n", width, " ", addr_fmt_width, " ", al->line);
1446
	}
1447 1448

	return 0;
1449 1450
}

1451 1452 1453 1454 1455 1456 1457 1458 1459 1460 1461 1462 1463 1464 1465 1466 1467 1468 1469 1470
/*
 * symbol__parse_objdump_line() parses objdump output (with -d --no-show-raw)
 * which looks like following
 *
 *  0000000000415500 <_init>:
 *    415500:       sub    $0x8,%rsp
 *    415504:       mov    0x2f5ad5(%rip),%rax        # 70afe0 <_DYNAMIC+0x2f8>
 *    41550b:       test   %rax,%rax
 *    41550e:       je     415515 <_init+0x15>
 *    415510:       callq  416e70 <__gmon_start__@plt>
 *    415515:       add    $0x8,%rsp
 *    415519:       retq
 *
 * it will be parsed and saved into struct disasm_line as
 *  <offset>       <name>  <ops.raw>
 *
 * The offset will be a relative offset from the start of the symbol and -1
 * means that it's not a disassembly line so should be treated differently.
 * The ops.raw part will be parsed further according to type of the instruction.
 */
1471
static int symbol__parse_objdump_line(struct symbol *sym,
1472
				      struct annotate_args *args,
1473
				      char *parsed_line, int *line_nr)
1474
{
1475
	struct map *map = args->ms.map;
1476
	struct annotation *notes = symbol__annotation(sym);
1477
	struct disasm_line *dl;
1478
	char *tmp;
1479
	s64 line_ip, offset = -1;
1480
	regmatch_t match[2];
1481

1482
	/* /filename:linenr ? Save line number and ignore. */
1483 1484
	if (regexec(&file_lineno, parsed_line, 2, match, 0) == 0) {
		*line_nr = atoi(parsed_line + match[1].rm_so);
1485 1486 1487
		return 0;
	}

1488 1489 1490
	/* Process hex address followed by ':'. */
	line_ip = strtoull(parsed_line, &tmp, 16);
	if (parsed_line != tmp && tmp[0] == ':' && tmp[1] != '\0') {
1491 1492 1493 1494
		u64 start = map__rip_2objdump(map, sym->start),
		    end = map__rip_2objdump(map, sym->end);

		offset = line_ip - start;
1495
		if ((u64)line_ip < start || (u64)line_ip >= end)
1496
			offset = -1;
1497
		else
1498
			parsed_line = tmp + 1;
N
Namhyung Kim 已提交
1499
	}
1500

1501 1502 1503
	args->offset  = offset;
	args->line    = parsed_line;
	args->line_nr = *line_nr;
1504
	args->ms.sym  = sym;
1505 1506

	dl = disasm_line__new(args);
1507
	(*line_nr)++;
1508

1509
	if (dl == NULL)
1510
		return -1;
1511

1512
	if (!disasm_line__has_local_offset(dl)) {
1513 1514
		dl->ops.target.offset = dl->ops.target.addr -
					map__rip_2objdump(map, sym->start);
1515 1516
		dl->ops.target.offset_avail = true;
	}
1517

1518 1519
	/* kcore has no symbols, so add the call target symbol */
	if (dl->ins.ops && ins__is_call(&dl->ins) && !dl->ops.target.sym) {
1520 1521
		struct addr_map_symbol target = {
			.addr = dl->ops.target.addr,
1522
			.ms = { .map = map, },
1523 1524
		};

1525
		if (!maps__find_ams(args->ms.maps, &target) &&
1526 1527
		    target.ms.sym->start == target.al_addr)
			dl->ops.target.sym = target.ms.sym;
1528 1529
	}

1530
	annotation_line__add(&dl->al, &notes->src->source);
1531 1532 1533 1534

	return 0;
}

1535 1536 1537 1538 1539
static __attribute__((constructor)) void symbol__init_regexpr(void)
{
	regcomp(&file_lineno, "^/[^:]+:([0-9]+)", REG_EXTENDED);
}

1540 1541 1542 1543 1544 1545 1546
static void delete_last_nop(struct symbol *sym)
{
	struct annotation *notes = symbol__annotation(sym);
	struct list_head *list = &notes->src->source;
	struct disasm_line *dl;

	while (!list_empty(list)) {
1547
		dl = list_entry(list->prev, struct disasm_line, al.node);
1548

1549 1550
		if (dl->ins.ops) {
			if (dl->ins.ops != &nop_ops)
1551 1552
				return;
		} else {
1553 1554 1555
			if (!strstr(dl->al.line, " nop ") &&
			    !strstr(dl->al.line, " nopl ") &&
			    !strstr(dl->al.line, " nopw "))
1556 1557 1558
				return;
		}

1559
		list_del_init(&dl->al.node);
1560 1561 1562 1563
		disasm_line__free(dl);
	}
}

1564
int symbol__strerror_disassemble(struct map_symbol *ms, int errnum, char *buf, size_t buflen)
1565
{
1566
	struct dso *dso = ms->map->dso;
1567 1568 1569 1570 1571 1572 1573 1574 1575 1576 1577 1578 1579 1580

	BUG_ON(buflen == 0);

	if (errnum >= 0) {
		str_error_r(errnum, buf, buflen);
		return 0;
	}

	switch (errnum) {
	case SYMBOL_ANNOTATE_ERRNO__NO_VMLINUX: {
		char bf[SBUILD_ID_SIZE + 15] = " with build id ";
		char *build_id_msg = NULL;

		if (dso->has_build_id) {
J
Jiri Olsa 已提交
1581 1582
			build_id__sprintf(dso->bid.data,
					  sizeof(dso->bid.data), bf + 15);
1583 1584 1585 1586 1587 1588 1589 1590 1591 1592 1593
			build_id_msg = bf;
		}
		scnprintf(buf, buflen,
			  "No vmlinux file%s\nwas found in the path.\n\n"
			  "Note that annotation using /proc/kcore requires CAP_SYS_RAWIO capability.\n\n"
			  "Please use:\n\n"
			  "  perf buildid-cache -vu vmlinux\n\n"
			  "or:\n\n"
			  "  --vmlinux vmlinux\n", build_id_msg ?: "");
	}
		break;
1594 1595 1596
	case SYMBOL_ANNOTATE_ERRNO__NO_LIBOPCODES_FOR_BPF:
		scnprintf(buf, buflen, "Please link with binutils's libopcode to enable BPF annotation");
		break;
1597 1598 1599 1600 1601 1602
	case SYMBOL_ANNOTATE_ERRNO__ARCH_INIT_REGEXP:
		scnprintf(buf, buflen, "Problems with arch specific instruction name regular expressions.");
		break;
	case SYMBOL_ANNOTATE_ERRNO__ARCH_INIT_CPUID_PARSING:
		scnprintf(buf, buflen, "Problems while parsing the CPUID in the arch specific initialization.");
		break;
1603 1604 1605 1606 1607 1608 1609
	case SYMBOL_ANNOTATE_ERRNO__BPF_INVALID_FILE:
		scnprintf(buf, buflen, "Invalid BPF file: %s.", dso->long_name);
		break;
	case SYMBOL_ANNOTATE_ERRNO__BPF_MISSING_BTF:
		scnprintf(buf, buflen, "The %s BPF file has no BTF section, compile with -g or use pahole -J.",
			  dso->long_name);
		break;
1610 1611 1612 1613 1614 1615 1616 1617
	default:
		scnprintf(buf, buflen, "Internal error: Invalid %d error code\n", errnum);
		break;
	}

	return 0;
}

1618
static int dso__disassemble_filename(struct dso *dso, char *filename, size_t filename_size)
1619
{
1620 1621
	char linkname[PATH_MAX];
	char *build_id_filename;
1622
	char *build_id_path = NULL;
1623
	char *pos;
1624
	int len;
1625

1626 1627
	if (dso->symtab_type == DSO_BINARY_TYPE__KALLSYMS &&
	    !dso__is_kcore(dso))
1628
		return SYMBOL_ANNOTATE_ERRNO__NO_VMLINUX;
1629

1630
	build_id_filename = dso__build_id_filename(dso, NULL, 0, false);
1631 1632 1633
	if (build_id_filename) {
		__symbol__join_symfs(filename, filename_size, build_id_filename);
		free(build_id_filename);
1634
	} else {
1635 1636
		if (dso->has_build_id)
			return ENOMEM;
1637
		goto fallback;
1638 1639
	}

1640 1641
	build_id_path = strdup(filename);
	if (!build_id_path)
1642
		return ENOMEM;
1643

1644 1645 1646 1647 1648 1649 1650 1651
	/*
	 * old style build-id cache has name of XX/XXXXXXX.. while
	 * new style has XX/XXXXXXX../{elf,kallsyms,vdso}.
	 * extract the build-id part of dirname in the new style only.
	 */
	pos = strrchr(build_id_path, '/');
	if (pos && strlen(pos) < SBUILD_ID_SIZE - 2)
		dirname(build_id_path);
1652

1653 1654 1655 1656 1657 1658 1659 1660 1661 1662
	if (dso__is_kcore(dso))
		goto fallback;

	len = readlink(build_id_path, linkname, sizeof(linkname) - 1);
	if (len < 0)
		goto fallback;

	linkname[len] = '\0';
	if (strstr(linkname, DSO__NAME_KALLSYMS) ||
		access(filename, R_OK)) {
1663 1664 1665 1666 1667 1668
fallback:
		/*
		 * If we don't have build-ids or the build-id file isn't in the
		 * cache, or is just a kallsyms file, well, lets hope that this
		 * DSO is the same as when 'perf record' ran.
		 */
1669
		__symbol__join_symfs(filename, filename_size, dso->long_name);
1670 1671
	}

1672
	free(build_id_path);
1673 1674 1675
	return 0;
}

1676 1677 1678 1679 1680 1681 1682 1683 1684 1685 1686 1687 1688 1689 1690 1691 1692 1693 1694 1695 1696 1697 1698 1699 1700
#if defined(HAVE_LIBBFD_SUPPORT) && defined(HAVE_LIBBPF_SUPPORT)
#define PACKAGE "perf"
#include <bfd.h>
#include <dis-asm.h>

static int symbol__disassemble_bpf(struct symbol *sym,
				   struct annotate_args *args)
{
	struct annotation *notes = symbol__annotation(sym);
	struct annotation_options *opts = args->options;
	struct bpf_prog_info_linear *info_linear;
	struct bpf_prog_linfo *prog_linfo = NULL;
	struct bpf_prog_info_node *info_node;
	int len = sym->end - sym->start;
	disassembler_ftype disassemble;
	struct map *map = args->ms.map;
	struct disassemble_info info;
	struct dso *dso = map->dso;
	int pc = 0, count, sub_id;
	struct btf *btf = NULL;
	char tpath[PATH_MAX];
	size_t buf_size;
	int nr_skip = 0;
	char *buf;
	bfd *bfdf;
1701
	int ret;
1702 1703 1704
	FILE *s;

	if (dso->binary_type != DSO_BINARY_TYPE__BPF_PROG_INFO)
1705
		return SYMBOL_ANNOTATE_ERRNO__BPF_INVALID_FILE;
1706

1707 1708
	pr_debug("%s: handling sym %s addr %" PRIx64 " len %" PRIx64 "\n", __func__,
		  sym->name, sym->start, sym->end - sym->start);
1709 1710 1711 1712 1713 1714 1715 1716 1717

	memset(tpath, 0, sizeof(tpath));
	perf_exe(tpath, sizeof(tpath));

	bfdf = bfd_openr(tpath, NULL);
	assert(bfdf);
	assert(bfd_check_format(bfdf, bfd_object));

	s = open_memstream(&buf, &buf_size);
1718 1719
	if (!s) {
		ret = errno;
1720
		goto out;
1721
	}
1722 1723 1724 1725 1726 1727 1728 1729
	init_disassemble_info(&info, s,
			      (fprintf_ftype) fprintf);

	info.arch = bfd_get_arch(bfdf);
	info.mach = bfd_get_mach(bfdf);

	info_node = perf_env__find_bpf_prog_info(dso->bpf_prog.env,
						 dso->bpf_prog.id);
1730
	if (!info_node) {
1731
		ret = SYMBOL_ANNOTATE_ERRNO__BPF_MISSING_BTF;
1732
		goto out;
1733
	}
1734 1735 1736
	info_linear = info_node->info_linear;
	sub_id = dso->bpf_prog.sub_id;

1737
	info.buffer = (void *)(uintptr_t)(info_linear->info.jited_prog_insns);
1738 1739 1740 1741 1742 1743 1744 1745 1746 1747 1748 1749 1750 1751 1752 1753 1754 1755 1756 1757 1758 1759 1760 1761 1762 1763 1764 1765 1766 1767 1768 1769 1770 1771 1772
	info.buffer_length = info_linear->info.jited_prog_len;

	if (info_linear->info.nr_line_info)
		prog_linfo = bpf_prog_linfo__new(&info_linear->info);

	if (info_linear->info.btf_id) {
		struct btf_node *node;

		node = perf_env__find_btf(dso->bpf_prog.env,
					  info_linear->info.btf_id);
		if (node)
			btf = btf__new((__u8 *)(node->data),
				       node->data_size);
	}

	disassemble_init_for_target(&info);

#ifdef DISASM_FOUR_ARGS_SIGNATURE
	disassemble = disassembler(info.arch,
				   bfd_big_endian(bfdf),
				   info.mach,
				   bfdf);
#else
	disassemble = disassembler(bfdf);
#endif
	assert(disassemble);

	fflush(s);
	do {
		const struct bpf_line_info *linfo = NULL;
		struct disasm_line *dl;
		size_t prev_buf_size;
		const char *srcline;
		u64 addr;

1773
		addr = pc + ((u64 *)(uintptr_t)(info_linear->info.jited_ksyms))[sub_id];
1774 1775 1776 1777 1778 1779 1780 1781 1782 1783 1784 1785 1786 1787 1788 1789 1790 1791 1792 1793 1794 1795 1796 1797 1798 1799 1800 1801 1802 1803 1804 1805 1806 1807 1808 1809 1810 1811 1812 1813 1814 1815 1816 1817 1818 1819 1820 1821 1822 1823 1824 1825 1826 1827 1828 1829
		count = disassemble(pc, &info);

		if (prog_linfo)
			linfo = bpf_prog_linfo__lfind_addr_func(prog_linfo,
								addr, sub_id,
								nr_skip);

		if (linfo && btf) {
			srcline = btf__name_by_offset(btf, linfo->line_off);
			nr_skip++;
		} else
			srcline = NULL;

		fprintf(s, "\n");
		prev_buf_size = buf_size;
		fflush(s);

		if (!opts->hide_src_code && srcline) {
			args->offset = -1;
			args->line = strdup(srcline);
			args->line_nr = 0;
			args->ms.sym  = sym;
			dl = disasm_line__new(args);
			if (dl) {
				annotation_line__add(&dl->al,
						     &notes->src->source);
			}
		}

		args->offset = pc;
		args->line = buf + prev_buf_size;
		args->line_nr = 0;
		args->ms.sym  = sym;
		dl = disasm_line__new(args);
		if (dl)
			annotation_line__add(&dl->al, &notes->src->source);

		pc += count;
	} while (count > 0 && pc < len);

	ret = 0;
out:
	free(prog_linfo);
	free(btf);
	fclose(s);
	bfd_close(bfdf);
	return ret;
}
#else // defined(HAVE_LIBBFD_SUPPORT) && defined(HAVE_LIBBPF_SUPPORT)
static int symbol__disassemble_bpf(struct symbol *sym __maybe_unused,
				   struct annotate_args *args __maybe_unused)
{
	return SYMBOL_ANNOTATE_ERRNO__NO_LIBOPCODES_FOR_BPF;
}
#endif // defined(HAVE_LIBBFD_SUPPORT) && defined(HAVE_LIBBPF_SUPPORT)

1830 1831 1832 1833 1834 1835 1836 1837 1838 1839 1840 1841 1842 1843 1844 1845 1846 1847
static int
symbol__disassemble_bpf_image(struct symbol *sym,
			      struct annotate_args *args)
{
	struct annotation *notes = symbol__annotation(sym);
	struct disasm_line *dl;

	args->offset = -1;
	args->line = strdup("to be implemented");
	args->line_nr = 0;
	dl = disasm_line__new(args);
	if (dl)
		annotation_line__add(&dl->al, &notes->src->source);

	free(args->line);
	return 0;
}

1848 1849 1850 1851 1852 1853 1854 1855 1856 1857 1858 1859 1860 1861 1862 1863 1864 1865 1866 1867 1868 1869 1870 1871 1872 1873 1874 1875 1876 1877 1878 1879 1880 1881 1882 1883 1884 1885 1886 1887 1888 1889 1890 1891 1892 1893 1894 1895 1896
/*
 * Possibly create a new version of line with tabs expanded. Returns the
 * existing or new line, storage is updated if a new line is allocated. If
 * allocation fails then NULL is returned.
 */
static char *expand_tabs(char *line, char **storage, size_t *storage_len)
{
	size_t i, src, dst, len, new_storage_len, num_tabs;
	char *new_line;
	size_t line_len = strlen(line);

	for (num_tabs = 0, i = 0; i < line_len; i++)
		if (line[i] == '\t')
			num_tabs++;

	if (num_tabs == 0)
		return line;

	/*
	 * Space for the line and '\0', less the leading and trailing
	 * spaces. Each tab may introduce 7 additional spaces.
	 */
	new_storage_len = line_len + 1 + (num_tabs * 7);

	new_line = malloc(new_storage_len);
	if (new_line == NULL) {
		pr_err("Failure allocating memory for tab expansion\n");
		return NULL;
	}

	/*
	 * Copy regions starting at src and expand tabs. If there are two
	 * adjacent tabs then 'src == i', the memcpy is of size 0 and the spaces
	 * are inserted.
	 */
	for (i = 0, src = 0, dst = 0; i < line_len && num_tabs; i++) {
		if (line[i] == '\t') {
			len = i - src;
			memcpy(&new_line[dst], &line[src], len);
			dst += len;
			new_line[dst++] = ' ';
			while (dst % 8 != 0)
				new_line[dst++] = ' ';
			src = i + 1;
			num_tabs--;
		}
	}

	/* Expand the last region. */
I
Ian Rogers 已提交
1897
	len = line_len - src;
1898 1899 1900 1901 1902 1903 1904 1905 1906 1907 1908
	memcpy(&new_line[dst], &line[src], len);
	dst += len;
	new_line[dst] = '\0';

	free(*storage);
	*storage = new_line;
	*storage_len = new_storage_len;
	return new_line;

}

1909
static int symbol__disassemble(struct symbol *sym, struct annotate_args *args)
1910
{
1911
	struct annotation_options *opts = args->options;
1912
	struct map *map = args->ms.map;
1913
	struct dso *dso = map->dso;
1914
	char *command;
1915 1916 1917 1918
	FILE *file;
	char symfs_filename[PATH_MAX];
	struct kcore_extract kce;
	bool delete_extract = false;
1919
	bool decomp = false;
1920 1921
	int lineno = 0;
	int nline;
1922 1923
	char *line;
	size_t line_len;
1924 1925 1926 1927 1928 1929 1930 1931 1932
	const char *objdump_argv[] = {
		"/bin/sh",
		"-c",
		NULL, /* Will be the objdump command to run. */
		"--",
		NULL, /* Will be the symfs path. */
		NULL,
	};
	struct child_process objdump_process;
1933 1934 1935 1936 1937
	int err = dso__disassemble_filename(dso, symfs_filename, sizeof(symfs_filename));

	if (err)
		return err;

1938
	pr_debug("%s: filename=%s, sym=%s, start=%#" PRIx64 ", end=%#" PRIx64 "\n", __func__,
1939
		 symfs_filename, sym->name, map->unmap_ip(map, sym->start),
1940 1941 1942 1943 1944
		 map->unmap_ip(map, sym->end));

	pr_debug("annotating [%p] %30s : [%p] %30s\n",
		 dso, dso->long_name, sym, sym->name);

1945 1946
	if (dso->binary_type == DSO_BINARY_TYPE__BPF_PROG_INFO) {
		return symbol__disassemble_bpf(sym, args);
1947 1948
	} else if (dso->binary_type == DSO_BINARY_TYPE__BPF_IMAGE) {
		return symbol__disassemble_bpf_image(sym, args);
1949
	} else if (dso__is_kcore(dso)) {
1950 1951 1952
		kce.kcore_filename = symfs_filename;
		kce.addr = map__rip_2objdump(map, sym->start);
		kce.offs = sym->start;
1953
		kce.len = sym->end - sym->start;
1954 1955 1956 1957 1958
		if (!kcore_extract__create(&kce)) {
			delete_extract = true;
			strlcpy(symfs_filename, kce.extract_filename,
				sizeof(symfs_filename));
		}
1959
	} else if (dso__needs_decompress(dso)) {
1960
		char tmp[KMOD_DECOMP_LEN];
1961

1962 1963
		if (dso__decompress_kmodule_path(dso, symfs_filename,
						 tmp, sizeof(tmp)) < 0)
1964
			return -1;
1965

1966
		decomp = true;
1967
		strcpy(symfs_filename, tmp);
1968 1969
	}

1970
	err = asprintf(&command,
1971
		 "%s %s%s --start-address=0x%016" PRIx64
1972
		 " --stop-address=0x%016" PRIx64
1973
		 " -l -d %s %s %s %c%s%c %s%s -C \"$1\"",
1974
		 opts->objdump_path ?: "objdump",
1975 1976
		 opts->disassembler_style ? "-M " : "",
		 opts->disassembler_style ?: "",
1977
		 map__rip_2objdump(map, sym->start),
1978
		 map__rip_2objdump(map, sym->end),
1979
		 opts->show_asm_raw ? "" : "--no-show-raw-insn",
1980 1981 1982 1983 1984 1985 1986
		 opts->annotate_src ? "-S" : "",
		 opts->prefix ? "--prefix " : "",
		 opts->prefix ? '"' : ' ',
		 opts->prefix ?: "",
		 opts->prefix ? '"' : ' ',
		 opts->prefix_strip ? "--prefix-strip=" : "",
		 opts->prefix_strip ?: "");
1987

1988 1989 1990 1991 1992
	if (err < 0) {
		pr_err("Failure allocating memory for the command to run\n");
		goto out_remove_tmp;
	}

1993 1994
	pr_debug("Executing: %s\n", command);

1995 1996
	objdump_argv[2] = command;
	objdump_argv[4] = symfs_filename;
1997

1998 1999 2000 2001 2002 2003 2004 2005
	/* Create a pipe to read from for stdout */
	memset(&objdump_process, 0, sizeof(objdump_process));
	objdump_process.argv = objdump_argv;
	objdump_process.out = -1;
	if (start_command(&objdump_process)) {
		pr_err("Failure starting to run %s\n", command);
		err = -1;
		goto out_free_command;
2006 2007
	}

2008
	file = fdopen(objdump_process.out, "r");
2009
	if (!file) {
2010
		pr_err("Failure creating FILE stream for %s\n", command);
2011 2012 2013 2014
		/*
		 * If we were using debug info should retry with
		 * original binary.
		 */
2015 2016
		err = -1;
		goto out_close_stdout;
2017
	}
2018

2019 2020 2021 2022
	/* Storage for getline. */
	line = NULL;
	line_len = 0;

2023 2024
	nline = 0;
	while (!feof(file)) {
2025
		const char *match;
2026
		char *expanded_line;
2027

2028 2029 2030
		if (getline(&line, &line_len, file) < 0 || !line)
			break;

2031 2032 2033 2034 2035
		/* Skip lines containing "filename:" */
		match = strstr(line, symfs_filename);
		if (match && match[strlen(symfs_filename)] == ':')
			continue;

2036 2037 2038 2039 2040
		expanded_line = strim(line);
		expanded_line = expand_tabs(expanded_line, &line, &line_len);
		if (!expanded_line)
			break;

2041 2042
		/*
		 * The source code line number (lineno) needs to be kept in
2043
		 * across calls to symbol__parse_objdump_line(), so that it
2044 2045 2046
		 * can associate it with the instructions till the next one.
		 * See disasm_line__new() and struct disasm_line::line_nr.
		 */
2047 2048
		if (symbol__parse_objdump_line(sym, args, expanded_line,
					       &lineno) < 0)
2049
			break;
2050 2051
		nline++;
	}
2052
	free(line);
2053

2054 2055 2056 2057 2058 2059
	err = finish_command(&objdump_process);
	if (err)
		pr_err("Error running %s\n", command);

	if (nline == 0) {
		err = -1;
2060
		pr_err("No output from %s\n", command);
2061
	}
2062

2063 2064 2065 2066 2067 2068 2069
	/*
	 * kallsyms does not have symbol sizes so there may a nop at the end.
	 * Remove it.
	 */
	if (dso__is_kcore(dso))
		delete_last_nop(sym);

2070
	fclose(file);
2071 2072 2073 2074

out_close_stdout:
	close(objdump_process.out);

2075 2076
out_free_command:
	free(command);
2077

2078
out_remove_tmp:
2079
	if (decomp)
2080
		unlink(symfs_filename);
2081

2082 2083
	if (delete_extract)
		kcore_extract__delete(&kce);
2084

2085
	return err;
2086 2087
}

2088
static void calc_percent(struct sym_hist *sym_hist,
2089
			 struct hists *hists,
2090
			 struct annotation_data *data,
2091 2092 2093 2094 2095 2096
			 s64 offset, s64 end)
{
	unsigned int hits = 0;
	u64 period = 0;

	while (offset < end) {
2097 2098
		hits   += sym_hist->addr[offset].nr_samples;
		period += sym_hist->addr[offset].period;
2099 2100 2101
		++offset;
	}

2102
	if (sym_hist->nr_samples) {
2103 2104
		data->he.period     = period;
		data->he.nr_samples = hits;
2105
		data->percent[PERCENT_HITS_LOCAL] = 100.0 * hits / sym_hist->nr_samples;
2106
	}
2107 2108 2109 2110

	if (hists->stats.nr_non_filtered_samples)
		data->percent[PERCENT_HITS_GLOBAL] = 100.0 * hits / hists->stats.nr_non_filtered_samples;

2111 2112
	if (sym_hist->period)
		data->percent[PERCENT_PERIOD_LOCAL] = 100.0 * period / sym_hist->period;
2113 2114 2115

	if (hists->stats.total_period)
		data->percent[PERCENT_PERIOD_GLOBAL] = 100.0 * period / hists->stats.total_period;
2116 2117
}

2118
static void annotation__calc_percent(struct annotation *notes,
2119
				     struct evsel *leader, s64 len)
2120 2121
{
	struct annotation_line *al, *next;
2122
	struct evsel *evsel;
2123 2124 2125

	list_for_each_entry(al, &notes->src->source, node) {
		s64 end;
2126
		int i = 0;
2127 2128 2129 2130 2131 2132 2133

		if (al->offset == -1)
			continue;

		next = annotation_line__next(al, &notes->src->source);
		end  = next ? next->offset : len;

2134
		for_each_group_evsel(evsel, leader) {
2135
			struct hists *hists = evsel__hists(evsel);
2136
			struct annotation_data *data;
2137
			struct sym_hist *sym_hist;
2138

2139 2140 2141 2142
			BUG_ON(i >= al->data_nr);

			sym_hist = annotation__histogram(notes, evsel->idx);
			data = &al->data[i++];
2143

2144
			calc_percent(sym_hist, hists, data, al->offset, end);
2145 2146 2147 2148
		}
	}
}

2149
void symbol__calc_percent(struct symbol *sym, struct evsel *evsel)
2150 2151 2152
{
	struct annotation *notes = symbol__annotation(sym);

2153
	annotation__calc_percent(notes, evsel, symbol__size(sym));
2154 2155
}

2156
int symbol__annotate(struct map_symbol *ms, struct evsel *evsel,
2157
		     struct annotation_options *options, struct arch **parch)
2158
{
2159
	struct symbol *sym = ms->sym;
2160
	struct annotation *notes = symbol__annotation(sym);
2161
	struct annotate_args args = {
2162
		.evsel		= evsel,
2163
		.options	= options,
2164
	};
2165
	struct perf_env *env = evsel__env(evsel);
2166
	const char *arch_name = perf_env__arch(env);
2167 2168 2169 2170
	struct arch *arch;
	int err;

	if (!arch_name)
2171
		return errno;
2172

2173
	args.arch = arch = arch__find(arch_name);
2174
	if (arch == NULL)
2175
		return ENOTSUP;
2176 2177 2178 2179 2180

	if (parch)
		*parch = arch;

	if (arch->init) {
2181
		err = arch->init(arch, env ? env->cpuid : NULL);
2182 2183 2184 2185 2186 2187
		if (err) {
			pr_err("%s: failed to initialize %s arch priv area\n", __func__, arch->name);
			return err;
		}
	}

2188 2189
	args.ms = *ms;
	notes->start = map__rip_2objdump(ms->map, sym->start);
2190

2191
	return symbol__disassemble(sym, &args);
2192 2193
}

2194 2195
static void insert_source_line(struct rb_root *root, struct annotation_line *al,
			       struct annotation_options *opts)
2196
{
2197
	struct annotation_line *iter;
2198 2199
	struct rb_node **p = &root->rb_node;
	struct rb_node *parent = NULL;
2200
	int i, ret;
2201 2202 2203

	while (*p != NULL) {
		parent = *p;
2204
		iter = rb_entry(parent, struct annotation_line, rb_node);
2205

2206
		ret = strcmp(iter->path, al->path);
2207
		if (ret == 0) {
2208 2209
			for (i = 0; i < al->data_nr; i++) {
				iter->data[i].percent_sum += annotation_data__percent(&al->data[i],
2210
										      opts->percent_type);
2211
			}
2212 2213 2214 2215 2216 2217 2218 2219 2220
			return;
		}

		if (ret < 0)
			p = &(*p)->rb_left;
		else
			p = &(*p)->rb_right;
	}

2221 2222
	for (i = 0; i < al->data_nr; i++) {
		al->data[i].percent_sum = annotation_data__percent(&al->data[i],
2223
								   opts->percent_type);
2224
	}
2225

2226 2227
	rb_link_node(&al->rb_node, parent, p);
	rb_insert_color(&al->rb_node, root);
2228 2229
}

2230
static int cmp_source_line(struct annotation_line *a, struct annotation_line *b)
2231 2232 2233
{
	int i;

2234 2235
	for (i = 0; i < a->data_nr; i++) {
		if (a->data[i].percent_sum == b->data[i].percent_sum)
2236
			continue;
2237
		return a->data[i].percent_sum > b->data[i].percent_sum;
2238 2239 2240 2241 2242
	}

	return 0;
}

2243
static void __resort_source_line(struct rb_root *root, struct annotation_line *al)
2244
{
2245
	struct annotation_line *iter;
2246 2247 2248 2249 2250
	struct rb_node **p = &root->rb_node;
	struct rb_node *parent = NULL;

	while (*p != NULL) {
		parent = *p;
2251
		iter = rb_entry(parent, struct annotation_line, rb_node);
2252

2253
		if (cmp_source_line(al, iter))
2254 2255 2256 2257 2258
			p = &(*p)->rb_left;
		else
			p = &(*p)->rb_right;
	}

2259 2260
	rb_link_node(&al->rb_node, parent, p);
	rb_insert_color(&al->rb_node, root);
2261 2262
}

2263 2264
static void resort_source_line(struct rb_root *dest_root, struct rb_root *src_root)
{
2265
	struct annotation_line *al;
2266 2267 2268 2269 2270 2271
	struct rb_node *node;

	node = rb_first(src_root);
	while (node) {
		struct rb_node *next;

2272
		al = rb_entry(node, struct annotation_line, rb_node);
2273 2274 2275
		next = rb_next(node);
		rb_erase(node, src_root);

2276
		__resort_source_line(dest_root, al);
2277 2278 2279 2280
		node = next;
	}
}

2281 2282
static void print_summary(struct rb_root *root, const char *filename)
{
2283
	struct annotation_line *al;
2284 2285 2286 2287 2288 2289 2290 2291 2292 2293 2294 2295
	struct rb_node *node;

	printf("\nSorted summary for file %s\n", filename);
	printf("----------------------------------------------\n\n");

	if (RB_EMPTY_ROOT(root)) {
		printf(" Nothing higher than %1.1f%%\n", MIN_GREEN);
		return;
	}

	node = rb_first(root);
	while (node) {
2296
		double percent, percent_max = 0.0;
2297 2298
		const char *color;
		char *path;
2299
		int i;
2300

2301
		al = rb_entry(node, struct annotation_line, rb_node);
2302 2303
		for (i = 0; i < al->data_nr; i++) {
			percent = al->data[i].percent_sum;
2304 2305 2306 2307 2308 2309 2310
			color = get_percent_color(percent);
			color_fprintf(stdout, color, " %7.2f", percent);

			if (percent > percent_max)
				percent_max = percent;
		}

2311
		path = al->path;
2312
		color = get_percent_color(percent_max);
2313
		color_fprintf(stdout, color, " %s\n", path);
2314 2315 2316 2317 2318

		node = rb_next(node);
	}
}

2319
static void symbol__annotate_hits(struct symbol *sym, struct evsel *evsel)
2320 2321
{
	struct annotation *notes = symbol__annotation(sym);
2322
	struct sym_hist *h = annotation__histogram(notes, evsel->idx);
2323
	u64 len = symbol__size(sym), offset;
2324 2325

	for (offset = 0; offset < len; ++offset)
2326
		if (h->addr[offset].nr_samples != 0)
2327
			printf("%*" PRIx64 ": %" PRIu64 "\n", BITS_PER_LONG / 2,
2328
			       sym->start + offset, h->addr[offset].nr_samples);
2329
	printf("%*s: %" PRIu64 "\n", BITS_PER_LONG / 2, "h->nr_samples", h->nr_samples);
2330 2331
}

2332 2333 2334 2335 2336 2337 2338 2339 2340 2341 2342 2343 2344
static int annotated_source__addr_fmt_width(struct list_head *lines, u64 start)
{
	char bf[32];
	struct annotation_line *line;

	list_for_each_entry_reverse(line, lines, node) {
		if (line->offset != -1)
			return scnprintf(bf, sizeof(bf), "%" PRIx64, start + line->offset);
	}

	return 0;
}

2345
int symbol__annotate_printf(struct map_symbol *ms, struct evsel *evsel,
2346
			    struct annotation_options *opts)
2347
{
2348 2349
	struct map *map = ms->map;
	struct symbol *sym = ms->sym;
2350
	struct dso *dso = map->dso;
2351 2352
	char *filename;
	const char *d_filename;
2353
	const char *evsel_name = evsel__name(evsel);
2354
	struct annotation *notes = symbol__annotation(sym);
2355
	struct sym_hist *h = annotation__histogram(notes, evsel->idx);
2356
	struct annotation_line *pos, *queue = NULL;
2357
	u64 start = map__rip_2objdump(map, sym->start);
2358
	int printed = 2, queue_len = 0, addr_fmt_width;
2359
	int more = 0;
2360
	bool context = opts->context;
2361
	u64 len;
2362
	int width = symbol_conf.show_total_period ? 12 : 8;
2363
	int graph_dotted_len;
2364
	char buf[512];
2365

2366 2367 2368 2369
	filename = strdup(dso->long_name);
	if (!filename)
		return -ENOMEM;

2370
	if (opts->full_path)
2371 2372 2373 2374
		d_filename = filename;
	else
		d_filename = basename(filename);

2375
	len = symbol__size(sym);
2376

2377
	if (evsel__is_group_event(evsel)) {
2378
		width *= evsel->core.nr_members;
2379
		evsel__group_desc(evsel, buf, sizeof(buf));
2380 2381
		evsel_name = buf;
	}
2382

2383 2384
	graph_dotted_len = printf(" %-*.*s|	Source code & Disassembly of %s for %s (%" PRIu64 " samples, "
				  "percent: %s)\n",
2385 2386
				  width, width, symbol_conf.show_total_period ? "Period" :
				  symbol_conf.show_nr_samples ? "Samples" : "Percent",
2387 2388
				  d_filename, evsel_name, h->nr_samples,
				  percent_type_str(opts->percent_type));
2389

2390
	printf("%-*.*s----\n",
2391
	       graph_dotted_len, graph_dotted_len, graph_dotted_line);
2392

2393
	if (verbose > 0)
2394
		symbol__annotate_hits(sym, evsel);
2395

2396 2397
	addr_fmt_width = annotated_source__addr_fmt_width(&notes->src->source, start);

2398 2399 2400
	list_for_each_entry(pos, &notes->src->source, node) {
		int err;

2401 2402 2403 2404 2405
		if (context && queue == NULL) {
			queue = pos;
			queue_len = 0;
		}

2406
		err = annotation_line__print(pos, sym, start, evsel, len,
2407
					     opts->min_pcnt, printed, opts->max_lines,
2408
					     queue, addr_fmt_width, opts->percent_type);
2409 2410

		switch (err) {
2411 2412
		case 0:
			++printed;
2413 2414 2415 2416 2417
			if (context) {
				printed += queue_len;
				queue = NULL;
				queue_len = 0;
			}
2418 2419 2420 2421
			break;
		case 1:
			/* filtered by max_lines */
			++more;
2422
			break;
2423 2424
		case -1:
		default:
2425 2426 2427 2428 2429 2430 2431
			/*
			 * Filtered by min_pcnt or non IP lines when
			 * context != 0
			 */
			if (!context)
				break;
			if (queue_len == context)
2432
				queue = list_entry(queue->node.next, typeof(*queue), node);
2433 2434
			else
				++queue_len;
2435 2436 2437 2438
			break;
		}
	}

2439 2440
	free(filename);

2441 2442
	return more;
}
2443

2444 2445 2446 2447 2448 2449 2450 2451 2452 2453 2454 2455 2456 2457 2458 2459 2460 2461 2462 2463 2464 2465 2466 2467 2468 2469 2470 2471 2472 2473 2474 2475 2476 2477 2478 2479 2480 2481 2482 2483 2484
static void FILE__set_percent_color(void *fp __maybe_unused,
				    double percent __maybe_unused,
				    bool current __maybe_unused)
{
}

static int FILE__set_jumps_percent_color(void *fp __maybe_unused,
					 int nr __maybe_unused, bool current __maybe_unused)
{
	return 0;
}

static int FILE__set_color(void *fp __maybe_unused, int color __maybe_unused)
{
	return 0;
}

static void FILE__printf(void *fp, const char *fmt, ...)
{
	va_list args;

	va_start(args, fmt);
	vfprintf(fp, fmt, args);
	va_end(args);
}

static void FILE__write_graph(void *fp, int graph)
{
	const char *s;
	switch (graph) {

	case DARROW_CHAR: s = "↓"; break;
	case UARROW_CHAR: s = "↑"; break;
	case LARROW_CHAR: s = "←"; break;
	case RARROW_CHAR: s = "→"; break;
	default:		s = "?"; break;
	}

	fputs(s, fp);
}

2485 2486
static int symbol__annotate_fprintf2(struct symbol *sym, FILE *fp,
				     struct annotation_options *opts)
2487 2488
{
	struct annotation *notes = symbol__annotation(sym);
2489
	struct annotation_write_ops wops = {
2490 2491 2492 2493 2494 2495 2496 2497 2498 2499 2500 2501 2502
		.first_line		 = true,
		.obj			 = fp,
		.set_color		 = FILE__set_color,
		.set_percent_color	 = FILE__set_percent_color,
		.set_jumps_percent_color = FILE__set_jumps_percent_color,
		.printf			 = FILE__printf,
		.write_graph		 = FILE__write_graph,
	};
	struct annotation_line *al;

	list_for_each_entry(al, &notes->src->source, node) {
		if (annotation_line__filter(al, notes))
			continue;
2503
		annotation_line__write(al, notes, &wops, opts);
2504
		fputc('\n', fp);
2505
		wops.first_line = false;
2506 2507 2508 2509 2510
	}

	return 0;
}

2511
int map_symbol__annotation_dump(struct map_symbol *ms, struct evsel *evsel,
2512
				struct annotation_options *opts)
2513
{
2514
	const char *ev_name = evsel__name(evsel);
2515 2516 2517 2518 2519 2520 2521 2522 2523 2524 2525 2526
	char buf[1024];
	char *filename;
	int err = -1;
	FILE *fp;

	if (asprintf(&filename, "%s.annotation", ms->sym->name) < 0)
		return -1;

	fp = fopen(filename, "w");
	if (fp == NULL)
		goto out_free_filename;

2527
	if (evsel__is_group_event(evsel)) {
2528
		evsel__group_desc(evsel, buf, sizeof(buf));
2529 2530 2531 2532 2533
		ev_name = buf;
	}

	fprintf(fp, "%s() %s\nEvent: %s\n\n",
		ms->sym->name, ms->map->dso->long_name, ev_name);
2534
	symbol__annotate_fprintf2(ms->sym, fp, opts);
2535 2536 2537 2538 2539 2540 2541 2542

	fclose(fp);
	err = 0;
out_free_filename:
	free(filename);
	return err;
}

2543 2544 2545 2546 2547
void symbol__annotate_zero_histogram(struct symbol *sym, int evidx)
{
	struct annotation *notes = symbol__annotation(sym);
	struct sym_hist *h = annotation__histogram(notes, evidx);

2548
	memset(h, 0, notes->src->sizeof_sym_hist);
2549 2550
}

2551
void symbol__annotate_decay_histogram(struct symbol *sym, int evidx)
2552 2553 2554
{
	struct annotation *notes = symbol__annotation(sym);
	struct sym_hist *h = annotation__histogram(notes, evidx);
2555
	int len = symbol__size(sym), offset;
2556

2557
	h->nr_samples = 0;
2558
	for (offset = 0; offset < len; ++offset) {
2559
		h->addr[offset].nr_samples = h->addr[offset].nr_samples * 7 / 8;
2560
		h->nr_samples += h->addr[offset].nr_samples;
2561 2562 2563
	}
}

2564
void annotated_source__purge(struct annotated_source *as)
2565
{
2566
	struct annotation_line *al, *n;
2567

2568
	list_for_each_entry_safe(al, n, &as->source, node) {
2569
		list_del_init(&al->node);
2570
		disasm_line__free(disasm_line(al));
2571 2572 2573
	}
}

2574 2575 2576 2577
static size_t disasm_line__fprintf(struct disasm_line *dl, FILE *fp)
{
	size_t printed;

2578 2579
	if (dl->al.offset == -1)
		return fprintf(fp, "%s\n", dl->al.line);
2580

2581
	printed = fprintf(fp, "%#" PRIx64 " %s", dl->al.offset, dl->ins.name);
2582

2583
	if (dl->ops.raw[0] != '\0') {
2584
		printed += fprintf(fp, "%.*s %s\n", 6 - (int)printed, " ",
2585
				   dl->ops.raw);
2586 2587 2588 2589 2590 2591 2592 2593 2594 2595
	}

	return printed + fprintf(fp, "\n");
}

size_t disasm__fprintf(struct list_head *head, FILE *fp)
{
	struct disasm_line *pos;
	size_t printed = 0;

2596
	list_for_each_entry(pos, head, al.node)
2597 2598 2599 2600 2601
		printed += disasm_line__fprintf(pos, fp);

	return printed;
}

2602
bool disasm_line__is_valid_local_jump(struct disasm_line *dl, struct symbol *sym)
2603 2604
{
	if (!dl || !dl->ins.ops || !ins__is_jump(&dl->ins) ||
2605
	    !disasm_line__has_local_offset(dl) || dl->ops.target.offset < 0 ||
2606 2607 2608 2609 2610 2611 2612 2613 2614 2615 2616 2617 2618 2619 2620 2621 2622 2623 2624 2625
	    dl->ops.target.offset >= (s64)symbol__size(sym))
		return false;

	return true;
}

void annotation__mark_jump_targets(struct annotation *notes, struct symbol *sym)
{
	u64 offset, size = symbol__size(sym);

	/* PLT symbols contain external offsets */
	if (strstr(sym->name, "@plt"))
		return;

	for (offset = 0; offset < size; ++offset) {
		struct annotation_line *al = notes->offsets[offset];
		struct disasm_line *dl;

		dl = disasm_line(al);

2626
		if (!disasm_line__is_valid_local_jump(dl, sym))
2627 2628 2629 2630 2631 2632 2633 2634 2635 2636 2637 2638 2639 2640 2641 2642
			continue;

		al = notes->offsets[dl->ops.target.offset];

		/*
		 * FIXME: Oops, no jump target? Buggy disassembler? Or do we
		 * have to adjust to the previous offset?
		 */
		if (al == NULL)
			continue;

		if (++al->jump_sources > notes->max_jump_sources)
			notes->max_jump_sources = al->jump_sources;
	}
}

2643 2644 2645 2646 2647
void annotation__set_offsets(struct annotation *notes, s64 size)
{
	struct annotation_line *al;

	notes->max_line_len = 0;
2648 2649
	notes->nr_entries = 0;
	notes->nr_asm_entries = 0;
2650 2651 2652 2653 2654 2655 2656 2657 2658 2659 2660 2661 2662 2663 2664 2665 2666 2667 2668 2669 2670 2671 2672

	list_for_each_entry(al, &notes->src->source, node) {
		size_t line_len = strlen(al->line);

		if (notes->max_line_len < line_len)
			notes->max_line_len = line_len;
		al->idx = notes->nr_entries++;
		if (al->offset != -1) {
			al->idx_asm = notes->nr_asm_entries++;
			/*
			 * FIXME: short term bandaid to cope with assembly
			 * routines that comes with labels in the same column
			 * as the address in objdump, sigh.
			 *
			 * E.g. copy_user_generic_unrolled
 			 */
			if (al->offset < size)
				notes->offsets[al->offset] = al;
		} else
			al->idx_asm = -1;
	}
}

2673 2674 2675 2676 2677 2678 2679 2680 2681
static inline int width_jumps(int n)
{
	if (n >= 100)
		return 5;
	if (n / 10)
		return 2;
	return 1;
}

2682 2683 2684 2685 2686 2687 2688 2689 2690 2691 2692 2693 2694 2695 2696 2697 2698
static int annotation__max_ins_name(struct annotation *notes)
{
	int max_name = 0, len;
	struct annotation_line *al;

        list_for_each_entry(al, &notes->src->source, node) {
		if (al->offset == -1)
			continue;

		len = strlen(disasm_line(al)->ins.name);
		if (max_name < len)
			max_name = len;
	}

	return max_name;
}

2699 2700 2701 2702 2703 2704
void annotation__init_column_widths(struct annotation *notes, struct symbol *sym)
{
	notes->widths.addr = notes->widths.target =
		notes->widths.min_addr = hex_width(symbol__size(sym));
	notes->widths.max_addr = hex_width(sym->end);
	notes->widths.jumps = width_jumps(notes->max_jump_sources);
2705
	notes->widths.max_ins_name = annotation__max_ins_name(notes);
2706 2707
}

2708 2709 2710 2711 2712 2713 2714 2715 2716 2717 2718 2719 2720
void annotation__update_column_widths(struct annotation *notes)
{
	if (notes->options->use_offset)
		notes->widths.target = notes->widths.min_addr;
	else
		notes->widths.target = notes->widths.max_addr;

	notes->widths.addr = notes->widths.target;

	if (notes->options->show_nr_jumps)
		notes->widths.addr += notes->widths.jumps + 1;
}

2721
static void annotation__calc_lines(struct annotation *notes, struct map *map,
2722 2723
				   struct rb_root *root,
				   struct annotation_options *opts)
2724 2725 2726 2727 2728 2729 2730 2731
{
	struct annotation_line *al;
	struct rb_root tmp_root = RB_ROOT;

	list_for_each_entry(al, &notes->src->source, node) {
		double percent_max = 0.0;
		int i;

2732
		for (i = 0; i < al->data_nr; i++) {
2733
			double percent;
2734

2735
			percent = annotation_data__percent(&al->data[i],
2736
							   opts->percent_type);
2737

2738 2739
			if (percent > percent_max)
				percent_max = percent;
2740 2741 2742 2743 2744
		}

		if (percent_max <= 0.5)
			continue;

2745 2746
		al->path = get_srcline(map->dso, notes->start + al->offset, NULL,
				       false, true, notes->start + al->offset);
2747
		insert_source_line(&tmp_root, al, opts);
2748 2749 2750 2751 2752
	}

	resort_source_line(root, &tmp_root);
}

2753
static void symbol__calc_lines(struct map_symbol *ms, struct rb_root *root,
2754
			       struct annotation_options *opts)
2755
{
2756
	struct annotation *notes = symbol__annotation(ms->sym);
2757

2758
	annotation__calc_lines(notes, ms->map, root, opts);
2759 2760
}

2761
int symbol__tty_annotate2(struct map_symbol *ms, struct evsel *evsel,
2762
			  struct annotation_options *opts)
2763
{
2764 2765
	struct dso *dso = ms->map->dso;
	struct symbol *sym = ms->sym;
2766
	struct rb_root source_line = RB_ROOT;
2767
	struct hists *hists = evsel__hists(evsel);
2768
	char buf[1024];
2769

2770
	if (symbol__annotate2(ms, evsel, opts, NULL) < 0)
2771 2772
		return -1;

2773 2774
	if (opts->print_lines) {
		srcline_full_filename = opts->full_path;
2775
		symbol__calc_lines(ms, &source_line, opts);
2776 2777 2778
		print_summary(&source_line, dso->long_name);
	}

2779
	hists__scnprintf_title(hists, buf, sizeof(buf));
2780 2781
	fprintf(stdout, "%s, [percent: %s]\n%s() %s\n",
		buf, percent_type_str(opts->percent_type), sym->name, dso->long_name);
2782
	symbol__annotate_fprintf2(sym, stdout, opts);
2783 2784 2785 2786 2787 2788

	annotated_source__purge(symbol__annotation(sym)->src);

	return 0;
}

2789
int symbol__tty_annotate(struct map_symbol *ms, struct evsel *evsel,
2790
			 struct annotation_options *opts)
2791
{
2792 2793
	struct dso *dso = ms->map->dso;
	struct symbol *sym = ms->sym;
2794 2795
	struct rb_root source_line = RB_ROOT;

2796
	if (symbol__annotate(ms, evsel, opts, NULL) < 0)
2797 2798
		return -1;

2799 2800
	symbol__calc_percent(sym, evsel);

2801 2802
	if (opts->print_lines) {
		srcline_full_filename = opts->full_path;
2803
		symbol__calc_lines(ms, &source_line, opts);
2804
		print_summary(&source_line, dso->long_name);
2805 2806
	}

2807
	symbol__annotate_printf(ms, evsel, opts);
2808

2809
	annotated_source__purge(symbol__annotation(sym)->src);
2810

2811 2812
	return 0;
}
2813

2814 2815
bool ui__has_annotation(void)
{
2816
	return use_browser == 1 && perf_hpp_list.sym;
2817
}
2818

2819

2820
static double annotation_line__max_percent(struct annotation_line *al,
2821 2822
					   struct annotation *notes,
					   unsigned int percent_type)
2823 2824 2825 2826 2827
{
	double percent_max = 0.0;
	int i;

	for (i = 0; i < notes->nr_events; i++) {
2828 2829 2830
		double percent;

		percent = annotation_data__percent(&al->data[i],
2831
						   percent_type);
2832 2833 2834

		if (percent > percent_max)
			percent_max = percent;
2835 2836 2837 2838 2839
	}

	return percent_max;
}

2840 2841 2842 2843 2844 2845 2846
static void disasm_line__write(struct disasm_line *dl, struct annotation *notes,
			       void *obj, char *bf, size_t size,
			       void (*obj__printf)(void *obj, const char *fmt, ...),
			       void (*obj__write_graph)(void *obj, int graph))
{
	if (dl->ins.ops && dl->ins.ops->scnprintf) {
		if (ins__is_jump(&dl->ins)) {
2847
			bool fwd;
2848

2849 2850 2851
			if (dl->ops.target.outside)
				goto call_like;
			fwd = dl->ops.target.offset > dl->al.offset;
2852 2853 2854
			obj__write_graph(obj, fwd ? DARROW_CHAR : UARROW_CHAR);
			obj__printf(obj, " ");
		} else if (ins__is_call(&dl->ins)) {
2855
call_like:
2856 2857 2858 2859 2860 2861 2862 2863 2864 2865 2866 2867
			obj__write_graph(obj, RARROW_CHAR);
			obj__printf(obj, " ");
		} else if (ins__is_ret(&dl->ins)) {
			obj__write_graph(obj, LARROW_CHAR);
			obj__printf(obj, " ");
		} else {
			obj__printf(obj, "  ");
		}
	} else {
		obj__printf(obj, "  ");
	}

2868
	disasm_line__scnprintf(dl, bf, size, !notes->options->use_offset, notes->widths.max_ins_name);
2869 2870
}

2871 2872 2873 2874 2875 2876 2877 2878 2879 2880 2881 2882 2883 2884 2885 2886
static void ipc_coverage_string(char *bf, int size, struct annotation *notes)
{
	double ipc = 0.0, coverage = 0.0;

	if (notes->hit_cycles)
		ipc = notes->hit_insn / ((double)notes->hit_cycles);

	if (notes->total_insn) {
		coverage = notes->cover_insn * 100.0 /
			((double)notes->total_insn);
	}

	scnprintf(bf, size, "(Average IPC: %.2f, IPC Coverage: %.1f%%)",
		  ipc, coverage);
}

2887 2888
static void __annotation_line__write(struct annotation_line *al, struct annotation *notes,
				     bool first_line, bool current_entry, bool change_color, int width,
2889
				     void *obj, unsigned int percent_type,
2890 2891 2892 2893 2894 2895
				     int  (*obj__set_color)(void *obj, int color),
				     void (*obj__set_percent_color)(void *obj, double percent, bool current),
				     int  (*obj__set_jumps_percent_color)(void *obj, int nr, bool current),
				     void (*obj__printf)(void *obj, const char *fmt, ...),
				     void (*obj__write_graph)(void *obj, int graph))

2896
{
2897
	double percent_max = annotation_line__max_percent(al, notes, percent_type);
2898 2899
	int pcnt_width = annotation__pcnt_width(notes),
	    cycles_width = annotation__cycles_width(notes);
2900
	bool show_title = false;
2901 2902
	char bf[256];
	int printed;
2903 2904 2905 2906 2907 2908 2909 2910 2911 2912 2913 2914 2915

	if (first_line && (al->offset == -1 || percent_max == 0.0)) {
		if (notes->have_cycles) {
			if (al->ipc == 0.0 && al->cycles == 0)
				show_title = true;
		} else
			show_title = true;
	}

	if (al->offset != -1 && percent_max != 0.0) {
		int i;

		for (i = 0; i < notes->nr_events; i++) {
2916 2917
			double percent;

2918
			percent = annotation_data__percent(&al->data[i], percent_type);
2919 2920

			obj__set_percent_color(obj, percent, current_entry);
2921
			if (symbol_conf.show_total_period) {
2922
				obj__printf(obj, "%11" PRIu64 " ", al->data[i].he.period);
2923
			} else if (symbol_conf.show_nr_samples) {
2924
				obj__printf(obj, "%6" PRIu64 " ",
2925
						   al->data[i].he.nr_samples);
2926
			} else {
2927
				obj__printf(obj, "%6.2f ", percent);
2928 2929 2930 2931 2932 2933
			}
		}
	} else {
		obj__set_percent_color(obj, 0, current_entry);

		if (!show_title)
2934
			obj__printf(obj, "%-*s", pcnt_width, " ");
2935
		else {
2936
			obj__printf(obj, "%-*s", pcnt_width,
2937
					   symbol_conf.show_total_period ? "Period" :
2938
					   symbol_conf.show_nr_samples ? "Samples" : "Percent");
2939 2940 2941 2942 2943 2944 2945 2946 2947 2948 2949
		}
	}

	if (notes->have_cycles) {
		if (al->ipc)
			obj__printf(obj, "%*.2f ", ANNOTATION__IPC_WIDTH - 1, al->ipc);
		else if (!show_title)
			obj__printf(obj, "%*s", ANNOTATION__IPC_WIDTH, " ");
		else
			obj__printf(obj, "%*s ", ANNOTATION__IPC_WIDTH - 1, "IPC");

2950 2951 2952
		if (!notes->options->show_minmax_cycle) {
			if (al->cycles)
				obj__printf(obj, "%*" PRIu64 " ",
2953
					   ANNOTATION__CYCLES_WIDTH - 1, al->cycles);
2954 2955 2956 2957 2958 2959 2960 2961 2962 2963 2964 2965 2966 2967 2968 2969 2970 2971 2972 2973 2974 2975 2976 2977 2978 2979 2980 2981
			else if (!show_title)
				obj__printf(obj, "%*s",
					    ANNOTATION__CYCLES_WIDTH, " ");
			else
				obj__printf(obj, "%*s ",
					    ANNOTATION__CYCLES_WIDTH - 1,
					    "Cycle");
		} else {
			if (al->cycles) {
				char str[32];

				scnprintf(str, sizeof(str),
					"%" PRIu64 "(%" PRIu64 "/%" PRIu64 ")",
					al->cycles, al->cycles_min,
					al->cycles_max);

				obj__printf(obj, "%*s ",
					    ANNOTATION__MINMAX_CYCLES_WIDTH - 1,
					    str);
			} else if (!show_title)
				obj__printf(obj, "%*s",
					    ANNOTATION__MINMAX_CYCLES_WIDTH,
					    " ");
			else
				obj__printf(obj, "%*s ",
					    ANNOTATION__MINMAX_CYCLES_WIDTH - 1,
					    "Cycle(min/max)");
		}
2982 2983 2984 2985 2986

		if (show_title && !*al->line) {
			ipc_coverage_string(bf, sizeof(bf), notes);
			obj__printf(obj, "%*s", ANNOTATION__AVG_IPC_WIDTH, bf);
		}
2987 2988 2989
	}

	obj__printf(obj, " ");
2990 2991 2992 2993 2994 2995 2996 2997 2998 2999 3000 3001 3002 3003 3004 3005 3006 3007 3008 3009

	if (!*al->line)
		obj__printf(obj, "%-*s", width - pcnt_width - cycles_width, " ");
	else if (al->offset == -1) {
		if (al->line_nr && notes->options->show_linenr)
			printed = scnprintf(bf, sizeof(bf), "%-*d ", notes->widths.addr + 1, al->line_nr);
		else
			printed = scnprintf(bf, sizeof(bf), "%-*s  ", notes->widths.addr, " ");
		obj__printf(obj, bf);
		obj__printf(obj, "%-*s", width - printed - pcnt_width - cycles_width + 1, al->line);
	} else {
		u64 addr = al->offset;
		int color = -1;

		if (!notes->options->use_offset)
			addr += notes->start;

		if (!notes->options->use_offset) {
			printed = scnprintf(bf, sizeof(bf), "%" PRIx64 ": ", addr);
		} else {
3010 3011
			if (al->jump_sources &&
			    notes->options->offset_level >= ANNOTATION__OFFSET_JUMP_TARGETS) {
3012 3013 3014 3015 3016 3017 3018 3019 3020 3021
				if (notes->options->show_nr_jumps) {
					int prev;
					printed = scnprintf(bf, sizeof(bf), "%*d ",
							    notes->widths.jumps,
							    al->jump_sources);
					prev = obj__set_jumps_percent_color(obj, al->jump_sources,
									    current_entry);
					obj__printf(obj, bf);
					obj__set_color(obj, prev);
				}
3022
print_addr:
3023 3024
				printed = scnprintf(bf, sizeof(bf), "%*" PRIx64 ": ",
						    notes->widths.target, addr);
3025 3026 3027 3028 3029
			} else if (ins__is_call(&disasm_line(al)->ins) &&
				   notes->options->offset_level >= ANNOTATION__OFFSET_CALL) {
				goto print_addr;
			} else if (notes->options->offset_level == ANNOTATION__MAX_OFFSET_LEVEL) {
				goto print_addr;
3030 3031 3032 3033 3034 3035 3036 3037 3038 3039 3040 3041 3042 3043 3044 3045 3046
			} else {
				printed = scnprintf(bf, sizeof(bf), "%-*s  ",
						    notes->widths.addr, " ");
			}
		}

		if (change_color)
			color = obj__set_color(obj, HE_COLORSET_ADDR);
		obj__printf(obj, bf);
		if (change_color)
			obj__set_color(obj, color);

		disasm_line__write(disasm_line(al), notes, obj, bf, sizeof(bf), obj__printf, obj__write_graph);

		obj__printf(obj, "%-*s", width - pcnt_width - cycles_width - 3 - printed, bf);
	}

3047 3048
}

3049
void annotation_line__write(struct annotation_line *al, struct annotation *notes,
3050 3051
			    struct annotation_write_ops *wops,
			    struct annotation_options *opts)
3052
{
3053 3054 3055 3056 3057 3058
	__annotation_line__write(al, notes, wops->first_line, wops->current_entry,
				 wops->change_color, wops->width, wops->obj,
				 opts->percent_type,
				 wops->set_color, wops->set_percent_color,
				 wops->set_jumps_percent_color, wops->printf,
				 wops->write_graph);
3059 3060
}

3061
int symbol__annotate2(struct map_symbol *ms, struct evsel *evsel,
3062 3063
		      struct annotation_options *options, struct arch **parch)
{
3064
	struct symbol *sym = ms->sym;
3065 3066 3067 3068 3069 3070
	struct annotation *notes = symbol__annotation(sym);
	size_t size = symbol__size(sym);
	int nr_pcnt = 1, err;

	notes->offsets = zalloc(size * sizeof(struct annotation_line *));
	if (notes->offsets == NULL)
3071
		return ENOMEM;
3072

3073
	if (evsel__is_group_event(evsel))
3074
		nr_pcnt = evsel->core.nr_members;
3075

3076
	err = symbol__annotate(ms, evsel, options, parch);
3077 3078 3079 3080 3081 3082 3083 3084 3085 3086 3087 3088 3089 3090
	if (err)
		goto out_free_offsets;

	notes->options = options;

	symbol__calc_percent(sym, evsel);

	annotation__set_offsets(notes, size);
	annotation__mark_jump_targets(notes, sym);
	annotation__compute_ipc(notes, size);
	annotation__init_column_widths(notes, sym);
	notes->nr_events = nr_pcnt;

	annotation__update_column_widths(notes);
3091
	sym->annotate2 = true;
3092 3093 3094 3095 3096

	return 0;

out_free_offsets:
	zfree(&notes->offsets);
3097
	return err;
3098
}
3099

3100
static int annotation__config(const char *var, const char *value, void *data)
3101
{
3102
	struct annotation_options *opt = data;
3103 3104 3105 3106

	if (!strstarts(var, "annotate."))
		return 0;

3107 3108 3109 3110 3111 3112 3113 3114 3115 3116 3117 3118 3119 3120 3121 3122 3123 3124 3125 3126 3127 3128 3129
	if (!strcmp(var, "annotate.offset_level")) {
		perf_config_u8(&opt->offset_level, "offset_level", value);

		if (opt->offset_level > ANNOTATION__MAX_OFFSET_LEVEL)
			opt->offset_level = ANNOTATION__MAX_OFFSET_LEVEL;
		else if (opt->offset_level < ANNOTATION__MIN_OFFSET_LEVEL)
			opt->offset_level = ANNOTATION__MIN_OFFSET_LEVEL;
	} else if (!strcmp(var, "annotate.hide_src_code")) {
		opt->hide_src_code = perf_config_bool("hide_src_code", value);
	} else if (!strcmp(var, "annotate.jump_arrows")) {
		opt->jump_arrows = perf_config_bool("jump_arrows", value);
	} else if (!strcmp(var, "annotate.show_linenr")) {
		opt->show_linenr = perf_config_bool("show_linenr", value);
	} else if (!strcmp(var, "annotate.show_nr_jumps")) {
		opt->show_nr_jumps = perf_config_bool("show_nr_jumps", value);
	} else if (!strcmp(var, "annotate.show_nr_samples")) {
		symbol_conf.show_nr_samples = perf_config_bool("show_nr_samples",
								value);
	} else if (!strcmp(var, "annotate.show_total_period")) {
		symbol_conf.show_total_period = perf_config_bool("show_total_period",
								value);
	} else if (!strcmp(var, "annotate.use_offset")) {
		opt->use_offset = perf_config_bool("use_offset", value);
3130 3131
	} else if (!strcmp(var, "annotate.disassembler_style")) {
		opt->disassembler_style = value;
3132
	} else {
3133
		pr_debug("%s variable unknown, ignoring...", var);
3134
	}
3135

3136 3137 3138
	return 0;
}

3139
void annotation_config__init(struct annotation_options *opt)
3140
{
3141
	perf_config(annotation__config, opt);
3142
}
3143 3144 3145 3146 3147 3148 3149 3150 3151 3152 3153 3154 3155 3156 3157 3158 3159 3160 3161 3162 3163 3164 3165 3166 3167 3168 3169 3170 3171 3172 3173 3174 3175 3176 3177 3178 3179 3180 3181 3182 3183 3184 3185 3186 3187 3188 3189 3190 3191 3192 3193 3194

static unsigned int parse_percent_type(char *str1, char *str2)
{
	unsigned int type = (unsigned int) -1;

	if (!strcmp("period", str1)) {
		if (!strcmp("local", str2))
			type = PERCENT_PERIOD_LOCAL;
		else if (!strcmp("global", str2))
			type = PERCENT_PERIOD_GLOBAL;
	}

	if (!strcmp("hits", str1)) {
		if (!strcmp("local", str2))
			type = PERCENT_HITS_LOCAL;
		else if (!strcmp("global", str2))
			type = PERCENT_HITS_GLOBAL;
	}

	return type;
}

int annotate_parse_percent_type(const struct option *opt, const char *_str,
				int unset __maybe_unused)
{
	struct annotation_options *opts = opt->value;
	unsigned int type;
	char *str1, *str2;
	int err = -1;

	str1 = strdup(_str);
	if (!str1)
		return -ENOMEM;

	str2 = strchr(str1, '-');
	if (!str2)
		goto out;

	*str2++ = 0;

	type = parse_percent_type(str1, str2);
	if (type == (unsigned int) -1)
		type = parse_percent_type(str2, str1);
	if (type != (unsigned int) -1) {
		opts->percent_type = type;
		err = 0;
	}

out:
	free(str1);
	return err;
}
3195 3196 3197 3198 3199 3200 3201 3202 3203

int annotate_check_args(struct annotation_options *args)
{
	if (args->prefix_strip && !args->prefix) {
		pr_err("--prefix-strip requires --prefix\n");
		return -1;
	}
	return 0;
}