symbol.c 62.6 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13
#define _GNU_SOURCE
#include <ctype.h>
#include <dirent.h>
#include <errno.h>
#include <libgen.h>
#include <stdlib.h>
#include <stdio.h>
#include <string.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <sys/param.h>
#include <fcntl.h>
#include <unistd.h>
14
#include <inttypes.h>
15
#include "build-id.h"
16
#include "debug.h"
17
#include "symbol.h"
18
#include "strlist.h"
19 20 21 22

#include <libelf.h>
#include <gelf.h>
#include <elf.h>
23
#include <limits.h>
24
#include <sys/utsname.h>
P
Peter Zijlstra 已提交
25

26 27 28 29
#ifndef KSYM_NAME_LEN
#define KSYM_NAME_LEN 128
#endif

30 31 32 33
#ifndef NT_GNU_BUILD_ID
#define NT_GNU_BUILD_ID 3
#endif

34
static bool dso__build_id_equal(const struct dso *dso, u8 *build_id);
35
static int elf_read_build_id(Elf *elf, void *bf, size_t size);
36
static void dsos__add(struct list_head *head, struct dso *dso);
37
static struct map *map__new2(u64 start, struct dso *dso, enum map_type type);
38
static int dso__load_kernel_sym(struct dso *dso, struct map *map,
39
				symbol_filter_t filter);
40
static int dso__load_guest_kernel_sym(struct dso *dso, struct map *map,
41
			symbol_filter_t filter);
42 43
static int vmlinux_path__nr_entries;
static char **vmlinux_path;
44

45
struct symbol_conf symbol_conf = {
46
	.exclude_other	  = true,
47 48
	.use_modules	  = true,
	.try_vmlinux_path = true,
49
	.annotate_src	  = true,
50
	.symfs            = "",
51 52
};

53
int dso__name_len(const struct dso *dso)
54 55
{
	if (verbose)
56
		return dso->long_name_len;
57

58
	return dso->short_name_len;
59 60
}

61
bool dso__loaded(const struct dso *dso, enum map_type type)
62
{
63
	return dso->loaded & (1 << type);
64 65
}

66
bool dso__sorted_by_name(const struct dso *dso, enum map_type type)
67
{
68
	return dso->sorted_by_name & (1 << type);
69 70
}

71
static void dso__set_sorted_by_name(struct dso *dso, enum map_type type)
72
{
73
	dso->sorted_by_name |= (1 << type);
74 75
}

76
bool symbol_type__is_a(char symbol_type, enum map_type map_type)
77
{
78 79
	symbol_type = toupper(symbol_type);

80 81 82
	switch (map_type) {
	case MAP__FUNCTION:
		return symbol_type == 'T' || symbol_type == 'W';
83
	case MAP__VARIABLE:
84
		return symbol_type == 'D';
85 86 87 88 89
	default:
		return false;
	}
}

90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175
static int prefix_underscores_count(const char *str)
{
	const char *tail = str;

	while (*tail == '_')
		tail++;

	return tail - str;
}

#define SYMBOL_A 0
#define SYMBOL_B 1

static int choose_best_symbol(struct symbol *syma, struct symbol *symb)
{
	s64 a;
	s64 b;

	/* Prefer a symbol with non zero length */
	a = syma->end - syma->start;
	b = symb->end - symb->start;
	if ((b == 0) && (a > 0))
		return SYMBOL_A;
	else if ((a == 0) && (b > 0))
		return SYMBOL_B;

	/* Prefer a non weak symbol over a weak one */
	a = syma->binding == STB_WEAK;
	b = symb->binding == STB_WEAK;
	if (b && !a)
		return SYMBOL_A;
	if (a && !b)
		return SYMBOL_B;

	/* Prefer a global symbol over a non global one */
	a = syma->binding == STB_GLOBAL;
	b = symb->binding == STB_GLOBAL;
	if (a && !b)
		return SYMBOL_A;
	if (b && !a)
		return SYMBOL_B;

	/* Prefer a symbol with less underscores */
	a = prefix_underscores_count(syma->name);
	b = prefix_underscores_count(symb->name);
	if (b > a)
		return SYMBOL_A;
	else if (a > b)
		return SYMBOL_B;

	/* If all else fails, choose the symbol with the longest name */
	if (strlen(syma->name) >= strlen(symb->name))
		return SYMBOL_A;
	else
		return SYMBOL_B;
}

static void symbols__fixup_duplicate(struct rb_root *symbols)
{
	struct rb_node *nd;
	struct symbol *curr, *next;

	nd = rb_first(symbols);

	while (nd) {
		curr = rb_entry(nd, struct symbol, rb_node);
again:
		nd = rb_next(&curr->rb_node);
		next = rb_entry(nd, struct symbol, rb_node);

		if (!nd)
			break;

		if (curr->start != next->start)
			continue;

		if (choose_best_symbol(curr, next) == SYMBOL_A) {
			rb_erase(&next->rb_node, symbols);
			goto again;
		} else {
			nd = rb_next(&curr->rb_node);
			rb_erase(&curr->rb_node, symbols);
		}
	}
}

176
static void symbols__fixup_end(struct rb_root *symbols)
177
{
178
	struct rb_node *nd, *prevnd = rb_first(symbols);
179
	struct symbol *curr, *prev;
180 181 182 183

	if (prevnd == NULL)
		return;

184 185
	curr = rb_entry(prevnd, struct symbol, rb_node);

186
	for (nd = rb_next(prevnd); nd; nd = rb_next(nd)) {
187 188
		prev = curr;
		curr = rb_entry(nd, struct symbol, rb_node);
189

190
		if (prev->end == prev->start && prev->end != curr->start)
191 192
			prev->end = curr->start - 1;
	}
193 194 195 196

	/* Last entry */
	if (curr->end == curr->start)
		curr->end = roundup(curr->start, 4096);
197 198
}

199
static void __map_groups__fixup_end(struct map_groups *mg, enum map_type type)
200 201
{
	struct map *prev, *curr;
202
	struct rb_node *nd, *prevnd = rb_first(&mg->maps[type]);
203 204 205 206 207 208 209 210 211 212

	if (prevnd == NULL)
		return;

	curr = rb_entry(prevnd, struct map, rb_node);

	for (nd = rb_next(prevnd); nd; nd = rb_next(nd)) {
		prev = curr;
		curr = rb_entry(nd, struct map, rb_node);
		prev->end = curr->start - 1;
213
	}
214 215 216 217 218

	/*
	 * We still haven't the actual symbols, so guess the
	 * last map final address.
	 */
219
	curr->end = ~0ULL;
220 221
}

222
static void map_groups__fixup_end(struct map_groups *mg)
223 224 225
{
	int i;
	for (i = 0; i < MAP__NR_TYPES; ++i)
226
		__map_groups__fixup_end(mg, i);
227 228
}

229 230
static struct symbol *symbol__new(u64 start, u64 len, u8 binding,
				  const char *name)
231
{
232
	size_t namelen = strlen(name) + 1;
233 234 235
	struct symbol *sym = calloc(1, (symbol_conf.priv_size +
					sizeof(*sym) + namelen));
	if (sym == NULL)
236 237
		return NULL;

238
	if (symbol_conf.priv_size)
239
		sym = ((void *)sym) + symbol_conf.priv_size;
240

241 242 243 244
	sym->start   = start;
	sym->end     = len ? start + len - 1 : start;
	sym->binding = binding;
	sym->namelen = namelen - 1;
245

246 247 248
	pr_debug4("%s: %s %#" PRIx64 "-%#" PRIx64 "\n",
		  __func__, name, start, sym->end);
	memcpy(sym->name, name, namelen);
249

250
	return sym;
251 252
}

253
void symbol__delete(struct symbol *sym)
254
{
255
	free(((void *)sym) - symbol_conf.priv_size);
256 257
}

258
static size_t symbol__fprintf(struct symbol *sym, FILE *fp)
259
{
260
	return fprintf(fp, " %" PRIx64 "-%" PRIx64 " %c %s\n",
261 262 263 264
		       sym->start, sym->end,
		       sym->binding == STB_GLOBAL ? 'g' :
		       sym->binding == STB_LOCAL  ? 'l' : 'w',
		       sym->name);
265 266
}

267
void dso__set_long_name(struct dso *dso, char *name)
268
{
269 270
	if (name == NULL)
		return;
271 272
	dso->long_name = name;
	dso->long_name_len = strlen(name);
273 274
}

275
static void dso__set_short_name(struct dso *dso, const char *name)
276 277 278
{
	if (name == NULL)
		return;
279 280
	dso->short_name = name;
	dso->short_name_len = strlen(name);
281 282
}

283
static void dso__set_basename(struct dso *dso)
284
{
285
	dso__set_short_name(dso, basename(dso->long_name));
286 287
}

288
struct dso *dso__new(const char *name)
289
{
290
	struct dso *dso = calloc(1, sizeof(*dso) + strlen(name) + 1);
291

292
	if (dso != NULL) {
293
		int i;
294 295 296
		strcpy(dso->name, name);
		dso__set_long_name(dso, dso->name);
		dso__set_short_name(dso, dso->name);
297
		for (i = 0; i < MAP__NR_TYPES; ++i)
298 299 300 301 302 303 304
			dso->symbols[i] = dso->symbol_names[i] = RB_ROOT;
		dso->symtab_type = SYMTAB__NOT_FOUND;
		dso->loaded = 0;
		dso->sorted_by_name = 0;
		dso->has_build_id = 0;
		dso->kernel = DSO_TYPE_USER;
		INIT_LIST_HEAD(&dso->node);
305 306
	}

307
	return dso;
308 309
}

310
static void symbols__delete(struct rb_root *symbols)
311 312
{
	struct symbol *pos;
313
	struct rb_node *next = rb_first(symbols);
314 315 316 317

	while (next) {
		pos = rb_entry(next, struct symbol, rb_node);
		next = rb_next(&pos->rb_node);
318
		rb_erase(&pos->rb_node, symbols);
319
		symbol__delete(pos);
320 321 322
	}
}

323
void dso__delete(struct dso *dso)
324
{
325 326
	int i;
	for (i = 0; i < MAP__NR_TYPES; ++i)
327 328 329 330 331 332
		symbols__delete(&dso->symbols[i]);
	if (dso->sname_alloc)
		free((char *)dso->short_name);
	if (dso->lname_alloc)
		free(dso->long_name);
	free(dso);
333 334
}

335
void dso__set_build_id(struct dso *dso, void *build_id)
336
{
337 338
	memcpy(dso->build_id, build_id, sizeof(dso->build_id));
	dso->has_build_id = 1;
339 340
}

341
static void symbols__insert(struct rb_root *symbols, struct symbol *sym)
342
{
343
	struct rb_node **p = &symbols->rb_node;
344
	struct rb_node *parent = NULL;
345
	const u64 ip = sym->start;
346 347 348 349 350 351 352 353 354 355 356
	struct symbol *s;

	while (*p != NULL) {
		parent = *p;
		s = rb_entry(parent, struct symbol, rb_node);
		if (ip < s->start)
			p = &(*p)->rb_left;
		else
			p = &(*p)->rb_right;
	}
	rb_link_node(&sym->rb_node, parent, p);
357
	rb_insert_color(&sym->rb_node, symbols);
358 359
}

360
static struct symbol *symbols__find(struct rb_root *symbols, u64 ip)
361 362 363
{
	struct rb_node *n;

364
	if (symbols == NULL)
365 366
		return NULL;

367
	n = symbols->rb_node;
368 369 370 371 372 373 374 375 376 377 378 379 380 381 382

	while (n) {
		struct symbol *s = rb_entry(n, struct symbol, rb_node);

		if (ip < s->start)
			n = n->rb_left;
		else if (ip > s->end)
			n = n->rb_right;
		else
			return s;
	}

	return NULL;
}

383 384 385 386 387
struct symbol_name_rb_node {
	struct rb_node	rb_node;
	struct symbol	sym;
};

388
static void symbols__insert_by_name(struct rb_root *symbols, struct symbol *sym)
389
{
390
	struct rb_node **p = &symbols->rb_node;
391
	struct rb_node *parent = NULL;
392 393 394
	struct symbol_name_rb_node *symn, *s;

	symn = container_of(sym, struct symbol_name_rb_node, sym);
395 396 397 398 399 400 401 402 403 404

	while (*p != NULL) {
		parent = *p;
		s = rb_entry(parent, struct symbol_name_rb_node, rb_node);
		if (strcmp(sym->name, s->sym.name) < 0)
			p = &(*p)->rb_left;
		else
			p = &(*p)->rb_right;
	}
	rb_link_node(&symn->rb_node, parent, p);
405
	rb_insert_color(&symn->rb_node, symbols);
406 407
}

408 409
static void symbols__sort_by_name(struct rb_root *symbols,
				  struct rb_root *source)
410 411 412 413 414
{
	struct rb_node *nd;

	for (nd = rb_first(source); nd; nd = rb_next(nd)) {
		struct symbol *pos = rb_entry(nd, struct symbol, rb_node);
415
		symbols__insert_by_name(symbols, pos);
416 417 418
	}
}

419 420
static struct symbol *symbols__find_by_name(struct rb_root *symbols,
					    const char *name)
421 422 423
{
	struct rb_node *n;

424
	if (symbols == NULL)
425 426
		return NULL;

427
	n = symbols->rb_node;
428 429 430 431 432 433 434 435 436 437 438 439 440 441 442 443 444 445 446

	while (n) {
		struct symbol_name_rb_node *s;
		int cmp;

		s = rb_entry(n, struct symbol_name_rb_node, rb_node);
		cmp = strcmp(name, s->sym.name);

		if (cmp < 0)
			n = n->rb_left;
		else if (cmp > 0)
			n = n->rb_right;
		else
			return &s->sym;
	}

	return NULL;
}

447
struct symbol *dso__find_symbol(struct dso *dso,
448
				enum map_type type, u64 addr)
449
{
450
	return symbols__find(&dso->symbols[type], addr);
451 452
}

453
struct symbol *dso__find_symbol_by_name(struct dso *dso, enum map_type type,
454 455
					const char *name)
{
456
	return symbols__find_by_name(&dso->symbol_names[type], name);
457 458
}

459
void dso__sort_by_name(struct dso *dso, enum map_type type)
460
{
461 462 463
	dso__set_sorted_by_name(dso, type);
	return symbols__sort_by_name(&dso->symbol_names[type],
				     &dso->symbols[type]);
464 465
}

466
int build_id__sprintf(const u8 *build_id, int len, char *bf)
467
{
468
	char *bid = bf;
469
	const u8 *raw = build_id;
470
	int i;
471

472 473 474 475 476 477
	for (i = 0; i < len; ++i) {
		sprintf(bid, "%02x", *raw);
		++raw;
		bid += 2;
	}

478
	return raw - build_id;
479 480
}

481
size_t dso__fprintf_buildid(struct dso *dso, FILE *fp)
482 483 484
{
	char sbuild_id[BUILD_ID_SIZE * 2 + 1];

485
	build_id__sprintf(dso->build_id, sizeof(dso->build_id), sbuild_id);
486 487 488
	return fprintf(fp, "%s", sbuild_id);
}

489 490
size_t dso__fprintf_symbols_by_name(struct dso *dso,
				    enum map_type type, FILE *fp)
491 492 493 494 495
{
	size_t ret = 0;
	struct rb_node *nd;
	struct symbol_name_rb_node *pos;

496
	for (nd = rb_first(&dso->symbol_names[type]); nd; nd = rb_next(nd)) {
497 498 499 500 501 502 503
		pos = rb_entry(nd, struct symbol_name_rb_node, rb_node);
		fprintf(fp, "%s\n", pos->sym.name);
	}

	return ret;
}

504
size_t dso__fprintf(struct dso *dso, enum map_type type, FILE *fp)
505 506
{
	struct rb_node *nd;
507
	size_t ret = fprintf(fp, "dso: %s (", dso->short_name);
508

509 510
	if (dso->short_name != dso->long_name)
		ret += fprintf(fp, "%s, ", dso->long_name);
511
	ret += fprintf(fp, "%s, %sloaded, ", map_type__name[type],
512 513
		       dso->loaded ? "" : "NOT ");
	ret += dso__fprintf_buildid(dso, fp);
514
	ret += fprintf(fp, ")\n");
515
	for (nd = rb_first(&dso->symbols[type]); nd; nd = rb_next(nd)) {
516 517
		struct symbol *pos = rb_entry(nd, struct symbol, rb_node);
		ret += symbol__fprintf(pos, fp);
518 519 520 521 522
	}

	return ret;
}

523 524
int kallsyms__parse(const char *filename, void *arg,
		    int (*process_symbol)(void *arg, const char *name,
525
					  char type, u64 start, u64 end))
526 527 528
{
	char *line = NULL;
	size_t n;
529
	int err = -1;
530
	FILE *file = fopen(filename, "r");
531 532 533 534

	if (file == NULL)
		goto out_failure;

535 536
	err = 0;

537
	while (!feof(file)) {
538
		u64 start;
539 540
		int line_len, len;
		char symbol_type;
541
		char *symbol_name;
542 543

		line_len = getline(&line, &n, file);
544
		if (line_len < 0 || !line)
545 546 547 548
			break;

		line[--line_len] = '\0'; /* \n */

549
		len = hex2u64(line, &start);
550 551 552 553 554

		len++;
		if (len + 2 >= line_len)
			continue;

555
		symbol_type = line[len];
556 557 558
		len += 2;
		symbol_name = line + len;
		len = line_len - len;
559

560 561
		if (len >= KSYM_NAME_LEN) {
			err = -1;
562
			break;
563 564
		}

565 566 567 568 569 570 571 572 573
		/*
		 * module symbols are not sorted so we add all
		 * symbols with zero length and rely on
		 * symbols__fixup_end() to fix it up.
		 */
		err = process_symbol(arg, symbol_name,
				     symbol_type, start, start);
		if (err)
			break;
574 575 576 577
	}

	free(line);
	fclose(file);
578
	return err;
579 580 581 582 583

out_failure:
	return -1;
}

584 585 586 587 588
struct process_kallsyms_args {
	struct map *map;
	struct dso *dso;
};

589 590 591 592 593 594 595 596
static u8 kallsyms2elf_type(char type)
{
	if (type == 'W')
		return STB_WEAK;

	return isupper(type) ? STB_GLOBAL : STB_LOCAL;
}

597
static int map__process_kallsym_symbol(void *arg, const char *name,
598
				       char type, u64 start, u64 end)
599 600 601 602 603 604 605 606
{
	struct symbol *sym;
	struct process_kallsyms_args *a = arg;
	struct rb_root *root = &a->dso->symbols[a->map->type];

	if (!symbol_type__is_a(type, a->map->type))
		return 0;

607 608
	sym = symbol__new(start, end - start + 1,
			  kallsyms2elf_type(type), name);
609 610 611 612 613 614 615
	if (sym == NULL)
		return -ENOMEM;
	/*
	 * We will pass the symbols to the filter later, in
	 * map__split_kallsyms, when we have split the maps per module
	 */
	symbols__insert(root, sym);
616

617 618 619 620 621 622 623 624
	return 0;
}

/*
 * Loads the function entries in /proc/kallsyms into kernel_map->dso,
 * so that we can in the next step set the symbol ->end address and then
 * call kernel_maps__split_kallsyms.
 */
625
static int dso__load_all_kallsyms(struct dso *dso, const char *filename,
626
				  struct map *map)
627
{
628
	struct process_kallsyms_args args = { .map = map, .dso = dso, };
629
	return kallsyms__parse(filename, &args, map__process_kallsym_symbol);
630 631
}

632 633 634 635 636
/*
 * Split the symbols into maps, making sure there are no overlaps, i.e. the
 * kernel range is broken in several maps, named [kernel].N, as we don't have
 * the original ELF section names vmlinux have.
 */
637
static int dso__split_kallsyms(struct dso *dso, struct map *map,
638
			       symbol_filter_t filter)
639
{
640
	struct map_groups *kmaps = map__kmap(map)->kmaps;
641
	struct machine *machine = kmaps->machine;
642
	struct map *curr_map = map;
643
	struct symbol *pos;
644
	int count = 0, moved = 0;	
645
	struct rb_root *root = &dso->symbols[map->type];
646
	struct rb_node *next = rb_first(root);
647 648 649 650 651 652 653 654 655 656
	int kernel_range = 0;

	while (next) {
		char *module;

		pos = rb_entry(next, struct symbol, rb_node);
		next = rb_next(&pos->rb_node);

		module = strchr(pos->name, '\t');
		if (module) {
657
			if (!symbol_conf.use_modules)
658 659
				goto discard_symbol;

660 661
			*module++ = '\0';

662
			if (strcmp(curr_map->dso->short_name, module)) {
663
				if (curr_map != map &&
664
				    dso->kernel == DSO_TYPE_GUEST_KERNEL &&
665
				    machine__is_default_guest(machine)) {
666 667 668 669 670 671 672 673 674 675 676 677 678
					/*
					 * We assume all symbols of a module are
					 * continuous in * kallsyms, so curr_map
					 * points to a module and all its
					 * symbols are in its kmap. Mark it as
					 * loaded.
					 */
					dso__set_loaded(curr_map->dso,
							curr_map->type);
				}

				curr_map = map_groups__find_by_name(kmaps,
							map->type, module);
679
				if (curr_map == NULL) {
680
					pr_debug("%s/proc/{kallsyms,modules} "
681
					         "inconsistency while looking "
682
						 "for \"%s\" module!\n",
683
						 machine->root_dir, module);
684 685
					curr_map = map;
					goto discard_symbol;
686
				}
687

688
				if (curr_map->dso->loaded &&
689
				    !machine__is_default_guest(machine))
690
					goto discard_symbol;
691
			}
692 693 694 695
			/*
			 * So that we look just like we get from .ko files,
			 * i.e. not prelinked, relative to map->start.
			 */
696 697 698
			pos->start = curr_map->map_ip(curr_map, pos->start);
			pos->end   = curr_map->map_ip(curr_map, pos->end);
		} else if (curr_map != map) {
699
			char dso_name[PATH_MAX];
700
			struct dso *ndso;
701

702 703 704 705 706
			if (count == 0) {
				curr_map = map;
				goto filter_symbol;
			}

707
			if (dso->kernel == DSO_TYPE_GUEST_KERNEL)
708 709 710 711 712 713 714
				snprintf(dso_name, sizeof(dso_name),
					"[guest.kernel].%d",
					kernel_range++);
			else
				snprintf(dso_name, sizeof(dso_name),
					"[kernel].%d",
					kernel_range++);
715

716 717
			ndso = dso__new(dso_name);
			if (ndso == NULL)
718 719
				return -1;

720
			ndso->kernel = dso->kernel;
721

722
			curr_map = map__new2(pos->start, ndso, map->type);
723
			if (curr_map == NULL) {
724
				dso__delete(ndso);
725 726
				return -1;
			}
727

728
			curr_map->map_ip = curr_map->unmap_ip = identity__map_ip;
729
			map_groups__insert(kmaps, curr_map);
730 731
			++kernel_range;
		}
732
filter_symbol:
733
		if (filter && filter(curr_map, pos)) {
734
discard_symbol:		rb_erase(&pos->rb_node, root);
735
			symbol__delete(pos);
736
		} else {
737 738 739
			if (curr_map != map) {
				rb_erase(&pos->rb_node, root);
				symbols__insert(&curr_map->dso->symbols[curr_map->type], pos);
740 741 742
				++moved;
			} else
				++count;
743
		}
744 745
	}

746
	if (curr_map != map &&
747
	    dso->kernel == DSO_TYPE_GUEST_KERNEL &&
748
	    machine__is_default_guest(kmaps->machine)) {
749 750 751
		dso__set_loaded(curr_map->dso, curr_map->type);
	}

752
	return count + moved;
753
}
754

755 756 757 758 759 760 761 762 763 764 765 766 767 768 769 770 771 772
static bool symbol__restricted_filename(const char *filename,
					const char *restricted_filename)
{
	bool restricted = false;

	if (symbol_conf.kptr_restrict) {
		char *r = realpath(filename, NULL);

		if (r != NULL) {
			restricted = strcmp(r, restricted_filename) == 0;
			free(r);
			return restricted;
		}
	}

	return restricted;
}

773
int dso__load_kallsyms(struct dso *dso, const char *filename,
774
		       struct map *map, symbol_filter_t filter)
775
{
776 777 778
	if (symbol__restricted_filename(filename, "/proc/kallsyms"))
		return -1;

779
	if (dso__load_all_kallsyms(dso, filename, map) < 0)
780 781
		return -1;

782
	symbols__fixup_duplicate(&dso->symbols[map->type]);
783 784
	symbols__fixup_end(&dso->symbols[map->type]);

785 786
	if (dso->kernel == DSO_TYPE_GUEST_KERNEL)
		dso->symtab_type = SYMTAB__GUEST_KALLSYMS;
787
	else
788
		dso->symtab_type = SYMTAB__KALLSYMS;
789

790
	return dso__split_kallsyms(dso, map, filter);
791 792
}

793
static int dso__load_perf_map(struct dso *dso, struct map *map,
794
			      symbol_filter_t filter)
795 796 797 798 799 800
{
	char *line = NULL;
	size_t n;
	FILE *file;
	int nr_syms = 0;

801
	file = fopen(dso->long_name, "r");
802 803 804 805
	if (file == NULL)
		goto out_failure;

	while (!feof(file)) {
806
		u64 start, size;
807 808 809 810 811 812 813 814 815 816 817 818 819 820 821 822 823 824 825 826 827 828 829 830
		struct symbol *sym;
		int line_len, len;

		line_len = getline(&line, &n, file);
		if (line_len < 0)
			break;

		if (!line)
			goto out_failure;

		line[--line_len] = '\0'; /* \n */

		len = hex2u64(line, &start);

		len++;
		if (len + 2 >= line_len)
			continue;

		len += hex2u64(line + len, &size);

		len++;
		if (len + 2 >= line_len)
			continue;

831
		sym = symbol__new(start, size, STB_GLOBAL, line + len);
832 833 834 835

		if (sym == NULL)
			goto out_delete_line;

836
		if (filter && filter(map, sym))
837
			symbol__delete(sym);
838
		else {
839
			symbols__insert(&dso->symbols[map->type], sym);
840 841 842 843 844 845 846 847 848 849 850 851 852 853 854
			nr_syms++;
		}
	}

	free(line);
	fclose(file);

	return nr_syms;

out_delete_line:
	free(line);
out_failure:
	return -1;
}

855 856 857
/**
 * elf_symtab__for_each_symbol - iterate thru all the symbols
 *
858
 * @syms: struct elf_symtab instance to iterate
859
 * @idx: uint32_t idx
860 861
 * @sym: GElf_Sym iterator
 */
862 863 864 865
#define elf_symtab__for_each_symbol(syms, nr_syms, idx, sym) \
	for (idx = 0, gelf_getsym(syms, idx, &sym);\
	     idx < nr_syms; \
	     idx++, gelf_getsym(syms, idx, &sym))
866 867 868 869 870 871 872 873 874 875

static inline uint8_t elf_sym__type(const GElf_Sym *sym)
{
	return GELF_ST_TYPE(sym->st_info);
}

static inline int elf_sym__is_function(const GElf_Sym *sym)
{
	return elf_sym__type(sym) == STT_FUNC &&
	       sym->st_name != 0 &&
876
	       sym->st_shndx != SHN_UNDEF;
877 878
}

879 880 881 882 883 884 885
static inline bool elf_sym__is_object(const GElf_Sym *sym)
{
	return elf_sym__type(sym) == STT_OBJECT &&
		sym->st_name != 0 &&
		sym->st_shndx != SHN_UNDEF;
}

886 887 888 889 890 891 892 893 894 895 896 897 898 899 900 901 902 903 904 905
static inline int elf_sym__is_label(const GElf_Sym *sym)
{
	return elf_sym__type(sym) == STT_NOTYPE &&
		sym->st_name != 0 &&
		sym->st_shndx != SHN_UNDEF &&
		sym->st_shndx != SHN_ABS;
}

static inline const char *elf_sec__name(const GElf_Shdr *shdr,
					const Elf_Data *secstrs)
{
	return secstrs->d_buf + shdr->sh_name;
}

static inline int elf_sec__is_text(const GElf_Shdr *shdr,
					const Elf_Data *secstrs)
{
	return strstr(elf_sec__name(shdr, secstrs), "text") != NULL;
}

906 907 908 909 910 911
static inline bool elf_sec__is_data(const GElf_Shdr *shdr,
				    const Elf_Data *secstrs)
{
	return strstr(elf_sec__name(shdr, secstrs), "data") != NULL;
}

912 913 914 915 916 917 918 919
static inline const char *elf_sym__name(const GElf_Sym *sym,
					const Elf_Data *symstrs)
{
	return symstrs->d_buf + sym->st_name;
}

static Elf_Scn *elf_section_by_name(Elf *elf, GElf_Ehdr *ep,
				    GElf_Shdr *shp, const char *name,
920
				    size_t *idx)
921 922 923 924 925 926 927 928 929 930
{
	Elf_Scn *sec = NULL;
	size_t cnt = 1;

	while ((sec = elf_nextscn(elf, sec)) != NULL) {
		char *str;

		gelf_getshdr(sec, shp);
		str = elf_strptr(elf, ep->e_shstrndx, shp->sh_name);
		if (!strcmp(name, str)) {
931 932
			if (idx)
				*idx = cnt;
933 934 935 936 937 938 939 940
			break;
		}
		++cnt;
	}

	return sec;
}

941 942 943 944 945 946 947 948 949 950
#define elf_section__for_each_rel(reldata, pos, pos_mem, idx, nr_entries) \
	for (idx = 0, pos = gelf_getrel(reldata, 0, &pos_mem); \
	     idx < nr_entries; \
	     ++idx, pos = gelf_getrel(reldata, idx, &pos_mem))

#define elf_section__for_each_rela(reldata, pos, pos_mem, idx, nr_entries) \
	for (idx = 0, pos = gelf_getrela(reldata, 0, &pos_mem); \
	     idx < nr_entries; \
	     ++idx, pos = gelf_getrela(reldata, idx, &pos_mem))

951 952 953 954 955 956 957
/*
 * We need to check if we have a .dynsym, so that we can handle the
 * .plt, synthesizing its symbols, that aren't on the symtabs (be it
 * .dynsym or .symtab).
 * And always look at the original dso, not at debuginfo packages, that
 * have the PLT data stripped out (shdr_rel_plt.sh_type == SHT_NOBITS).
 */
958
static int dso__synthesize_plt_symbols(struct  dso *dso, struct map *map,
959
				       symbol_filter_t filter)
960 961 962
{
	uint32_t nr_rel_entries, idx;
	GElf_Sym sym;
963
	u64 plt_offset;
964 965
	GElf_Shdr shdr_plt;
	struct symbol *f;
966
	GElf_Shdr shdr_rel_plt, shdr_dynsym;
967
	Elf_Data *reldata, *syms, *symstrs;
968 969 970
	Elf_Scn *scn_plt_rel, *scn_symstrs, *scn_dynsym;
	size_t dynsym_idx;
	GElf_Ehdr ehdr;
971
	char sympltname[1024];
972 973
	Elf *elf;
	int nr = 0, symidx, fd, err = 0;
974
	char name[PATH_MAX];
975

976
	snprintf(name, sizeof(name), "%s%s",
977
		 symbol_conf.symfs, dso->long_name);
978
	fd = open(name, O_RDONLY);
979 980 981
	if (fd < 0)
		goto out;

982
	elf = elf_begin(fd, PERF_ELF_C_READ_MMAP, NULL);
983 984 985 986 987 988 989 990 991 992
	if (elf == NULL)
		goto out_close;

	if (gelf_getehdr(elf, &ehdr) == NULL)
		goto out_elf_end;

	scn_dynsym = elf_section_by_name(elf, &ehdr, &shdr_dynsym,
					 ".dynsym", &dynsym_idx);
	if (scn_dynsym == NULL)
		goto out_elf_end;
993

994
	scn_plt_rel = elf_section_by_name(elf, &ehdr, &shdr_rel_plt,
995 996
					  ".rela.plt", NULL);
	if (scn_plt_rel == NULL) {
997
		scn_plt_rel = elf_section_by_name(elf, &ehdr, &shdr_rel_plt,
998 999
						  ".rel.plt", NULL);
		if (scn_plt_rel == NULL)
1000
			goto out_elf_end;
1001 1002
	}

1003 1004
	err = -1;

1005
	if (shdr_rel_plt.sh_link != dynsym_idx)
1006
		goto out_elf_end;
1007

1008 1009
	if (elf_section_by_name(elf, &ehdr, &shdr_plt, ".plt", NULL) == NULL)
		goto out_elf_end;
1010 1011

	/*
1012
	 * Fetch the relocation section to find the idxes to the GOT
1013 1014 1015 1016
	 * and the symbols in the .dynsym they refer to.
	 */
	reldata = elf_getdata(scn_plt_rel, NULL);
	if (reldata == NULL)
1017
		goto out_elf_end;
1018 1019 1020

	syms = elf_getdata(scn_dynsym, NULL);
	if (syms == NULL)
1021
		goto out_elf_end;
1022

1023
	scn_symstrs = elf_getscn(elf, shdr_dynsym.sh_link);
1024
	if (scn_symstrs == NULL)
1025
		goto out_elf_end;
1026 1027 1028

	symstrs = elf_getdata(scn_symstrs, NULL);
	if (symstrs == NULL)
1029
		goto out_elf_end;
1030 1031 1032 1033 1034 1035 1036 1037 1038 1039 1040 1041 1042 1043 1044 1045

	nr_rel_entries = shdr_rel_plt.sh_size / shdr_rel_plt.sh_entsize;
	plt_offset = shdr_plt.sh_offset;

	if (shdr_rel_plt.sh_type == SHT_RELA) {
		GElf_Rela pos_mem, *pos;

		elf_section__for_each_rela(reldata, pos, pos_mem, idx,
					   nr_rel_entries) {
			symidx = GELF_R_SYM(pos->r_info);
			plt_offset += shdr_plt.sh_entsize;
			gelf_getsym(syms, symidx, &sym);
			snprintf(sympltname, sizeof(sympltname),
				 "%s@plt", elf_sym__name(&sym, symstrs));

			f = symbol__new(plt_offset, shdr_plt.sh_entsize,
1046
					STB_GLOBAL, sympltname);
1047
			if (!f)
1048
				goto out_elf_end;
1049

1050 1051 1052
			if (filter && filter(map, f))
				symbol__delete(f);
			else {
1053
				symbols__insert(&dso->symbols[map->type], f);
1054 1055
				++nr;
			}
1056 1057 1058 1059 1060 1061 1062 1063 1064 1065 1066 1067
		}
	} else if (shdr_rel_plt.sh_type == SHT_REL) {
		GElf_Rel pos_mem, *pos;
		elf_section__for_each_rel(reldata, pos, pos_mem, idx,
					  nr_rel_entries) {
			symidx = GELF_R_SYM(pos->r_info);
			plt_offset += shdr_plt.sh_entsize;
			gelf_getsym(syms, symidx, &sym);
			snprintf(sympltname, sizeof(sympltname),
				 "%s@plt", elf_sym__name(&sym, symstrs));

			f = symbol__new(plt_offset, shdr_plt.sh_entsize,
1068
					STB_GLOBAL, sympltname);
1069
			if (!f)
1070
				goto out_elf_end;
1071

1072 1073 1074
			if (filter && filter(map, f))
				symbol__delete(f);
			else {
1075
				symbols__insert(&dso->symbols[map->type], f);
1076 1077
				++nr;
			}
1078 1079 1080
		}
	}

1081 1082 1083 1084 1085 1086 1087 1088 1089
	err = 0;
out_elf_end:
	elf_end(elf);
out_close:
	close(fd);

	if (err == 0)
		return nr;
out:
1090
	pr_debug("%s: problems reading %s PLT info.\n",
1091
		 __func__, dso->long_name);
1092
	return 0;
1093 1094
}

1095
static bool elf_sym__is_a(GElf_Sym *sym, enum map_type type)
1096 1097 1098
{
	switch (type) {
	case MAP__FUNCTION:
1099
		return elf_sym__is_function(sym);
1100
	case MAP__VARIABLE:
1101
		return elf_sym__is_object(sym);
1102 1103 1104 1105 1106
	default:
		return false;
	}
}

1107 1108
static bool elf_sec__is_a(GElf_Shdr *shdr, Elf_Data *secstrs,
			  enum map_type type)
1109 1110 1111
{
	switch (type) {
	case MAP__FUNCTION:
1112
		return elf_sec__is_text(shdr, secstrs);
1113
	case MAP__VARIABLE:
1114
		return elf_sec__is_data(shdr, secstrs);
1115 1116 1117 1118 1119
	default:
		return false;
	}
}

1120 1121 1122 1123 1124 1125 1126 1127 1128 1129 1130 1131 1132 1133 1134 1135 1136 1137 1138
static size_t elf_addr_to_index(Elf *elf, GElf_Addr addr)
{
	Elf_Scn *sec = NULL;
	GElf_Shdr shdr;
	size_t cnt = 1;

	while ((sec = elf_nextscn(elf, sec)) != NULL) {
		gelf_getshdr(sec, &shdr);

		if ((addr >= shdr.sh_addr) &&
		    (addr < (shdr.sh_addr + shdr.sh_size)))
			return cnt;

		++cnt;
	}

	return -1;
}

1139
static int dso__load_sym(struct dso *dso, struct map *map, const char *name,
1140 1141
			 int fd, symbol_filter_t filter, int kmodule,
			 int want_symtab)
1142
{
1143
	struct kmap *kmap = dso->kernel ? map__kmap(map) : NULL;
1144
	struct map *curr_map = map;
1145
	struct dso *curr_dso = dso;
1146
	Elf_Data *symstrs, *secstrs;
1147 1148
	uint32_t nr_syms;
	int err = -1;
1149
	uint32_t idx;
1150
	GElf_Ehdr ehdr;
1151 1152
	GElf_Shdr shdr, opdshdr;
	Elf_Data *syms, *opddata = NULL;
1153
	GElf_Sym sym;
1154
	Elf_Scn *sec, *sec_strndx, *opdsec;
1155
	Elf *elf;
1156
	int nr = 0;
1157
	size_t opdidx = 0;
1158

1159
	elf = elf_begin(fd, PERF_ELF_C_READ_MMAP, NULL);
1160
	if (elf == NULL) {
1161
		pr_debug("%s: cannot read %s ELF file.\n", __func__, name);
1162 1163 1164 1165
		goto out_close;
	}

	if (gelf_getehdr(elf, &ehdr) == NULL) {
1166
		pr_debug("%s: cannot get elf header.\n", __func__);
1167 1168 1169
		goto out_elf_end;
	}

1170
	/* Always reject images with a mismatched build-id: */
1171
	if (dso->has_build_id) {
1172 1173
		u8 build_id[BUILD_ID_SIZE];

1174
		if (elf_read_build_id(elf, build_id, BUILD_ID_SIZE) < 0)
1175 1176
			goto out_elf_end;

1177
		if (!dso__build_id_equal(dso, build_id))
1178 1179 1180
			goto out_elf_end;
	}

1181
	sec = elf_section_by_name(elf, &ehdr, &shdr, ".symtab", NULL);
1182
	if (sec == NULL) {
1183 1184 1185
		if (want_symtab)
			goto out_elf_end;

1186 1187
		sec = elf_section_by_name(elf, &ehdr, &shdr, ".dynsym", NULL);
		if (sec == NULL)
1188 1189
			goto out_elf_end;
	}
1190

1191
	opdsec = elf_section_by_name(elf, &ehdr, &opdshdr, ".opd", &opdidx);
1192 1193
	if (opdshdr.sh_type != SHT_PROGBITS)
		opdsec = NULL;
1194 1195 1196
	if (opdsec)
		opddata = elf_rawdata(opdsec, NULL);

1197 1198 1199 1200 1201 1202 1203 1204 1205 1206 1207 1208
	syms = elf_getdata(sec, NULL);
	if (syms == NULL)
		goto out_elf_end;

	sec = elf_getscn(elf, shdr.sh_link);
	if (sec == NULL)
		goto out_elf_end;

	symstrs = elf_getdata(sec, NULL);
	if (symstrs == NULL)
		goto out_elf_end;

1209 1210 1211 1212 1213
	sec_strndx = elf_getscn(elf, ehdr.e_shstrndx);
	if (sec_strndx == NULL)
		goto out_elf_end;

	secstrs = elf_getdata(sec_strndx, NULL);
S
Stoyan Gaydarov 已提交
1214
	if (secstrs == NULL)
1215 1216
		goto out_elf_end;

1217 1218
	nr_syms = shdr.sh_size / shdr.sh_entsize;

1219
	memset(&sym, 0, sizeof(sym));
1220 1221
	if (dso->kernel == DSO_TYPE_USER) {
		dso->adjust_symbols = (ehdr.e_type == ET_EXEC ||
1222 1223 1224
				elf_section_by_name(elf, &ehdr, &shdr,
						     ".gnu.prelink_undo",
						     NULL) != NULL);
1225 1226 1227
	} else {
		dso->adjust_symbols = 0;
	}
1228
	elf_symtab__for_each_symbol(syms, nr_syms, idx, sym) {
1229
		struct symbol *f;
1230
		const char *elf_name = elf_sym__name(&sym, symstrs);
1231
		char *demangled = NULL;
1232 1233
		int is_label = elf_sym__is_label(&sym);
		const char *section_name;
1234

1235 1236 1237
		if (kmap && kmap->ref_reloc_sym && kmap->ref_reloc_sym->name &&
		    strcmp(elf_name, kmap->ref_reloc_sym->name) == 0)
			kmap->ref_reloc_sym->unrelocated_addr = sym.st_value;
1238

1239
		if (!is_label && !elf_sym__is_a(&sym, map->type))
1240 1241
			continue;

1242 1243 1244 1245 1246 1247 1248 1249 1250 1251
		/* Reject ARM ELF "mapping symbols": these aren't unique and
		 * don't identify functions, so will confuse the profile
		 * output: */
		if (ehdr.e_machine == EM_ARM) {
			if (!strcmp(elf_name, "$a") ||
			    !strcmp(elf_name, "$d") ||
			    !strcmp(elf_name, "$t"))
				continue;
		}

1252 1253 1254 1255 1256 1257 1258
		if (opdsec && sym.st_shndx == opdidx) {
			u32 offset = sym.st_value - opdshdr.sh_addr;
			u64 *opd = opddata->d_buf + offset;
			sym.st_value = *opd;
			sym.st_shndx = elf_addr_to_index(elf, sym.st_value);
		}

1259 1260 1261 1262 1263
		sec = elf_getscn(elf, sym.st_shndx);
		if (!sec)
			goto out_elf_end;

		gelf_getshdr(sec, &shdr);
1264

1265
		if (is_label && !elf_sec__is_a(&shdr, secstrs, map->type))
1266 1267 1268
			continue;

		section_name = elf_sec__name(&shdr, secstrs);
1269

1270 1271 1272 1273 1274 1275 1276
		/* On ARM, symbols for thumb functions have 1 added to
		 * the symbol address as a flag - remove it */
		if ((ehdr.e_machine == EM_ARM) &&
		    (map->type == MAP__FUNCTION) &&
		    (sym.st_value & 1))
			--sym.st_value;

1277
		if (dso->kernel != DSO_TYPE_USER || kmodule) {
1278 1279 1280
			char dso_name[PATH_MAX];

			if (strcmp(section_name,
1281
				   (curr_dso->short_name +
1282
				    dso->short_name_len)) == 0)
1283 1284 1285 1286
				goto new_symbol;

			if (strcmp(section_name, ".text") == 0) {
				curr_map = map;
1287
				curr_dso = dso;
1288 1289 1290 1291
				goto new_symbol;
			}

			snprintf(dso_name, sizeof(dso_name),
1292
				 "%s%s", dso->short_name, section_name);
1293

1294
			curr_map = map_groups__find_by_name(kmap->kmaps, map->type, dso_name);
1295 1296 1297 1298 1299 1300
			if (curr_map == NULL) {
				u64 start = sym.st_value;

				if (kmodule)
					start += map->start + shdr.sh_offset;

1301
				curr_dso = dso__new(dso_name);
1302 1303
				if (curr_dso == NULL)
					goto out_elf_end;
1304 1305 1306
				curr_dso->kernel = dso->kernel;
				curr_dso->long_name = dso->long_name;
				curr_dso->long_name_len = dso->long_name_len;
1307
				curr_map = map__new2(start, curr_dso,
1308
						     map->type);
1309 1310 1311 1312
				if (curr_map == NULL) {
					dso__delete(curr_dso);
					goto out_elf_end;
				}
1313 1314
				curr_map->map_ip = identity__map_ip;
				curr_map->unmap_ip = identity__map_ip;
1315
				curr_dso->symtab_type = dso->symtab_type;
1316
				map_groups__insert(kmap->kmaps, curr_map);
1317
				dsos__add(&dso->node, curr_dso);
1318
				dso__set_loaded(curr_dso, map->type);
1319 1320 1321 1322
			} else
				curr_dso = curr_map->dso;

			goto new_symbol;
1323 1324
		}

1325
		if (curr_dso->adjust_symbols) {
1326 1327
			pr_debug4("%s: adjusting symbol: st_value: %#" PRIx64 " "
				  "sh_addr: %#" PRIx64 " sh_offset: %#" PRIx64 "\n", __func__,
1328 1329
				  (u64)sym.st_value, (u64)shdr.sh_addr,
				  (u64)shdr.sh_offset);
1330
			sym.st_value -= shdr.sh_addr - shdr.sh_offset;
1331
		}
1332 1333 1334 1335 1336
		/*
		 * We need to figure out if the object was created from C++ sources
		 * DWARF DW_compile_unit has this, but we don't always have access
		 * to it...
		 */
1337
		demangled = bfd_demangle(NULL, elf_name, DMGL_PARAMS | DMGL_ANSI);
1338
		if (demangled != NULL)
1339
			elf_name = demangled;
1340
new_symbol:
1341 1342
		f = symbol__new(sym.st_value, sym.st_size,
				GELF_ST_BIND(sym.st_info), elf_name);
1343
		free(demangled);
1344 1345 1346
		if (!f)
			goto out_elf_end;

1347
		if (filter && filter(curr_map, f))
1348
			symbol__delete(f);
1349
		else {
1350
			symbols__insert(&curr_dso->symbols[curr_map->type], f);
1351 1352
			nr++;
		}
1353 1354
	}

1355 1356 1357
	/*
	 * For misannotated, zeroed, ASM function sizes.
	 */
1358
	if (nr > 0) {
1359
		symbols__fixup_duplicate(&dso->symbols[map->type]);
1360
		symbols__fixup_end(&dso->symbols[map->type]);
1361 1362 1363 1364 1365 1366 1367 1368
		if (kmap) {
			/*
			 * We need to fixup this here too because we create new
			 * maps here, for things like vsyscall sections.
			 */
			__map_groups__fixup_end(kmap->kmaps, map->type);
		}
	}
1369 1370 1371 1372 1373 1374 1375
	err = nr;
out_elf_end:
	elf_end(elf);
out_close:
	return err;
}

1376
static bool dso__build_id_equal(const struct dso *dso, u8 *build_id)
1377
{
1378
	return memcmp(dso->build_id, build_id, sizeof(dso->build_id)) == 0;
1379 1380
}

1381
bool __dsos__read_build_ids(struct list_head *head, bool with_hits)
1382
{
1383
	bool have_build_id = false;
1384 1385
	struct dso *pos;

1386 1387 1388
	list_for_each_entry(pos, head, node) {
		if (with_hits && !pos->hit)
			continue;
1389 1390 1391 1392
		if (pos->has_build_id) {
			have_build_id = true;
			continue;
		}
1393 1394 1395 1396 1397
		if (filename__read_build_id(pos->long_name, pos->build_id,
					    sizeof(pos->build_id)) > 0) {
			have_build_id	  = true;
			pos->has_build_id = true;
		}
1398
	}
1399

1400
	return have_build_id;
1401 1402
}

1403 1404 1405 1406 1407
/*
 * Align offset to 4 bytes as needed for note name and descriptor data.
 */
#define NOTE_ALIGN(n) (((n) + 3) & -4U)

1408
static int elf_read_build_id(Elf *elf, void *bf, size_t size)
1409
{
1410
	int err = -1;
1411 1412
	GElf_Ehdr ehdr;
	GElf_Shdr shdr;
1413
	Elf_Data *data;
1414
	Elf_Scn *sec;
1415
	Elf_Kind ek;
1416
	void *ptr;
1417

1418 1419 1420
	if (size < BUILD_ID_SIZE)
		goto out;

1421 1422
	ek = elf_kind(elf);
	if (ek != ELF_K_ELF)
1423
		goto out;
1424

1425
	if (gelf_getehdr(elf, &ehdr) == NULL) {
1426
		pr_err("%s: cannot get elf header.\n", __func__);
1427
		goto out;
1428 1429
	}

1430 1431
	sec = elf_section_by_name(elf, &ehdr, &shdr,
				  ".note.gnu.build-id", NULL);
1432 1433 1434 1435
	if (sec == NULL) {
		sec = elf_section_by_name(elf, &ehdr, &shdr,
					  ".notes", NULL);
		if (sec == NULL)
1436
			goto out;
1437
	}
1438

1439 1440
	data = elf_getdata(sec, NULL);
	if (data == NULL)
1441
		goto out;
1442 1443 1444 1445

	ptr = data->d_buf;
	while (ptr < (data->d_buf + data->d_size)) {
		GElf_Nhdr *nhdr = ptr;
1446 1447
		size_t namesz = NOTE_ALIGN(nhdr->n_namesz),
		       descsz = NOTE_ALIGN(nhdr->n_descsz);
1448 1449 1450 1451 1452 1453 1454 1455
		const char *name;

		ptr += sizeof(*nhdr);
		name = ptr;
		ptr += namesz;
		if (nhdr->n_type == NT_GNU_BUILD_ID &&
		    nhdr->n_namesz == sizeof("GNU")) {
			if (memcmp(name, "GNU", sizeof("GNU")) == 0) {
1456 1457 1458 1459
				size_t sz = min(size, descsz);
				memcpy(bf, ptr, sz);
				memset(bf + sz, 0, size - sz);
				err = descsz;
1460 1461 1462 1463 1464
				break;
			}
		}
		ptr += descsz;
	}
1465 1466 1467 1468 1469 1470 1471 1472 1473 1474 1475 1476 1477 1478 1479 1480 1481 1482 1483 1484 1485 1486 1487 1488 1489

out:
	return err;
}

int filename__read_build_id(const char *filename, void *bf, size_t size)
{
	int fd, err = -1;
	Elf *elf;

	if (size < BUILD_ID_SIZE)
		goto out;

	fd = open(filename, O_RDONLY);
	if (fd < 0)
		goto out;

	elf = elf_begin(fd, PERF_ELF_C_READ_MMAP, NULL);
	if (elf == NULL) {
		pr_debug2("%s: cannot read %s ELF file.\n", __func__, filename);
		goto out_close;
	}

	err = elf_read_build_id(elf, bf, size);

1490 1491 1492 1493 1494 1495 1496
	elf_end(elf);
out_close:
	close(fd);
out:
	return err;
}

1497 1498 1499 1500 1501 1502 1503 1504 1505 1506 1507 1508 1509 1510
int sysfs__read_build_id(const char *filename, void *build_id, size_t size)
{
	int fd, err = -1;

	if (size < BUILD_ID_SIZE)
		goto out;

	fd = open(filename, O_RDONLY);
	if (fd < 0)
		goto out;

	while (1) {
		char bf[BUFSIZ];
		GElf_Nhdr nhdr;
1511
		size_t namesz, descsz;
1512 1513 1514 1515

		if (read(fd, &nhdr, sizeof(nhdr)) != sizeof(nhdr))
			break;

1516 1517
		namesz = NOTE_ALIGN(nhdr.n_namesz);
		descsz = NOTE_ALIGN(nhdr.n_descsz);
1518 1519
		if (nhdr.n_type == NT_GNU_BUILD_ID &&
		    nhdr.n_namesz == sizeof("GNU")) {
1520
			if (read(fd, bf, namesz) != (ssize_t)namesz)
1521 1522
				break;
			if (memcmp(bf, "GNU", sizeof("GNU")) == 0) {
1523 1524 1525
				size_t sz = min(descsz, size);
				if (read(fd, build_id, sz) == (ssize_t)sz) {
					memset(build_id + sz, 0, size - sz);
1526 1527 1528
					err = 0;
					break;
				}
1529
			} else if (read(fd, bf, descsz) != (ssize_t)descsz)
1530 1531 1532 1533 1534 1535 1536 1537 1538 1539 1540 1541
				break;
		} else {
			int n = namesz + descsz;
			if (read(fd, bf, n) != n)
				break;
		}
	}
	close(fd);
out:
	return err;
}

1542
char dso__symtab_origin(const struct dso *dso)
1543 1544
{
	static const char origin[] = {
1545 1546 1547 1548 1549 1550 1551 1552 1553 1554
		[SYMTAB__KALLSYMS]	      = 'k',
		[SYMTAB__JAVA_JIT]	      = 'j',
		[SYMTAB__BUILD_ID_CACHE]      = 'B',
		[SYMTAB__FEDORA_DEBUGINFO]    = 'f',
		[SYMTAB__UBUNTU_DEBUGINFO]    = 'u',
		[SYMTAB__BUILDID_DEBUGINFO]   = 'b',
		[SYMTAB__SYSTEM_PATH_DSO]     = 'd',
		[SYMTAB__SYSTEM_PATH_KMODULE] = 'K',
		[SYMTAB__GUEST_KALLSYMS]      =  'g',
		[SYMTAB__GUEST_KMODULE]	      =  'G',
1555 1556
	};

1557
	if (dso == NULL || dso->symtab_type == SYMTAB__NOT_FOUND)
1558
		return '!';
1559
	return origin[dso->symtab_type];
1560 1561
}

1562
int dso__load(struct dso *dso, struct map *map, symbol_filter_t filter)
1563
{
1564
	int size = PATH_MAX;
1565
	char *name;
1566 1567
	int ret = -1;
	int fd;
1568
	struct machine *machine;
1569
	const char *root_dir;
1570
	int want_symtab;
1571

1572
	dso__set_loaded(dso, map->type);
1573

1574 1575 1576 1577
	if (dso->kernel == DSO_TYPE_KERNEL)
		return dso__load_kernel_sym(dso, map, filter);
	else if (dso->kernel == DSO_TYPE_GUEST_KERNEL)
		return dso__load_guest_kernel_sym(dso, map, filter);
1578

1579 1580
	if (map->groups && map->groups->machine)
		machine = map->groups->machine;
1581
	else
1582
		machine = NULL;
1583 1584

	name = malloc(size);
1585 1586 1587
	if (!name)
		return -1;

1588
	dso->adjust_symbols = 0;
1589

1590
	if (strncmp(dso->name, "/tmp/perf-", 10) == 0) {
1591 1592
		struct stat st;

1593
		if (lstat(dso->name, &st) < 0)
1594 1595 1596 1597 1598 1599 1600 1601
			return -1;

		if (st.st_uid && (st.st_uid != geteuid())) {
			pr_warning("File %s not owned by current user or root, "
				"ignoring it.\n", dso->name);
			return -1;
		}

1602 1603
		ret = dso__load_perf_map(dso, map, filter);
		dso->symtab_type = ret > 0 ? SYMTAB__JAVA_JIT :
1604
					      SYMTAB__NOT_FOUND;
1605 1606 1607
		return ret;
	}

1608 1609 1610 1611
	/* Iterate over candidate debug images.
	 * On the first pass, only load images if they have a full symtab.
	 * Failing that, do a second pass where we accept .dynsym also
	 */
1612 1613
	want_symtab = 1;
restart:
1614 1615 1616 1617
	for (dso->symtab_type = SYMTAB__BUILD_ID_CACHE;
	     dso->symtab_type != SYMTAB__NOT_FOUND;
	     dso->symtab_type++) {
		switch (dso->symtab_type) {
1618
		case SYMTAB__BUILD_ID_CACHE:
1619 1620
			/* skip the locally configured cache if a symfs is given */
			if (symbol_conf.symfs[0] ||
1621
			    (dso__build_id_filename(dso, name, size) == NULL)) {
1622
				continue;
1623
			}
1624
			break;
1625
		case SYMTAB__FEDORA_DEBUGINFO:
1626
			snprintf(name, size, "%s/usr/lib/debug%s.debug",
1627
				 symbol_conf.symfs, dso->long_name);
1628
			break;
1629
		case SYMTAB__UBUNTU_DEBUGINFO:
1630
			snprintf(name, size, "%s/usr/lib/debug%s",
1631
				 symbol_conf.symfs, dso->long_name);
1632
			break;
1633
		case SYMTAB__BUILDID_DEBUGINFO: {
1634 1635
			char build_id_hex[BUILD_ID_SIZE * 2 + 1];

1636
			if (!dso->has_build_id)
1637 1638
				continue;

1639 1640
			build_id__sprintf(dso->build_id,
					  sizeof(dso->build_id),
1641 1642
					  build_id_hex);
			snprintf(name, size,
1643 1644
				 "%s/usr/lib/debug/.build-id/%.2s/%s.debug",
				 symbol_conf.symfs, build_id_hex, build_id_hex + 2);
1645
			}
1646
			break;
1647
		case SYMTAB__SYSTEM_PATH_DSO:
1648
			snprintf(name, size, "%s%s",
1649
			     symbol_conf.symfs, dso->long_name);
1650
			break;
1651
		case SYMTAB__GUEST_KMODULE:
K
Kyle McMartin 已提交
1652 1653
			if (map->groups && machine)
				root_dir = machine->root_dir;
1654 1655
			else
				root_dir = "";
1656
			snprintf(name, size, "%s%s%s", symbol_conf.symfs,
1657
				 root_dir, dso->long_name);
1658 1659
			break;

1660
		case SYMTAB__SYSTEM_PATH_KMODULE:
1661
			snprintf(name, size, "%s%s", symbol_conf.symfs,
1662
				 dso->long_name);
1663
			break;
1664
		default:;
1665
		}
1666 1667

		/* Name is now the name of the next image to try */
1668
		fd = open(name, O_RDONLY);
1669 1670
		if (fd < 0)
			continue;
1671

1672
		ret = dso__load_sym(dso, map, name, fd, filter, 0,
1673 1674
				    want_symtab);
		close(fd);
1675

1676 1677 1678 1679 1680 1681
		/*
		 * Some people seem to have debuginfo files _WITHOUT_ debug
		 * info!?!?
		 */
		if (!ret)
			continue;
1682

1683
		if (ret > 0) {
1684 1685
			int nr_plt = dso__synthesize_plt_symbols(dso, map,
								 filter);
1686 1687 1688 1689
			if (nr_plt > 0)
				ret += nr_plt;
			break;
		}
1690
	}
1691

1692 1693 1694 1695 1696 1697 1698 1699 1700
	/*
	 * If we wanted a full symtab but no image had one,
	 * relax our requirements and repeat the search.
	 */
	if (ret <= 0 && want_symtab) {
		want_symtab = 0;
		goto restart;
	}

1701
	free(name);
1702
	if (ret < 0 && strstr(dso->name, " (deleted)") != NULL)
1703
		return 0;
1704 1705 1706
	return ret;
}

1707
struct map *map_groups__find_by_name(struct map_groups *mg,
1708
				     enum map_type type, const char *name)
1709 1710 1711
{
	struct rb_node *nd;

1712
	for (nd = rb_first(&mg->maps[type]); nd; nd = rb_next(nd)) {
1713 1714
		struct map *map = rb_entry(nd, struct map, rb_node);

1715
		if (map->dso && strcmp(map->dso->short_name, name) == 0)
1716 1717 1718 1719 1720 1721
			return map;
	}

	return NULL;
}

1722 1723
static int dso__kernel_module_get_build_id(struct dso *dso,
					   const char *root_dir)
1724 1725 1726 1727 1728 1729
{
	char filename[PATH_MAX];
	/*
	 * kernel module short names are of the form "[module]" and
	 * we need just "module" here.
	 */
1730
	const char *name = dso->short_name + 1;
1731 1732

	snprintf(filename, sizeof(filename),
1733 1734
		 "%s/sys/module/%.*s/notes/.note.gnu.build-id",
		 root_dir, (int)strlen(name) - 1, name);
1735

1736 1737 1738
	if (sysfs__read_build_id(filename, dso->build_id,
				 sizeof(dso->build_id)) == 0)
		dso->has_build_id = true;
1739 1740 1741 1742

	return 0;
}

1743
static int map_groups__set_modules_path_dir(struct map_groups *mg,
1744
				const char *dir_name)
1745
{
1746
	struct dirent *dent;
1747
	DIR *dir = opendir(dir_name);
1748
	int ret = 0;
1749

1750
	if (!dir) {
1751
		pr_debug("%s: cannot open %s dir\n", __func__, dir_name);
1752 1753
		return -1;
	}
1754

1755 1756
	while ((dent = readdir(dir)) != NULL) {
		char path[PATH_MAX];
1757 1758 1759 1760 1761 1762
		struct stat st;

		/*sshfs might return bad dent->d_type, so we have to stat*/
		sprintf(path, "%s/%s", dir_name, dent->d_name);
		if (stat(path, &st))
			continue;
1763

1764
		if (S_ISDIR(st.st_mode)) {
1765 1766 1767 1768 1769
			if (!strcmp(dent->d_name, ".") ||
			    !strcmp(dent->d_name, ".."))
				continue;

			snprintf(path, sizeof(path), "%s/%s",
1770
				 dir_name, dent->d_name);
1771
			ret = map_groups__set_modules_path_dir(mg, path);
1772 1773
			if (ret < 0)
				goto out;
1774 1775 1776 1777
		} else {
			char *dot = strrchr(dent->d_name, '.'),
			     dso_name[PATH_MAX];
			struct map *map;
1778
			char *long_name;
1779 1780 1781 1782 1783 1784

			if (dot == NULL || strcmp(dot, ".ko"))
				continue;
			snprintf(dso_name, sizeof(dso_name), "[%.*s]",
				 (int)(dot - dent->d_name), dent->d_name);

1785
			strxfrchar(dso_name, '-', '_');
1786 1787
			map = map_groups__find_by_name(mg, MAP__FUNCTION,
						       dso_name);
1788 1789 1790 1791
			if (map == NULL)
				continue;

			snprintf(path, sizeof(path), "%s/%s",
1792
				 dir_name, dent->d_name);
1793

1794
			long_name = strdup(path);
1795 1796 1797 1798
			if (long_name == NULL) {
				ret = -1;
				goto out;
			}
1799
			dso__set_long_name(map->dso, long_name);
1800
			map->dso->lname_alloc = 1;
1801
			dso__kernel_module_get_build_id(map->dso, "");
1802 1803
		}
	}
1804

1805
out:
1806
	closedir(dir);
1807
	return ret;
1808
}
1809

1810
static char *get_kernel_version(const char *root_dir)
1811
{
1812 1813 1814 1815 1816 1817 1818 1819 1820 1821 1822 1823 1824 1825 1826 1827 1828 1829 1830 1831 1832 1833 1834 1835 1836
	char version[PATH_MAX];
	FILE *file;
	char *name, *tmp;
	const char *prefix = "Linux version ";

	sprintf(version, "%s/proc/version", root_dir);
	file = fopen(version, "r");
	if (!file)
		return NULL;

	version[0] = '\0';
	tmp = fgets(version, sizeof(version), file);
	fclose(file);

	name = strstr(version, prefix);
	if (!name)
		return NULL;
	name += strlen(prefix);
	tmp = strchr(name, ' ');
	if (tmp)
		*tmp = '\0';

	return strdup(name);
}

1837
static int machine__set_modules_path(struct machine *machine)
1838 1839
{
	char *version;
1840
	char modules_path[PATH_MAX];
1841

1842
	version = get_kernel_version(machine->root_dir);
1843
	if (!version)
1844
		return -1;
1845

1846
	snprintf(modules_path, sizeof(modules_path), "%s/lib/modules/%s/kernel",
1847
		 machine->root_dir, version);
1848
	free(version);
1849

1850
	return map_groups__set_modules_path_dir(&machine->kmaps, modules_path);
1851 1852
}

1853 1854 1855 1856 1857
/*
 * Constructor variant for modules (where we know from /proc/modules where
 * they are loaded) and for vmlinux, where only after we load all the
 * symbols we'll know where it starts and ends.
 */
1858
static struct map *map__new2(u64 start, struct dso *dso, enum map_type type)
1859
{
1860 1861 1862
	struct map *map = calloc(1, (sizeof(*map) +
				     (dso->kernel ? sizeof(struct kmap) : 0)));
	if (map != NULL) {
1863
		/*
1864
		 * ->end will be filled after we load all the symbols
1865
		 */
1866
		map__init(map, type, start, 0, 0, dso);
1867
	}
1868

1869
	return map;
1870 1871
}

1872
struct map *machine__new_module(struct machine *machine, u64 start,
1873
				const char *filename)
1874 1875
{
	struct map *map;
1876
	struct dso *dso = __dsos__findnew(&machine->kernel_dsos, filename);
1877 1878 1879 1880 1881 1882 1883 1884

	if (dso == NULL)
		return NULL;

	map = map__new2(start, dso, MAP__FUNCTION);
	if (map == NULL)
		return NULL;

1885
	if (machine__is_host(machine))
1886
		dso->symtab_type = SYMTAB__SYSTEM_PATH_KMODULE;
1887
	else
1888
		dso->symtab_type = SYMTAB__GUEST_KMODULE;
1889
	map_groups__insert(&machine->kmaps, map);
1890 1891 1892
	return map;
}

1893
static int machine__create_modules(struct machine *machine)
1894 1895 1896
{
	char *line = NULL;
	size_t n;
1897
	FILE *file;
1898
	struct map *map;
1899 1900 1901
	const char *modules;
	char path[PATH_MAX];

1902
	if (machine__is_default_guest(machine))
1903 1904
		modules = symbol_conf.default_guest_modules;
	else {
1905
		sprintf(path, "%s/proc/modules", machine->root_dir);
1906 1907
		modules = path;
	}
1908

1909 1910 1911
	if (symbol__restricted_filename(path, "/proc/modules"))
		return -1;

1912
	file = fopen(modules, "r");
1913 1914
	if (file == NULL)
		return -1;
1915

1916 1917 1918 1919 1920
	while (!feof(file)) {
		char name[PATH_MAX];
		u64 start;
		char *sep;
		int line_len;
1921

1922 1923 1924 1925 1926 1927 1928 1929 1930 1931 1932 1933 1934 1935 1936 1937 1938 1939 1940 1941 1942 1943
		line_len = getline(&line, &n, file);
		if (line_len < 0)
			break;

		if (!line)
			goto out_failure;

		line[--line_len] = '\0'; /* \n */

		sep = strrchr(line, 'x');
		if (sep == NULL)
			continue;

		hex2u64(sep + 1, &start);

		sep = strchr(line, ' ');
		if (sep == NULL)
			continue;

		*sep = '\0';

		snprintf(name, sizeof(name), "[%s]", line);
1944
		map = machine__new_module(machine, start, name);
1945
		if (map == NULL)
1946
			goto out_delete_line;
1947
		dso__kernel_module_get_build_id(map->dso, machine->root_dir);
1948
	}
1949 1950 1951 1952

	free(line);
	fclose(file);

1953
	return machine__set_modules_path(machine);
1954 1955 1956 1957 1958

out_delete_line:
	free(line);
out_failure:
	return -1;
1959 1960
}

1961
int dso__load_vmlinux(struct dso *dso, struct map *map,
1962
		      const char *vmlinux, symbol_filter_t filter)
1963
{
1964
	int err = -1, fd;
1965
	char symfs_vmlinux[PATH_MAX];
1966

1967
	snprintf(symfs_vmlinux, sizeof(symfs_vmlinux), "%s%s",
1968 1969
		 symbol_conf.symfs, vmlinux);
	fd = open(symfs_vmlinux, O_RDONLY);
1970 1971 1972
	if (fd < 0)
		return -1;

1973 1974 1975
	dso__set_long_name(dso, (char *)vmlinux);
	dso__set_loaded(dso, map->type);
	err = dso__load_sym(dso, map, symfs_vmlinux, fd, filter, 0, 0);
1976 1977
	close(fd);

1978
	if (err > 0)
1979
		pr_debug("Using %s for symbols\n", symfs_vmlinux);
1980

1981 1982 1983
	return err;
}

1984
int dso__load_vmlinux_path(struct dso *dso, struct map *map,
1985
			   symbol_filter_t filter)
1986 1987
{
	int i, err = 0;
1988
	char *filename;
1989 1990

	pr_debug("Looking at the vmlinux_path (%d entries long)\n",
1991 1992
		 vmlinux_path__nr_entries + 1);

1993
	filename = dso__build_id_filename(dso, NULL, 0);
1994
	if (filename != NULL) {
1995
		err = dso__load_vmlinux(dso, map, filename, filter);
1996
		if (err > 0) {
1997
			dso__set_long_name(dso, filename);
1998 1999 2000 2001
			goto out;
		}
		free(filename);
	}
2002 2003

	for (i = 0; i < vmlinux_path__nr_entries; ++i) {
2004
		err = dso__load_vmlinux(dso, map, vmlinux_path[i], filter);
2005
		if (err > 0) {
2006
			dso__set_long_name(dso, strdup(vmlinux_path[i]));
2007 2008 2009
			break;
		}
	}
2010
out:
2011 2012 2013
	return err;
}

2014
static int dso__load_kernel_sym(struct dso *dso, struct map *map,
2015
				symbol_filter_t filter)
2016
{
2017
	int err;
2018 2019
	const char *kallsyms_filename = NULL;
	char *kallsyms_allocated_filename = NULL;
2020
	/*
2021 2022
	 * Step 1: if the user specified a kallsyms or vmlinux filename, use
	 * it and only it, reporting errors to the user if it cannot be used.
2023 2024 2025 2026 2027 2028 2029 2030 2031 2032 2033 2034
	 *
	 * For instance, try to analyse an ARM perf.data file _without_ a
	 * build-id, or if the user specifies the wrong path to the right
	 * vmlinux file, obviously we can't fallback to another vmlinux (a
	 * x86_86 one, on the machine where analysis is being performed, say),
	 * or worse, /proc/kallsyms.
	 *
	 * If the specified file _has_ a build-id and there is a build-id
	 * section in the perf.data file, we will still do the expected
	 * validation in dso__load_vmlinux and will bail out if they don't
	 * match.
	 */
2035 2036 2037 2038 2039
	if (symbol_conf.kallsyms_name != NULL) {
		kallsyms_filename = symbol_conf.kallsyms_name;
		goto do_kallsyms;
	}

2040
	if (symbol_conf.vmlinux_name != NULL) {
2041
		err = dso__load_vmlinux(dso, map,
2042
					symbol_conf.vmlinux_name, filter);
2043
		if (err > 0) {
2044
			dso__set_long_name(dso,
2045 2046 2047 2048
					   strdup(symbol_conf.vmlinux_name));
			goto out_fixup;
		}
		return err;
2049
	}
2050 2051

	if (vmlinux_path != NULL) {
2052
		err = dso__load_vmlinux_path(dso, map, filter);
2053 2054
		if (err > 0)
			goto out_fixup;
2055 2056
	}

2057 2058 2059 2060
	/* do not try local files if a symfs was given */
	if (symbol_conf.symfs[0] != 0)
		return -1;

2061 2062 2063 2064 2065
	/*
	 * Say the kernel DSO was created when processing the build-id header table,
	 * we have a build-id, so check if it is the same as the running kernel,
	 * using it if it is.
	 */
2066
	if (dso->has_build_id) {
2067
		u8 kallsyms_build_id[BUILD_ID_SIZE];
2068
		char sbuild_id[BUILD_ID_SIZE * 2 + 1];
2069 2070

		if (sysfs__read_build_id("/sys/kernel/notes", kallsyms_build_id,
2071
					 sizeof(kallsyms_build_id)) == 0) {
2072
			if (dso__build_id_equal(dso, kallsyms_build_id)) {
2073
				kallsyms_filename = "/proc/kallsyms";
2074
				goto do_kallsyms;
2075
			}
2076
		}
2077 2078 2079 2080
		/*
		 * Now look if we have it on the build-id cache in
		 * $HOME/.debug/[kernel.kallsyms].
		 */
2081
		build_id__sprintf(dso->build_id, sizeof(dso->build_id),
2082 2083 2084 2085
				  sbuild_id);

		if (asprintf(&kallsyms_allocated_filename,
			     "%s/.debug/[kernel.kallsyms]/%s",
2086 2087
			     getenv("HOME"), sbuild_id) == -1) {
			pr_err("Not enough memory for kallsyms file lookup\n");
2088
			return -1;
2089
		}
2090

2091 2092
		kallsyms_filename = kallsyms_allocated_filename;

2093
		if (access(kallsyms_filename, F_OK)) {
2094 2095
			pr_err("No kallsyms or vmlinux with build-id %s "
			       "was found\n", sbuild_id);
2096
			free(kallsyms_allocated_filename);
2097
			return -1;
2098
		}
2099 2100 2101 2102 2103
	} else {
		/*
		 * Last resort, if we don't have a build-id and couldn't find
		 * any vmlinux file, try the running kernel kallsyms table.
		 */
2104 2105
		kallsyms_filename = "/proc/kallsyms";
	}
2106

2107
do_kallsyms:
2108
	err = dso__load_kallsyms(dso, kallsyms_filename, map, filter);
2109 2110
	if (err > 0)
		pr_debug("Using %s for symbols\n", kallsyms_filename);
2111
	free(kallsyms_allocated_filename);
2112 2113

	if (err > 0) {
2114
out_fixup:
2115
		if (kallsyms_filename != NULL)
2116
			dso__set_long_name(dso, strdup("[kernel.kallsyms]"));
2117 2118
		map__fixup_start(map);
		map__fixup_end(map);
2119
	}
2120

2121 2122 2123
	return err;
}

2124 2125
static int dso__load_guest_kernel_sym(struct dso *dso, struct map *map,
				      symbol_filter_t filter)
2126 2127 2128
{
	int err;
	const char *kallsyms_filename = NULL;
2129
	struct machine *machine;
2130 2131 2132 2133 2134 2135
	char path[PATH_MAX];

	if (!map->groups) {
		pr_debug("Guest kernel map hasn't the point to groups\n");
		return -1;
	}
2136
	machine = map->groups->machine;
2137

2138
	if (machine__is_default_guest(machine)) {
2139 2140 2141 2142 2143 2144
		/*
		 * if the user specified a vmlinux filename, use it and only
		 * it, reporting errors to the user if it cannot be used.
		 * Or use file guest_kallsyms inputted by user on commandline
		 */
		if (symbol_conf.default_guest_vmlinux_name != NULL) {
2145
			err = dso__load_vmlinux(dso, map,
2146 2147 2148 2149 2150 2151 2152 2153
				symbol_conf.default_guest_vmlinux_name, filter);
			goto out_try_fixup;
		}

		kallsyms_filename = symbol_conf.default_guest_kallsyms;
		if (!kallsyms_filename)
			return -1;
	} else {
2154
		sprintf(path, "%s/proc/kallsyms", machine->root_dir);
2155 2156 2157
		kallsyms_filename = path;
	}

2158
	err = dso__load_kallsyms(dso, kallsyms_filename, map, filter);
2159 2160 2161 2162 2163 2164
	if (err > 0)
		pr_debug("Using %s for symbols\n", kallsyms_filename);

out_try_fixup:
	if (err > 0) {
		if (kallsyms_filename != NULL) {
2165
			machine__mmap_name(machine, path, sizeof(path));
2166
			dso__set_long_name(dso, strdup(path));
2167 2168 2169 2170 2171 2172 2173
		}
		map__fixup_start(map);
		map__fixup_end(map);
	}

	return err;
}
2174

2175
static void dsos__add(struct list_head *head, struct dso *dso)
2176
{
2177
	list_add_tail(&dso->node, head);
2178 2179
}

2180
static struct dso *dsos__find(struct list_head *head, const char *name)
2181 2182 2183
{
	struct dso *pos;

2184
	list_for_each_entry(pos, head, node)
2185
		if (strcmp(pos->long_name, name) == 0)
2186 2187 2188 2189
			return pos;
	return NULL;
}

2190
struct dso *__dsos__findnew(struct list_head *head, const char *name)
2191
{
2192
	struct dso *dso = dsos__find(head, name);
2193

2194
	if (!dso) {
2195
		dso = dso__new(name);
2196
		if (dso != NULL) {
2197
			dsos__add(head, dso);
2198 2199
			dso__set_basename(dso);
		}
2200
	}
2201 2202 2203 2204

	return dso;
}

2205
size_t __dsos__fprintf(struct list_head *head, FILE *fp)
2206 2207
{
	struct dso *pos;
2208
	size_t ret = 0;
2209

2210 2211 2212
	list_for_each_entry(pos, head, node) {
		int i;
		for (i = 0; i < MAP__NR_TYPES; ++i)
2213
			ret += dso__fprintf(pos, i, fp);
2214
	}
2215 2216

	return ret;
2217 2218
}

2219
size_t machines__fprintf_dsos(struct rb_root *machines, FILE *fp)
2220
{
2221
	struct rb_node *nd;
2222
	size_t ret = 0;
2223

2224
	for (nd = rb_first(machines); nd; nd = rb_next(nd)) {
2225
		struct machine *pos = rb_entry(nd, struct machine, rb_node);
2226 2227
		ret += __dsos__fprintf(&pos->kernel_dsos, fp);
		ret += __dsos__fprintf(&pos->user_dsos, fp);
2228
	}
2229 2230

	return ret;
2231 2232
}

2233 2234
static size_t __dsos__fprintf_buildid(struct list_head *head, FILE *fp,
				      bool with_hits)
2235 2236 2237 2238
{
	struct dso *pos;
	size_t ret = 0;

2239
	list_for_each_entry(pos, head, node) {
2240 2241
		if (with_hits && !pos->hit)
			continue;
2242
		ret += dso__fprintf_buildid(pos, fp);
2243
		ret += fprintf(fp, " %s\n", pos->long_name);
2244 2245 2246 2247
	}
	return ret;
}

2248 2249
size_t machine__fprintf_dsos_buildid(struct machine *machine, FILE *fp,
				     bool with_hits)
2250
{
2251 2252
	return __dsos__fprintf_buildid(&machine->kernel_dsos, fp, with_hits) +
	       __dsos__fprintf_buildid(&machine->user_dsos, fp, with_hits);
2253 2254
}

2255 2256
size_t machines__fprintf_dsos_buildid(struct rb_root *machines,
				      FILE *fp, bool with_hits)
2257
{
2258 2259 2260
	struct rb_node *nd;
	size_t ret = 0;

2261
	for (nd = rb_first(machines); nd; nd = rb_next(nd)) {
2262
		struct machine *pos = rb_entry(nd, struct machine, rb_node);
2263
		ret += machine__fprintf_dsos_buildid(pos, fp, with_hits);
2264 2265
	}
	return ret;
2266 2267
}

2268 2269 2270
static struct dso*
dso__kernel_findnew(struct machine *machine, const char *name,
		    const char *short_name, int dso_type)
2271
{
2272 2273 2274 2275
	/*
	 * The kernel dso could be created by build_id processing.
	 */
	struct dso *dso = __dsos__findnew(&machine->kernel_dsos, name);
2276

2277 2278 2279 2280
	/*
	 * We need to run this in all cases, since during the build_id
	 * processing we had no idea this was the kernel dso.
	 */
2281
	if (dso != NULL) {
2282 2283
		dso__set_short_name(dso, short_name);
		dso->kernel = dso_type;
2284 2285
	}

2286
	return dso;
2287 2288
}

2289
void dso__read_running_kernel_build_id(struct dso *dso, struct machine *machine)
2290
{
2291 2292
	char path[PATH_MAX];

2293
	if (machine__is_default_guest(machine))
2294
		return;
2295
	sprintf(path, "%s/sys/kernel/notes", machine->root_dir);
2296 2297 2298
	if (sysfs__read_build_id(path, dso->build_id,
				 sizeof(dso->build_id)) == 0)
		dso->has_build_id = true;
2299 2300
}

2301
static struct dso *machine__get_kernel(struct machine *machine)
2302
{
2303 2304
	const char *vmlinux_name = NULL;
	struct dso *kernel;
2305

2306
	if (machine__is_host(machine)) {
2307
		vmlinux_name = symbol_conf.vmlinux_name;
2308 2309 2310 2311 2312 2313
		if (!vmlinux_name)
			vmlinux_name = "[kernel.kallsyms]";

		kernel = dso__kernel_findnew(machine, vmlinux_name,
					     "[kernel]",
					     DSO_TYPE_KERNEL);
2314
	} else {
2315 2316
		char bf[PATH_MAX];

2317
		if (machine__is_default_guest(machine))
2318
			vmlinux_name = symbol_conf.default_guest_vmlinux_name;
2319 2320 2321 2322 2323 2324 2325
		if (!vmlinux_name)
			vmlinux_name = machine__mmap_name(machine, bf,
							  sizeof(bf));

		kernel = dso__kernel_findnew(machine, vmlinux_name,
					     "[guest.kernel]",
					     DSO_TYPE_GUEST_KERNEL);
2326
	}
2327

2328
	if (kernel != NULL && (!kernel->has_build_id))
2329
		dso__read_running_kernel_build_id(kernel, machine);
2330

2331 2332 2333
	return kernel;
}

2334 2335 2336 2337 2338
struct process_args {
	u64 start;
};

static int symbol__in_kernel(void *arg, const char *name,
2339
			     char type __used, u64 start, u64 end __used)
2340 2341 2342 2343 2344 2345 2346 2347 2348 2349 2350 2351 2352 2353 2354 2355 2356 2357 2358 2359 2360 2361 2362 2363 2364 2365 2366 2367
{
	struct process_args *args = arg;

	if (strchr(name, '['))
		return 0;

	args->start = start;
	return 1;
}

/* Figure out the start address of kernel map from /proc/kallsyms */
static u64 machine__get_kernel_start_addr(struct machine *machine)
{
	const char *filename;
	char path[PATH_MAX];
	struct process_args args;

	if (machine__is_host(machine)) {
		filename = "/proc/kallsyms";
	} else {
		if (machine__is_default_guest(machine))
			filename = (char *)symbol_conf.default_guest_kallsyms;
		else {
			sprintf(path, "%s/proc/kallsyms", machine->root_dir);
			filename = path;
		}
	}

2368 2369 2370
	if (symbol__restricted_filename(filename, "/proc/kallsyms"))
		return 0;

2371 2372 2373 2374 2375 2376
	if (kallsyms__parse(filename, &args, symbol__in_kernel) <= 0)
		return 0;

	return args.start;
}

2377
int __machine__create_kernel_maps(struct machine *machine, struct dso *kernel)
2378
{
2379
	enum map_type type;
2380
	u64 start = machine__get_kernel_start_addr(machine);
2381

2382
	for (type = 0; type < MAP__NR_TYPES; ++type) {
2383 2384
		struct kmap *kmap;

2385 2386
		machine->vmlinux_maps[type] = map__new2(start, kernel, type);
		if (machine->vmlinux_maps[type] == NULL)
2387
			return -1;
2388

2389 2390 2391 2392 2393 2394 2395
		machine->vmlinux_maps[type]->map_ip =
			machine->vmlinux_maps[type]->unmap_ip =
				identity__map_ip;
		kmap = map__kmap(machine->vmlinux_maps[type]);
		kmap->kmaps = &machine->kmaps;
		map_groups__insert(&machine->kmaps,
				   machine->vmlinux_maps[type]);
2396 2397 2398
	}

	return 0;
2399 2400
}

2401
void machine__destroy_kernel_maps(struct machine *machine)
2402 2403 2404 2405 2406 2407
{
	enum map_type type;

	for (type = 0; type < MAP__NR_TYPES; ++type) {
		struct kmap *kmap;

2408
		if (machine->vmlinux_maps[type] == NULL)
2409 2410
			continue;

2411 2412 2413
		kmap = map__kmap(machine->vmlinux_maps[type]);
		map_groups__remove(&machine->kmaps,
				   machine->vmlinux_maps[type]);
2414 2415 2416 2417 2418 2419 2420 2421 2422 2423 2424 2425 2426
		if (kmap->ref_reloc_sym) {
			/*
			 * ref_reloc_sym is shared among all maps, so free just
			 * on one of them.
			 */
			if (type == MAP__FUNCTION) {
				free((char *)kmap->ref_reloc_sym->name);
				kmap->ref_reloc_sym->name = NULL;
				free(kmap->ref_reloc_sym);
			}
			kmap->ref_reloc_sym = NULL;
		}

2427 2428
		map__delete(machine->vmlinux_maps[type]);
		machine->vmlinux_maps[type] = NULL;
2429 2430 2431
	}
}

2432
int machine__create_kernel_maps(struct machine *machine)
2433
{
2434
	struct dso *kernel = machine__get_kernel(machine);
2435 2436

	if (kernel == NULL ||
2437
	    __machine__create_kernel_maps(machine, kernel) < 0)
2438 2439
		return -1;

2440
	if (symbol_conf.use_modules && machine__create_modules(machine) < 0)
2441 2442 2443 2444
		pr_debug("Problems creating module maps, continuing anyway...\n");
	/*
	 * Now that we have all the maps created, just set the ->end of them:
	 */
2445
	map_groups__fixup_end(&machine->kmaps);
2446 2447 2448
	return 0;
}

2449 2450 2451 2452 2453 2454 2455 2456 2457 2458 2459 2460 2461 2462 2463 2464 2465 2466 2467 2468 2469 2470 2471 2472 2473 2474 2475 2476
static void vmlinux_path__exit(void)
{
	while (--vmlinux_path__nr_entries >= 0) {
		free(vmlinux_path[vmlinux_path__nr_entries]);
		vmlinux_path[vmlinux_path__nr_entries] = NULL;
	}

	free(vmlinux_path);
	vmlinux_path = NULL;
}

static int vmlinux_path__init(void)
{
	struct utsname uts;
	char bf[PATH_MAX];

	vmlinux_path = malloc(sizeof(char *) * 5);
	if (vmlinux_path == NULL)
		return -1;

	vmlinux_path[vmlinux_path__nr_entries] = strdup("vmlinux");
	if (vmlinux_path[vmlinux_path__nr_entries] == NULL)
		goto out_fail;
	++vmlinux_path__nr_entries;
	vmlinux_path[vmlinux_path__nr_entries] = strdup("/boot/vmlinux");
	if (vmlinux_path[vmlinux_path__nr_entries] == NULL)
		goto out_fail;
	++vmlinux_path__nr_entries;
2477 2478 2479 2480 2481 2482 2483 2484

	/* only try running kernel version if no symfs was given */
	if (symbol_conf.symfs[0] != 0)
		return 0;

	if (uname(&uts) < 0)
		return -1;

2485 2486 2487 2488 2489 2490 2491 2492 2493 2494 2495 2496 2497 2498 2499 2500 2501 2502 2503 2504 2505 2506 2507 2508
	snprintf(bf, sizeof(bf), "/boot/vmlinux-%s", uts.release);
	vmlinux_path[vmlinux_path__nr_entries] = strdup(bf);
	if (vmlinux_path[vmlinux_path__nr_entries] == NULL)
		goto out_fail;
	++vmlinux_path__nr_entries;
	snprintf(bf, sizeof(bf), "/lib/modules/%s/build/vmlinux", uts.release);
	vmlinux_path[vmlinux_path__nr_entries] = strdup(bf);
	if (vmlinux_path[vmlinux_path__nr_entries] == NULL)
		goto out_fail;
	++vmlinux_path__nr_entries;
	snprintf(bf, sizeof(bf), "/usr/lib/debug/lib/modules/%s/vmlinux",
		 uts.release);
	vmlinux_path[vmlinux_path__nr_entries] = strdup(bf);
	if (vmlinux_path[vmlinux_path__nr_entries] == NULL)
		goto out_fail;
	++vmlinux_path__nr_entries;

	return 0;

out_fail:
	vmlinux_path__exit();
	return -1;
}

2509
size_t machine__fprintf_vmlinux_path(struct machine *machine, FILE *fp)
2510 2511 2512
{
	int i;
	size_t printed = 0;
2513
	struct dso *kdso = machine->vmlinux_maps[MAP__FUNCTION]->dso;
2514 2515 2516 2517 2518 2519

	if (kdso->has_build_id) {
		char filename[PATH_MAX];
		if (dso__build_id_filename(kdso, filename, sizeof(filename)))
			printed += fprintf(fp, "[0] %s\n", filename);
	}
2520 2521

	for (i = 0; i < vmlinux_path__nr_entries; ++i)
2522 2523
		printed += fprintf(fp, "[%d] %s\n",
				   i + kdso->has_build_id, vmlinux_path[i]);
2524 2525 2526 2527

	return printed;
}

2528 2529 2530 2531 2532 2533 2534 2535 2536 2537 2538 2539 2540 2541
static int setup_list(struct strlist **list, const char *list_str,
		      const char *list_name)
{
	if (list_str == NULL)
		return 0;

	*list = strlist__new(true, list_str);
	if (!*list) {
		pr_err("problems parsing %s list\n", list_name);
		return -1;
	}
	return 0;
}

2542 2543 2544 2545 2546 2547 2548 2549 2550 2551 2552 2553 2554 2555 2556 2557 2558 2559 2560
static bool symbol__read_kptr_restrict(void)
{
	bool value = false;

	if (geteuid() != 0) {
		FILE *fp = fopen("/proc/sys/kernel/kptr_restrict", "r");
		if (fp != NULL) {
			char line[8];

			if (fgets(line, sizeof(line), fp) != NULL)
				value = atoi(line) != 0;

			fclose(fp);
		}
	}

	return value;
}

2561
int symbol__init(void)
2562
{
2563 2564
	const char *symfs;

2565 2566 2567
	if (symbol_conf.initialized)
		return 0;

2568 2569
	symbol_conf.priv_size = ALIGN(symbol_conf.priv_size, sizeof(u64));

2570
	elf_version(EV_CURRENT);
2571 2572 2573
	if (symbol_conf.sort_by_name)
		symbol_conf.priv_size += (sizeof(struct symbol_name_rb_node) -
					  sizeof(struct symbol));
2574

2575
	if (symbol_conf.try_vmlinux_path && vmlinux_path__init() < 0)
2576 2577
		return -1;

2578 2579 2580 2581 2582
	if (symbol_conf.field_sep && *symbol_conf.field_sep == '.') {
		pr_err("'.' is the only non valid --field-separator argument\n");
		return -1;
	}

2583 2584 2585 2586 2587 2588 2589 2590 2591 2592 2593 2594
	if (setup_list(&symbol_conf.dso_list,
		       symbol_conf.dso_list_str, "dso") < 0)
		return -1;

	if (setup_list(&symbol_conf.comm_list,
		       symbol_conf.comm_list_str, "comm") < 0)
		goto out_free_dso_list;

	if (setup_list(&symbol_conf.sym_list,
		       symbol_conf.sym_list_str, "symbol") < 0)
		goto out_free_comm_list;

2595 2596 2597 2598 2599 2600 2601 2602 2603 2604 2605 2606
	/*
	 * A path to symbols of "/" is identical to ""
	 * reset here for simplicity.
	 */
	symfs = realpath(symbol_conf.symfs, NULL);
	if (symfs == NULL)
		symfs = symbol_conf.symfs;
	if (strcmp(symfs, "/") == 0)
		symbol_conf.symfs = "";
	if (symfs != symbol_conf.symfs)
		free((void *)symfs);

2607 2608
	symbol_conf.kptr_restrict = symbol__read_kptr_restrict();

2609
	symbol_conf.initialized = true;
2610
	return 0;
2611 2612 2613 2614 2615 2616

out_free_dso_list:
	strlist__delete(symbol_conf.dso_list);
out_free_comm_list:
	strlist__delete(symbol_conf.comm_list);
	return -1;
2617 2618
}

2619 2620
void symbol__exit(void)
{
2621 2622
	if (!symbol_conf.initialized)
		return;
2623 2624 2625 2626 2627
	strlist__delete(symbol_conf.sym_list);
	strlist__delete(symbol_conf.dso_list);
	strlist__delete(symbol_conf.comm_list);
	vmlinux_path__exit();
	symbol_conf.sym_list = symbol_conf.dso_list = symbol_conf.comm_list = NULL;
2628
	symbol_conf.initialized = false;
2629 2630
}

2631
int machines__create_kernel_maps(struct rb_root *machines, pid_t pid)
2632
{
2633
	struct machine *machine = machines__findnew(machines, pid);
2634

2635
	if (machine == NULL)
2636
		return -1;
2637

2638
	return machine__create_kernel_maps(machine);
2639
}
2640 2641 2642 2643 2644 2645 2646 2647 2648 2649 2650 2651 2652 2653 2654 2655 2656 2657 2658 2659 2660 2661 2662 2663 2664 2665 2666 2667 2668 2669 2670 2671 2672 2673 2674 2675 2676 2677 2678 2679 2680 2681 2682

static int hex(char ch)
{
	if ((ch >= '0') && (ch <= '9'))
		return ch - '0';
	if ((ch >= 'a') && (ch <= 'f'))
		return ch - 'a' + 10;
	if ((ch >= 'A') && (ch <= 'F'))
		return ch - 'A' + 10;
	return -1;
}

/*
 * While we find nice hex chars, build a long_val.
 * Return number of chars processed.
 */
int hex2u64(const char *ptr, u64 *long_val)
{
	const char *p = ptr;
	*long_val = 0;

	while (*p) {
		const int hex_val = hex(*p);

		if (hex_val < 0)
			break;

		*long_val = (*long_val << 4) | hex_val;
		p++;
	}

	return p - ptr;
}

char *strxfrchar(char *s, char from, char to)
{
	char *p = s;

	while ((p = strchr(p, from)) != NULL)
		*p++ = to;

	return s;
}
2683

2684
int machines__create_guest_kernel_maps(struct rb_root *machines)
2685 2686 2687 2688 2689 2690 2691 2692 2693 2694
{
	int ret = 0;
	struct dirent **namelist = NULL;
	int i, items = 0;
	char path[PATH_MAX];
	pid_t pid;

	if (symbol_conf.default_guest_vmlinux_name ||
	    symbol_conf.default_guest_modules ||
	    symbol_conf.default_guest_kallsyms) {
2695
		machines__create_kernel_maps(machines, DEFAULT_GUEST_KERNEL_ID);
2696 2697 2698 2699 2700 2701 2702 2703 2704 2705 2706 2707 2708 2709 2710 2711 2712 2713 2714 2715
	}

	if (symbol_conf.guestmount) {
		items = scandir(symbol_conf.guestmount, &namelist, NULL, NULL);
		if (items <= 0)
			return -ENOENT;
		for (i = 0; i < items; i++) {
			if (!isdigit(namelist[i]->d_name[0])) {
				/* Filter out . and .. */
				continue;
			}
			pid = atoi(namelist[i]->d_name);
			sprintf(path, "%s/%s/proc/kallsyms",
				symbol_conf.guestmount,
				namelist[i]->d_name);
			ret = access(path, R_OK);
			if (ret) {
				pr_debug("Can't access file %s\n", path);
				goto failure;
			}
2716
			machines__create_kernel_maps(machines, pid);
2717 2718 2719 2720 2721 2722 2723
		}
failure:
		free(namelist);
	}

	return ret;
}
2724

2725
void machines__destroy_guest_kernel_maps(struct rb_root *machines)
2726
{
2727
	struct rb_node *next = rb_first(machines);
2728 2729 2730 2731 2732

	while (next) {
		struct machine *pos = rb_entry(next, struct machine, rb_node);

		next = rb_next(&pos->rb_node);
2733
		rb_erase(&pos->rb_node, machines);
2734 2735 2736 2737
		machine__delete(pos);
	}
}

2738
int machine__load_kallsyms(struct machine *machine, const char *filename,
2739 2740
			   enum map_type type, symbol_filter_t filter)
{
2741
	struct map *map = machine->vmlinux_maps[type];
2742 2743 2744 2745 2746 2747 2748 2749 2750
	int ret = dso__load_kallsyms(map->dso, filename, map, filter);

	if (ret > 0) {
		dso__set_loaded(map->dso, type);
		/*
		 * Since /proc/kallsyms will have multiple sessions for the
		 * kernel, with modules between them, fixup the end of all
		 * sections.
		 */
2751
		__map_groups__fixup_end(&machine->kmaps, type);
2752 2753 2754 2755 2756
	}

	return ret;
}

2757
int machine__load_vmlinux_path(struct machine *machine, enum map_type type,
2758 2759
			       symbol_filter_t filter)
{
2760
	struct map *map = machine->vmlinux_maps[type];
2761 2762 2763 2764 2765 2766 2767 2768 2769
	int ret = dso__load_vmlinux_path(map->dso, map, filter);

	if (ret > 0) {
		dso__set_loaded(map->dso, type);
		map__reloc_vmlinux(map);
	}

	return ret;
}