symbol.c 30.6 KB
Newer Older
1 2
#include "util.h"
#include "../perf.h"
3
#include "string.h"
4
#include "symbol.h"
5
#include "thread.h"
6

7 8
#include "debug.h"

9 10 11
#include <libelf.h>
#include <gelf.h>
#include <elf.h>
12
#include <limits.h>
13
#include <sys/utsname.h>
P
Peter Zijlstra 已提交
14

15 16 17 18 19 20 21
enum dso_origin {
	DSO__ORIG_KERNEL = 0,
	DSO__ORIG_JAVA_JIT,
	DSO__ORIG_FEDORA,
	DSO__ORIG_UBUNTU,
	DSO__ORIG_BUILDID,
	DSO__ORIG_DSO,
22
	DSO__ORIG_KMODULE,
23 24 25
	DSO__ORIG_NOT_FOUND,
};

26 27
static void dsos__add(struct dso *dso);
static struct dso *dsos__find(const char *name);
28 29
static struct map *map__new2(u64 start, struct dso *dso);
static void kernel_maps__insert(struct map *map);
30 31
static int dso__load_kernel_sym(struct dso *self, struct map *map,
				symbol_filter_t filter);
32
unsigned int symbol__priv_size;
33

34 35
static struct rb_root kernel_maps;

36
static void dso__fixup_sym_end(struct dso *self)
37 38
{
	struct rb_node *nd, *prevnd = rb_first(&self->syms);
39
	struct symbol *curr, *prev;
40 41 42 43

	if (prevnd == NULL)
		return;

44 45
	curr = rb_entry(prevnd, struct symbol, rb_node);

46
	for (nd = rb_next(prevnd); nd; nd = rb_next(nd)) {
47 48
		prev = curr;
		curr = rb_entry(nd, struct symbol, rb_node);
49 50 51 52

		if (prev->end == prev->start)
			prev->end = curr->start - 1;
	}
53 54 55 56

	/* Last entry */
	if (curr->end == curr->start)
		curr->end = roundup(curr->start, 4096);
57 58
}

59
static void kernel_maps__fixup_end(void)
60 61 62 63 64 65 66 67 68 69 70 71 72
{
	struct map *prev, *curr;
	struct rb_node *nd, *prevnd = rb_first(&kernel_maps);

	if (prevnd == NULL)
		return;

	curr = rb_entry(prevnd, struct map, rb_node);

	for (nd = rb_next(prevnd); nd; nd = rb_next(nd)) {
		prev = curr;
		curr = rb_entry(nd, struct map, rb_node);
		prev->end = curr->start - 1;
73
	}
74 75
}

76
static struct symbol *symbol__new(u64 start, u64 len, const char *name)
77
{
78
	size_t namelen = strlen(name) + 1;
79 80
	struct symbol *self = calloc(1, (symbol__priv_size +
					 sizeof(*self) + namelen));
81 82 83
	if (!self)
		return NULL;

84 85 86
	if (symbol__priv_size) {
		memset(self, 0, symbol__priv_size);
		self = ((void *)self) + symbol__priv_size;
87
	}
88
	self->start = start;
89
	self->end   = len ? start + len - 1 : start;
90

91
	pr_debug3("%s: %s %#Lx-%#Lx\n", __func__, name, start, self->end);
92

93
	memcpy(self->name, name, namelen);
94 95 96 97

	return self;
}

98
static void symbol__delete(struct symbol *self)
99
{
100
	free(((void *)self) - symbol__priv_size);
101 102 103 104
}

static size_t symbol__fprintf(struct symbol *self, FILE *fp)
{
105
	return fprintf(fp, " %llx-%llx %s\n",
106 107 108
		       self->start, self->end, self->name);
}

109 110 111 112 113 114 115 116 117 118 119
static void dso__set_long_name(struct dso *self, char *name)
{
	self->long_name = name;
	self->long_name_len = strlen(name);
}

static void dso__set_basename(struct dso *self)
{
	self->short_name = basename(self->long_name);
}

120
struct dso *dso__new(const char *name)
121 122 123 124 125
{
	struct dso *self = malloc(sizeof(*self) + strlen(name) + 1);

	if (self != NULL) {
		strcpy(self->name, name);
126
		dso__set_long_name(self, self->name);
127
		self->short_name = self->name;
128
		self->syms = RB_ROOT;
P
Peter Zijlstra 已提交
129
		self->find_symbol = dso__find_symbol;
130
		self->slen_calculated = 0;
131
		self->origin = DSO__ORIG_NOT_FOUND;
132 133
		self->loaded = 0;
		self->has_build_id = 0;
134 135 136 137 138 139 140 141 142 143 144 145 146
	}

	return self;
}

static void dso__delete_symbols(struct dso *self)
{
	struct symbol *pos;
	struct rb_node *next = rb_first(&self->syms);

	while (next) {
		pos = rb_entry(next, struct symbol, rb_node);
		next = rb_next(&pos->rb_node);
147
		rb_erase(&pos->rb_node, &self->syms);
148
		symbol__delete(pos);
149 150 151 152 153 154
	}
}

void dso__delete(struct dso *self)
{
	dso__delete_symbols(self);
155 156
	if (self->long_name != self->name)
		free(self->long_name);
157 158 159
	free(self);
}

160 161 162 163 164 165
void dso__set_build_id(struct dso *self, void *build_id)
{
	memcpy(self->build_id, build_id, sizeof(self->build_id));
	self->has_build_id = 1;
}

166 167 168 169
static void dso__insert_symbol(struct dso *self, struct symbol *sym)
{
	struct rb_node **p = &self->syms.rb_node;
	struct rb_node *parent = NULL;
170
	const u64 ip = sym->start;
171 172 173 174 175 176 177 178 179 180 181 182 183 184
	struct symbol *s;

	while (*p != NULL) {
		parent = *p;
		s = rb_entry(parent, struct symbol, rb_node);
		if (ip < s->start)
			p = &(*p)->rb_left;
		else
			p = &(*p)->rb_right;
	}
	rb_link_node(&sym->rb_node, parent, p);
	rb_insert_color(&sym->rb_node, &self->syms);
}

185
struct symbol *dso__find_symbol(struct dso *self, u64 ip)
186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207
{
	struct rb_node *n;

	if (self == NULL)
		return NULL;

	n = self->syms.rb_node;

	while (n) {
		struct symbol *s = rb_entry(n, struct symbol, rb_node);

		if (ip < s->start)
			n = n->rb_left;
		else if (ip > s->end)
			n = n->rb_right;
		else
			return s;
	}

	return NULL;
}

208
int build_id__sprintf(u8 *self, int len, char *bf)
209
{
210 211 212
	char *bid = bf;
	u8 *raw = self;
	int i;
213

214 215 216 217 218 219 220 221 222
	for (i = 0; i < len; ++i) {
		sprintf(bid, "%02x", *raw);
		++raw;
		bid += 2;
	}

	return raw - self;
}

223
size_t dso__fprintf_buildid(struct dso *self, FILE *fp)
224 225 226 227
{
	char sbuild_id[BUILD_ID_SIZE * 2 + 1];

	build_id__sprintf(self->build_id, sizeof(self->build_id), sbuild_id);
228 229 230 231 232 233 234 235 236 237
	return fprintf(fp, "%s", sbuild_id);
}

size_t dso__fprintf(struct dso *self, FILE *fp)
{
	struct rb_node *nd;
	size_t ret = fprintf(fp, "dso: %s (", self->short_name);

	ret += dso__fprintf_buildid(self, fp);
	ret += fprintf(fp, ")\n");
238

239 240 241 242 243 244 245 246
	for (nd = rb_first(&self->syms); nd; nd = rb_next(nd)) {
		struct symbol *pos = rb_entry(nd, struct symbol, rb_node);
		ret += symbol__fprintf(pos, fp);
	}

	return ret;
}

247 248 249 250 251
/*
 * Loads the function entries in /proc/kallsyms into kernel_map->dso,
 * so that we can in the next step set the symbol ->end address and then
 * call kernel_maps__split_kallsyms.
 */
252
static int kernel_maps__load_all_kallsyms(void)
253 254 255 256 257 258 259 260 261
{
	char *line = NULL;
	size_t n;
	FILE *file = fopen("/proc/kallsyms", "r");

	if (file == NULL)
		goto out_failure;

	while (!feof(file)) {
262
		u64 start;
263 264 265
		struct symbol *sym;
		int line_len, len;
		char symbol_type;
266
		char *symbol_name;
267 268 269 270 271 272 273 274 275 276

		line_len = getline(&line, &n, file);
		if (line_len < 0)
			break;

		if (!line)
			goto out_failure;

		line[--line_len] = '\0'; /* \n */

277
		len = hex2u64(line, &start);
278 279 280 281 282 283 284 285 286 287 288

		len++;
		if (len + 2 >= line_len)
			continue;

		symbol_type = toupper(line[len]);
		/*
		 * We're interested only in code ('T'ext)
		 */
		if (symbol_type != 'T' && symbol_type != 'W')
			continue;
289 290

		symbol_name = line + len + 2;
291 292 293
		/*
		 * Will fix up the end later, when we have all symbols sorted.
		 */
294
		sym = symbol__new(start, 0, symbol_name);
295

296 297 298
		if (sym == NULL)
			goto out_delete_line;

299 300 301 302 303
		/*
		 * We will pass the symbols to the filter later, in
		 * kernel_maps__split_kallsyms, when we have split the
		 * maps per module
		 */
304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322
		dso__insert_symbol(kernel_map->dso, sym);
	}

	free(line);
	fclose(file);

	return 0;

out_delete_line:
	free(line);
out_failure:
	return -1;
}

/*
 * Split the symbols into maps, making sure there are no overlaps, i.e. the
 * kernel range is broken in several maps, named [kernel].N, as we don't have
 * the original ELF section names vmlinux have.
 */
323
static int kernel_maps__split_kallsyms(symbol_filter_t filter)
324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340
{
	struct map *map = kernel_map;
	struct symbol *pos;
	int count = 0;
	struct rb_node *next = rb_first(&kernel_map->dso->syms);
	int kernel_range = 0;

	while (next) {
		char *module;

		pos = rb_entry(next, struct symbol, rb_node);
		next = rb_next(&pos->rb_node);

		module = strchr(pos->name, '\t');
		if (module) {
			*module++ = '\0';

341 342 343
			if (strcmp(map->dso->name, module)) {
				map = kernel_maps__find_by_dso_name(module);
				if (!map) {
344 345
					pr_err("/proc/{kallsyms,modules} "
					       "inconsistency!\n");
346 347 348
					return -1;
				}
			}
349 350 351 352 353 354 355 356 357 358 359 360 361
			/*
			 * So that we look just like we get from .ko files,
			 * i.e. not prelinked, relative to map->start.
			 */
			pos->start = map->map_ip(map, pos->start);
			pos->end   = map->map_ip(map, pos->end);
		} else if (map != kernel_map) {
			char dso_name[PATH_MAX];
			struct dso *dso;

			snprintf(dso_name, sizeof(dso_name), "[kernel].%d",
				 kernel_range++);

362
			dso = dso__new(dso_name);
363 364 365 366 367 368 369 370
			if (dso == NULL)
				return -1;

			map = map__new2(pos->start, dso);
			if (map == NULL) {
				dso__delete(dso);
				return -1;
			}
371

372
			map->map_ip = map->unmap_ip = identity__map_ip;
373 374 375
			kernel_maps__insert(map);
			++kernel_range;
		}
376

377 378
		if (filter && filter(map, pos)) {
			rb_erase(&pos->rb_node, &kernel_map->dso->syms);
379
			symbol__delete(pos);
380 381 382 383 384
		} else {
			if (map != kernel_map) {
				rb_erase(&pos->rb_node, &kernel_map->dso->syms);
				dso__insert_symbol(map->dso, pos);
			}
385 386
			count++;
		}
387 388
	}

389
	return count;
390
}
391

392

393
static int kernel_maps__load_kallsyms(symbol_filter_t filter)
394
{
395
	if (kernel_maps__load_all_kallsyms())
396 397 398
		return -1;

	dso__fixup_sym_end(kernel_map->dso);
399
	kernel_map->dso->origin = DSO__ORIG_KERNEL;
400

401
	return kernel_maps__split_kallsyms(filter);
402 403
}

404
size_t kernel_maps__fprintf(FILE *fp)
405
{
406
	size_t printed = fprintf(fp, "Kernel maps:\n");
407 408 409 410 411
	struct rb_node *nd;

	for (nd = rb_first(&kernel_maps); nd; nd = rb_next(nd)) {
		struct map *pos = rb_entry(nd, struct map, rb_node);

412
		printed += fprintf(fp, "Map:");
413
		printed += map__fprintf(pos, fp);
414
		if (verbose > 1) {
415 416 417
			printed += dso__fprintf(pos->dso, fp);
			printed += fprintf(fp, "--\n");
		}
418 419
	}

420
	return printed + fprintf(fp, "END kernel maps\n");
421 422
}

423
static int dso__load_perf_map(struct dso *self, struct map *map,
424
			      symbol_filter_t filter)
425 426 427 428 429 430
{
	char *line = NULL;
	size_t n;
	FILE *file;
	int nr_syms = 0;

431
	file = fopen(self->long_name, "r");
432 433 434 435
	if (file == NULL)
		goto out_failure;

	while (!feof(file)) {
436
		u64 start, size;
437 438 439 440 441 442 443 444 445 446 447 448 449 450 451 452 453 454 455 456 457 458 459 460
		struct symbol *sym;
		int line_len, len;

		line_len = getline(&line, &n, file);
		if (line_len < 0)
			break;

		if (!line)
			goto out_failure;

		line[--line_len] = '\0'; /* \n */

		len = hex2u64(line, &start);

		len++;
		if (len + 2 >= line_len)
			continue;

		len += hex2u64(line + len, &size);

		len++;
		if (len + 2 >= line_len)
			continue;

461
		sym = symbol__new(start, size, line + len);
462 463 464 465

		if (sym == NULL)
			goto out_delete_line;

466
		if (filter && filter(map, sym))
467
			symbol__delete(sym);
468 469 470 471 472 473 474 475 476 477 478 479 480 481 482 483 484
		else {
			dso__insert_symbol(self, sym);
			nr_syms++;
		}
	}

	free(line);
	fclose(file);

	return nr_syms;

out_delete_line:
	free(line);
out_failure:
	return -1;
}

485 486 487 488
/**
 * elf_symtab__for_each_symbol - iterate thru all the symbols
 *
 * @self: struct elf_symtab instance to iterate
489
 * @idx: uint32_t idx
490 491
 * @sym: GElf_Sym iterator
 */
492 493 494 495
#define elf_symtab__for_each_symbol(syms, nr_syms, idx, sym) \
	for (idx = 0, gelf_getsym(syms, idx, &sym);\
	     idx < nr_syms; \
	     idx++, gelf_getsym(syms, idx, &sym))
496 497 498 499 500 501 502 503 504 505

static inline uint8_t elf_sym__type(const GElf_Sym *sym)
{
	return GELF_ST_TYPE(sym->st_info);
}

static inline int elf_sym__is_function(const GElf_Sym *sym)
{
	return elf_sym__type(sym) == STT_FUNC &&
	       sym->st_name != 0 &&
506
	       sym->st_shndx != SHN_UNDEF;
507 508
}

509 510 511 512 513 514 515 516 517 518 519 520 521 522 523 524 525 526 527 528
static inline int elf_sym__is_label(const GElf_Sym *sym)
{
	return elf_sym__type(sym) == STT_NOTYPE &&
		sym->st_name != 0 &&
		sym->st_shndx != SHN_UNDEF &&
		sym->st_shndx != SHN_ABS;
}

static inline const char *elf_sec__name(const GElf_Shdr *shdr,
					const Elf_Data *secstrs)
{
	return secstrs->d_buf + shdr->sh_name;
}

static inline int elf_sec__is_text(const GElf_Shdr *shdr,
					const Elf_Data *secstrs)
{
	return strstr(elf_sec__name(shdr, secstrs), "text") != NULL;
}

529 530 531 532 533 534 535 536
static inline const char *elf_sym__name(const GElf_Sym *sym,
					const Elf_Data *symstrs)
{
	return symstrs->d_buf + sym->st_name;
}

static Elf_Scn *elf_section_by_name(Elf *elf, GElf_Ehdr *ep,
				    GElf_Shdr *shp, const char *name,
537
				    size_t *idx)
538 539 540 541 542 543 544 545 546 547
{
	Elf_Scn *sec = NULL;
	size_t cnt = 1;

	while ((sec = elf_nextscn(elf, sec)) != NULL) {
		char *str;

		gelf_getshdr(sec, shp);
		str = elf_strptr(elf, ep->e_shstrndx, shp->sh_name);
		if (!strcmp(name, str)) {
548 549
			if (idx)
				*idx = cnt;
550 551 552 553 554 555 556 557
			break;
		}
		++cnt;
	}

	return sec;
}

558 559 560 561 562 563 564 565 566 567
#define elf_section__for_each_rel(reldata, pos, pos_mem, idx, nr_entries) \
	for (idx = 0, pos = gelf_getrel(reldata, 0, &pos_mem); \
	     idx < nr_entries; \
	     ++idx, pos = gelf_getrel(reldata, idx, &pos_mem))

#define elf_section__for_each_rela(reldata, pos, pos_mem, idx, nr_entries) \
	for (idx = 0, pos = gelf_getrela(reldata, 0, &pos_mem); \
	     idx < nr_entries; \
	     ++idx, pos = gelf_getrela(reldata, idx, &pos_mem))

568 569 570 571 572 573 574
/*
 * We need to check if we have a .dynsym, so that we can handle the
 * .plt, synthesizing its symbols, that aren't on the symtabs (be it
 * .dynsym or .symtab).
 * And always look at the original dso, not at debuginfo packages, that
 * have the PLT data stripped out (shdr_rel_plt.sh_type == SHT_NOBITS).
 */
575 576
static int dso__synthesize_plt_symbols(struct  dso *self, struct map *map,
				       symbol_filter_t filter)
577 578 579
{
	uint32_t nr_rel_entries, idx;
	GElf_Sym sym;
580
	u64 plt_offset;
581 582
	GElf_Shdr shdr_plt;
	struct symbol *f;
583
	GElf_Shdr shdr_rel_plt, shdr_dynsym;
584
	Elf_Data *reldata, *syms, *symstrs;
585 586 587
	Elf_Scn *scn_plt_rel, *scn_symstrs, *scn_dynsym;
	size_t dynsym_idx;
	GElf_Ehdr ehdr;
588
	char sympltname[1024];
589 590 591
	Elf *elf;
	int nr = 0, symidx, fd, err = 0;

592
	fd = open(self->long_name, O_RDONLY);
593 594 595
	if (fd < 0)
		goto out;

596
	elf = elf_begin(fd, PERF_ELF_C_READ_MMAP, NULL);
597 598 599 600 601 602 603 604 605 606
	if (elf == NULL)
		goto out_close;

	if (gelf_getehdr(elf, &ehdr) == NULL)
		goto out_elf_end;

	scn_dynsym = elf_section_by_name(elf, &ehdr, &shdr_dynsym,
					 ".dynsym", &dynsym_idx);
	if (scn_dynsym == NULL)
		goto out_elf_end;
607

608
	scn_plt_rel = elf_section_by_name(elf, &ehdr, &shdr_rel_plt,
609 610
					  ".rela.plt", NULL);
	if (scn_plt_rel == NULL) {
611
		scn_plt_rel = elf_section_by_name(elf, &ehdr, &shdr_rel_plt,
612 613
						  ".rel.plt", NULL);
		if (scn_plt_rel == NULL)
614
			goto out_elf_end;
615 616
	}

617 618
	err = -1;

619
	if (shdr_rel_plt.sh_link != dynsym_idx)
620
		goto out_elf_end;
621

622 623
	if (elf_section_by_name(elf, &ehdr, &shdr_plt, ".plt", NULL) == NULL)
		goto out_elf_end;
624 625

	/*
626
	 * Fetch the relocation section to find the idxes to the GOT
627 628 629 630
	 * and the symbols in the .dynsym they refer to.
	 */
	reldata = elf_getdata(scn_plt_rel, NULL);
	if (reldata == NULL)
631
		goto out_elf_end;
632 633 634

	syms = elf_getdata(scn_dynsym, NULL);
	if (syms == NULL)
635
		goto out_elf_end;
636

637
	scn_symstrs = elf_getscn(elf, shdr_dynsym.sh_link);
638
	if (scn_symstrs == NULL)
639
		goto out_elf_end;
640 641 642

	symstrs = elf_getdata(scn_symstrs, NULL);
	if (symstrs == NULL)
643
		goto out_elf_end;
644 645 646 647 648 649 650 651 652 653 654 655 656 657 658 659

	nr_rel_entries = shdr_rel_plt.sh_size / shdr_rel_plt.sh_entsize;
	plt_offset = shdr_plt.sh_offset;

	if (shdr_rel_plt.sh_type == SHT_RELA) {
		GElf_Rela pos_mem, *pos;

		elf_section__for_each_rela(reldata, pos, pos_mem, idx,
					   nr_rel_entries) {
			symidx = GELF_R_SYM(pos->r_info);
			plt_offset += shdr_plt.sh_entsize;
			gelf_getsym(syms, symidx, &sym);
			snprintf(sympltname, sizeof(sympltname),
				 "%s@plt", elf_sym__name(&sym, symstrs));

			f = symbol__new(plt_offset, shdr_plt.sh_entsize,
660
					sympltname);
661
			if (!f)
662
				goto out_elf_end;
663

664 665 666 667 668 669
			if (filter && filter(map, f))
				symbol__delete(f);
			else {
				dso__insert_symbol(self, f);
				++nr;
			}
670 671 672 673 674 675 676 677 678 679 680 681
		}
	} else if (shdr_rel_plt.sh_type == SHT_REL) {
		GElf_Rel pos_mem, *pos;
		elf_section__for_each_rel(reldata, pos, pos_mem, idx,
					  nr_rel_entries) {
			symidx = GELF_R_SYM(pos->r_info);
			plt_offset += shdr_plt.sh_entsize;
			gelf_getsym(syms, symidx, &sym);
			snprintf(sympltname, sizeof(sympltname),
				 "%s@plt", elf_sym__name(&sym, symstrs));

			f = symbol__new(plt_offset, shdr_plt.sh_entsize,
682
					sympltname);
683
			if (!f)
684
				goto out_elf_end;
685

686 687 688 689 690 691
			if (filter && filter(map, f))
				symbol__delete(f);
			else {
				dso__insert_symbol(self, f);
				++nr;
			}
692 693 694
		}
	}

695 696 697 698 699 700 701 702 703
	err = 0;
out_elf_end:
	elf_end(elf);
out_close:
	close(fd);

	if (err == 0)
		return nr;
out:
704 705
	pr_warning("%s: problems reading %s PLT info.\n",
		   __func__, self->long_name);
706
	return 0;
707 708
}

709 710
static int dso__load_sym(struct dso *self, struct map *map, const char *name,
			 int fd, symbol_filter_t filter, int kernel,
711
			 int kmodule)
712
{
713 714 715
	struct map *curr_map = map;
	struct dso *curr_dso = self;
	size_t dso_name_len = strlen(self->short_name);
716
	Elf_Data *symstrs, *secstrs;
717 718
	uint32_t nr_syms;
	int err = -1;
719
	uint32_t idx;
720 721 722 723
	GElf_Ehdr ehdr;
	GElf_Shdr shdr;
	Elf_Data *syms;
	GElf_Sym sym;
724
	Elf_Scn *sec, *sec_strndx;
725
	Elf *elf;
726
	int nr = 0;
727

728
	elf = elf_begin(fd, PERF_ELF_C_READ_MMAP, NULL);
729
	if (elf == NULL) {
730
		pr_err("%s: cannot read %s ELF file.\n", __func__, name);
731 732 733 734
		goto out_close;
	}

	if (gelf_getehdr(elf, &ehdr) == NULL) {
735
		pr_err("%s: cannot get elf header.\n", __func__);
736 737 738 739
		goto out_elf_end;
	}

	sec = elf_section_by_name(elf, &ehdr, &shdr, ".symtab", NULL);
740
	if (sec == NULL) {
741 742
		sec = elf_section_by_name(elf, &ehdr, &shdr, ".dynsym", NULL);
		if (sec == NULL)
743 744
			goto out_elf_end;
	}
745 746 747 748 749 750 751 752 753 754 755 756 757

	syms = elf_getdata(sec, NULL);
	if (syms == NULL)
		goto out_elf_end;

	sec = elf_getscn(elf, shdr.sh_link);
	if (sec == NULL)
		goto out_elf_end;

	symstrs = elf_getdata(sec, NULL);
	if (symstrs == NULL)
		goto out_elf_end;

758 759 760 761 762
	sec_strndx = elf_getscn(elf, ehdr.e_shstrndx);
	if (sec_strndx == NULL)
		goto out_elf_end;

	secstrs = elf_getdata(sec_strndx, NULL);
S
Stoyan Gaydarov 已提交
763
	if (secstrs == NULL)
764 765
		goto out_elf_end;

766 767
	nr_syms = shdr.sh_size / shdr.sh_entsize;

768
	memset(&sym, 0, sizeof(sym));
769 770
	if (!kernel) {
		self->adjust_symbols = (ehdr.e_type == ET_EXEC ||
771 772 773
				elf_section_by_name(elf, &ehdr, &shdr,
						     ".gnu.prelink_undo",
						     NULL) != NULL);
774 775
	} else self->adjust_symbols = 0;

776
	elf_symtab__for_each_symbol(syms, nr_syms, idx, sym) {
777
		struct symbol *f;
778
		const char *elf_name;
779
		char *demangled = NULL;
780 781
		int is_label = elf_sym__is_label(&sym);
		const char *section_name;
782

783
		if (!is_label && !elf_sym__is_function(&sym))
784 785 786 787 788 789 790
			continue;

		sec = elf_getscn(elf, sym.st_shndx);
		if (!sec)
			goto out_elf_end;

		gelf_getshdr(sec, &shdr);
791 792 793 794

		if (is_label && !elf_sec__is_text(&shdr, secstrs))
			continue;

795
		elf_name = elf_sym__name(&sym, symstrs);
796
		section_name = elf_sec__name(&shdr, secstrs);
797

798 799 800 801 802 803 804 805 806 807 808 809 810 811 812 813 814 815 816 817 818 819 820
		if (kernel || kmodule) {
			char dso_name[PATH_MAX];

			if (strcmp(section_name,
				   curr_dso->short_name + dso_name_len) == 0)
				goto new_symbol;

			if (strcmp(section_name, ".text") == 0) {
				curr_map = map;
				curr_dso = self;
				goto new_symbol;
			}

			snprintf(dso_name, sizeof(dso_name),
				 "%s%s", self->short_name, section_name);

			curr_map = kernel_maps__find_by_dso_name(dso_name);
			if (curr_map == NULL) {
				u64 start = sym.st_value;

				if (kmodule)
					start += map->start + shdr.sh_offset;

821
				curr_dso = dso__new(dso_name);
822 823 824 825 826 827 828
				if (curr_dso == NULL)
					goto out_elf_end;
				curr_map = map__new2(start, curr_dso);
				if (curr_map == NULL) {
					dso__delete(curr_dso);
					goto out_elf_end;
				}
829 830
				curr_map->map_ip = identity__map_ip;
				curr_map->unmap_ip = identity__map_ip;
831 832 833 834 835 836 837
				curr_dso->origin = DSO__ORIG_KERNEL;
				kernel_maps__insert(curr_map);
				dsos__add(curr_dso);
			} else
				curr_dso = curr_map->dso;

			goto new_symbol;
838 839
		}

840
		if (curr_dso->adjust_symbols) {
841 842 843
			pr_debug2("adjusting symbol: st_value: %Lx sh_addr: "
				  "%Lx sh_offset: %Lx\n", (u64)sym.st_value,
				  (u64)shdr.sh_addr, (u64)shdr.sh_offset);
844
			sym.st_value -= shdr.sh_addr - shdr.sh_offset;
845
		}
846 847 848 849 850
		/*
		 * We need to figure out if the object was created from C++ sources
		 * DWARF DW_compile_unit has this, but we don't always have access
		 * to it...
		 */
851
		demangled = bfd_demangle(NULL, elf_name, DMGL_PARAMS | DMGL_ANSI);
852
		if (demangled != NULL)
853
			elf_name = demangled;
854
new_symbol:
855
		f = symbol__new(sym.st_value, sym.st_size, elf_name);
856
		free(demangled);
857 858 859
		if (!f)
			goto out_elf_end;

860
		if (filter && filter(curr_map, f))
861
			symbol__delete(f);
862
		else {
863
			dso__insert_symbol(curr_dso, f);
864 865
			nr++;
		}
866 867
	}

868 869 870 871 872
	/*
	 * For misannotated, zeroed, ASM function sizes.
	 */
	if (nr > 0)
		dso__fixup_sym_end(self);
873 874 875 876 877 878 879
	err = nr;
out_elf_end:
	elf_end(elf);
out_close:
	return err;
}

880 881 882 883 884
static bool dso__build_id_equal(const struct dso *self, u8 *build_id)
{
	return memcmp(self->build_id, build_id, sizeof(self->build_id)) == 0;
}

885
bool dsos__read_build_ids(void)
886
{
887
	bool have_build_id = false;
888 889
	struct dso *pos;

890 891 892 893 894 895
	list_for_each_entry(pos, &dsos, node)
		if (filename__read_build_id(pos->long_name, pos->build_id,
					    sizeof(pos->build_id)) > 0) {
			have_build_id	  = true;
			pos->has_build_id = true;
		}
896

897
	return have_build_id;
898 899
}

900 901 902 903 904
/*
 * Align offset to 4 bytes as needed for note name and descriptor data.
 */
#define NOTE_ALIGN(n) (((n) + 3) & -4U)

905
int filename__read_build_id(const char *filename, void *bf, size_t size)
906
{
907
	int fd, err = -1;
908 909
	GElf_Ehdr ehdr;
	GElf_Shdr shdr;
910
	Elf_Data *data;
911
	Elf_Scn *sec;
912
	void *ptr;
913 914
	Elf *elf;

915 916 917 918
	if (size < BUILD_ID_SIZE)
		goto out;

	fd = open(filename, O_RDONLY);
919 920 921
	if (fd < 0)
		goto out;

922
	elf = elf_begin(fd, PERF_ELF_C_READ_MMAP, NULL);
923
	if (elf == NULL) {
924
		pr_debug2("%s: cannot read %s ELF file.\n", __func__, filename);
925 926 927 928
		goto out_close;
	}

	if (gelf_getehdr(elf, &ehdr) == NULL) {
929
		pr_err("%s: cannot get elf header.\n", __func__);
930 931 932
		goto out_elf_end;
	}

933 934
	sec = elf_section_by_name(elf, &ehdr, &shdr,
				  ".note.gnu.build-id", NULL);
935 936 937 938 939 940
	if (sec == NULL) {
		sec = elf_section_by_name(elf, &ehdr, &shdr,
					  ".notes", NULL);
		if (sec == NULL)
			goto out_elf_end;
	}
941

942 943
	data = elf_getdata(sec, NULL);
	if (data == NULL)
944
		goto out_elf_end;
945 946 947 948 949 950 951 952 953 954 955 956 957 958 959 960 961 962 963 964 965

	ptr = data->d_buf;
	while (ptr < (data->d_buf + data->d_size)) {
		GElf_Nhdr *nhdr = ptr;
		int namesz = NOTE_ALIGN(nhdr->n_namesz),
		    descsz = NOTE_ALIGN(nhdr->n_descsz);
		const char *name;

		ptr += sizeof(*nhdr);
		name = ptr;
		ptr += namesz;
		if (nhdr->n_type == NT_GNU_BUILD_ID &&
		    nhdr->n_namesz == sizeof("GNU")) {
			if (memcmp(name, "GNU", sizeof("GNU")) == 0) {
				memcpy(bf, ptr, BUILD_ID_SIZE);
				err = BUILD_ID_SIZE;
				break;
			}
		}
		ptr += descsz;
	}
966 967 968 969 970 971 972 973
out_elf_end:
	elf_end(elf);
out_close:
	close(fd);
out:
	return err;
}

974 975 976 977 978 979 980 981 982 983 984 985 986 987 988 989 990 991 992
int sysfs__read_build_id(const char *filename, void *build_id, size_t size)
{
	int fd, err = -1;

	if (size < BUILD_ID_SIZE)
		goto out;

	fd = open(filename, O_RDONLY);
	if (fd < 0)
		goto out;

	while (1) {
		char bf[BUFSIZ];
		GElf_Nhdr nhdr;
		int namesz, descsz;

		if (read(fd, &nhdr, sizeof(nhdr)) != sizeof(nhdr))
			break;

993 994
		namesz = NOTE_ALIGN(nhdr.n_namesz);
		descsz = NOTE_ALIGN(nhdr.n_descsz);
995 996 997 998 999 1000 1001 1002 1003 1004 1005 1006 1007 1008 1009 1010 1011 1012 1013 1014 1015 1016 1017
		if (nhdr.n_type == NT_GNU_BUILD_ID &&
		    nhdr.n_namesz == sizeof("GNU")) {
			if (read(fd, bf, namesz) != namesz)
				break;
			if (memcmp(bf, "GNU", sizeof("GNU")) == 0) {
				if (read(fd, build_id,
				    BUILD_ID_SIZE) == BUILD_ID_SIZE) {
					err = 0;
					break;
				}
			} else if (read(fd, bf, descsz) != descsz)
				break;
		} else {
			int n = namesz + descsz;
			if (read(fd, bf, n) != n)
				break;
		}
	}
	close(fd);
out:
	return err;
}

1018 1019 1020 1021 1022 1023 1024 1025 1026
char dso__symtab_origin(const struct dso *self)
{
	static const char origin[] = {
		[DSO__ORIG_KERNEL] =   'k',
		[DSO__ORIG_JAVA_JIT] = 'j',
		[DSO__ORIG_FEDORA] =   'f',
		[DSO__ORIG_UBUNTU] =   'u',
		[DSO__ORIG_BUILDID] =  'b',
		[DSO__ORIG_DSO] =      'd',
1027
		[DSO__ORIG_KMODULE] =  'K',
1028 1029 1030 1031 1032 1033 1034
	};

	if (self == NULL || self->origin == DSO__ORIG_NOT_FOUND)
		return '!';
	return origin[self->origin];
}

1035
int dso__load(struct dso *self, struct map *map, symbol_filter_t filter)
1036
{
1037
	int size = PATH_MAX;
1038
	char *name;
1039
	u8 build_id[BUILD_ID_SIZE];
1040 1041 1042
	int ret = -1;
	int fd;

1043
	self->loaded = 1;
1044

1045 1046 1047 1048
	if (self->kernel)
		return dso__load_kernel_sym(self, map, filter);

	name = malloc(size);
1049 1050 1051
	if (!name)
		return -1;

1052
	self->adjust_symbols = 0;
1053

1054
	if (strncmp(self->name, "/tmp/perf-", 10) == 0) {
1055
		ret = dso__load_perf_map(self, map, filter);
1056 1057 1058 1059 1060 1061
		self->origin = ret > 0 ? DSO__ORIG_JAVA_JIT :
					 DSO__ORIG_NOT_FOUND;
		return ret;
	}

	self->origin = DSO__ORIG_FEDORA - 1;
1062

1063 1064
more:
	do {
1065 1066 1067
		self->origin++;
		switch (self->origin) {
		case DSO__ORIG_FEDORA:
1068 1069
			snprintf(name, size, "/usr/lib/debug%s.debug",
				 self->long_name);
1070
			break;
1071
		case DSO__ORIG_UBUNTU:
1072 1073
			snprintf(name, size, "/usr/lib/debug%s",
				 self->long_name);
1074
			break;
1075
		case DSO__ORIG_BUILDID:
1076 1077 1078 1079 1080 1081
			if (filename__read_build_id(self->long_name, build_id,
						    sizeof(build_id))) {
				char build_id_hex[BUILD_ID_SIZE * 2 + 1];

				build_id__sprintf(build_id, sizeof(build_id),
						  build_id_hex);
1082 1083
				snprintf(name, size,
					 "/usr/lib/debug/.build-id/%.2s/%s.debug",
1084 1085 1086 1087
					build_id_hex, build_id_hex + 2);
				if (self->has_build_id)
					goto compare_build_id;
				break;
1088
			}
1089
			self->origin++;
1090
			/* Fall thru */
1091
		case DSO__ORIG_DSO:
1092
			snprintf(name, size, "%s", self->long_name);
1093 1094 1095 1096 1097 1098
			break;

		default:
			goto out;
		}

1099
		if (self->has_build_id) {
1100 1101
			if (filename__read_build_id(name, build_id,
						    sizeof(build_id)) < 0)
1102 1103
				goto more;
compare_build_id:
1104
			if (!dso__build_id_equal(self, build_id))
1105 1106 1107
				goto more;
		}

1108 1109 1110
		fd = open(name, O_RDONLY);
	} while (fd < 0);

1111
	ret = dso__load_sym(self, map, name, fd, filter, 0, 0);
1112 1113 1114 1115 1116 1117 1118 1119
	close(fd);

	/*
	 * Some people seem to have debuginfo files _WITHOUT_ debug info!?!?
	 */
	if (!ret)
		goto more;

1120
	if (ret > 0) {
1121
		int nr_plt = dso__synthesize_plt_symbols(self, map, filter);
1122 1123 1124
		if (nr_plt > 0)
			ret += nr_plt;
	}
1125 1126
out:
	free(name);
1127 1128
	if (ret < 0 && strstr(self->name, " (deleted)") != NULL)
		return 0;
1129 1130 1131
	return ret;
}

1132 1133 1134
struct map *kernel_map;

static void kernel_maps__insert(struct map *map)
1135
{
1136 1137
	maps__insert(&kernel_maps, map);
}
1138

1139 1140
struct symbol *kernel_maps__find_symbol(u64 ip, struct map **mapp,
					symbol_filter_t filter)
1141 1142
{
	struct map *map = maps__find(&kernel_maps, ip);
1143 1144 1145

	if (mapp)
		*mapp = map;
1146 1147 1148

	if (map) {
		ip = map->map_ip(map, ip);
1149
		return map__find_symbol(map, ip, filter);
1150
	}
1151

1152
	return NULL;
1153 1154 1155 1156 1157 1158 1159 1160 1161 1162 1163 1164 1165 1166 1167 1168
}

struct map *kernel_maps__find_by_dso_name(const char *name)
{
	struct rb_node *nd;

	for (nd = rb_first(&kernel_maps); nd; nd = rb_next(nd)) {
		struct map *map = rb_entry(nd, struct map, rb_node);

		if (map->dso && strcmp(map->dso->name, name) == 0)
			return map;
	}

	return NULL;
}

1169
static int dsos__set_modules_path_dir(char *dirname)
1170
{
1171 1172
	struct dirent *dent;
	DIR *dir = opendir(dirname);
1173

1174
	if (!dir) {
1175
		pr_err("%s: cannot open %s dir\n", __func__, dirname);
1176 1177
		return -1;
	}
1178

1179 1180 1181 1182 1183 1184 1185 1186 1187 1188
	while ((dent = readdir(dir)) != NULL) {
		char path[PATH_MAX];

		if (dent->d_type == DT_DIR) {
			if (!strcmp(dent->d_name, ".") ||
			    !strcmp(dent->d_name, ".."))
				continue;

			snprintf(path, sizeof(path), "%s/%s",
				 dirname, dent->d_name);
1189
			if (dsos__set_modules_path_dir(path) < 0)
1190 1191 1192 1193 1194
				goto failure;
		} else {
			char *dot = strrchr(dent->d_name, '.'),
			     dso_name[PATH_MAX];
			struct map *map;
1195
			char *long_name;
1196 1197 1198 1199 1200 1201

			if (dot == NULL || strcmp(dot, ".ko"))
				continue;
			snprintf(dso_name, sizeof(dso_name), "[%.*s]",
				 (int)(dot - dent->d_name), dent->d_name);

1202
			strxfrchar(dso_name, '-', '_');
1203 1204 1205 1206 1207 1208 1209
			map = kernel_maps__find_by_dso_name(dso_name);
			if (map == NULL)
				continue;

			snprintf(path, sizeof(path), "%s/%s",
				 dirname, dent->d_name);

1210 1211
			long_name = strdup(path);
			if (long_name == NULL)
1212
				goto failure;
1213
			dso__set_long_name(map->dso, long_name);
1214 1215
		}
	}
1216

1217
	return 0;
1218 1219 1220 1221
failure:
	closedir(dir);
	return -1;
}
1222

1223
static int dsos__set_modules_path(void)
1224 1225 1226
{
	struct utsname uts;
	char modules_path[PATH_MAX];
1227

1228 1229
	if (uname(&uts) < 0)
		return -1;
1230

1231 1232
	snprintf(modules_path, sizeof(modules_path), "/lib/modules/%s/kernel",
		 uts.release);
1233

1234
	return dsos__set_modules_path_dir(modules_path);
1235 1236
}

1237 1238 1239 1240 1241 1242
/*
 * Constructor variant for modules (where we know from /proc/modules where
 * they are loaded) and for vmlinux, where only after we load all the
 * symbols we'll know where it starts and ends.
 */
static struct map *map__new2(u64 start, struct dso *dso)
1243
{
1244
	struct map *self = malloc(sizeof(*self));
1245

1246 1247
	if (self != NULL) {
		/*
1248
		 * ->end will be filled after we load all the symbols
1249
		 */
1250
		map__init(self, start, 0, 0, dso);
1251
	}
1252

1253 1254 1255
	return self;
}

1256
static int kernel_maps__create_module_maps(void)
1257 1258 1259 1260 1261
{
	char *line = NULL;
	size_t n;
	FILE *file = fopen("/proc/modules", "r");
	struct map *map;
1262

1263 1264
	if (file == NULL)
		return -1;
1265

1266 1267 1268 1269 1270 1271
	while (!feof(file)) {
		char name[PATH_MAX];
		u64 start;
		struct dso *dso;
		char *sep;
		int line_len;
1272

1273 1274 1275 1276 1277 1278 1279 1280 1281 1282 1283 1284 1285 1286 1287 1288 1289 1290 1291 1292 1293 1294
		line_len = getline(&line, &n, file);
		if (line_len < 0)
			break;

		if (!line)
			goto out_failure;

		line[--line_len] = '\0'; /* \n */

		sep = strrchr(line, 'x');
		if (sep == NULL)
			continue;

		hex2u64(sep + 1, &start);

		sep = strchr(line, ' ');
		if (sep == NULL)
			continue;

		*sep = '\0';

		snprintf(name, sizeof(name), "[%s]", line);
1295
		dso = dso__new(name);
1296 1297 1298 1299 1300 1301 1302 1303

		if (dso == NULL)
			goto out_delete_line;

		map = map__new2(start, dso);
		if (map == NULL) {
			dso__delete(dso);
			goto out_delete_line;
1304
		}
1305

1306 1307 1308 1309 1310 1311
		snprintf(name, sizeof(name),
			 "/sys/module/%s/notes/.note.gnu.build-id", line);
		if (sysfs__read_build_id(name, dso->build_id,
					 sizeof(dso->build_id)) == 0)
			dso->has_build_id = true;

1312 1313 1314
		dso->origin = DSO__ORIG_KMODULE;
		kernel_maps__insert(map);
		dsos__add(dso);
1315
	}
1316 1317 1318 1319

	free(line);
	fclose(file);

1320 1321 1322 1323 1324 1325 1326
	/*
	 * Now that we have all sorted out, just set the ->end of all
	 * maps:
	 */
	kernel_maps__fixup_end();

	return dsos__set_modules_path();
1327 1328 1329 1330 1331

out_delete_line:
	free(line);
out_failure:
	return -1;
1332 1333
}

1334
static int dso__load_vmlinux(struct dso *self, struct map *map,
1335
			     const char *vmlinux, symbol_filter_t filter)
1336 1337 1338
{
	int err, fd = open(vmlinux, O_RDONLY);

1339
	self->loaded = 1;
1340

1341 1342 1343
	if (fd < 0)
		return -1;

1344
	err = dso__load_sym(self, map, self->long_name, fd, filter, 1, 0);
1345

1346 1347 1348 1349 1350
	close(fd);

	return err;
}

1351 1352
static int dso__load_kernel_sym(struct dso *self, struct map *map,
				symbol_filter_t filter)
1353
{
1354
	int err = dso__load_vmlinux(self, map, self->name, filter);
1355

1356
	if (err <= 0)
1357
		err = kernel_maps__load_kallsyms(filter);
1358 1359

	if (err > 0) {
1360 1361
		map__fixup_start(map);
		map__fixup_end(map);
1362
	}
1363

1364 1365 1366
	return err;
}

1367 1368 1369
LIST_HEAD(dsos);
struct dso	*vdso;

1370
const char	*vmlinux_name = "vmlinux";
1371 1372 1373 1374 1375 1376 1377 1378 1379 1380 1381 1382 1383 1384 1385 1386

static void dsos__add(struct dso *dso)
{
	list_add_tail(&dso->node, &dsos);
}

static struct dso *dsos__find(const char *name)
{
	struct dso *pos;

	list_for_each_entry(pos, &dsos, node)
		if (strcmp(pos->name, name) == 0)
			return pos;
	return NULL;
}

1387
struct dso *dsos__findnew(const char *name)
1388 1389 1390
{
	struct dso *dso = dsos__find(name);

1391
	if (!dso) {
1392
		dso = dso__new(name);
1393
		if (dso != NULL) {
1394
			dsos__add(dso);
1395 1396
			dso__set_basename(dso);
		}
1397
	}
1398 1399 1400 1401 1402 1403 1404 1405 1406 1407 1408 1409

	return dso;
}

void dsos__fprintf(FILE *fp)
{
	struct dso *pos;

	list_for_each_entry(pos, &dsos, node)
		dso__fprintf(pos, fp);
}

1410 1411 1412 1413 1414 1415 1416
size_t dsos__fprintf_buildid(FILE *fp)
{
	struct dso *pos;
	size_t ret = 0;

	list_for_each_entry(pos, &dsos, node) {
		ret += dso__fprintf_buildid(pos, fp);
1417
		ret += fprintf(fp, " %s\n", pos->long_name);
1418 1419 1420 1421
	}
	return ret;
}

1422
static int kernel_maps__create_kernel_map(void)
1423
{
1424
	struct dso *kernel = dso__new(vmlinux_name);
1425

1426
	if (kernel == NULL)
1427 1428 1429 1430 1431 1432 1433
		return -1;

	kernel_map = map__new2(0, kernel);
	if (kernel_map == NULL)
		goto out_delete_kernel_dso;

	kernel_map->map_ip = kernel_map->unmap_ip = identity__map_ip;
1434 1435

	kernel->short_name = "[kernel]";
1436
	kernel->kernel = 1;
1437
	vdso = dso__new("[vdso]");
1438 1439
	if (vdso == NULL)
		goto out_delete_kernel_map;
1440 1441 1442 1443

	if (sysfs__read_build_id("/sys/kernel/notes", kernel->build_id,
				 sizeof(kernel->build_id)) == 0)
		kernel->has_build_id = true;
1444

1445
	kernel_maps__insert(kernel_map);
1446
	dsos__add(kernel);
1447 1448
	dsos__add(vdso);

1449 1450 1451 1452 1453 1454 1455 1456
	return 0;

out_delete_kernel_map:
	map__delete(kernel_map);
	kernel_map = NULL;
out_delete_kernel_dso:
	dso__delete(kernel);
	return -1;
1457 1458
}

1459
int kernel_maps__init(bool use_modules)
1460
{
1461
	if (kernel_maps__create_kernel_map() < 0)
1462 1463
		return -1;

1464 1465 1466
	if (use_modules && kernel_maps__create_module_maps() < 0)
		pr_warning("Failed to load list of modules in use, "
			   "continuing...\n");
1467 1468

	return 0;
1469 1470
}

1471
void symbol__init(unsigned int priv_size)
1472 1473
{
	elf_version(EV_CURRENT);
1474
	symbol__priv_size = priv_size;
1475
}