symbol.c 31.4 KB
Newer Older
1 2
#include "util.h"
#include "../perf.h"
3
#include "string.h"
4
#include "symbol.h"
5
#include "thread.h"
6

7 8
#include "debug.h"

9 10 11
#include <libelf.h>
#include <gelf.h>
#include <elf.h>
12
#include <limits.h>
13
#include <sys/utsname.h>
P
Peter Zijlstra 已提交
14

15 16 17 18 19 20 21
enum dso_origin {
	DSO__ORIG_KERNEL = 0,
	DSO__ORIG_JAVA_JIT,
	DSO__ORIG_FEDORA,
	DSO__ORIG_UBUNTU,
	DSO__ORIG_BUILDID,
	DSO__ORIG_DSO,
22
	DSO__ORIG_KMODULE,
23 24 25
	DSO__ORIG_NOT_FOUND,
};

26 27
static void dsos__add(struct dso *dso);
static struct dso *dsos__find(const char *name);
28 29
static struct map *map__new2(u64 start, struct dso *dso);
static void kernel_maps__insert(struct map *map);
30 31
static int dso__load_kernel_sym(struct dso *self, struct map *map,
				symbol_filter_t filter);
32
unsigned int symbol__priv_size;
33

34 35
static struct rb_root kernel_maps;

36
static void dso__fixup_sym_end(struct dso *self)
37 38
{
	struct rb_node *nd, *prevnd = rb_first(&self->syms);
39
	struct symbol *curr, *prev;
40 41 42 43

	if (prevnd == NULL)
		return;

44 45
	curr = rb_entry(prevnd, struct symbol, rb_node);

46
	for (nd = rb_next(prevnd); nd; nd = rb_next(nd)) {
47 48
		prev = curr;
		curr = rb_entry(nd, struct symbol, rb_node);
49 50 51 52

		if (prev->end == prev->start)
			prev->end = curr->start - 1;
	}
53 54 55 56

	/* Last entry */
	if (curr->end == curr->start)
		curr->end = roundup(curr->start, 4096);
57 58
}

59
static void kernel_maps__fixup_end(void)
60 61 62 63 64 65 66 67 68 69 70 71 72
{
	struct map *prev, *curr;
	struct rb_node *nd, *prevnd = rb_first(&kernel_maps);

	if (prevnd == NULL)
		return;

	curr = rb_entry(prevnd, struct map, rb_node);

	for (nd = rb_next(prevnd); nd; nd = rb_next(nd)) {
		prev = curr;
		curr = rb_entry(nd, struct map, rb_node);
		prev->end = curr->start - 1;
73
	}
74 75
}

76
static struct symbol *symbol__new(u64 start, u64 len, const char *name)
77
{
78
	size_t namelen = strlen(name) + 1;
79 80
	struct symbol *self = calloc(1, (symbol__priv_size +
					 sizeof(*self) + namelen));
81 82 83
	if (!self)
		return NULL;

84 85 86
	if (symbol__priv_size) {
		memset(self, 0, symbol__priv_size);
		self = ((void *)self) + symbol__priv_size;
87
	}
88
	self->start = start;
89
	self->end   = len ? start + len - 1 : start;
90

91
	pr_debug3("%s: %s %#Lx-%#Lx\n", __func__, name, start, self->end);
92

93
	memcpy(self->name, name, namelen);
94 95 96 97

	return self;
}

98
static void symbol__delete(struct symbol *self)
99
{
100
	free(((void *)self) - symbol__priv_size);
101 102 103 104
}

static size_t symbol__fprintf(struct symbol *self, FILE *fp)
{
105
	return fprintf(fp, " %llx-%llx %s\n",
106 107 108
		       self->start, self->end, self->name);
}

109 110
static void dso__set_long_name(struct dso *self, char *name)
{
111 112
	if (name == NULL)
		return;
113 114 115 116 117 118 119 120 121
	self->long_name = name;
	self->long_name_len = strlen(name);
}

static void dso__set_basename(struct dso *self)
{
	self->short_name = basename(self->long_name);
}

122
struct dso *dso__new(const char *name)
123 124 125 126 127
{
	struct dso *self = malloc(sizeof(*self) + strlen(name) + 1);

	if (self != NULL) {
		strcpy(self->name, name);
128
		dso__set_long_name(self, self->name);
129
		self->short_name = self->name;
130
		self->syms = RB_ROOT;
P
Peter Zijlstra 已提交
131
		self->find_symbol = dso__find_symbol;
132
		self->slen_calculated = 0;
133
		self->origin = DSO__ORIG_NOT_FOUND;
134 135
		self->loaded = 0;
		self->has_build_id = 0;
136 137 138 139 140 141 142 143 144 145 146 147 148
	}

	return self;
}

static void dso__delete_symbols(struct dso *self)
{
	struct symbol *pos;
	struct rb_node *next = rb_first(&self->syms);

	while (next) {
		pos = rb_entry(next, struct symbol, rb_node);
		next = rb_next(&pos->rb_node);
149
		rb_erase(&pos->rb_node, &self->syms);
150
		symbol__delete(pos);
151 152 153 154 155 156
	}
}

void dso__delete(struct dso *self)
{
	dso__delete_symbols(self);
157 158
	if (self->long_name != self->name)
		free(self->long_name);
159 160 161
	free(self);
}

162 163 164 165 166 167
void dso__set_build_id(struct dso *self, void *build_id)
{
	memcpy(self->build_id, build_id, sizeof(self->build_id));
	self->has_build_id = 1;
}

168 169 170 171
static void dso__insert_symbol(struct dso *self, struct symbol *sym)
{
	struct rb_node **p = &self->syms.rb_node;
	struct rb_node *parent = NULL;
172
	const u64 ip = sym->start;
173 174 175 176 177 178 179 180 181 182 183 184 185 186
	struct symbol *s;

	while (*p != NULL) {
		parent = *p;
		s = rb_entry(parent, struct symbol, rb_node);
		if (ip < s->start)
			p = &(*p)->rb_left;
		else
			p = &(*p)->rb_right;
	}
	rb_link_node(&sym->rb_node, parent, p);
	rb_insert_color(&sym->rb_node, &self->syms);
}

187
struct symbol *dso__find_symbol(struct dso *self, u64 ip)
188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209
{
	struct rb_node *n;

	if (self == NULL)
		return NULL;

	n = self->syms.rb_node;

	while (n) {
		struct symbol *s = rb_entry(n, struct symbol, rb_node);

		if (ip < s->start)
			n = n->rb_left;
		else if (ip > s->end)
			n = n->rb_right;
		else
			return s;
	}

	return NULL;
}

210
int build_id__sprintf(u8 *self, int len, char *bf)
211
{
212 213 214
	char *bid = bf;
	u8 *raw = self;
	int i;
215

216 217 218 219 220 221 222 223 224
	for (i = 0; i < len; ++i) {
		sprintf(bid, "%02x", *raw);
		++raw;
		bid += 2;
	}

	return raw - self;
}

225
size_t dso__fprintf_buildid(struct dso *self, FILE *fp)
226 227 228 229
{
	char sbuild_id[BUILD_ID_SIZE * 2 + 1];

	build_id__sprintf(self->build_id, sizeof(self->build_id), sbuild_id);
230 231 232 233 234 235 236 237 238 239
	return fprintf(fp, "%s", sbuild_id);
}

size_t dso__fprintf(struct dso *self, FILE *fp)
{
	struct rb_node *nd;
	size_t ret = fprintf(fp, "dso: %s (", self->short_name);

	ret += dso__fprintf_buildid(self, fp);
	ret += fprintf(fp, ")\n");
240

241 242 243 244 245 246 247 248
	for (nd = rb_first(&self->syms); nd; nd = rb_next(nd)) {
		struct symbol *pos = rb_entry(nd, struct symbol, rb_node);
		ret += symbol__fprintf(pos, fp);
	}

	return ret;
}

249 250 251 252 253
/*
 * Loads the function entries in /proc/kallsyms into kernel_map->dso,
 * so that we can in the next step set the symbol ->end address and then
 * call kernel_maps__split_kallsyms.
 */
254
static int kernel_maps__load_all_kallsyms(void)
255 256 257 258 259 260 261 262 263
{
	char *line = NULL;
	size_t n;
	FILE *file = fopen("/proc/kallsyms", "r");

	if (file == NULL)
		goto out_failure;

	while (!feof(file)) {
264
		u64 start;
265 266 267
		struct symbol *sym;
		int line_len, len;
		char symbol_type;
268
		char *symbol_name;
269 270 271 272 273 274 275 276 277 278

		line_len = getline(&line, &n, file);
		if (line_len < 0)
			break;

		if (!line)
			goto out_failure;

		line[--line_len] = '\0'; /* \n */

279
		len = hex2u64(line, &start);
280 281 282 283 284 285 286 287 288 289 290

		len++;
		if (len + 2 >= line_len)
			continue;

		symbol_type = toupper(line[len]);
		/*
		 * We're interested only in code ('T'ext)
		 */
		if (symbol_type != 'T' && symbol_type != 'W')
			continue;
291 292

		symbol_name = line + len + 2;
293 294 295
		/*
		 * Will fix up the end later, when we have all symbols sorted.
		 */
296
		sym = symbol__new(start, 0, symbol_name);
297

298 299 300
		if (sym == NULL)
			goto out_delete_line;

301 302 303 304 305
		/*
		 * We will pass the symbols to the filter later, in
		 * kernel_maps__split_kallsyms, when we have split the
		 * maps per module
		 */
306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324
		dso__insert_symbol(kernel_map->dso, sym);
	}

	free(line);
	fclose(file);

	return 0;

out_delete_line:
	free(line);
out_failure:
	return -1;
}

/*
 * Split the symbols into maps, making sure there are no overlaps, i.e. the
 * kernel range is broken in several maps, named [kernel].N, as we don't have
 * the original ELF section names vmlinux have.
 */
325
static int kernel_maps__split_kallsyms(symbol_filter_t filter)
326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342
{
	struct map *map = kernel_map;
	struct symbol *pos;
	int count = 0;
	struct rb_node *next = rb_first(&kernel_map->dso->syms);
	int kernel_range = 0;

	while (next) {
		char *module;

		pos = rb_entry(next, struct symbol, rb_node);
		next = rb_next(&pos->rb_node);

		module = strchr(pos->name, '\t');
		if (module) {
			*module++ = '\0';

343 344 345
			if (strcmp(map->dso->name, module)) {
				map = kernel_maps__find_by_dso_name(module);
				if (!map) {
346 347
					pr_err("/proc/{kallsyms,modules} "
					       "inconsistency!\n");
348 349 350
					return -1;
				}
			}
351 352 353 354 355 356 357 358 359 360 361 362 363
			/*
			 * So that we look just like we get from .ko files,
			 * i.e. not prelinked, relative to map->start.
			 */
			pos->start = map->map_ip(map, pos->start);
			pos->end   = map->map_ip(map, pos->end);
		} else if (map != kernel_map) {
			char dso_name[PATH_MAX];
			struct dso *dso;

			snprintf(dso_name, sizeof(dso_name), "[kernel].%d",
				 kernel_range++);

364
			dso = dso__new(dso_name);
365 366 367 368 369 370 371 372
			if (dso == NULL)
				return -1;

			map = map__new2(pos->start, dso);
			if (map == NULL) {
				dso__delete(dso);
				return -1;
			}
373

374
			map->map_ip = map->unmap_ip = identity__map_ip;
375 376 377
			kernel_maps__insert(map);
			++kernel_range;
		}
378

379 380
		if (filter && filter(map, pos)) {
			rb_erase(&pos->rb_node, &kernel_map->dso->syms);
381
			symbol__delete(pos);
382 383 384 385 386
		} else {
			if (map != kernel_map) {
				rb_erase(&pos->rb_node, &kernel_map->dso->syms);
				dso__insert_symbol(map->dso, pos);
			}
387 388
			count++;
		}
389 390
	}

391
	return count;
392
}
393

394

395
static int kernel_maps__load_kallsyms(symbol_filter_t filter)
396
{
397
	if (kernel_maps__load_all_kallsyms())
398 399 400
		return -1;

	dso__fixup_sym_end(kernel_map->dso);
401
	kernel_map->dso->origin = DSO__ORIG_KERNEL;
402

403
	return kernel_maps__split_kallsyms(filter);
404 405
}

406
size_t kernel_maps__fprintf(FILE *fp)
407
{
408
	size_t printed = fprintf(fp, "Kernel maps:\n");
409 410 411 412 413
	struct rb_node *nd;

	for (nd = rb_first(&kernel_maps); nd; nd = rb_next(nd)) {
		struct map *pos = rb_entry(nd, struct map, rb_node);

414
		printed += fprintf(fp, "Map:");
415
		printed += map__fprintf(pos, fp);
416
		if (verbose > 1) {
417 418 419
			printed += dso__fprintf(pos->dso, fp);
			printed += fprintf(fp, "--\n");
		}
420 421
	}

422
	return printed + fprintf(fp, "END kernel maps\n");
423 424
}

425
static int dso__load_perf_map(struct dso *self, struct map *map,
426
			      symbol_filter_t filter)
427 428 429 430 431 432
{
	char *line = NULL;
	size_t n;
	FILE *file;
	int nr_syms = 0;

433
	file = fopen(self->long_name, "r");
434 435 436 437
	if (file == NULL)
		goto out_failure;

	while (!feof(file)) {
438
		u64 start, size;
439 440 441 442 443 444 445 446 447 448 449 450 451 452 453 454 455 456 457 458 459 460 461 462
		struct symbol *sym;
		int line_len, len;

		line_len = getline(&line, &n, file);
		if (line_len < 0)
			break;

		if (!line)
			goto out_failure;

		line[--line_len] = '\0'; /* \n */

		len = hex2u64(line, &start);

		len++;
		if (len + 2 >= line_len)
			continue;

		len += hex2u64(line + len, &size);

		len++;
		if (len + 2 >= line_len)
			continue;

463
		sym = symbol__new(start, size, line + len);
464 465 466 467

		if (sym == NULL)
			goto out_delete_line;

468
		if (filter && filter(map, sym))
469
			symbol__delete(sym);
470 471 472 473 474 475 476 477 478 479 480 481 482 483 484 485 486
		else {
			dso__insert_symbol(self, sym);
			nr_syms++;
		}
	}

	free(line);
	fclose(file);

	return nr_syms;

out_delete_line:
	free(line);
out_failure:
	return -1;
}

487 488 489 490
/**
 * elf_symtab__for_each_symbol - iterate thru all the symbols
 *
 * @self: struct elf_symtab instance to iterate
491
 * @idx: uint32_t idx
492 493
 * @sym: GElf_Sym iterator
 */
494 495 496 497
#define elf_symtab__for_each_symbol(syms, nr_syms, idx, sym) \
	for (idx = 0, gelf_getsym(syms, idx, &sym);\
	     idx < nr_syms; \
	     idx++, gelf_getsym(syms, idx, &sym))
498 499 500 501 502 503 504 505 506 507

static inline uint8_t elf_sym__type(const GElf_Sym *sym)
{
	return GELF_ST_TYPE(sym->st_info);
}

static inline int elf_sym__is_function(const GElf_Sym *sym)
{
	return elf_sym__type(sym) == STT_FUNC &&
	       sym->st_name != 0 &&
508
	       sym->st_shndx != SHN_UNDEF;
509 510
}

511 512 513 514 515 516 517 518 519 520 521 522 523 524 525 526 527 528 529 530
static inline int elf_sym__is_label(const GElf_Sym *sym)
{
	return elf_sym__type(sym) == STT_NOTYPE &&
		sym->st_name != 0 &&
		sym->st_shndx != SHN_UNDEF &&
		sym->st_shndx != SHN_ABS;
}

static inline const char *elf_sec__name(const GElf_Shdr *shdr,
					const Elf_Data *secstrs)
{
	return secstrs->d_buf + shdr->sh_name;
}

static inline int elf_sec__is_text(const GElf_Shdr *shdr,
					const Elf_Data *secstrs)
{
	return strstr(elf_sec__name(shdr, secstrs), "text") != NULL;
}

531 532 533 534 535 536 537 538
static inline const char *elf_sym__name(const GElf_Sym *sym,
					const Elf_Data *symstrs)
{
	return symstrs->d_buf + sym->st_name;
}

static Elf_Scn *elf_section_by_name(Elf *elf, GElf_Ehdr *ep,
				    GElf_Shdr *shp, const char *name,
539
				    size_t *idx)
540 541 542 543 544 545 546 547 548 549
{
	Elf_Scn *sec = NULL;
	size_t cnt = 1;

	while ((sec = elf_nextscn(elf, sec)) != NULL) {
		char *str;

		gelf_getshdr(sec, shp);
		str = elf_strptr(elf, ep->e_shstrndx, shp->sh_name);
		if (!strcmp(name, str)) {
550 551
			if (idx)
				*idx = cnt;
552 553 554 555 556 557 558 559
			break;
		}
		++cnt;
	}

	return sec;
}

560 561 562 563 564 565 566 567 568 569
#define elf_section__for_each_rel(reldata, pos, pos_mem, idx, nr_entries) \
	for (idx = 0, pos = gelf_getrel(reldata, 0, &pos_mem); \
	     idx < nr_entries; \
	     ++idx, pos = gelf_getrel(reldata, idx, &pos_mem))

#define elf_section__for_each_rela(reldata, pos, pos_mem, idx, nr_entries) \
	for (idx = 0, pos = gelf_getrela(reldata, 0, &pos_mem); \
	     idx < nr_entries; \
	     ++idx, pos = gelf_getrela(reldata, idx, &pos_mem))

570 571 572 573 574 575 576
/*
 * We need to check if we have a .dynsym, so that we can handle the
 * .plt, synthesizing its symbols, that aren't on the symtabs (be it
 * .dynsym or .symtab).
 * And always look at the original dso, not at debuginfo packages, that
 * have the PLT data stripped out (shdr_rel_plt.sh_type == SHT_NOBITS).
 */
577 578
static int dso__synthesize_plt_symbols(struct  dso *self, struct map *map,
				       symbol_filter_t filter)
579 580 581
{
	uint32_t nr_rel_entries, idx;
	GElf_Sym sym;
582
	u64 plt_offset;
583 584
	GElf_Shdr shdr_plt;
	struct symbol *f;
585
	GElf_Shdr shdr_rel_plt, shdr_dynsym;
586
	Elf_Data *reldata, *syms, *symstrs;
587 588 589
	Elf_Scn *scn_plt_rel, *scn_symstrs, *scn_dynsym;
	size_t dynsym_idx;
	GElf_Ehdr ehdr;
590
	char sympltname[1024];
591 592 593
	Elf *elf;
	int nr = 0, symidx, fd, err = 0;

594
	fd = open(self->long_name, O_RDONLY);
595 596 597
	if (fd < 0)
		goto out;

598
	elf = elf_begin(fd, PERF_ELF_C_READ_MMAP, NULL);
599 600 601 602 603 604 605 606 607 608
	if (elf == NULL)
		goto out_close;

	if (gelf_getehdr(elf, &ehdr) == NULL)
		goto out_elf_end;

	scn_dynsym = elf_section_by_name(elf, &ehdr, &shdr_dynsym,
					 ".dynsym", &dynsym_idx);
	if (scn_dynsym == NULL)
		goto out_elf_end;
609

610
	scn_plt_rel = elf_section_by_name(elf, &ehdr, &shdr_rel_plt,
611 612
					  ".rela.plt", NULL);
	if (scn_plt_rel == NULL) {
613
		scn_plt_rel = elf_section_by_name(elf, &ehdr, &shdr_rel_plt,
614 615
						  ".rel.plt", NULL);
		if (scn_plt_rel == NULL)
616
			goto out_elf_end;
617 618
	}

619 620
	err = -1;

621
	if (shdr_rel_plt.sh_link != dynsym_idx)
622
		goto out_elf_end;
623

624 625
	if (elf_section_by_name(elf, &ehdr, &shdr_plt, ".plt", NULL) == NULL)
		goto out_elf_end;
626 627

	/*
628
	 * Fetch the relocation section to find the idxes to the GOT
629 630 631 632
	 * and the symbols in the .dynsym they refer to.
	 */
	reldata = elf_getdata(scn_plt_rel, NULL);
	if (reldata == NULL)
633
		goto out_elf_end;
634 635 636

	syms = elf_getdata(scn_dynsym, NULL);
	if (syms == NULL)
637
		goto out_elf_end;
638

639
	scn_symstrs = elf_getscn(elf, shdr_dynsym.sh_link);
640
	if (scn_symstrs == NULL)
641
		goto out_elf_end;
642 643 644

	symstrs = elf_getdata(scn_symstrs, NULL);
	if (symstrs == NULL)
645
		goto out_elf_end;
646 647 648 649 650 651 652 653 654 655 656 657 658 659 660 661

	nr_rel_entries = shdr_rel_plt.sh_size / shdr_rel_plt.sh_entsize;
	plt_offset = shdr_plt.sh_offset;

	if (shdr_rel_plt.sh_type == SHT_RELA) {
		GElf_Rela pos_mem, *pos;

		elf_section__for_each_rela(reldata, pos, pos_mem, idx,
					   nr_rel_entries) {
			symidx = GELF_R_SYM(pos->r_info);
			plt_offset += shdr_plt.sh_entsize;
			gelf_getsym(syms, symidx, &sym);
			snprintf(sympltname, sizeof(sympltname),
				 "%s@plt", elf_sym__name(&sym, symstrs));

			f = symbol__new(plt_offset, shdr_plt.sh_entsize,
662
					sympltname);
663
			if (!f)
664
				goto out_elf_end;
665

666 667 668 669 670 671
			if (filter && filter(map, f))
				symbol__delete(f);
			else {
				dso__insert_symbol(self, f);
				++nr;
			}
672 673 674 675 676 677 678 679 680 681 682 683
		}
	} else if (shdr_rel_plt.sh_type == SHT_REL) {
		GElf_Rel pos_mem, *pos;
		elf_section__for_each_rel(reldata, pos, pos_mem, idx,
					  nr_rel_entries) {
			symidx = GELF_R_SYM(pos->r_info);
			plt_offset += shdr_plt.sh_entsize;
			gelf_getsym(syms, symidx, &sym);
			snprintf(sympltname, sizeof(sympltname),
				 "%s@plt", elf_sym__name(&sym, symstrs));

			f = symbol__new(plt_offset, shdr_plt.sh_entsize,
684
					sympltname);
685
			if (!f)
686
				goto out_elf_end;
687

688 689 690 691 692 693
			if (filter && filter(map, f))
				symbol__delete(f);
			else {
				dso__insert_symbol(self, f);
				++nr;
			}
694 695 696
		}
	}

697 698 699 700 701 702 703 704 705
	err = 0;
out_elf_end:
	elf_end(elf);
out_close:
	close(fd);

	if (err == 0)
		return nr;
out:
706 707
	pr_warning("%s: problems reading %s PLT info.\n",
		   __func__, self->long_name);
708
	return 0;
709 710
}

711 712
static int dso__load_sym(struct dso *self, struct map *map, const char *name,
			 int fd, symbol_filter_t filter, int kernel,
713
			 int kmodule)
714
{
715 716 717
	struct map *curr_map = map;
	struct dso *curr_dso = self;
	size_t dso_name_len = strlen(self->short_name);
718
	Elf_Data *symstrs, *secstrs;
719 720
	uint32_t nr_syms;
	int err = -1;
721
	uint32_t idx;
722 723 724 725
	GElf_Ehdr ehdr;
	GElf_Shdr shdr;
	Elf_Data *syms;
	GElf_Sym sym;
726
	Elf_Scn *sec, *sec_strndx;
727
	Elf *elf;
728
	int nr = 0;
729

730
	elf = elf_begin(fd, PERF_ELF_C_READ_MMAP, NULL);
731
	if (elf == NULL) {
732
		pr_err("%s: cannot read %s ELF file.\n", __func__, name);
733 734 735 736
		goto out_close;
	}

	if (gelf_getehdr(elf, &ehdr) == NULL) {
737
		pr_err("%s: cannot get elf header.\n", __func__);
738 739 740 741
		goto out_elf_end;
	}

	sec = elf_section_by_name(elf, &ehdr, &shdr, ".symtab", NULL);
742
	if (sec == NULL) {
743 744
		sec = elf_section_by_name(elf, &ehdr, &shdr, ".dynsym", NULL);
		if (sec == NULL)
745 746
			goto out_elf_end;
	}
747 748 749 750 751 752 753 754 755 756 757 758 759

	syms = elf_getdata(sec, NULL);
	if (syms == NULL)
		goto out_elf_end;

	sec = elf_getscn(elf, shdr.sh_link);
	if (sec == NULL)
		goto out_elf_end;

	symstrs = elf_getdata(sec, NULL);
	if (symstrs == NULL)
		goto out_elf_end;

760 761 762 763 764
	sec_strndx = elf_getscn(elf, ehdr.e_shstrndx);
	if (sec_strndx == NULL)
		goto out_elf_end;

	secstrs = elf_getdata(sec_strndx, NULL);
S
Stoyan Gaydarov 已提交
765
	if (secstrs == NULL)
766 767
		goto out_elf_end;

768 769
	nr_syms = shdr.sh_size / shdr.sh_entsize;

770
	memset(&sym, 0, sizeof(sym));
771 772
	if (!kernel) {
		self->adjust_symbols = (ehdr.e_type == ET_EXEC ||
773 774 775
				elf_section_by_name(elf, &ehdr, &shdr,
						     ".gnu.prelink_undo",
						     NULL) != NULL);
776 777
	} else self->adjust_symbols = 0;

778
	elf_symtab__for_each_symbol(syms, nr_syms, idx, sym) {
779
		struct symbol *f;
780
		const char *elf_name;
781
		char *demangled = NULL;
782 783
		int is_label = elf_sym__is_label(&sym);
		const char *section_name;
784

785
		if (!is_label && !elf_sym__is_function(&sym))
786 787 788 789 790 791 792
			continue;

		sec = elf_getscn(elf, sym.st_shndx);
		if (!sec)
			goto out_elf_end;

		gelf_getshdr(sec, &shdr);
793 794 795 796

		if (is_label && !elf_sec__is_text(&shdr, secstrs))
			continue;

797
		elf_name = elf_sym__name(&sym, symstrs);
798
		section_name = elf_sec__name(&shdr, secstrs);
799

800 801 802 803 804 805 806 807 808 809 810 811 812 813 814 815 816 817 818 819 820 821 822
		if (kernel || kmodule) {
			char dso_name[PATH_MAX];

			if (strcmp(section_name,
				   curr_dso->short_name + dso_name_len) == 0)
				goto new_symbol;

			if (strcmp(section_name, ".text") == 0) {
				curr_map = map;
				curr_dso = self;
				goto new_symbol;
			}

			snprintf(dso_name, sizeof(dso_name),
				 "%s%s", self->short_name, section_name);

			curr_map = kernel_maps__find_by_dso_name(dso_name);
			if (curr_map == NULL) {
				u64 start = sym.st_value;

				if (kmodule)
					start += map->start + shdr.sh_offset;

823
				curr_dso = dso__new(dso_name);
824 825 826 827 828 829 830
				if (curr_dso == NULL)
					goto out_elf_end;
				curr_map = map__new2(start, curr_dso);
				if (curr_map == NULL) {
					dso__delete(curr_dso);
					goto out_elf_end;
				}
831 832
				curr_map->map_ip = identity__map_ip;
				curr_map->unmap_ip = identity__map_ip;
833 834 835 836 837 838 839
				curr_dso->origin = DSO__ORIG_KERNEL;
				kernel_maps__insert(curr_map);
				dsos__add(curr_dso);
			} else
				curr_dso = curr_map->dso;

			goto new_symbol;
840 841
		}

842
		if (curr_dso->adjust_symbols) {
843 844 845
			pr_debug2("adjusting symbol: st_value: %Lx sh_addr: "
				  "%Lx sh_offset: %Lx\n", (u64)sym.st_value,
				  (u64)shdr.sh_addr, (u64)shdr.sh_offset);
846
			sym.st_value -= shdr.sh_addr - shdr.sh_offset;
847
		}
848 849 850 851 852
		/*
		 * We need to figure out if the object was created from C++ sources
		 * DWARF DW_compile_unit has this, but we don't always have access
		 * to it...
		 */
853
		demangled = bfd_demangle(NULL, elf_name, DMGL_PARAMS | DMGL_ANSI);
854
		if (demangled != NULL)
855
			elf_name = demangled;
856
new_symbol:
857
		f = symbol__new(sym.st_value, sym.st_size, elf_name);
858
		free(demangled);
859 860 861
		if (!f)
			goto out_elf_end;

862
		if (filter && filter(curr_map, f))
863
			symbol__delete(f);
864
		else {
865
			dso__insert_symbol(curr_dso, f);
866 867
			nr++;
		}
868 869
	}

870 871 872 873 874
	/*
	 * For misannotated, zeroed, ASM function sizes.
	 */
	if (nr > 0)
		dso__fixup_sym_end(self);
875 876 877 878 879 880 881
	err = nr;
out_elf_end:
	elf_end(elf);
out_close:
	return err;
}

882 883 884 885 886
static bool dso__build_id_equal(const struct dso *self, u8 *build_id)
{
	return memcmp(self->build_id, build_id, sizeof(self->build_id)) == 0;
}

887
bool dsos__read_build_ids(void)
888
{
889
	bool have_build_id = false;
890 891
	struct dso *pos;

892 893 894 895 896 897
	list_for_each_entry(pos, &dsos, node)
		if (filename__read_build_id(pos->long_name, pos->build_id,
					    sizeof(pos->build_id)) > 0) {
			have_build_id	  = true;
			pos->has_build_id = true;
		}
898

899
	return have_build_id;
900 901
}

902 903 904 905 906
/*
 * Align offset to 4 bytes as needed for note name and descriptor data.
 */
#define NOTE_ALIGN(n) (((n) + 3) & -4U)

907
int filename__read_build_id(const char *filename, void *bf, size_t size)
908
{
909
	int fd, err = -1;
910 911
	GElf_Ehdr ehdr;
	GElf_Shdr shdr;
912
	Elf_Data *data;
913
	Elf_Scn *sec;
914
	void *ptr;
915 916
	Elf *elf;

917 918 919 920
	if (size < BUILD_ID_SIZE)
		goto out;

	fd = open(filename, O_RDONLY);
921 922 923
	if (fd < 0)
		goto out;

924
	elf = elf_begin(fd, PERF_ELF_C_READ_MMAP, NULL);
925
	if (elf == NULL) {
926
		pr_debug2("%s: cannot read %s ELF file.\n", __func__, filename);
927 928 929 930
		goto out_close;
	}

	if (gelf_getehdr(elf, &ehdr) == NULL) {
931
		pr_err("%s: cannot get elf header.\n", __func__);
932 933 934
		goto out_elf_end;
	}

935 936
	sec = elf_section_by_name(elf, &ehdr, &shdr,
				  ".note.gnu.build-id", NULL);
937 938 939 940 941 942
	if (sec == NULL) {
		sec = elf_section_by_name(elf, &ehdr, &shdr,
					  ".notes", NULL);
		if (sec == NULL)
			goto out_elf_end;
	}
943

944 945
	data = elf_getdata(sec, NULL);
	if (data == NULL)
946
		goto out_elf_end;
947 948 949 950 951 952 953 954 955 956 957 958 959 960 961 962 963 964 965 966 967

	ptr = data->d_buf;
	while (ptr < (data->d_buf + data->d_size)) {
		GElf_Nhdr *nhdr = ptr;
		int namesz = NOTE_ALIGN(nhdr->n_namesz),
		    descsz = NOTE_ALIGN(nhdr->n_descsz);
		const char *name;

		ptr += sizeof(*nhdr);
		name = ptr;
		ptr += namesz;
		if (nhdr->n_type == NT_GNU_BUILD_ID &&
		    nhdr->n_namesz == sizeof("GNU")) {
			if (memcmp(name, "GNU", sizeof("GNU")) == 0) {
				memcpy(bf, ptr, BUILD_ID_SIZE);
				err = BUILD_ID_SIZE;
				break;
			}
		}
		ptr += descsz;
	}
968 969 970 971 972 973 974 975
out_elf_end:
	elf_end(elf);
out_close:
	close(fd);
out:
	return err;
}

976 977 978 979 980 981 982 983 984 985 986 987 988 989 990 991 992 993 994
int sysfs__read_build_id(const char *filename, void *build_id, size_t size)
{
	int fd, err = -1;

	if (size < BUILD_ID_SIZE)
		goto out;

	fd = open(filename, O_RDONLY);
	if (fd < 0)
		goto out;

	while (1) {
		char bf[BUFSIZ];
		GElf_Nhdr nhdr;
		int namesz, descsz;

		if (read(fd, &nhdr, sizeof(nhdr)) != sizeof(nhdr))
			break;

995 996
		namesz = NOTE_ALIGN(nhdr.n_namesz);
		descsz = NOTE_ALIGN(nhdr.n_descsz);
997 998 999 1000 1001 1002 1003 1004 1005 1006 1007 1008 1009 1010 1011 1012 1013 1014 1015 1016 1017 1018 1019
		if (nhdr.n_type == NT_GNU_BUILD_ID &&
		    nhdr.n_namesz == sizeof("GNU")) {
			if (read(fd, bf, namesz) != namesz)
				break;
			if (memcmp(bf, "GNU", sizeof("GNU")) == 0) {
				if (read(fd, build_id,
				    BUILD_ID_SIZE) == BUILD_ID_SIZE) {
					err = 0;
					break;
				}
			} else if (read(fd, bf, descsz) != descsz)
				break;
		} else {
			int n = namesz + descsz;
			if (read(fd, bf, n) != n)
				break;
		}
	}
	close(fd);
out:
	return err;
}

1020 1021 1022 1023 1024 1025 1026 1027 1028
char dso__symtab_origin(const struct dso *self)
{
	static const char origin[] = {
		[DSO__ORIG_KERNEL] =   'k',
		[DSO__ORIG_JAVA_JIT] = 'j',
		[DSO__ORIG_FEDORA] =   'f',
		[DSO__ORIG_UBUNTU] =   'u',
		[DSO__ORIG_BUILDID] =  'b',
		[DSO__ORIG_DSO] =      'd',
1029
		[DSO__ORIG_KMODULE] =  'K',
1030 1031 1032 1033 1034 1035 1036
	};

	if (self == NULL || self->origin == DSO__ORIG_NOT_FOUND)
		return '!';
	return origin[self->origin];
}

1037
int dso__load(struct dso *self, struct map *map, symbol_filter_t filter)
1038
{
1039
	int size = PATH_MAX;
1040
	char *name;
1041
	u8 build_id[BUILD_ID_SIZE];
1042 1043 1044
	int ret = -1;
	int fd;

1045
	self->loaded = 1;
1046

1047 1048 1049 1050
	if (self->kernel)
		return dso__load_kernel_sym(self, map, filter);

	name = malloc(size);
1051 1052 1053
	if (!name)
		return -1;

1054
	self->adjust_symbols = 0;
1055

1056
	if (strncmp(self->name, "/tmp/perf-", 10) == 0) {
1057
		ret = dso__load_perf_map(self, map, filter);
1058 1059 1060 1061 1062 1063
		self->origin = ret > 0 ? DSO__ORIG_JAVA_JIT :
					 DSO__ORIG_NOT_FOUND;
		return ret;
	}

	self->origin = DSO__ORIG_FEDORA - 1;
1064

1065 1066
more:
	do {
1067 1068 1069
		self->origin++;
		switch (self->origin) {
		case DSO__ORIG_FEDORA:
1070 1071
			snprintf(name, size, "/usr/lib/debug%s.debug",
				 self->long_name);
1072
			break;
1073
		case DSO__ORIG_UBUNTU:
1074 1075
			snprintf(name, size, "/usr/lib/debug%s",
				 self->long_name);
1076
			break;
1077
		case DSO__ORIG_BUILDID:
1078 1079 1080 1081 1082 1083
			if (filename__read_build_id(self->long_name, build_id,
						    sizeof(build_id))) {
				char build_id_hex[BUILD_ID_SIZE * 2 + 1];

				build_id__sprintf(build_id, sizeof(build_id),
						  build_id_hex);
1084 1085
				snprintf(name, size,
					 "/usr/lib/debug/.build-id/%.2s/%s.debug",
1086 1087 1088 1089
					build_id_hex, build_id_hex + 2);
				if (self->has_build_id)
					goto compare_build_id;
				break;
1090
			}
1091
			self->origin++;
1092
			/* Fall thru */
1093
		case DSO__ORIG_DSO:
1094
			snprintf(name, size, "%s", self->long_name);
1095 1096 1097 1098 1099 1100
			break;

		default:
			goto out;
		}

1101
		if (self->has_build_id) {
1102 1103
			if (filename__read_build_id(name, build_id,
						    sizeof(build_id)) < 0)
1104 1105
				goto more;
compare_build_id:
1106
			if (!dso__build_id_equal(self, build_id))
1107 1108 1109
				goto more;
		}

1110 1111 1112
		fd = open(name, O_RDONLY);
	} while (fd < 0);

1113
	ret = dso__load_sym(self, map, name, fd, filter, 0, 0);
1114 1115 1116 1117 1118 1119 1120 1121
	close(fd);

	/*
	 * Some people seem to have debuginfo files _WITHOUT_ debug info!?!?
	 */
	if (!ret)
		goto more;

1122
	if (ret > 0) {
1123
		int nr_plt = dso__synthesize_plt_symbols(self, map, filter);
1124 1125 1126
		if (nr_plt > 0)
			ret += nr_plt;
	}
1127 1128
out:
	free(name);
1129 1130
	if (ret < 0 && strstr(self->name, " (deleted)") != NULL)
		return 0;
1131 1132 1133
	return ret;
}

1134 1135 1136
struct map *kernel_map;

static void kernel_maps__insert(struct map *map)
1137
{
1138 1139
	maps__insert(&kernel_maps, map);
}
1140

1141 1142
struct symbol *kernel_maps__find_symbol(u64 ip, struct map **mapp,
					symbol_filter_t filter)
1143 1144
{
	struct map *map = maps__find(&kernel_maps, ip);
1145 1146 1147

	if (mapp)
		*mapp = map;
1148 1149 1150

	if (map) {
		ip = map->map_ip(map, ip);
1151
		return map__find_symbol(map, ip, filter);
1152
	}
1153

1154
	return NULL;
1155 1156 1157 1158 1159 1160 1161 1162 1163 1164 1165 1166 1167 1168 1169 1170
}

struct map *kernel_maps__find_by_dso_name(const char *name)
{
	struct rb_node *nd;

	for (nd = rb_first(&kernel_maps); nd; nd = rb_next(nd)) {
		struct map *map = rb_entry(nd, struct map, rb_node);

		if (map->dso && strcmp(map->dso->name, name) == 0)
			return map;
	}

	return NULL;
}

1171
static int dsos__set_modules_path_dir(char *dirname)
1172
{
1173 1174
	struct dirent *dent;
	DIR *dir = opendir(dirname);
1175

1176
	if (!dir) {
1177
		pr_err("%s: cannot open %s dir\n", __func__, dirname);
1178 1179
		return -1;
	}
1180

1181 1182 1183 1184 1185 1186 1187 1188 1189 1190
	while ((dent = readdir(dir)) != NULL) {
		char path[PATH_MAX];

		if (dent->d_type == DT_DIR) {
			if (!strcmp(dent->d_name, ".") ||
			    !strcmp(dent->d_name, ".."))
				continue;

			snprintf(path, sizeof(path), "%s/%s",
				 dirname, dent->d_name);
1191
			if (dsos__set_modules_path_dir(path) < 0)
1192 1193 1194 1195 1196
				goto failure;
		} else {
			char *dot = strrchr(dent->d_name, '.'),
			     dso_name[PATH_MAX];
			struct map *map;
1197
			char *long_name;
1198 1199 1200 1201 1202 1203

			if (dot == NULL || strcmp(dot, ".ko"))
				continue;
			snprintf(dso_name, sizeof(dso_name), "[%.*s]",
				 (int)(dot - dent->d_name), dent->d_name);

1204
			strxfrchar(dso_name, '-', '_');
1205 1206 1207 1208 1209 1210 1211
			map = kernel_maps__find_by_dso_name(dso_name);
			if (map == NULL)
				continue;

			snprintf(path, sizeof(path), "%s/%s",
				 dirname, dent->d_name);

1212 1213
			long_name = strdup(path);
			if (long_name == NULL)
1214
				goto failure;
1215
			dso__set_long_name(map->dso, long_name);
1216 1217
		}
	}
1218

1219
	return 0;
1220 1221 1222 1223
failure:
	closedir(dir);
	return -1;
}
1224

1225
static int dsos__set_modules_path(void)
1226 1227 1228
{
	struct utsname uts;
	char modules_path[PATH_MAX];
1229

1230 1231
	if (uname(&uts) < 0)
		return -1;
1232

1233 1234
	snprintf(modules_path, sizeof(modules_path), "/lib/modules/%s/kernel",
		 uts.release);
1235

1236
	return dsos__set_modules_path_dir(modules_path);
1237 1238
}

1239 1240 1241 1242 1243 1244
/*
 * Constructor variant for modules (where we know from /proc/modules where
 * they are loaded) and for vmlinux, where only after we load all the
 * symbols we'll know where it starts and ends.
 */
static struct map *map__new2(u64 start, struct dso *dso)
1245
{
1246
	struct map *self = malloc(sizeof(*self));
1247

1248 1249
	if (self != NULL) {
		/*
1250
		 * ->end will be filled after we load all the symbols
1251
		 */
1252
		map__init(self, start, 0, 0, dso);
1253
	}
1254

1255 1256 1257
	return self;
}

1258
static int kernel_maps__create_module_maps(void)
1259 1260 1261 1262 1263
{
	char *line = NULL;
	size_t n;
	FILE *file = fopen("/proc/modules", "r");
	struct map *map;
1264

1265 1266
	if (file == NULL)
		return -1;
1267

1268 1269 1270 1271 1272 1273
	while (!feof(file)) {
		char name[PATH_MAX];
		u64 start;
		struct dso *dso;
		char *sep;
		int line_len;
1274

1275 1276 1277 1278 1279 1280 1281 1282 1283 1284 1285 1286 1287 1288 1289 1290 1291 1292 1293 1294 1295 1296
		line_len = getline(&line, &n, file);
		if (line_len < 0)
			break;

		if (!line)
			goto out_failure;

		line[--line_len] = '\0'; /* \n */

		sep = strrchr(line, 'x');
		if (sep == NULL)
			continue;

		hex2u64(sep + 1, &start);

		sep = strchr(line, ' ');
		if (sep == NULL)
			continue;

		*sep = '\0';

		snprintf(name, sizeof(name), "[%s]", line);
1297
		dso = dso__new(name);
1298 1299 1300 1301 1302 1303 1304 1305

		if (dso == NULL)
			goto out_delete_line;

		map = map__new2(start, dso);
		if (map == NULL) {
			dso__delete(dso);
			goto out_delete_line;
1306
		}
1307

1308 1309 1310 1311 1312 1313
		snprintf(name, sizeof(name),
			 "/sys/module/%s/notes/.note.gnu.build-id", line);
		if (sysfs__read_build_id(name, dso->build_id,
					 sizeof(dso->build_id)) == 0)
			dso->has_build_id = true;

1314 1315 1316
		dso->origin = DSO__ORIG_KMODULE;
		kernel_maps__insert(map);
		dsos__add(dso);
1317
	}
1318 1319 1320 1321

	free(line);
	fclose(file);

1322 1323 1324 1325 1326 1327 1328
	/*
	 * Now that we have all sorted out, just set the ->end of all
	 * maps:
	 */
	kernel_maps__fixup_end();

	return dsos__set_modules_path();
1329 1330 1331 1332 1333

out_delete_line:
	free(line);
out_failure:
	return -1;
1334 1335
}

1336
static int dso__load_vmlinux(struct dso *self, struct map *map,
1337
			     const char *vmlinux, symbol_filter_t filter)
1338
{
1339
	int err = -1, fd;
1340

1341 1342 1343 1344 1345 1346 1347 1348 1349 1350 1351 1352 1353 1354 1355 1356 1357 1358 1359 1360 1361 1362 1363
	if (self->has_build_id) {
		u8 build_id[BUILD_ID_SIZE];

		if (filename__read_build_id(vmlinux, build_id,
					    sizeof(build_id)) < 0) {
			pr_debug("No build_id in %s, ignoring it\n", vmlinux);
			return -1;
		}
		if (!dso__build_id_equal(self, build_id)) {
			char expected_build_id[BUILD_ID_SIZE * 2 + 1],
			     vmlinux_build_id[BUILD_ID_SIZE * 2 + 1];

			build_id__sprintf(self->build_id,
					  sizeof(self->build_id),
					  expected_build_id);
			build_id__sprintf(build_id, sizeof(build_id),
					  vmlinux_build_id);
			pr_debug("build_id in %s is %s while expected is %s, "
				 "ignoring it\n", vmlinux, vmlinux_build_id,
				 expected_build_id);
			return -1;
		}
	}
1364

1365
	fd = open(vmlinux, O_RDONLY);
1366 1367 1368
	if (fd < 0)
		return -1;

1369
	self->loaded = 1;
1370
	err = dso__load_sym(self, map, self->long_name, fd, filter, 1, 0);
1371

1372 1373 1374 1375 1376
	close(fd);

	return err;
}

1377 1378
static int dso__load_kernel_sym(struct dso *self, struct map *map,
				symbol_filter_t filter)
1379
{
1380
	int err = dso__load_vmlinux(self, map, self->name, filter);
1381

1382
	if (err <= 0) {
1383
		err = kernel_maps__load_kallsyms(filter);
1384 1385 1386
		if (err > 0)
                        dso__set_long_name(self, strdup("[kernel.kallsyms]"));
	}
1387 1388

	if (err > 0) {
1389 1390
		map__fixup_start(map);
		map__fixup_end(map);
1391
	}
1392

1393 1394 1395
	return err;
}

1396 1397 1398
LIST_HEAD(dsos);
struct dso	*vdso;

1399
const char	*vmlinux_name = "vmlinux";
1400 1401 1402 1403 1404 1405 1406 1407 1408 1409 1410 1411 1412 1413 1414 1415

static void dsos__add(struct dso *dso)
{
	list_add_tail(&dso->node, &dsos);
}

static struct dso *dsos__find(const char *name)
{
	struct dso *pos;

	list_for_each_entry(pos, &dsos, node)
		if (strcmp(pos->name, name) == 0)
			return pos;
	return NULL;
}

1416
struct dso *dsos__findnew(const char *name)
1417 1418 1419
{
	struct dso *dso = dsos__find(name);

1420
	if (!dso) {
1421
		dso = dso__new(name);
1422
		if (dso != NULL) {
1423
			dsos__add(dso);
1424 1425
			dso__set_basename(dso);
		}
1426
	}
1427 1428 1429 1430 1431 1432 1433 1434 1435 1436 1437 1438

	return dso;
}

void dsos__fprintf(FILE *fp)
{
	struct dso *pos;

	list_for_each_entry(pos, &dsos, node)
		dso__fprintf(pos, fp);
}

1439 1440 1441 1442 1443 1444 1445
size_t dsos__fprintf_buildid(FILE *fp)
{
	struct dso *pos;
	size_t ret = 0;

	list_for_each_entry(pos, &dsos, node) {
		ret += dso__fprintf_buildid(pos, fp);
1446
		ret += fprintf(fp, " %s\n", pos->long_name);
1447 1448 1449 1450
	}
	return ret;
}

1451
static int kernel_maps__create_kernel_map(void)
1452
{
1453
	struct dso *kernel = dso__new(vmlinux_name);
1454

1455
	if (kernel == NULL)
1456 1457 1458 1459 1460 1461 1462
		return -1;

	kernel_map = map__new2(0, kernel);
	if (kernel_map == NULL)
		goto out_delete_kernel_dso;

	kernel_map->map_ip = kernel_map->unmap_ip = identity__map_ip;
1463 1464

	kernel->short_name = "[kernel]";
1465
	kernel->kernel = 1;
1466
	vdso = dso__new("[vdso]");
1467 1468
	if (vdso == NULL)
		goto out_delete_kernel_map;
1469 1470 1471 1472

	if (sysfs__read_build_id("/sys/kernel/notes", kernel->build_id,
				 sizeof(kernel->build_id)) == 0)
		kernel->has_build_id = true;
1473

1474
	kernel_maps__insert(kernel_map);
1475
	dsos__add(kernel);
1476 1477
	dsos__add(vdso);

1478 1479 1480 1481 1482 1483 1484 1485
	return 0;

out_delete_kernel_map:
	map__delete(kernel_map);
	kernel_map = NULL;
out_delete_kernel_dso:
	dso__delete(kernel);
	return -1;
1486 1487
}

1488
int kernel_maps__init(bool use_modules)
1489
{
1490
	if (kernel_maps__create_kernel_map() < 0)
1491 1492
		return -1;

1493 1494 1495
	if (use_modules && kernel_maps__create_module_maps() < 0)
		pr_warning("Failed to load list of modules in use, "
			   "continuing...\n");
1496 1497

	return 0;
1498 1499
}

1500
void symbol__init(unsigned int priv_size)
1501 1502
{
	elf_version(EV_CURRENT);
1503
	symbol__priv_size = priv_size;
1504
}