elf.c 24.7 KB
Newer Older
1
// SPDX-License-Identifier: GPL-2.0-or-later
2 3 4 5 6 7 8 9 10 11
/*
 * elf.c - ELF access library
 *
 * Adapted from kpatch (https://github.com/dynup/kpatch):
 * Copyright (C) 2013-2015 Josh Poimboeuf <jpoimboe@redhat.com>
 * Copyright (C) 2014 Seth Jennings <sjenning@redhat.com>
 */

#include <sys/types.h>
#include <sys/stat.h>
12
#include <sys/mman.h>
13 14 15 16 17
#include <fcntl.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <unistd.h>
18
#include <errno.h>
19
#include <objtool/builtin.h>
20

21 22
#include <objtool/elf.h>
#include <objtool/warn.h>
23

24 25
#define MAX_NAME_LEN 128

26 27 28 29 30
static inline u32 str_hash(const char *str)
{
	return jhash(str, strlen(str), 0);
}

31 32
#define __elf_table(name)	(elf->name##_hash)
#define __elf_bits(name)	(elf->name##_bits)
33

34 35
#define elf_hash_add(name, node, key) \
	hlist_add_head(node, &__elf_table(name)[hash_min(key, __elf_bits(name))])
36

37 38
#define elf_hash_for_each_possible(name, obj, member, key) \
	hlist_for_each_entry(obj, &__elf_table(name)[hash_min(key, __elf_bits(name))], member)
39

40 41 42 43 44 45 46 47 48 49 50 51
#define elf_alloc_hash(name, size) \
({ \
	__elf_bits(name) = max(10, ilog2(size)); \
	__elf_table(name) = mmap(NULL, sizeof(struct hlist_head) << __elf_bits(name), \
				 PROT_READ|PROT_WRITE, \
				 MAP_PRIVATE|MAP_ANON, -1, 0); \
	if (__elf_table(name) == (void *)-1L) { \
		WARN("mmap fail " #name); \
		__elf_table(name) = NULL; \
	} \
	__elf_table(name); \
})
52

53
static bool symbol_to_offset(struct rb_node *a, const struct rb_node *b)
54 55 56 57 58
{
	struct symbol *sa = rb_entry(a, struct symbol, node);
	struct symbol *sb = rb_entry(b, struct symbol, node);

	if (sa->offset < sb->offset)
59
		return true;
60
	if (sa->offset > sb->offset)
61
		return false;
62 63

	if (sa->len < sb->len)
64
		return true;
65
	if (sa->len > sb->len)
66
		return false;
67 68 69

	sa->alias = sb;

70
	return false;
71 72 73 74 75 76 77 78 79
}

static int symbol_by_offset(const void *key, const struct rb_node *node)
{
	const struct symbol *s = rb_entry(node, struct symbol, node);
	const unsigned long *o = key;

	if (*o < s->offset)
		return -1;
80
	if (*o >= s->offset + s->len)
81 82 83 84 85
		return 1;

	return 0;
}

86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110
struct symbol_hole {
	unsigned long key;
	const struct symbol *sym;
};

/*
 * Find !section symbol where @offset is after it.
 */
static int symbol_hole_by_offset(const void *key, const struct rb_node *node)
{
	const struct symbol *s = rb_entry(node, struct symbol, node);
	struct symbol_hole *sh = (void *)key;

	if (sh->key < s->offset)
		return -1;

	if (sh->key >= s->offset + s->len) {
		if (s->type != STT_SECTION)
			sh->sym = s;
		return 1;
	}

	return 0;
}

111
struct section *find_section_by_name(const struct elf *elf, const char *name)
112 113 114
{
	struct section *sec;

115
	elf_hash_for_each_possible(section_name, sec, name_hash, str_hash(name)) {
116 117
		if (!strcmp(sec->name, name))
			return sec;
118
	}
119 120 121 122 123 124 125 126 127

	return NULL;
}

static struct section *find_section_by_index(struct elf *elf,
					     unsigned int idx)
{
	struct section *sec;

128
	elf_hash_for_each_possible(section, sec, hash, idx) {
129 130
		if (sec->idx == idx)
			return sec;
131
	}
132 133 134 135 136 137 138 139

	return NULL;
}

static struct symbol *find_symbol_by_index(struct elf *elf, unsigned int idx)
{
	struct symbol *sym;

140
	elf_hash_for_each_possible(symbol, sym, hash, idx) {
141 142
		if (sym->idx == idx)
			return sym;
143
	}
144 145 146 147 148 149

	return NULL;
}

struct symbol *find_symbol_by_offset(struct section *sec, unsigned long offset)
{
150
	struct rb_node *node;
151

152
	rb_for_each(node, &offset, &sec->symbol_tree, symbol_by_offset) {
153 154 155 156 157
		struct symbol *s = rb_entry(node, struct symbol, node);

		if (s->offset == offset && s->type != STT_SECTION)
			return s;
	}
158 159 160 161 162 163

	return NULL;
}

struct symbol *find_func_by_offset(struct section *sec, unsigned long offset)
{
164
	struct rb_node *node;
165

166
	rb_for_each(node, &offset, &sec->symbol_tree, symbol_by_offset) {
167 168 169 170 171
		struct symbol *s = rb_entry(node, struct symbol, node);

		if (s->offset == offset && s->type == STT_FUNC)
			return s;
	}
172 173 174 175

	return NULL;
}

176
struct symbol *find_symbol_containing(const struct section *sec, unsigned long offset)
177
{
178
	struct rb_node *node;
179

180
	rb_for_each(node, &offset, &sec->symbol_tree, symbol_by_offset) {
181 182 183 184 185
		struct symbol *s = rb_entry(node, struct symbol, node);

		if (s->type != STT_SECTION)
			return s;
	}
186 187 188 189

	return NULL;
}

190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224
/*
 * Returns size of hole starting at @offset.
 */
int find_symbol_hole_containing(const struct section *sec, unsigned long offset)
{
	struct symbol_hole hole = {
		.key = offset,
		.sym = NULL,
	};
	struct rb_node *n;
	struct symbol *s;

	/*
	 * Find the rightmost symbol for which @offset is after it.
	 */
	n = rb_find(&hole, &sec->symbol_tree, symbol_hole_by_offset);

	/* found a symbol that contains @offset */
	if (n)
		return 0; /* not a hole */

	/* didn't find a symbol for which @offset is after it */
	if (!hole.sym)
		return 0; /* not a hole */

	/* @offset >= sym->offset + sym->len, find symbol after it */
	n = rb_next(&hole.sym->node);
	if (!n)
		return -1; /* until end of address space */

	/* hole until start of next symbol */
	s = rb_entry(n, struct symbol, node);
	return s->offset - offset;
}

225
struct symbol *find_func_containing(struct section *sec, unsigned long offset)
226 227 228
{
	struct rb_node *node;

229
	rb_for_each(node, &offset, &sec->symbol_tree, symbol_by_offset) {
230 231 232 233 234 235 236 237 238
		struct symbol *s = rb_entry(node, struct symbol, node);

		if (s->type == STT_FUNC)
			return s;
	}

	return NULL;
}

239
struct symbol *find_symbol_by_name(const struct elf *elf, const char *name)
240 241 242
{
	struct symbol *sym;

243
	elf_hash_for_each_possible(symbol_name, sym, name_hash, str_hash(name)) {
244 245
		if (!strcmp(sym->name, name))
			return sym;
246
	}
247 248 249 250

	return NULL;
}

M
Matt Helsley 已提交
251
struct reloc *find_reloc_by_dest_range(const struct elf *elf, struct section *sec,
252
				     unsigned long offset, unsigned int len)
253
{
M
Matt Helsley 已提交
254
	struct reloc *reloc, *r = NULL;
255
	unsigned long o;
256

M
Matt Helsley 已提交
257
	if (!sec->reloc)
258 259
		return NULL;

M
Matt Helsley 已提交
260
	sec = sec->reloc;
261

262
	for_offset_range(o, offset, offset + len) {
263 264
		elf_hash_for_each_possible(reloc, reloc, hash,
					   sec_offset_hash(sec, o)) {
M
Matt Helsley 已提交
265
			if (reloc->sec != sec)
266 267
				continue;

M
Matt Helsley 已提交
268 269 270
			if (reloc->offset >= offset && reloc->offset < offset + len) {
				if (!r || reloc->offset < r->offset)
					r = reloc;
271
			}
272
		}
273 274
		if (r)
			return r;
275
	}
276 277 278 279

	return NULL;
}

M
Matt Helsley 已提交
280
struct reloc *find_reloc_by_dest(const struct elf *elf, struct section *sec, unsigned long offset)
281
{
M
Matt Helsley 已提交
282
	return find_reloc_by_dest_range(elf, sec, offset, 1);
283 284 285 286 287 288 289 290 291 292
}

static int read_sections(struct elf *elf)
{
	Elf_Scn *s = NULL;
	struct section *sec;
	size_t shstrndx, sections_nr;
	int i;

	if (elf_getshdrnum(elf->elf, &sections_nr)) {
293
		WARN_ELF("elf_getshdrnum");
294 295 296 297
		return -1;
	}

	if (elf_getshdrstrndx(elf->elf, &shstrndx)) {
298
		WARN_ELF("elf_getshdrstrndx");
299 300 301
		return -1;
	}

302 303 304 305
	if (!elf_alloc_hash(section, sections_nr) ||
	    !elf_alloc_hash(section_name, sections_nr))
		return -1;

306 307 308 309 310 311 312 313
	for (i = 0; i < sections_nr; i++) {
		sec = malloc(sizeof(*sec));
		if (!sec) {
			perror("malloc");
			return -1;
		}
		memset(sec, 0, sizeof(*sec));

314
		INIT_LIST_HEAD(&sec->symbol_list);
M
Matt Helsley 已提交
315
		INIT_LIST_HEAD(&sec->reloc_list);
316 317 318

		s = elf_getscn(elf->elf, i);
		if (!s) {
319
			WARN_ELF("elf_getscn");
320 321 322 323 324 325
			return -1;
		}

		sec->idx = elf_ndxscn(s);

		if (!gelf_getshdr(s, &sec->sh)) {
326
			WARN_ELF("gelf_getshdr");
327 328 329 330 331
			return -1;
		}

		sec->name = elf_strptr(elf->elf, shstrndx, sec->sh.sh_name);
		if (!sec->name) {
332
			WARN_ELF("elf_strptr");
333 334 335
			return -1;
		}

336 337 338 339 340 341 342 343 344 345 346 347
		if (sec->sh.sh_size != 0) {
			sec->data = elf_getdata(s, NULL);
			if (!sec->data) {
				WARN_ELF("elf_getdata");
				return -1;
			}
			if (sec->data->d_off != 0 ||
			    sec->data->d_size != sec->sh.sh_size) {
				WARN("unexpected data attributes for %s",
				     sec->name);
				return -1;
			}
348
		}
349

350
		if (sec->sh.sh_flags & SHF_EXECINSTR)
351
			elf->text_size += sec->sh.sh_size;
352

353
		list_add_tail(&sec->list, &elf->sections);
354 355
		elf_hash_add(section, &sec->hash, sec->idx);
		elf_hash_add(section_name, &sec->name_hash, str_hash(sec->name));
356 357
	}

358
	if (stats) {
P
Peter Zijlstra 已提交
359
		printf("nr_sections: %lu\n", (unsigned long)sections_nr);
360 361
		printf("section_bits: %d\n", elf->section_bits);
	}
P
Peter Zijlstra 已提交
362

363 364 365 366 367 368 369 370 371
	/* sanity check, one more call to elf_nextscn() should return NULL */
	if (elf_nextscn(elf->elf, s)) {
		WARN("section entry mismatch");
		return -1;
	}

	return 0;
}

372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 388 389
static void elf_add_symbol(struct elf *elf, struct symbol *sym)
{
	struct list_head *entry;
	struct rb_node *pnode;

	sym->type = GELF_ST_TYPE(sym->sym.st_info);
	sym->bind = GELF_ST_BIND(sym->sym.st_info);

	sym->offset = sym->sym.st_value;
	sym->len = sym->sym.st_size;

	rb_add(&sym->node, &sym->sec->symbol_tree, symbol_to_offset);
	pnode = rb_prev(&sym->node);
	if (pnode)
		entry = &rb_entry(pnode, struct symbol, node)->list;
	else
		entry = &sym->sec->symbol_list;
	list_add(&sym->list, entry);
390 391
	elf_hash_add(symbol, &sym->hash, sym->idx);
	elf_hash_add(symbol_name, &sym->name_hash, str_hash(sym->name));
392 393 394 395 396 397 398 399 400

	/*
	 * Don't store empty STT_NOTYPE symbols in the rbtree.  They
	 * can exist within a function, confusing the sorting.
	 */
	if (!sym->len)
		rb_erase(&sym->node, &sym->sec->symbol_tree);
}

401 402
static int read_symbols(struct elf *elf)
{
403
	struct section *symtab, *symtab_shndx, *sec;
404
	struct symbol *sym, *pfunc;
405
	int symbols_nr, i;
406
	char *coldstr;
407 408
	Elf_Data *shndx_data = NULL;
	Elf32_Word shndx;
409 410

	symtab = find_section_by_name(elf, ".symtab");
411 412 413 414 415 416 417
	if (symtab) {
		symtab_shndx = find_section_by_name(elf, ".symtab_shndx");
		if (symtab_shndx)
			shndx_data = symtab_shndx->data;

		symbols_nr = symtab->sh.sh_size / symtab->sh.sh_entsize;
	} else {
418 419
		/*
		 * A missing symbol table is actually possible if it's an empty
420 421 422
		 * .o file. This can happen for thunk_64.o. Make sure to at
		 * least allocate the symbol hash tables so we can do symbol
		 * lookups without crashing.
423
		 */
424
		symbols_nr = 0;
425 426
	}

427 428 429
	if (!elf_alloc_hash(symbol, symbols_nr) ||
	    !elf_alloc_hash(symbol_name, symbols_nr))
		return -1;
430 431 432 433 434 435 436 437

	for (i = 0; i < symbols_nr; i++) {
		sym = malloc(sizeof(*sym));
		if (!sym) {
			perror("malloc");
			return -1;
		}
		memset(sym, 0, sizeof(*sym));
438
		INIT_LIST_HEAD(&sym->pv_target);
439
		sym->alias = sym;
440 441 442

		sym->idx = i;

443 444 445
		if (!gelf_getsymshndx(symtab->data, shndx_data, i, &sym->sym,
				      &shndx)) {
			WARN_ELF("gelf_getsymshndx");
446 447 448 449 450 451
			goto err;
		}

		sym->name = elf_strptr(elf->elf, symtab->sh.sh_link,
				       sym->sym.st_name);
		if (!sym->name) {
452
			WARN_ELF("elf_strptr");
453 454 455
			goto err;
		}

456 457 458 459 460 461 462
		if ((sym->sym.st_shndx > SHN_UNDEF &&
		     sym->sym.st_shndx < SHN_LORESERVE) ||
		    (shndx_data && sym->sym.st_shndx == SHN_XINDEX)) {
			if (sym->sym.st_shndx != SHN_XINDEX)
				shndx = sym->sym.st_shndx;

			sym->sec = find_section_by_index(elf, shndx);
463 464 465 466 467
			if (!sym->sec) {
				WARN("couldn't find section for symbol %s",
				     sym->name);
				goto err;
			}
468
			if (GELF_ST_TYPE(sym->sym.st_info) == STT_SECTION) {
469 470 471 472 473 474
				sym->name = sym->sec->name;
				sym->sec->sym = sym;
			}
		} else
			sym->sec = find_section_by_index(elf, 0);

475
		elf_add_symbol(elf, sym);
476 477
	}

478
	if (stats) {
P
Peter Zijlstra 已提交
479
		printf("nr_symbols: %lu\n", (unsigned long)symbols_nr);
480 481
		printf("symbol_bits: %d\n", elf->symbol_bits);
	}
P
Peter Zijlstra 已提交
482

483 484 485
	/* Create parent/child links for any cold subfunctions */
	list_for_each_entry(sec, &elf->sections, list) {
		list_for_each_entry(sym, &sec->symbol_list, list) {
486 487
			char pname[MAX_NAME_LEN + 1];
			size_t pnamelen;
488 489
			if (sym->type != STT_FUNC)
				continue;
490 491 492 493 494 495 496

			if (sym->pfunc == NULL)
				sym->pfunc = sym;

			if (sym->cfunc == NULL)
				sym->cfunc = sym;

497
			coldstr = strstr(sym->name, ".cold");
498 499 500
			if (!coldstr)
				continue;

501 502 503 504 505 506 507 508 509 510
			pnamelen = coldstr - sym->name;
			if (pnamelen > MAX_NAME_LEN) {
				WARN("%s(): parent function name exceeds maximum length of %d characters",
				     sym->name, MAX_NAME_LEN);
				return -1;
			}

			strncpy(pname, sym->name, pnamelen);
			pname[pnamelen] = '\0';
			pfunc = find_symbol_by_name(elf, pname);
511 512 513 514

			if (!pfunc) {
				WARN("%s(): can't find parent function",
				     sym->name);
515
				return -1;
516 517 518 519 520 521 522 523 524 525 526 527 528 529 530 531 532
			}

			sym->pfunc = pfunc;
			pfunc->cfunc = sym;

			/*
			 * Unfortunately, -fnoreorder-functions puts the child
			 * inside the parent.  Remove the overlap so we can
			 * have sane assumptions.
			 *
			 * Note that pfunc->len now no longer matches
			 * pfunc->sym.st_size.
			 */
			if (sym->sec == pfunc->sec &&
			    sym->offset >= pfunc->offset &&
			    sym->offset + sym->len == pfunc->offset + pfunc->len) {
				pfunc->len -= sym->len;
533 534 535 536
			}
		}
	}

537 538 539 540 541 542 543
	return 0;

err:
	free(sym);
	return -1;
}

544 545 546 547
static struct section *elf_create_reloc_section(struct elf *elf,
						struct section *base,
						int reltype);

548 549
int elf_add_reloc(struct elf *elf, struct section *sec, unsigned long offset,
		  unsigned int type, struct symbol *sym, int addend)
550
{
551 552
	struct reloc *reloc;

553 554 555
	if (!sec->reloc && !elf_create_reloc_section(elf, sec, SHT_RELA))
		return -1;

556 557 558 559 560 561 562 563 564 565 566 567
	reloc = malloc(sizeof(*reloc));
	if (!reloc) {
		perror("malloc");
		return -1;
	}
	memset(reloc, 0, sizeof(*reloc));

	reloc->sec = sec->reloc;
	reloc->offset = offset;
	reloc->type = type;
	reloc->sym = sym;
	reloc->addend = addend;
568

569
	list_add_tail(&reloc->list, &sec->reloc->reloc_list);
570
	elf_hash_add(reloc, &reloc->hash, reloc_hash(reloc));
571

572
	sec->reloc->sh.sh_size += sec->reloc->sh.sh_entsize;
573 574 575 576 577 578 579 580 581 582 583 584 585 586 587 588 589 590 591 592 593 594 595 596 597 598 599 600 601 602 603 604 605 606 607 608 609 610 611
	sec->reloc->changed = true;

	return 0;
}

int elf_add_reloc_to_insn(struct elf *elf, struct section *sec,
			  unsigned long offset, unsigned int type,
			  struct section *insn_sec, unsigned long insn_off)
{
	struct symbol *sym;
	int addend;

	if (insn_sec->sym) {
		sym = insn_sec->sym;
		addend = insn_off;

	} else {
		/*
		 * The Clang assembler strips section symbols, so we have to
		 * reference the function symbol instead:
		 */
		sym = find_symbol_containing(insn_sec, insn_off);
		if (!sym) {
			/*
			 * Hack alert.  This happens when we need to reference
			 * the NOP pad insn immediately after the function.
			 */
			sym = find_symbol_containing(insn_sec, insn_off - 1);
		}

		if (!sym) {
			WARN("can't find symbol containing %s+0x%lx", insn_sec->name, insn_off);
			return -1;
		}

		addend = insn_off - sym->offset;
	}

	return elf_add_reloc(elf, sec, offset, type, sym, addend);
612 613
}

614 615 616 617 618 619 620 621 622 623 624 625 626 627 628 629 630 631 632 633 634 635 636 637 638 639
static int read_rel_reloc(struct section *sec, int i, struct reloc *reloc, unsigned int *symndx)
{
	if (!gelf_getrel(sec->data, i, &reloc->rel)) {
		WARN_ELF("gelf_getrel");
		return -1;
	}
	reloc->type = GELF_R_TYPE(reloc->rel.r_info);
	reloc->addend = 0;
	reloc->offset = reloc->rel.r_offset;
	*symndx = GELF_R_SYM(reloc->rel.r_info);
	return 0;
}

static int read_rela_reloc(struct section *sec, int i, struct reloc *reloc, unsigned int *symndx)
{
	if (!gelf_getrela(sec->data, i, &reloc->rela)) {
		WARN_ELF("gelf_getrela");
		return -1;
	}
	reloc->type = GELF_R_TYPE(reloc->rela.r_info);
	reloc->addend = reloc->rela.r_addend;
	reloc->offset = reloc->rela.r_offset;
	*symndx = GELF_R_SYM(reloc->rela.r_info);
	return 0;
}

M
Matt Helsley 已提交
640
static int read_relocs(struct elf *elf)
641 642
{
	struct section *sec;
M
Matt Helsley 已提交
643
	struct reloc *reloc;
644 645
	int i;
	unsigned int symndx;
M
Matt Helsley 已提交
646
	unsigned long nr_reloc, max_reloc = 0, tot_reloc = 0;
647

648
	if (!elf_alloc_hash(reloc, elf->text_size / 16))
649 650
		return -1;

651
	list_for_each_entry(sec, &elf->sections, list) {
652 653
		if ((sec->sh.sh_type != SHT_RELA) &&
		    (sec->sh.sh_type != SHT_REL))
654 655
			continue;

656
		sec->base = find_section_by_index(elf, sec->sh.sh_info);
657
		if (!sec->base) {
M
Matt Helsley 已提交
658
			WARN("can't find base section for reloc section %s",
659 660 661 662
			     sec->name);
			return -1;
		}

M
Matt Helsley 已提交
663
		sec->base->reloc = sec;
664

M
Matt Helsley 已提交
665
		nr_reloc = 0;
666
		for (i = 0; i < sec->sh.sh_size / sec->sh.sh_entsize; i++) {
M
Matt Helsley 已提交
667 668
			reloc = malloc(sizeof(*reloc));
			if (!reloc) {
669 670 671
				perror("malloc");
				return -1;
			}
M
Matt Helsley 已提交
672
			memset(reloc, 0, sizeof(*reloc));
673 674 675 676 677 678 679 680 681 682
			switch (sec->sh.sh_type) {
			case SHT_REL:
				if (read_rel_reloc(sec, i, reloc, &symndx))
					return -1;
				break;
			case SHT_RELA:
				if (read_rela_reloc(sec, i, reloc, &symndx))
					return -1;
				break;
			default: return -1;
683 684
			}

M
Matt Helsley 已提交
685
			reloc->sec = sec;
686 687
			reloc->idx = i;
			reloc->sym = find_symbol_by_index(elf, symndx);
M
Matt Helsley 已提交
688 689
			if (!reloc->sym) {
				WARN("can't find reloc entry symbol %d for %s",
690 691 692
				     symndx, sec->name);
				return -1;
			}
693

694
			list_add_tail(&reloc->list, &sec->reloc_list);
695
			elf_hash_add(reloc, &reloc->hash, reloc_hash(reloc));
696

M
Matt Helsley 已提交
697
			nr_reloc++;
698
		}
M
Matt Helsley 已提交
699 700
		max_reloc = max(max_reloc, nr_reloc);
		tot_reloc += nr_reloc;
P
Peter Zijlstra 已提交
701 702 703
	}

	if (stats) {
M
Matt Helsley 已提交
704 705
		printf("max_reloc: %lu\n", max_reloc);
		printf("tot_reloc: %lu\n", tot_reloc);
706
		printf("reloc_bits: %d\n", elf->reloc_bits);
707 708 709 710 711
	}

	return 0;
}

712
struct elf *elf_open_read(const char *name, int flags)
713 714
{
	struct elf *elf;
715
	Elf_Cmd cmd;
716 717 718 719 720 721 722 723

	elf_version(EV_CURRENT);

	elf = malloc(sizeof(*elf));
	if (!elf) {
		perror("malloc");
		return NULL;
	}
724
	memset(elf, 0, offsetof(struct elf, sections));
725 726 727

	INIT_LIST_HEAD(&elf->sections);

728
	elf->fd = open(name, flags);
729
	if (elf->fd == -1) {
730 731
		fprintf(stderr, "objtool: Can't open '%s': %s\n",
			name, strerror(errno));
732 733 734
		goto err;
	}

735 736 737 738 739 740 741 742
	if ((flags & O_ACCMODE) == O_RDONLY)
		cmd = ELF_C_READ_MMAP;
	else if ((flags & O_ACCMODE) == O_RDWR)
		cmd = ELF_C_RDWR;
	else /* O_WRONLY */
		cmd = ELF_C_WRITE;

	elf->elf = elf_begin(elf->fd, cmd, NULL);
743
	if (!elf->elf) {
744
		WARN_ELF("elf_begin");
745 746 747 748
		goto err;
	}

	if (!gelf_getehdr(elf->elf, &elf->ehdr)) {
749
		WARN_ELF("gelf_getehdr");
750 751 752 753 754 755 756 757 758
		goto err;
	}

	if (read_sections(elf))
		goto err;

	if (read_symbols(elf))
		goto err;

M
Matt Helsley 已提交
759
	if (read_relocs(elf))
760 761 762 763 764 765 766 767 768
		goto err;

	return elf;

err:
	elf_close(elf);
	return NULL;
}

769 770 771 772 773 774 775 776 777 778 779 780 781 782 783 784 785 786 787 788 789 790 791 792 793 794 795 796 797
static int elf_add_string(struct elf *elf, struct section *strtab, char *str)
{
	Elf_Data *data;
	Elf_Scn *s;
	int len;

	if (!strtab)
		strtab = find_section_by_name(elf, ".strtab");
	if (!strtab) {
		WARN("can't find .strtab section");
		return -1;
	}

	s = elf_getscn(elf->elf, strtab->idx);
	if (!s) {
		WARN_ELF("elf_getscn");
		return -1;
	}

	data = elf_newdata(s);
	if (!data) {
		WARN_ELF("elf_newdata");
		return -1;
	}

	data->d_buf = str;
	data->d_size = strlen(str) + 1;
	data->d_align = 1;

798 799
	len = strtab->sh.sh_size;
	strtab->sh.sh_size += data->d_size;
800 801 802 803 804
	strtab->changed = true;

	return len;
}

805
struct section *elf_create_section(struct elf *elf, const char *name,
806
				   unsigned int sh_flags, size_t entsize, int nr)
807 808 809
{
	struct section *sec, *shstrtab;
	size_t size = entsize * nr;
810
	Elf_Scn *s;
811 812 813 814 815 816 817 818 819

	sec = malloc(sizeof(*sec));
	if (!sec) {
		perror("malloc");
		return NULL;
	}
	memset(sec, 0, sizeof(*sec));

	INIT_LIST_HEAD(&sec->symbol_list);
M
Matt Helsley 已提交
820
	INIT_LIST_HEAD(&sec->reloc_list);
821 822 823 824 825 826 827 828 829 830 831 832 833 834 835 836 837 838 839 840 841 842 843 844 845 846 847 848 849 850 851 852 853 854 855 856 857 858 859 860 861 862 863

	s = elf_newscn(elf->elf);
	if (!s) {
		WARN_ELF("elf_newscn");
		return NULL;
	}

	sec->name = strdup(name);
	if (!sec->name) {
		perror("strdup");
		return NULL;
	}

	sec->idx = elf_ndxscn(s);
	sec->changed = true;

	sec->data = elf_newdata(s);
	if (!sec->data) {
		WARN_ELF("elf_newdata");
		return NULL;
	}

	sec->data->d_size = size;
	sec->data->d_align = 1;

	if (size) {
		sec->data->d_buf = malloc(size);
		if (!sec->data->d_buf) {
			perror("malloc");
			return NULL;
		}
		memset(sec->data->d_buf, 0, size);
	}

	if (!gelf_getshdr(s, &sec->sh)) {
		WARN_ELF("gelf_getshdr");
		return NULL;
	}

	sec->sh.sh_size = size;
	sec->sh.sh_entsize = entsize;
	sec->sh.sh_type = SHT_PROGBITS;
	sec->sh.sh_addralign = 1;
864
	sec->sh.sh_flags = SHF_ALLOC | sh_flags;
865

866
	/* Add section name to .shstrtab (or .strtab for Clang) */
867
	shstrtab = find_section_by_name(elf, ".shstrtab");
868 869
	if (!shstrtab)
		shstrtab = find_section_by_name(elf, ".strtab");
870
	if (!shstrtab) {
871
		WARN("can't find .shstrtab or .strtab section");
872 873
		return NULL;
	}
874 875
	sec->sh.sh_name = elf_add_string(elf, shstrtab, sec->name);
	if (sec->sh.sh_name == -1)
876 877
		return NULL;

878
	list_add_tail(&sec->list, &elf->sections);
879 880
	elf_hash_add(section, &sec->hash, sec->idx);
	elf_hash_add(section_name, &sec->name_hash, str_hash(sec->name));
881

882 883
	elf->changed = true;

884 885 886
	return sec;
}

887 888 889 890 891 892 893 894 895 896 897 898 899
static struct section *elf_create_rel_reloc_section(struct elf *elf, struct section *base)
{
	char *relocname;
	struct section *sec;

	relocname = malloc(strlen(base->name) + strlen(".rel") + 1);
	if (!relocname) {
		perror("malloc");
		return NULL;
	}
	strcpy(relocname, ".rel");
	strcat(relocname, base->name);

900
	sec = elf_create_section(elf, relocname, 0, sizeof(GElf_Rel), 0);
901 902 903 904 905 906 907 908 909 910 911 912 913 914 915 916 917
	free(relocname);
	if (!sec)
		return NULL;

	base->reloc = sec;
	sec->base = base;

	sec->sh.sh_type = SHT_REL;
	sec->sh.sh_addralign = 8;
	sec->sh.sh_link = find_section_by_name(elf, ".symtab")->idx;
	sec->sh.sh_info = base->idx;
	sec->sh.sh_flags = SHF_INFO_LINK;

	return sec;
}

static struct section *elf_create_rela_reloc_section(struct elf *elf, struct section *base)
918
{
M
Matt Helsley 已提交
919
	char *relocname;
920 921
	struct section *sec;

M
Matt Helsley 已提交
922 923
	relocname = malloc(strlen(base->name) + strlen(".rela") + 1);
	if (!relocname) {
924 925 926
		perror("malloc");
		return NULL;
	}
M
Matt Helsley 已提交
927 928
	strcpy(relocname, ".rela");
	strcat(relocname, base->name);
929

930
	sec = elf_create_section(elf, relocname, 0, sizeof(GElf_Rela), 0);
M
Matt Helsley 已提交
931
	free(relocname);
932 933 934
	if (!sec)
		return NULL;

M
Matt Helsley 已提交
935
	base->reloc = sec;
936 937 938 939 940 941 942 943 944 945 946
	sec->base = base;

	sec->sh.sh_type = SHT_RELA;
	sec->sh.sh_addralign = 8;
	sec->sh.sh_link = find_section_by_name(elf, ".symtab")->idx;
	sec->sh.sh_info = base->idx;
	sec->sh.sh_flags = SHF_INFO_LINK;

	return sec;
}

947
static struct section *elf_create_reloc_section(struct elf *elf,
948 949 950 951 952 953 954 955 956 957
					 struct section *base,
					 int reltype)
{
	switch (reltype) {
	case SHT_REL:  return elf_create_rel_reloc_section(elf, base);
	case SHT_RELA: return elf_create_rela_reloc_section(elf, base);
	default:       return NULL;
	}
}

958
static int elf_rebuild_rel_reloc_section(struct section *sec)
959
{
M
Matt Helsley 已提交
960
	struct reloc *reloc;
961
	int idx = 0;
962
	void *buf;
963

964
	/* Allocate a buffer for relocations */
965
	buf = malloc(sec->sh.sh_size);
966
	if (!buf) {
967 968 969 970
		perror("malloc");
		return -1;
	}

971
	sec->data->d_buf = buf;
972
	sec->data->d_size = sec->sh.sh_size;
973
	sec->data->d_type = ELF_T_REL;
974 975 976

	idx = 0;
	list_for_each_entry(reloc, &sec->reloc_list, list) {
977 978
		reloc->rel.r_offset = reloc->offset;
		reloc->rel.r_info = GELF_R_INFO(reloc->sym->idx, reloc->type);
979 980 981 982
		if (!gelf_update_rel(sec->data, idx, &reloc->rel)) {
			WARN_ELF("gelf_update_rel");
			return -1;
		}
983 984 985 986 987
		idx++;
	}

	return 0;
}
988

989
static int elf_rebuild_rela_reloc_section(struct section *sec)
990 991
{
	struct reloc *reloc;
992
	int idx = 0;
993
	void *buf;
994 995

	/* Allocate a buffer for relocations with addends */
996
	buf = malloc(sec->sh.sh_size);
997
	if (!buf) {
998 999 1000 1001
		perror("malloc");
		return -1;
	}

1002
	sec->data->d_buf = buf;
1003
	sec->data->d_size = sec->sh.sh_size;
1004
	sec->data->d_type = ELF_T_RELA;
1005 1006

	idx = 0;
M
Matt Helsley 已提交
1007
	list_for_each_entry(reloc, &sec->reloc_list, list) {
1008 1009 1010
		reloc->rela.r_offset = reloc->offset;
		reloc->rela.r_addend = reloc->addend;
		reloc->rela.r_info = GELF_R_INFO(reloc->sym->idx, reloc->type);
1011 1012 1013 1014
		if (!gelf_update_rela(sec->data, idx, &reloc->rela)) {
			WARN_ELF("gelf_update_rela");
			return -1;
		}
1015 1016 1017 1018 1019 1020
		idx++;
	}

	return 0;
}

1021
static int elf_rebuild_reloc_section(struct elf *elf, struct section *sec)
1022 1023
{
	switch (sec->sh.sh_type) {
1024 1025
	case SHT_REL:  return elf_rebuild_rel_reloc_section(sec);
	case SHT_RELA: return elf_rebuild_rela_reloc_section(sec);
1026 1027 1028 1029
	default:       return -1;
	}
}

1030 1031 1032 1033 1034 1035 1036 1037 1038 1039 1040 1041 1042 1043 1044 1045 1046 1047 1048
int elf_write_insn(struct elf *elf, struct section *sec,
		   unsigned long offset, unsigned int len,
		   const char *insn)
{
	Elf_Data *data = sec->data;

	if (data->d_type != ELF_T_BYTE || data->d_off) {
		WARN("write to unexpected data for section: %s", sec->name);
		return -1;
	}

	memcpy(data->d_buf + offset, insn, len);
	elf_flagdata(data, ELF_C_SET, ELF_F_DIRTY);

	elf->changed = true;

	return 0;
}

1049
int elf_write_reloc(struct elf *elf, struct reloc *reloc)
1050
{
1051
	struct section *sec = reloc->sec;
1052

1053 1054 1055
	if (sec->sh.sh_type == SHT_REL) {
		reloc->rel.r_info = GELF_R_INFO(reloc->sym->idx, reloc->type);
		reloc->rel.r_offset = reloc->offset;
1056

1057 1058 1059 1060 1061 1062 1063 1064 1065 1066 1067 1068 1069
		if (!gelf_update_rel(sec->data, reloc->idx, &reloc->rel)) {
			WARN_ELF("gelf_update_rel");
			return -1;
		}
	} else {
		reloc->rela.r_info = GELF_R_INFO(reloc->sym->idx, reloc->type);
		reloc->rela.r_addend = reloc->addend;
		reloc->rela.r_offset = reloc->offset;

		if (!gelf_update_rela(sec->data, reloc->idx, &reloc->rela)) {
			WARN_ELF("gelf_update_rela");
			return -1;
		}
1070 1071 1072 1073 1074 1075 1076
	}

	elf->changed = true;

	return 0;
}

1077
int elf_write(struct elf *elf)
1078 1079 1080 1081
{
	struct section *sec;
	Elf_Scn *s;

P
Peter Zijlstra 已提交
1082 1083 1084
	if (dryrun)
		return 0;

1085
	/* Update changed relocation sections and section headers: */
1086 1087 1088 1089 1090 1091 1092
	list_for_each_entry(sec, &elf->sections, list) {
		if (sec->changed) {
			s = elf_getscn(elf->elf, sec->idx);
			if (!s) {
				WARN_ELF("elf_getscn");
				return -1;
			}
1093
			if (!gelf_update_shdr(s, &sec->sh)) {
1094 1095 1096
				WARN_ELF("gelf_update_shdr");
				return -1;
			}
1097

1098 1099 1100 1101 1102 1103
			if (sec->base &&
			    elf_rebuild_reloc_section(elf, sec)) {
				WARN("elf_rebuild_reloc_section");
				return -1;
			}

1104
			sec->changed = false;
1105
			elf->changed = true;
1106 1107 1108
		}
	}

1109 1110 1111 1112
	/* Make sure the new section header entries get updated properly. */
	elf_flagelf(elf->elf, ELF_C_SET, ELF_F_DIRTY);

	/* Write all changes to the file. */
1113 1114 1115 1116 1117
	if (elf_update(elf->elf, ELF_C_WRITE) < 0) {
		WARN_ELF("elf_update");
		return -1;
	}

1118 1119
	elf->changed = false;

1120 1121 1122
	return 0;
}

1123 1124 1125 1126
void elf_close(struct elf *elf)
{
	struct section *sec, *tmpsec;
	struct symbol *sym, *tmpsym;
M
Matt Helsley 已提交
1127
	struct reloc *reloc, *tmpreloc;
1128

1129 1130 1131 1132 1133 1134
	if (elf->elf)
		elf_end(elf->elf);

	if (elf->fd > 0)
		close(elf->fd);

1135
	list_for_each_entry_safe(sec, tmpsec, &elf->sections, list) {
1136
		list_for_each_entry_safe(sym, tmpsym, &sec->symbol_list, list) {
1137
			list_del(&sym->list);
1138
			hash_del(&sym->hash);
1139 1140
			free(sym);
		}
M
Matt Helsley 已提交
1141 1142 1143 1144
		list_for_each_entry_safe(reloc, tmpreloc, &sec->reloc_list, list) {
			list_del(&reloc->list);
			hash_del(&reloc->hash);
			free(reloc);
1145 1146 1147 1148
		}
		list_del(&sec->list);
		free(sec);
	}
1149

1150 1151
	free(elf);
}