dso.c 30.5 KB
Newer Older
1
// SPDX-License-Identifier: GPL-2.0
2
#include <asm/bug.h>
3
#include <linux/kernel.h>
4
#include <linux/string.h>
5
#include <linux/zalloc.h>
6 7
#include <sys/time.h>
#include <sys/resource.h>
8 9 10
#include <sys/types.h>
#include <sys/stat.h>
#include <unistd.h>
11
#include <errno.h>
12
#include <fcntl.h>
13
#include <stdlib.h>
14 15
#include <bpf/libbpf.h>
#include "bpf-event.h"
16
#include "compress.h"
17
#include "env.h"
18
#include "namespaces.h"
19
#include "path.h"
20
#include "map.h"
21
#include "symbol.h"
22
#include "srcline.h"
23
#include "dso.h"
24
#include "dsos.h"
25
#include "machine.h"
26
#include "auxtrace.h"
27
#include "util.h" /* O_CLOEXEC for older systems */
28
#include "debug.h"
29
#include "string2.h"
30
#include "vdso.h"
31

32 33 34 35 36 37 38
static const char * const debuglink_paths[] = {
	"%.0s%s",
	"%s/%s",
	"%s/.debug/%s",
	"/usr/lib/debug%s/%s"
};

39 40 41
char dso__symtab_origin(const struct dso *dso)
{
	static const char origin[] = {
42 43 44 45 46
		[DSO_BINARY_TYPE__KALLSYMS]			= 'k',
		[DSO_BINARY_TYPE__VMLINUX]			= 'v',
		[DSO_BINARY_TYPE__JAVA_JIT]			= 'j',
		[DSO_BINARY_TYPE__DEBUGLINK]			= 'l',
		[DSO_BINARY_TYPE__BUILD_ID_CACHE]		= 'B',
47
		[DSO_BINARY_TYPE__BUILD_ID_CACHE_DEBUGINFO]	= 'D',
48 49 50 51 52 53
		[DSO_BINARY_TYPE__FEDORA_DEBUGINFO]		= 'f',
		[DSO_BINARY_TYPE__UBUNTU_DEBUGINFO]		= 'u',
		[DSO_BINARY_TYPE__OPENEMBEDDED_DEBUGINFO]	= 'o',
		[DSO_BINARY_TYPE__BUILDID_DEBUGINFO]		= 'b',
		[DSO_BINARY_TYPE__SYSTEM_PATH_DSO]		= 'd',
		[DSO_BINARY_TYPE__SYSTEM_PATH_KMODULE]		= 'K',
54
		[DSO_BINARY_TYPE__SYSTEM_PATH_KMODULE_COMP]	= 'm',
55 56
		[DSO_BINARY_TYPE__GUEST_KALLSYMS]		= 'g',
		[DSO_BINARY_TYPE__GUEST_KMODULE]		= 'G',
57
		[DSO_BINARY_TYPE__GUEST_KMODULE_COMP]		= 'M',
58
		[DSO_BINARY_TYPE__GUEST_VMLINUX]		= 'V',
59 60 61 62 63 64 65
	};

	if (dso == NULL || dso->symtab_type == DSO_BINARY_TYPE__NOT_FOUND)
		return '!';
	return origin[dso->symtab_type];
}

66 67 68
int dso__read_binary_type_filename(const struct dso *dso,
				   enum dso_binary_type type,
				   char *root_dir, char *filename, size_t size)
69
{
70
	char build_id_hex[SBUILD_ID_SIZE];
71
	int ret = 0;
72
	size_t len;
73 74

	switch (type) {
75 76 77 78 79 80
	case DSO_BINARY_TYPE__DEBUGLINK:
	{
		const char *last_slash;
		char dso_dir[PATH_MAX];
		char symfile[PATH_MAX];
		unsigned int i;
81

82
		len = __symbol__join_symfs(filename, size, dso->long_name);
83 84 85
		last_slash = filename + len;
		while (last_slash != filename && *last_slash != '/')
			last_slash--;
86

87 88 89 90 91
		strncpy(dso_dir, filename, last_slash - filename);
		dso_dir[last_slash-filename] = '\0';

		if (!is_regular_file(filename)) {
			ret = -1;
92
			break;
93
		}
94

95 96 97 98 99 100 101 102 103 104 105 106 107
		ret = filename__read_debuglink(filename, symfile, PATH_MAX);
		if (ret)
			break;

		/* Check predefined locations where debug file might reside */
		ret = -1;
		for (i = 0; i < ARRAY_SIZE(debuglink_paths); i++) {
			snprintf(filename, size,
					debuglink_paths[i], dso_dir, symfile);
			if (is_regular_file(filename)) {
				ret = 0;
				break;
			}
108
		}
109

110
		break;
111
	}
112
	case DSO_BINARY_TYPE__BUILD_ID_CACHE:
113 114 115 116 117 118
		if (dso__build_id_filename(dso, filename, size, false) == NULL)
			ret = -1;
		break;

	case DSO_BINARY_TYPE__BUILD_ID_CACHE_DEBUGINFO:
		if (dso__build_id_filename(dso, filename, size, true) == NULL)
119 120 121 122
			ret = -1;
		break;

	case DSO_BINARY_TYPE__FEDORA_DEBUGINFO:
123 124
		len = __symbol__join_symfs(filename, size, "/usr/lib/debug");
		snprintf(filename + len, size - len, "%s.debug", dso->long_name);
125 126 127
		break;

	case DSO_BINARY_TYPE__UBUNTU_DEBUGINFO:
128 129
		len = __symbol__join_symfs(filename, size, "/usr/lib/debug");
		snprintf(filename + len, size - len, "%s", dso->long_name);
130 131
		break;

132 133
	case DSO_BINARY_TYPE__OPENEMBEDDED_DEBUGINFO:
	{
134
		const char *last_slash;
135 136 137 138 139 140
		size_t dir_size;

		last_slash = dso->long_name + dso->long_name_len;
		while (last_slash != dso->long_name && *last_slash != '/')
			last_slash--;

141
		len = __symbol__join_symfs(filename, size, "");
142 143 144 145 146
		dir_size = last_slash - dso->long_name + 2;
		if (dir_size > (size - len)) {
			ret = -1;
			break;
		}
147 148
		len += scnprintf(filename + len, dir_size, "%s",  dso->long_name);
		len += scnprintf(filename + len , size - len, ".debug%s",
149 150 151 152
								last_slash);
		break;
	}

153 154 155 156 157 158 159 160 161
	case DSO_BINARY_TYPE__BUILDID_DEBUGINFO:
		if (!dso->has_build_id) {
			ret = -1;
			break;
		}

		build_id__sprintf(dso->build_id,
				  sizeof(dso->build_id),
				  build_id_hex);
162 163 164
		len = __symbol__join_symfs(filename, size, "/usr/lib/debug/.build-id/");
		snprintf(filename + len, size - len, "%.2s/%s.debug",
			 build_id_hex, build_id_hex + 2);
165 166
		break;

167 168
	case DSO_BINARY_TYPE__VMLINUX:
	case DSO_BINARY_TYPE__GUEST_VMLINUX:
169
	case DSO_BINARY_TYPE__SYSTEM_PATH_DSO:
170
		__symbol__join_symfs(filename, size, dso->long_name);
171 172 173
		break;

	case DSO_BINARY_TYPE__GUEST_KMODULE:
174
	case DSO_BINARY_TYPE__GUEST_KMODULE_COMP:
175 176
		path__join3(filename, size, symbol_conf.symfs,
			    root_dir, dso->long_name);
177 178 179
		break;

	case DSO_BINARY_TYPE__SYSTEM_PATH_KMODULE:
180
	case DSO_BINARY_TYPE__SYSTEM_PATH_KMODULE_COMP:
181
		__symbol__join_symfs(filename, size, dso->long_name);
182 183
		break;

184 185
	case DSO_BINARY_TYPE__KCORE:
	case DSO_BINARY_TYPE__GUEST_KCORE:
186
		snprintf(filename, size, "%s", dso->long_name);
187 188
		break;

189 190 191 192
	default:
	case DSO_BINARY_TYPE__KALLSYMS:
	case DSO_BINARY_TYPE__GUEST_KALLSYMS:
	case DSO_BINARY_TYPE__JAVA_JIT:
193
	case DSO_BINARY_TYPE__BPF_PROG_INFO:
194 195 196 197 198 199 200 201
	case DSO_BINARY_TYPE__NOT_FOUND:
		ret = -1;
		break;
	}

	return ret;
}

202 203 204 205
enum {
	COMP_ID__NONE = 0,
};

206 207 208
static const struct {
	const char *fmt;
	int (*decompress)(const char *input, int output);
209
	bool (*is_compressed)(const char *input);
210
} compressions[] = {
211
	[COMP_ID__NONE] = { .fmt = NULL, },
212
#ifdef HAVE_ZLIB_SUPPORT
213
	{ "gz", gzip_decompress_to_file, gzip_is_compressed },
214 215
#endif
#ifdef HAVE_LZMA_SUPPORT
216
	{ "xz", lzma_decompress_to_file, lzma_is_compressed },
217
#endif
218
	{ NULL, NULL, NULL },
219 220
};

221
static int is_supported_compression(const char *ext)
222 223 224
{
	unsigned i;

225
	for (i = 1; compressions[i].fmt; i++) {
226
		if (!strcmp(ext, compressions[i].fmt))
227
			return i;
228
	}
229
	return COMP_ID__NONE;
230 231
}

232
bool is_kernel_module(const char *pathname, int cpumode)
233
{
234
	struct kmod_path m;
235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253
	int mode = cpumode & PERF_RECORD_MISC_CPUMODE_MASK;

	WARN_ONCE(mode != cpumode,
		  "Internal error: passing unmasked cpumode (%x) to is_kernel_module",
		  cpumode);

	switch (mode) {
	case PERF_RECORD_MISC_USER:
	case PERF_RECORD_MISC_HYPERVISOR:
	case PERF_RECORD_MISC_GUEST_USER:
		return false;
	/* Treat PERF_RECORD_MISC_CPUMODE_UNKNOWN as kernel */
	default:
		if (kmod_path__parse(&m, pathname)) {
			pr_err("Failed to check whether %s is a kernel module or not. Assume it is.",
					pathname);
			return true;
		}
	}
254

255
	return m.kmod;
256 257 258 259 260 261 262 263
}

bool dso__needs_decompress(struct dso *dso)
{
	return dso->symtab_type == DSO_BINARY_TYPE__SYSTEM_PATH_KMODULE_COMP ||
		dso->symtab_type == DSO_BINARY_TYPE__GUEST_KMODULE_COMP;
}

264 265
static int decompress_kmodule(struct dso *dso, const char *name,
			      char *pathname, size_t len)
266
{
267
	char tmpbuf[] = KMOD_DECOMP_NAME;
268 269 270 271 272
	int fd = -1;

	if (!dso__needs_decompress(dso))
		return -1;

273
	if (dso->comp == COMP_ID__NONE)
274 275
		return -1;

276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291
	/*
	 * We have proper compression id for DSO and yet the file
	 * behind the 'name' can still be plain uncompressed object.
	 *
	 * The reason is behind the logic we open the DSO object files,
	 * when we try all possible 'debug' objects until we find the
	 * data. So even if the DSO is represented by 'krava.xz' module,
	 * we can end up here opening ~/.debug/....23432432/debug' file
	 * which is not compressed.
	 *
	 * To keep this transparent, we detect this and return the file
	 * descriptor to the uncompressed file.
	 */
	if (!compressions[dso->comp].is_compressed(name))
		return open(name, O_RDONLY);

292 293 294
	fd = mkstemp(tmpbuf);
	if (fd < 0) {
		dso->load_errno = errno;
295
		return -1;
296 297
	}

298
	if (compressions[dso->comp].decompress(name, fd)) {
299 300 301 302 303
		dso->load_errno = DSO_LOAD_ERRNO__DECOMPRESSION_FAILURE;
		close(fd);
		fd = -1;
	}

304 305 306 307
	if (!pathname || (fd < 0))
		unlink(tmpbuf);

	if (pathname && (fd >= 0))
308
		strlcpy(pathname, tmpbuf, len);
309

310 311 312 313 314
	return fd;
}

int dso__decompress_kmodule_fd(struct dso *dso, const char *name)
{
315
	return decompress_kmodule(dso, name, NULL, 0);
316 317 318 319 320
}

int dso__decompress_kmodule_path(struct dso *dso, const char *name,
				 char *pathname, size_t len)
{
321
	int fd = decompress_kmodule(dso, name, pathname, len);
322 323

	close(fd);
324
	return fd >= 0 ? 0 : -1;
325 326
}

327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343
/*
 * Parses kernel module specified in @path and updates
 * @m argument like:
 *
 *    @comp - true if @path contains supported compression suffix,
 *            false otherwise
 *    @kmod - true if @path contains '.ko' suffix in right position,
 *            false otherwise
 *    @name - if (@alloc_name && @kmod) is true, it contains strdup-ed base name
 *            of the kernel module without suffixes, otherwise strudup-ed
 *            base name of @path
 *    @ext  - if (@alloc_ext && @comp) is true, it contains strdup-ed string
 *            the compression suffix
 *
 * Returns 0 if there's no strdup error, -ENOMEM otherwise.
 */
int __kmod_path__parse(struct kmod_path *m, const char *path,
344
		       bool alloc_name)
345 346 347
{
	const char *name = strrchr(path, '/');
	const char *ext  = strrchr(path, '.');
348
	bool is_simple_name = false;
349 350 351 352

	memset(m, 0x0, sizeof(*m));
	name = name ? name + 1 : path;

353 354 355 356 357 358 359 360 361 362 363 364 365
	/*
	 * '.' is also a valid character for module name. For example:
	 * [aaa.bbb] is a valid module name. '[' should have higher
	 * priority than '.ko' suffix.
	 *
	 * The kernel names are from machine__mmap_name. Such
	 * name should belong to kernel itself, not kernel module.
	 */
	if (name[0] == '[') {
		is_simple_name = true;
		if ((strncmp(name, "[kernel.kallsyms]", 17) == 0) ||
		    (strncmp(name, "[guest.kernel.kallsyms", 22) == 0) ||
		    (strncmp(name, "[vdso]", 6) == 0) ||
366 367
		    (strncmp(name, "[vdso32]", 8) == 0) ||
		    (strncmp(name, "[vdsox32]", 9) == 0) ||
368 369 370 371 372 373 374
		    (strncmp(name, "[vsyscall]", 10) == 0)) {
			m->kmod = false;

		} else
			m->kmod = true;
	}

375
	/* No extension, just return name. */
376
	if ((ext == NULL) || is_simple_name) {
377 378 379 380 381 382 383
		if (alloc_name) {
			m->name = strdup(name);
			return m->name ? 0 : -ENOMEM;
		}
		return 0;
	}

384 385
	m->comp = is_supported_compression(ext + 1);
	if (m->comp > COMP_ID__NONE)
386 387 388 389 390 391 392 393 394 395 396 397 398 399 400
		ext -= 3;

	/* Check .ko extension only if there's enough name left. */
	if (ext > name)
		m->kmod = !strncmp(ext, ".ko", 3);

	if (alloc_name) {
		if (m->kmod) {
			if (asprintf(&m->name, "[%.*s]", (int) (ext - name), name) == -1)
				return -ENOMEM;
		} else {
			if (asprintf(&m->name, "%s", name) == -1)
				return -ENOMEM;
		}

401
		strreplace(m->name, '-', '_');
402 403 404 405 406
	}

	return 0;
}

407 408 409 410 411 412 413 414 415
void dso__set_module_info(struct dso *dso, struct kmod_path *m,
			  struct machine *machine)
{
	if (machine__is_host(machine))
		dso->symtab_type = DSO_BINARY_TYPE__SYSTEM_PATH_KMODULE;
	else
		dso->symtab_type = DSO_BINARY_TYPE__GUEST_KMODULE;

	/* _KMODULE_COMP should be next to _KMODULE */
416
	if (m->kmod && m->comp) {
417
		dso->symtab_type++;
418 419
		dso->comp = m->comp;
	}
420 421 422 423

	dso__set_short_name(dso, strdup(m->name), true);
}

424
/*
425
 * Global list of open DSOs and the counter.
426 427
 */
static LIST_HEAD(dso__data_open);
428
static long dso__data_open_cnt;
429
static pthread_mutex_t dso__data_open_lock = PTHREAD_MUTEX_INITIALIZER;
430 431 432 433

static void dso__list_add(struct dso *dso)
{
	list_add_tail(&dso->data.open_entry, &dso__data_open);
434
	dso__data_open_cnt++;
435 436 437 438
}

static void dso__list_del(struct dso *dso)
{
439
	list_del_init(&dso->data.open_entry);
440 441 442
	WARN_ONCE(dso__data_open_cnt <= 0,
		  "DSO data fd counter out of bounds.");
	dso__data_open_cnt--;
443 444
}

445 446 447 448 449
static void close_first_dso(void);

static int do_open(char *name)
{
	int fd;
450
	char sbuf[STRERR_BUFSIZE];
451 452

	do {
453
		fd = open(name, O_RDONLY|O_CLOEXEC);
454 455 456
		if (fd >= 0)
			return fd;

457
		pr_debug("dso open failed: %s\n",
458
			 str_error_r(errno, sbuf, sizeof(sbuf)));
459 460 461 462 463 464 465 466 467
		if (!dso__data_open_cnt || errno != EMFILE)
			break;

		close_first_dso();
	} while (1);

	return -1;
}

468
static int __open_dso(struct dso *dso, struct machine *machine)
469
{
470
	int fd = -EINVAL;
471 472
	char *root_dir = (char *)"";
	char *name = malloc(PATH_MAX);
473
	bool decomp = false;
474 475 476 477 478 479 480

	if (!name)
		return -ENOMEM;

	if (machine)
		root_dir = machine->root_dir;

481
	if (dso__read_binary_type_filename(dso, dso->binary_type,
482 483
					    root_dir, name, PATH_MAX))
		goto out;
484

485 486
	if (!is_regular_file(name))
		goto out;
487

488 489 490 491 492
	if (dso__needs_decompress(dso)) {
		char newpath[KMOD_DECOMP_LEN];
		size_t len = sizeof(newpath);

		if (dso__decompress_kmodule_path(dso, name, newpath, len) < 0) {
493 494
			fd = -dso->load_errno;
			goto out;
495 496
		}

497
		decomp = true;
498 499 500
		strcpy(name, newpath);
	}

501
	fd = do_open(name);
502

503
	if (decomp)
504 505
		unlink(name);

506
out:
507 508 509 510
	free(name);
	return fd;
}

511 512
static void check_data_close(void);

513 514 515 516 517 518 519
/**
 * dso_close - Open DSO data file
 * @dso: dso object
 *
 * Open @dso's data file descriptor and updates
 * list/count of open DSO objects.
 */
520 521
static int open_dso(struct dso *dso, struct machine *machine)
{
522 523 524 525 526 527 528 529
	int fd;
	struct nscookie nsc;

	if (dso->binary_type != DSO_BINARY_TYPE__BUILD_ID_CACHE)
		nsinfo__mountns_enter(dso->nsinfo, &nsc);
	fd = __open_dso(dso, machine);
	if (dso->binary_type != DSO_BINARY_TYPE__BUILD_ID_CACHE)
		nsinfo__mountns_exit(&nsc);
530

531
	if (fd >= 0) {
532
		dso__list_add(dso);
533 534 535 536 537 538
		/*
		 * Check if we crossed the allowed number
		 * of opened DSOs and close one if needed.
		 */
		check_data_close();
	}
539 540 541 542 543

	return fd;
}

static void close_data_fd(struct dso *dso)
544 545 546 547
{
	if (dso->data.fd >= 0) {
		close(dso->data.fd);
		dso->data.fd = -1;
548
		dso->data.file_size = 0;
549
		dso__list_del(dso);
550 551 552
	}
}

553 554 555 556 557 558 559
/**
 * dso_close - Close DSO data file
 * @dso: dso object
 *
 * Close @dso's data file descriptor and updates
 * list/count of open DSO objects.
 */
560 561 562 563 564
static void close_dso(struct dso *dso)
{
	close_data_fd(dso);
}

565 566 567 568 569 570 571 572 573 574 575 576 577 578 579 580 581 582 583 584 585 586 587 588 589 590 591
static void close_first_dso(void)
{
	struct dso *dso;

	dso = list_first_entry(&dso__data_open, struct dso, data.open_entry);
	close_dso(dso);
}

static rlim_t get_fd_limit(void)
{
	struct rlimit l;
	rlim_t limit = 0;

	/* Allow half of the current open fd limit. */
	if (getrlimit(RLIMIT_NOFILE, &l) == 0) {
		if (l.rlim_cur == RLIM_INFINITY)
			limit = l.rlim_cur;
		else
			limit = l.rlim_cur / 2;
	} else {
		pr_err("failed to get fd limit\n");
		limit = 1;
	}

	return limit;
}

592 593 594 595 596 597 598 599
static rlim_t fd_limit;

/*
 * Used only by tests/dso-data.c to reset the environment
 * for tests. I dont expect we should change this during
 * standard runtime.
 */
void reset_fd_limit(void)
600
{
601 602
	fd_limit = 0;
}
603

604 605 606 607
static bool may_cache_fd(void)
{
	if (!fd_limit)
		fd_limit = get_fd_limit();
608

609
	if (fd_limit == RLIM_INFINITY)
610 611
		return true;

612
	return fd_limit > (rlim_t) dso__data_open_cnt;
613 614
}

615 616 617 618 619
/*
 * Check and close LRU dso if we crossed allowed limit
 * for opened dso file descriptors. The limit is half
 * of the RLIMIT_NOFILE files opened.
*/
620 621 622 623 624 625 626 627
static void check_data_close(void)
{
	bool cache_fd = may_cache_fd();

	if (!cache_fd)
		close_first_dso();
}

628 629 630 631 632 633
/**
 * dso__data_close - Close DSO data file
 * @dso: dso object
 *
 * External interface to close @dso's data file descriptor.
 */
634 635
void dso__data_close(struct dso *dso)
{
636
	pthread_mutex_lock(&dso__data_open_lock);
637
	close_dso(dso);
638
	pthread_mutex_unlock(&dso__data_open_lock);
639 640
}

641
static void try_to_open_dso(struct dso *dso, struct machine *machine)
642
{
643
	enum dso_binary_type binary_type_data[] = {
644 645 646 647 648 649
		DSO_BINARY_TYPE__BUILD_ID_CACHE,
		DSO_BINARY_TYPE__SYSTEM_PATH_DSO,
		DSO_BINARY_TYPE__NOT_FOUND,
	};
	int i = 0;

650
	if (dso->data.fd >= 0)
651
		return;
652 653 654

	if (dso->binary_type != DSO_BINARY_TYPE__NOT_FOUND) {
		dso->data.fd = open_dso(dso, machine);
655
		goto out;
656
	}
657 658

	do {
659
		dso->binary_type = binary_type_data[i++];
660

661 662 663
		dso->data.fd = open_dso(dso, machine);
		if (dso->data.fd >= 0)
			goto out;
664

665
	} while (dso->binary_type != DSO_BINARY_TYPE__NOT_FOUND);
666 667 668 669 670
out:
	if (dso->data.fd >= 0)
		dso->data.status = DSO_DATA_STATUS_OK;
	else
		dso->data.status = DSO_DATA_STATUS_ERROR;
671 672 673
}

/**
674
 * dso__data_get_fd - Get dso's data file descriptor
675 676 677 678
 * @dso: dso object
 * @machine: machine object
 *
 * External interface to find dso's file, open it and
679 680
 * returns file descriptor.  It should be paired with
 * dso__data_put_fd() if it returns non-negative value.
681
 */
682
int dso__data_get_fd(struct dso *dso, struct machine *machine)
683 684 685
{
	if (dso->data.status == DSO_DATA_STATUS_ERROR)
		return -1;
686

687 688 689
	if (pthread_mutex_lock(&dso__data_open_lock) < 0)
		return -1;

690
	try_to_open_dso(dso, machine);
691 692 693

	if (dso->data.fd < 0)
		pthread_mutex_unlock(&dso__data_open_lock);
694

695
	return dso->data.fd;
696 697
}

698 699 700 701 702
void dso__data_put_fd(struct dso *dso __maybe_unused)
{
	pthread_mutex_unlock(&dso__data_open_lock);
}

703 704 705 706 707 708 709 710 711 712 713 714
bool dso__data_status_seen(struct dso *dso, enum dso_data_status_seen by)
{
	u32 flag = 1 << by;

	if (dso->data.status_seen & flag)
		return true;

	dso->data.status_seen |= flag;

	return false;
}

715 716 717 718 719 720 721 722 723 724 725 726 727 728 729 730 731 732 733 734 735 736 737 738 739 740 741 742 743 744 745 746 747 748 749 750 751 752
static ssize_t bpf_read(struct dso *dso, u64 offset, char *data)
{
	struct bpf_prog_info_node *node;
	ssize_t size = DSO__DATA_CACHE_SIZE;
	u64 len;
	u8 *buf;

	node = perf_env__find_bpf_prog_info(dso->bpf_prog.env, dso->bpf_prog.id);
	if (!node || !node->info_linear) {
		dso->data.status = DSO_DATA_STATUS_ERROR;
		return -1;
	}

	len = node->info_linear->info.jited_prog_len;
	buf = (u8 *)(uintptr_t)node->info_linear->info.jited_prog_insns;

	if (offset >= len)
		return -1;

	size = (ssize_t)min(len - offset, (u64)size);
	memcpy(data, buf + offset, size);
	return size;
}

static int bpf_size(struct dso *dso)
{
	struct bpf_prog_info_node *node;

	node = perf_env__find_bpf_prog_info(dso->bpf_prog.env, dso->bpf_prog.id);
	if (!node || !node->info_linear) {
		dso->data.status = DSO_DATA_STATUS_ERROR;
		return -1;
	}

	dso->data.file_size = node->info_linear->info.jited_prog_len;
	return 0;
}

753
static void
754
dso_cache__free(struct dso *dso)
755
{
756
	struct rb_root *root = &dso->data.cache;
757 758
	struct rb_node *next = rb_first(root);

759
	pthread_mutex_lock(&dso->lock);
760 761 762 763 764 765 766 767
	while (next) {
		struct dso_cache *cache;

		cache = rb_entry(next, struct dso_cache, rb_node);
		next = rb_next(&cache->rb_node);
		rb_erase(&cache->rb_node, root);
		free(cache);
	}
768
	pthread_mutex_unlock(&dso->lock);
769 770
}

771
static struct dso_cache *dso_cache__find(struct dso *dso, u64 offset)
772
{
773
	const struct rb_root *root = &dso->data.cache;
774 775
	struct rb_node * const *p = &root->rb_node;
	const struct rb_node *parent = NULL;
776 777 778 779 780 781 782 783 784 785 786 787 788 789 790 791
	struct dso_cache *cache;

	while (*p != NULL) {
		u64 end;

		parent = *p;
		cache = rb_entry(parent, struct dso_cache, rb_node);
		end = cache->offset + DSO__DATA_CACHE_SIZE;

		if (offset < cache->offset)
			p = &(*p)->rb_left;
		else if (offset >= end)
			p = &(*p)->rb_right;
		else
			return cache;
	}
792

793 794 795
	return NULL;
}

796 797
static struct dso_cache *
dso_cache__insert(struct dso *dso, struct dso_cache *new)
798
{
799
	struct rb_root *root = &dso->data.cache;
800 801 802 803 804
	struct rb_node **p = &root->rb_node;
	struct rb_node *parent = NULL;
	struct dso_cache *cache;
	u64 offset = new->offset;

805
	pthread_mutex_lock(&dso->lock);
806 807 808 809 810 811 812 813 814 815 816
	while (*p != NULL) {
		u64 end;

		parent = *p;
		cache = rb_entry(parent, struct dso_cache, rb_node);
		end = cache->offset + DSO__DATA_CACHE_SIZE;

		if (offset < cache->offset)
			p = &(*p)->rb_left;
		else if (offset >= end)
			p = &(*p)->rb_right;
817 818
		else
			goto out;
819 820 821 822
	}

	rb_link_node(&new->rb_node, parent, p);
	rb_insert_color(&new->rb_node, root);
823 824 825 826 827

	cache = NULL;
out:
	pthread_mutex_unlock(&dso->lock);
	return cache;
828 829 830 831 832 833 834 835 836 837 838 839 840
}

static ssize_t
dso_cache__memcpy(struct dso_cache *cache, u64 offset,
		  u8 *data, u64 size)
{
	u64 cache_offset = offset - cache->offset;
	u64 cache_size   = min(cache->size - cache_offset, size);

	memcpy(data, cache->data + cache_offset, cache_size);
	return cache_size;
}

841 842 843 844 845 846 847 848 849 850 851 852 853 854 855 856 857 858 859 860 861 862 863 864 865
static ssize_t file_read(struct dso *dso, struct machine *machine,
			 u64 offset, char *data)
{
	ssize_t ret;

	pthread_mutex_lock(&dso__data_open_lock);

	/*
	 * dso->data.fd might be closed if other thread opened another
	 * file (dso) due to open file limit (RLIMIT_NOFILE).
	 */
	try_to_open_dso(dso, machine);

	if (dso->data.fd < 0) {
		dso->data.status = DSO_DATA_STATUS_ERROR;
		ret = -errno;
		goto out;
	}

	ret = pread(dso->data.fd, data, DSO__DATA_CACHE_SIZE, offset);
out:
	pthread_mutex_unlock(&dso__data_open_lock);
	return ret;
}

866
static ssize_t
867 868
dso_cache__read(struct dso *dso, struct machine *machine,
		u64 offset, u8 *data, ssize_t size)
869
{
870
	u64 cache_offset = offset & DSO__DATA_CACHE_MASK;
871
	struct dso_cache *cache;
872
	struct dso_cache *old;
873 874
	ssize_t ret;

875 876 877
	cache = zalloc(sizeof(*cache) + DSO__DATA_CACHE_SIZE);
	if (!cache)
		return -ENOMEM;
878

879 880 881 882 883
	if (dso->binary_type == DSO_BINARY_TYPE__BPF_PROG_INFO)
		ret = bpf_read(dso, cache_offset, cache->data);
	else
		ret = file_read(dso, machine, cache_offset, cache->data);

884
	if (ret > 0) {
885 886
		cache->offset = cache_offset;
		cache->size   = ret;
887

888 889 890 891 892 893
		old = dso_cache__insert(dso, cache);
		if (old) {
			/* we lose the race */
			free(cache);
			cache = old;
		}
894 895

		ret = dso_cache__memcpy(cache, offset, data, size);
896
	}
897 898 899 900 901 902 903

	if (ret <= 0)
		free(cache);

	return ret;
}

904 905
static ssize_t dso_cache_read(struct dso *dso, struct machine *machine,
			      u64 offset, u8 *data, ssize_t size)
906 907 908
{
	struct dso_cache *cache;

909
	cache = dso_cache__find(dso, offset);
910 911 912
	if (cache)
		return dso_cache__memcpy(cache, offset, data, size);
	else
913
		return dso_cache__read(dso, machine, offset, data, size);
914 915
}

916 917 918 919 920
/*
 * Reads and caches dso data DSO__DATA_CACHE_SIZE size chunks
 * in the rb_tree. Any read to already cached data is served
 * by cached data.
 */
921 922
static ssize_t cached_read(struct dso *dso, struct machine *machine,
			   u64 offset, u8 *data, ssize_t size)
923 924 925 926 927 928 929
{
	ssize_t r = 0;
	u8 *p = data;

	do {
		ssize_t ret;

930
		ret = dso_cache_read(dso, machine, offset, p, size);
931 932 933 934 935 936 937 938 939 940 941 942 943 944 945 946 947 948 949
		if (ret < 0)
			return ret;

		/* Reached EOF, return what we have. */
		if (!ret)
			break;

		BUG_ON(ret > size);

		r      += ret;
		p      += ret;
		offset += ret;
		size   -= ret;

	} while (size);

	return r;
}

950
static int file_size(struct dso *dso, struct machine *machine)
951
{
952
	int ret = 0;
953
	struct stat st;
954
	char sbuf[STRERR_BUFSIZE];
955

956 957 958 959 960 961
	pthread_mutex_lock(&dso__data_open_lock);

	/*
	 * dso->data.fd might be closed if other thread opened another
	 * file (dso) due to open file limit (RLIMIT_NOFILE).
	 */
962 963
	try_to_open_dso(dso, machine);

964
	if (dso->data.fd < 0) {
965 966 967
		ret = -errno;
		dso->data.status = DSO_DATA_STATUS_ERROR;
		goto out;
968 969
	}

970 971 972
	if (fstat(dso->data.fd, &st) < 0) {
		ret = -errno;
		pr_err("dso cache fstat failed: %s\n",
973
		       str_error_r(errno, sbuf, sizeof(sbuf)));
974 975 976 977 978 979 980 981
		dso->data.status = DSO_DATA_STATUS_ERROR;
		goto out;
	}
	dso->data.file_size = st.st_size;

out:
	pthread_mutex_unlock(&dso__data_open_lock);
	return ret;
982 983
}

984 985 986 987 988 989 990 991
int dso__data_file_size(struct dso *dso, struct machine *machine)
{
	if (dso->data.file_size)
		return 0;

	if (dso->data.status == DSO_DATA_STATUS_ERROR)
		return -1;

992 993 994
	if (dso->binary_type == DSO_BINARY_TYPE__BPF_PROG_INFO)
		return bpf_size(dso);

995 996 997
	return file_size(dso, machine);
}

A
Adrian Hunter 已提交
998 999 1000 1001 1002 1003 1004 1005 1006
/**
 * dso__data_size - Return dso data size
 * @dso: dso object
 * @machine: machine object
 *
 * Return: dso data size
 */
off_t dso__data_size(struct dso *dso, struct machine *machine)
{
1007
	if (dso__data_file_size(dso, machine))
A
Adrian Hunter 已提交
1008 1009 1010 1011 1012 1013
		return -1;

	/* For now just estimate dso data size is close to file size */
	return dso->data.file_size;
}

1014 1015
static ssize_t data_read_offset(struct dso *dso, struct machine *machine,
				u64 offset, u8 *data, ssize_t size)
1016
{
1017
	if (dso__data_file_size(dso, machine))
1018 1019 1020 1021 1022 1023 1024 1025 1026
		return -1;

	/* Check the offset sanity. */
	if (offset > dso->data.file_size)
		return -1;

	if (offset + size < offset)
		return -1;

1027
	return cached_read(dso, machine, offset, data, size);
1028 1029
}

1030 1031 1032 1033 1034 1035 1036 1037 1038 1039 1040
/**
 * dso__data_read_offset - Read data from dso file offset
 * @dso: dso object
 * @machine: machine object
 * @offset: file offset
 * @data: buffer to store data
 * @size: size of the @data buffer
 *
 * External interface to read data from dso file offset. Open
 * dso data file and use cached_read to get the data.
 */
1041 1042 1043
ssize_t dso__data_read_offset(struct dso *dso, struct machine *machine,
			      u64 offset, u8 *data, ssize_t size)
{
1044
	if (dso->data.status == DSO_DATA_STATUS_ERROR)
1045 1046
		return -1;

1047
	return data_read_offset(dso, machine, offset, data, size);
1048 1049
}

1050 1051 1052 1053 1054 1055 1056 1057 1058 1059
/**
 * dso__data_read_addr - Read data from dso address
 * @dso: dso object
 * @machine: machine object
 * @add: virtual memory address
 * @data: buffer to store data
 * @size: size of the @data buffer
 *
 * External interface to read data from dso address.
 */
1060 1061 1062 1063 1064 1065 1066 1067 1068 1069 1070 1071 1072 1073
ssize_t dso__data_read_addr(struct dso *dso, struct map *map,
			    struct machine *machine, u64 addr,
			    u8 *data, ssize_t size)
{
	u64 offset = map->map_ip(map, addr);
	return dso__data_read_offset(dso, machine, offset, data, size);
}

struct map *dso__new_map(const char *name)
{
	struct map *map = NULL;
	struct dso *dso = dso__new(name);

	if (dso)
1074
		map = map__new2(0, dso);
1075 1076 1077 1078

	return map;
}

1079 1080
struct dso *machine__findnew_kernel(struct machine *machine, const char *name,
				    const char *short_name, int dso_type)
1081 1082 1083 1084
{
	/*
	 * The kernel dso could be created by build_id processing.
	 */
1085
	struct dso *dso = machine__findnew_dso(machine, name);
1086 1087 1088 1089 1090 1091

	/*
	 * We need to run this in all cases, since during the build_id
	 * processing we had no idea this was the kernel dso.
	 */
	if (dso != NULL) {
1092
		dso__set_short_name(dso, short_name, false);
1093 1094 1095 1096 1097 1098
		dso->kernel = dso_type;
	}

	return dso;
}

1099
void dso__set_long_name(struct dso *dso, const char *name, bool name_allocated)
1100
{
1101 1102
	struct rb_root *root = dso->root;

1103 1104
	if (name == NULL)
		return;
1105 1106

	if (dso->long_name_allocated)
1107
		free((char *)dso->long_name);
1108

1109 1110 1111
	if (root) {
		rb_erase(&dso->rb_node, root);
		/*
1112
		 * __dsos__findnew_link_by_longname() isn't guaranteed to add it
1113 1114 1115 1116 1117 1118
		 * back, so a clean removal is required here.
		 */
		RB_CLEAR_NODE(&dso->rb_node);
		dso->root = NULL;
	}

1119 1120 1121
	dso->long_name		 = name;
	dso->long_name_len	 = strlen(name);
	dso->long_name_allocated = name_allocated;
1122 1123

	if (root)
1124
		__dsos__findnew_link_by_longname(root, dso, NULL);
1125 1126
}

1127
void dso__set_short_name(struct dso *dso, const char *name, bool name_allocated)
1128 1129 1130
{
	if (name == NULL)
		return;
1131 1132 1133 1134 1135 1136 1137

	if (dso->short_name_allocated)
		free((char *)dso->short_name);

	dso->short_name		  = name;
	dso->short_name_len	  = strlen(name);
	dso->short_name_allocated = name_allocated;
1138 1139 1140 1141 1142 1143
}

int dso__name_len(const struct dso *dso)
{
	if (!dso)
		return strlen("[unknown]");
1144
	if (verbose > 0)
1145 1146 1147 1148 1149
		return dso->long_name_len;

	return dso->short_name_len;
}

1150
bool dso__loaded(const struct dso *dso)
1151
{
1152
	return dso->loaded;
1153 1154
}

1155
bool dso__sorted_by_name(const struct dso *dso)
1156
{
1157
	return dso->sorted_by_name;
1158 1159
}

1160
void dso__set_sorted_by_name(struct dso *dso)
1161
{
1162
	dso->sorted_by_name = true;
1163 1164 1165 1166 1167 1168 1169 1170
}

struct dso *dso__new(const char *name)
{
	struct dso *dso = calloc(1, sizeof(*dso) + strlen(name) + 1);

	if (dso != NULL) {
		strcpy(dso->name, name);
1171
		dso__set_long_name(dso, dso->name, false);
1172
		dso__set_short_name(dso, dso->name, false);
1173
		dso->symbols = dso->symbol_names = RB_ROOT_CACHED;
1174
		dso->data.cache = RB_ROOT;
1175 1176
		dso->inlined_nodes = RB_ROOT_CACHED;
		dso->srclines = RB_ROOT_CACHED;
1177
		dso->data.fd = -1;
1178
		dso->data.status = DSO_DATA_STATUS_UNKNOWN;
1179
		dso->symtab_type = DSO_BINARY_TYPE__NOT_FOUND;
1180
		dso->binary_type = DSO_BINARY_TYPE__NOT_FOUND;
1181
		dso->is_64_bit = (sizeof(void *) == 8);
1182
		dso->loaded = 0;
1183
		dso->rel = 0;
1184 1185
		dso->sorted_by_name = 0;
		dso->has_build_id = 0;
1186
		dso->has_srcline = 1;
1187
		dso->a2l_fails = 1;
1188 1189
		dso->kernel = DSO_TYPE_USER;
		dso->needs_swap = DSO_SWAP__UNSET;
1190
		dso->comp = COMP_ID__NONE;
1191
		RB_CLEAR_NODE(&dso->rb_node);
1192
		dso->root = NULL;
1193
		INIT_LIST_HEAD(&dso->node);
1194
		INIT_LIST_HEAD(&dso->data.open_entry);
1195
		pthread_mutex_init(&dso->lock, NULL);
1196
		refcount_set(&dso->refcnt, 1);
1197 1198 1199 1200 1201 1202 1203
	}

	return dso;
}

void dso__delete(struct dso *dso)
{
1204 1205 1206
	if (!RB_EMPTY_NODE(&dso->rb_node))
		pr_err("DSO %s is still in rbtree when being deleted!\n",
		       dso->long_name);
1207 1208 1209

	/* free inlines first, as they reference symbols */
	inlines__tree_delete(&dso->inlined_nodes);
1210
	srcline__tree_delete(&dso->srclines);
1211
	symbols__delete(&dso->symbols);
1212 1213

	if (dso->short_name_allocated) {
1214
		zfree((char **)&dso->short_name);
1215 1216 1217 1218
		dso->short_name_allocated = false;
	}

	if (dso->long_name_allocated) {
1219
		zfree((char **)&dso->long_name);
1220 1221 1222
		dso->long_name_allocated = false;
	}

1223
	dso__data_close(dso);
1224
	auxtrace_cache__free(dso->auxtrace_cache);
1225
	dso_cache__free(dso);
1226
	dso__free_a2l(dso);
1227
	zfree(&dso->symsrc_filename);
1228
	nsinfo__zput(dso->nsinfo);
1229
	pthread_mutex_destroy(&dso->lock);
1230 1231 1232
	free(dso);
}

1233 1234 1235
struct dso *dso__get(struct dso *dso)
{
	if (dso)
1236
		refcount_inc(&dso->refcnt);
1237 1238 1239 1240 1241
	return dso;
}

void dso__put(struct dso *dso)
{
1242
	if (dso && refcount_dec_and_test(&dso->refcnt))
1243 1244 1245
		dso__delete(dso);
}

1246 1247 1248 1249 1250 1251 1252 1253 1254 1255 1256 1257 1258 1259 1260 1261 1262 1263 1264 1265 1266 1267 1268 1269 1270 1271 1272 1273 1274 1275 1276 1277 1278 1279 1280 1281 1282 1283 1284 1285 1286 1287 1288 1289 1290 1291
void dso__set_build_id(struct dso *dso, void *build_id)
{
	memcpy(dso->build_id, build_id, sizeof(dso->build_id));
	dso->has_build_id = 1;
}

bool dso__build_id_equal(const struct dso *dso, u8 *build_id)
{
	return memcmp(dso->build_id, build_id, sizeof(dso->build_id)) == 0;
}

void dso__read_running_kernel_build_id(struct dso *dso, struct machine *machine)
{
	char path[PATH_MAX];

	if (machine__is_default_guest(machine))
		return;
	sprintf(path, "%s/sys/kernel/notes", machine->root_dir);
	if (sysfs__read_build_id(path, dso->build_id,
				 sizeof(dso->build_id)) == 0)
		dso->has_build_id = true;
}

int dso__kernel_module_get_build_id(struct dso *dso,
				    const char *root_dir)
{
	char filename[PATH_MAX];
	/*
	 * kernel module short names are of the form "[module]" and
	 * we need just "module" here.
	 */
	const char *name = dso->short_name + 1;

	snprintf(filename, sizeof(filename),
		 "%s/sys/module/%.*s/notes/.note.gnu.build-id",
		 root_dir, (int)strlen(name) - 1, name);

	if (sysfs__read_build_id(filename, dso->build_id,
				 sizeof(dso->build_id)) == 0)
		dso->has_build_id = true;

	return 0;
}

size_t dso__fprintf_buildid(struct dso *dso, FILE *fp)
{
1292
	char sbuild_id[SBUILD_ID_SIZE];
1293 1294 1295 1296 1297

	build_id__sprintf(dso->build_id, sizeof(dso->build_id), sbuild_id);
	return fprintf(fp, "%s", sbuild_id);
}

1298
size_t dso__fprintf(struct dso *dso, FILE *fp)
1299 1300 1301 1302 1303 1304
{
	struct rb_node *nd;
	size_t ret = fprintf(fp, "dso: %s (", dso->short_name);

	if (dso->short_name != dso->long_name)
		ret += fprintf(fp, "%s, ", dso->long_name);
1305
	ret += fprintf(fp, "%sloaded, ", dso__loaded(dso) ? "" : "NOT ");
1306 1307
	ret += dso__fprintf_buildid(dso, fp);
	ret += fprintf(fp, ")\n");
1308
	for (nd = rb_first_cached(&dso->symbols); nd; nd = rb_next(nd)) {
1309 1310 1311 1312 1313 1314
		struct symbol *pos = rb_entry(nd, struct symbol, rb_node);
		ret += symbol__fprintf(pos, fp);
	}

	return ret;
}
A
Adrian Hunter 已提交
1315 1316 1317 1318

enum dso_type dso__type(struct dso *dso, struct machine *machine)
{
	int fd;
1319
	enum dso_type type = DSO__TYPE_UNKNOWN;
A
Adrian Hunter 已提交
1320

1321 1322 1323 1324 1325
	fd = dso__data_get_fd(dso, machine);
	if (fd >= 0) {
		type = dso__type_fd(fd);
		dso__data_put_fd(dso);
	}
A
Adrian Hunter 已提交
1326

1327
	return type;
A
Adrian Hunter 已提交
1328
}
1329 1330 1331 1332 1333 1334 1335 1336 1337 1338 1339 1340 1341 1342 1343 1344 1345 1346

int dso__strerror_load(struct dso *dso, char *buf, size_t buflen)
{
	int idx, errnum = dso->load_errno;
	/*
	 * This must have a same ordering as the enum dso_load_errno.
	 */
	static const char *dso_load__error_str[] = {
	"Internal tools/perf/ library error",
	"Invalid ELF file",
	"Can not read build id",
	"Mismatching build id",
	"Decompression failure",
	};

	BUG_ON(buflen == 0);

	if (errnum >= 0) {
1347
		const char *err = str_error_r(errnum, buf, buflen);
1348 1349 1350 1351 1352 1353 1354 1355 1356 1357 1358 1359 1360 1361

		if (err != buf)
			scnprintf(buf, buflen, "%s", err);

		return 0;
	}

	if (errnum <  __DSO_LOAD_ERRNO__START || errnum >= __DSO_LOAD_ERRNO__END)
		return -1;

	idx = errnum - __DSO_LOAD_ERRNO__START;
	scnprintf(buf, buflen, "%s", dso_load__error_str[idx]);
	return 0;
}