dso.c 30.4 KB
Newer Older
1
// SPDX-License-Identifier: GPL-2.0
2
#include <asm/bug.h>
3
#include <linux/kernel.h>
4
#include <linux/string.h>
5
#include <linux/zalloc.h>
6 7
#include <sys/time.h>
#include <sys/resource.h>
8 9 10
#include <sys/types.h>
#include <sys/stat.h>
#include <unistd.h>
11
#include <errno.h>
12
#include <fcntl.h>
13 14
#include <bpf/libbpf.h>
#include "bpf-event.h"
15
#include "compress.h"
16
#include "namespaces.h"
17
#include "path.h"
18
#include "map.h"
19
#include "symbol.h"
20
#include "srcline.h"
21
#include "dso.h"
22
#include "dsos.h"
23
#include "machine.h"
24
#include "auxtrace.h"
25
#include "util.h" /* O_CLOEXEC for older systems */
26
#include "debug.h"
27
#include "string2.h"
28
#include "vdso.h"
29

30 31 32 33 34 35 36
static const char * const debuglink_paths[] = {
	"%.0s%s",
	"%s/%s",
	"%s/.debug/%s",
	"/usr/lib/debug%s/%s"
};

37 38 39
char dso__symtab_origin(const struct dso *dso)
{
	static const char origin[] = {
40 41 42 43 44
		[DSO_BINARY_TYPE__KALLSYMS]			= 'k',
		[DSO_BINARY_TYPE__VMLINUX]			= 'v',
		[DSO_BINARY_TYPE__JAVA_JIT]			= 'j',
		[DSO_BINARY_TYPE__DEBUGLINK]			= 'l',
		[DSO_BINARY_TYPE__BUILD_ID_CACHE]		= 'B',
45
		[DSO_BINARY_TYPE__BUILD_ID_CACHE_DEBUGINFO]	= 'D',
46 47 48 49 50 51
		[DSO_BINARY_TYPE__FEDORA_DEBUGINFO]		= 'f',
		[DSO_BINARY_TYPE__UBUNTU_DEBUGINFO]		= 'u',
		[DSO_BINARY_TYPE__OPENEMBEDDED_DEBUGINFO]	= 'o',
		[DSO_BINARY_TYPE__BUILDID_DEBUGINFO]		= 'b',
		[DSO_BINARY_TYPE__SYSTEM_PATH_DSO]		= 'd',
		[DSO_BINARY_TYPE__SYSTEM_PATH_KMODULE]		= 'K',
52
		[DSO_BINARY_TYPE__SYSTEM_PATH_KMODULE_COMP]	= 'm',
53 54
		[DSO_BINARY_TYPE__GUEST_KALLSYMS]		= 'g',
		[DSO_BINARY_TYPE__GUEST_KMODULE]		= 'G',
55
		[DSO_BINARY_TYPE__GUEST_KMODULE_COMP]		= 'M',
56
		[DSO_BINARY_TYPE__GUEST_VMLINUX]		= 'V',
57 58 59 60 61 62 63
	};

	if (dso == NULL || dso->symtab_type == DSO_BINARY_TYPE__NOT_FOUND)
		return '!';
	return origin[dso->symtab_type];
}

64 65 66
int dso__read_binary_type_filename(const struct dso *dso,
				   enum dso_binary_type type,
				   char *root_dir, char *filename, size_t size)
67
{
68
	char build_id_hex[SBUILD_ID_SIZE];
69
	int ret = 0;
70
	size_t len;
71 72

	switch (type) {
73 74 75 76 77 78
	case DSO_BINARY_TYPE__DEBUGLINK:
	{
		const char *last_slash;
		char dso_dir[PATH_MAX];
		char symfile[PATH_MAX];
		unsigned int i;
79

80
		len = __symbol__join_symfs(filename, size, dso->long_name);
81 82 83
		last_slash = filename + len;
		while (last_slash != filename && *last_slash != '/')
			last_slash--;
84

85 86 87 88 89
		strncpy(dso_dir, filename, last_slash - filename);
		dso_dir[last_slash-filename] = '\0';

		if (!is_regular_file(filename)) {
			ret = -1;
90
			break;
91
		}
92

93 94 95 96 97 98 99 100 101 102 103 104 105
		ret = filename__read_debuglink(filename, symfile, PATH_MAX);
		if (ret)
			break;

		/* Check predefined locations where debug file might reside */
		ret = -1;
		for (i = 0; i < ARRAY_SIZE(debuglink_paths); i++) {
			snprintf(filename, size,
					debuglink_paths[i], dso_dir, symfile);
			if (is_regular_file(filename)) {
				ret = 0;
				break;
			}
106
		}
107

108
		break;
109
	}
110
	case DSO_BINARY_TYPE__BUILD_ID_CACHE:
111 112 113 114 115 116
		if (dso__build_id_filename(dso, filename, size, false) == NULL)
			ret = -1;
		break;

	case DSO_BINARY_TYPE__BUILD_ID_CACHE_DEBUGINFO:
		if (dso__build_id_filename(dso, filename, size, true) == NULL)
117 118 119 120
			ret = -1;
		break;

	case DSO_BINARY_TYPE__FEDORA_DEBUGINFO:
121 122
		len = __symbol__join_symfs(filename, size, "/usr/lib/debug");
		snprintf(filename + len, size - len, "%s.debug", dso->long_name);
123 124 125
		break;

	case DSO_BINARY_TYPE__UBUNTU_DEBUGINFO:
126 127
		len = __symbol__join_symfs(filename, size, "/usr/lib/debug");
		snprintf(filename + len, size - len, "%s", dso->long_name);
128 129
		break;

130 131
	case DSO_BINARY_TYPE__OPENEMBEDDED_DEBUGINFO:
	{
132
		const char *last_slash;
133 134 135 136 137 138
		size_t dir_size;

		last_slash = dso->long_name + dso->long_name_len;
		while (last_slash != dso->long_name && *last_slash != '/')
			last_slash--;

139
		len = __symbol__join_symfs(filename, size, "");
140 141 142 143 144
		dir_size = last_slash - dso->long_name + 2;
		if (dir_size > (size - len)) {
			ret = -1;
			break;
		}
145 146
		len += scnprintf(filename + len, dir_size, "%s",  dso->long_name);
		len += scnprintf(filename + len , size - len, ".debug%s",
147 148 149 150
								last_slash);
		break;
	}

151 152 153 154 155 156 157 158 159
	case DSO_BINARY_TYPE__BUILDID_DEBUGINFO:
		if (!dso->has_build_id) {
			ret = -1;
			break;
		}

		build_id__sprintf(dso->build_id,
				  sizeof(dso->build_id),
				  build_id_hex);
160 161 162
		len = __symbol__join_symfs(filename, size, "/usr/lib/debug/.build-id/");
		snprintf(filename + len, size - len, "%.2s/%s.debug",
			 build_id_hex, build_id_hex + 2);
163 164
		break;

165 166
	case DSO_BINARY_TYPE__VMLINUX:
	case DSO_BINARY_TYPE__GUEST_VMLINUX:
167
	case DSO_BINARY_TYPE__SYSTEM_PATH_DSO:
168
		__symbol__join_symfs(filename, size, dso->long_name);
169 170 171
		break;

	case DSO_BINARY_TYPE__GUEST_KMODULE:
172
	case DSO_BINARY_TYPE__GUEST_KMODULE_COMP:
173 174
		path__join3(filename, size, symbol_conf.symfs,
			    root_dir, dso->long_name);
175 176 177
		break;

	case DSO_BINARY_TYPE__SYSTEM_PATH_KMODULE:
178
	case DSO_BINARY_TYPE__SYSTEM_PATH_KMODULE_COMP:
179
		__symbol__join_symfs(filename, size, dso->long_name);
180 181
		break;

182 183
	case DSO_BINARY_TYPE__KCORE:
	case DSO_BINARY_TYPE__GUEST_KCORE:
184
		snprintf(filename, size, "%s", dso->long_name);
185 186
		break;

187 188 189 190
	default:
	case DSO_BINARY_TYPE__KALLSYMS:
	case DSO_BINARY_TYPE__GUEST_KALLSYMS:
	case DSO_BINARY_TYPE__JAVA_JIT:
191
	case DSO_BINARY_TYPE__BPF_PROG_INFO:
192 193 194 195 196 197 198 199
	case DSO_BINARY_TYPE__NOT_FOUND:
		ret = -1;
		break;
	}

	return ret;
}

200 201 202 203
enum {
	COMP_ID__NONE = 0,
};

204 205 206
static const struct {
	const char *fmt;
	int (*decompress)(const char *input, int output);
207
	bool (*is_compressed)(const char *input);
208
} compressions[] = {
209
	[COMP_ID__NONE] = { .fmt = NULL, },
210
#ifdef HAVE_ZLIB_SUPPORT
211
	{ "gz", gzip_decompress_to_file, gzip_is_compressed },
212 213
#endif
#ifdef HAVE_LZMA_SUPPORT
214
	{ "xz", lzma_decompress_to_file, lzma_is_compressed },
215
#endif
216
	{ NULL, NULL, NULL },
217 218
};

219
static int is_supported_compression(const char *ext)
220 221 222
{
	unsigned i;

223
	for (i = 1; compressions[i].fmt; i++) {
224
		if (!strcmp(ext, compressions[i].fmt))
225
			return i;
226
	}
227
	return COMP_ID__NONE;
228 229
}

230
bool is_kernel_module(const char *pathname, int cpumode)
231
{
232
	struct kmod_path m;
233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251
	int mode = cpumode & PERF_RECORD_MISC_CPUMODE_MASK;

	WARN_ONCE(mode != cpumode,
		  "Internal error: passing unmasked cpumode (%x) to is_kernel_module",
		  cpumode);

	switch (mode) {
	case PERF_RECORD_MISC_USER:
	case PERF_RECORD_MISC_HYPERVISOR:
	case PERF_RECORD_MISC_GUEST_USER:
		return false;
	/* Treat PERF_RECORD_MISC_CPUMODE_UNKNOWN as kernel */
	default:
		if (kmod_path__parse(&m, pathname)) {
			pr_err("Failed to check whether %s is a kernel module or not. Assume it is.",
					pathname);
			return true;
		}
	}
252

253
	return m.kmod;
254 255 256 257 258 259 260 261
}

bool dso__needs_decompress(struct dso *dso)
{
	return dso->symtab_type == DSO_BINARY_TYPE__SYSTEM_PATH_KMODULE_COMP ||
		dso->symtab_type == DSO_BINARY_TYPE__GUEST_KMODULE_COMP;
}

262 263
static int decompress_kmodule(struct dso *dso, const char *name,
			      char *pathname, size_t len)
264
{
265
	char tmpbuf[] = KMOD_DECOMP_NAME;
266 267 268 269 270
	int fd = -1;

	if (!dso__needs_decompress(dso))
		return -1;

271
	if (dso->comp == COMP_ID__NONE)
272 273
		return -1;

274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289
	/*
	 * We have proper compression id for DSO and yet the file
	 * behind the 'name' can still be plain uncompressed object.
	 *
	 * The reason is behind the logic we open the DSO object files,
	 * when we try all possible 'debug' objects until we find the
	 * data. So even if the DSO is represented by 'krava.xz' module,
	 * we can end up here opening ~/.debug/....23432432/debug' file
	 * which is not compressed.
	 *
	 * To keep this transparent, we detect this and return the file
	 * descriptor to the uncompressed file.
	 */
	if (!compressions[dso->comp].is_compressed(name))
		return open(name, O_RDONLY);

290 291 292
	fd = mkstemp(tmpbuf);
	if (fd < 0) {
		dso->load_errno = errno;
293
		return -1;
294 295
	}

296
	if (compressions[dso->comp].decompress(name, fd)) {
297 298 299 300 301
		dso->load_errno = DSO_LOAD_ERRNO__DECOMPRESSION_FAILURE;
		close(fd);
		fd = -1;
	}

302 303 304 305
	if (!pathname || (fd < 0))
		unlink(tmpbuf);

	if (pathname && (fd >= 0))
306
		strlcpy(pathname, tmpbuf, len);
307

308 309 310 311 312
	return fd;
}

int dso__decompress_kmodule_fd(struct dso *dso, const char *name)
{
313
	return decompress_kmodule(dso, name, NULL, 0);
314 315 316 317 318
}

int dso__decompress_kmodule_path(struct dso *dso, const char *name,
				 char *pathname, size_t len)
{
319
	int fd = decompress_kmodule(dso, name, pathname, len);
320 321

	close(fd);
322
	return fd >= 0 ? 0 : -1;
323 324
}

325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341
/*
 * Parses kernel module specified in @path and updates
 * @m argument like:
 *
 *    @comp - true if @path contains supported compression suffix,
 *            false otherwise
 *    @kmod - true if @path contains '.ko' suffix in right position,
 *            false otherwise
 *    @name - if (@alloc_name && @kmod) is true, it contains strdup-ed base name
 *            of the kernel module without suffixes, otherwise strudup-ed
 *            base name of @path
 *    @ext  - if (@alloc_ext && @comp) is true, it contains strdup-ed string
 *            the compression suffix
 *
 * Returns 0 if there's no strdup error, -ENOMEM otherwise.
 */
int __kmod_path__parse(struct kmod_path *m, const char *path,
342
		       bool alloc_name)
343 344 345
{
	const char *name = strrchr(path, '/');
	const char *ext  = strrchr(path, '.');
346
	bool is_simple_name = false;
347 348 349 350

	memset(m, 0x0, sizeof(*m));
	name = name ? name + 1 : path;

351 352 353 354 355 356 357 358 359 360 361 362 363
	/*
	 * '.' is also a valid character for module name. For example:
	 * [aaa.bbb] is a valid module name. '[' should have higher
	 * priority than '.ko' suffix.
	 *
	 * The kernel names are from machine__mmap_name. Such
	 * name should belong to kernel itself, not kernel module.
	 */
	if (name[0] == '[') {
		is_simple_name = true;
		if ((strncmp(name, "[kernel.kallsyms]", 17) == 0) ||
		    (strncmp(name, "[guest.kernel.kallsyms", 22) == 0) ||
		    (strncmp(name, "[vdso]", 6) == 0) ||
364 365
		    (strncmp(name, "[vdso32]", 8) == 0) ||
		    (strncmp(name, "[vdsox32]", 9) == 0) ||
366 367 368 369 370 371 372
		    (strncmp(name, "[vsyscall]", 10) == 0)) {
			m->kmod = false;

		} else
			m->kmod = true;
	}

373
	/* No extension, just return name. */
374
	if ((ext == NULL) || is_simple_name) {
375 376 377 378 379 380 381
		if (alloc_name) {
			m->name = strdup(name);
			return m->name ? 0 : -ENOMEM;
		}
		return 0;
	}

382 383
	m->comp = is_supported_compression(ext + 1);
	if (m->comp > COMP_ID__NONE)
384 385 386 387 388 389 390 391 392 393 394 395 396 397 398
		ext -= 3;

	/* Check .ko extension only if there's enough name left. */
	if (ext > name)
		m->kmod = !strncmp(ext, ".ko", 3);

	if (alloc_name) {
		if (m->kmod) {
			if (asprintf(&m->name, "[%.*s]", (int) (ext - name), name) == -1)
				return -ENOMEM;
		} else {
			if (asprintf(&m->name, "%s", name) == -1)
				return -ENOMEM;
		}

399
		strreplace(m->name, '-', '_');
400 401 402 403 404
	}

	return 0;
}

405 406 407 408 409 410 411 412 413
void dso__set_module_info(struct dso *dso, struct kmod_path *m,
			  struct machine *machine)
{
	if (machine__is_host(machine))
		dso->symtab_type = DSO_BINARY_TYPE__SYSTEM_PATH_KMODULE;
	else
		dso->symtab_type = DSO_BINARY_TYPE__GUEST_KMODULE;

	/* _KMODULE_COMP should be next to _KMODULE */
414
	if (m->kmod && m->comp) {
415
		dso->symtab_type++;
416 417
		dso->comp = m->comp;
	}
418 419 420 421

	dso__set_short_name(dso, strdup(m->name), true);
}

422
/*
423
 * Global list of open DSOs and the counter.
424 425
 */
static LIST_HEAD(dso__data_open);
426
static long dso__data_open_cnt;
427
static pthread_mutex_t dso__data_open_lock = PTHREAD_MUTEX_INITIALIZER;
428 429 430 431

static void dso__list_add(struct dso *dso)
{
	list_add_tail(&dso->data.open_entry, &dso__data_open);
432
	dso__data_open_cnt++;
433 434 435 436
}

static void dso__list_del(struct dso *dso)
{
437
	list_del_init(&dso->data.open_entry);
438 439 440
	WARN_ONCE(dso__data_open_cnt <= 0,
		  "DSO data fd counter out of bounds.");
	dso__data_open_cnt--;
441 442
}

443 444 445 446 447
static void close_first_dso(void);

static int do_open(char *name)
{
	int fd;
448
	char sbuf[STRERR_BUFSIZE];
449 450

	do {
451
		fd = open(name, O_RDONLY|O_CLOEXEC);
452 453 454
		if (fd >= 0)
			return fd;

455
		pr_debug("dso open failed: %s\n",
456
			 str_error_r(errno, sbuf, sizeof(sbuf)));
457 458 459 460 461 462 463 464 465
		if (!dso__data_open_cnt || errno != EMFILE)
			break;

		close_first_dso();
	} while (1);

	return -1;
}

466
static int __open_dso(struct dso *dso, struct machine *machine)
467
{
468
	int fd = -EINVAL;
469 470
	char *root_dir = (char *)"";
	char *name = malloc(PATH_MAX);
471
	bool decomp = false;
472 473 474 475 476 477 478

	if (!name)
		return -ENOMEM;

	if (machine)
		root_dir = machine->root_dir;

479
	if (dso__read_binary_type_filename(dso, dso->binary_type,
480 481
					    root_dir, name, PATH_MAX))
		goto out;
482

483 484
	if (!is_regular_file(name))
		goto out;
485

486 487 488 489 490
	if (dso__needs_decompress(dso)) {
		char newpath[KMOD_DECOMP_LEN];
		size_t len = sizeof(newpath);

		if (dso__decompress_kmodule_path(dso, name, newpath, len) < 0) {
491 492
			fd = -dso->load_errno;
			goto out;
493 494
		}

495
		decomp = true;
496 497 498
		strcpy(name, newpath);
	}

499
	fd = do_open(name);
500

501
	if (decomp)
502 503
		unlink(name);

504
out:
505 506 507 508
	free(name);
	return fd;
}

509 510
static void check_data_close(void);

511 512 513 514 515 516 517
/**
 * dso_close - Open DSO data file
 * @dso: dso object
 *
 * Open @dso's data file descriptor and updates
 * list/count of open DSO objects.
 */
518 519
static int open_dso(struct dso *dso, struct machine *machine)
{
520 521 522 523 524 525 526 527
	int fd;
	struct nscookie nsc;

	if (dso->binary_type != DSO_BINARY_TYPE__BUILD_ID_CACHE)
		nsinfo__mountns_enter(dso->nsinfo, &nsc);
	fd = __open_dso(dso, machine);
	if (dso->binary_type != DSO_BINARY_TYPE__BUILD_ID_CACHE)
		nsinfo__mountns_exit(&nsc);
528

529
	if (fd >= 0) {
530
		dso__list_add(dso);
531 532 533 534 535 536
		/*
		 * Check if we crossed the allowed number
		 * of opened DSOs and close one if needed.
		 */
		check_data_close();
	}
537 538 539 540 541

	return fd;
}

static void close_data_fd(struct dso *dso)
542 543 544 545
{
	if (dso->data.fd >= 0) {
		close(dso->data.fd);
		dso->data.fd = -1;
546
		dso->data.file_size = 0;
547
		dso__list_del(dso);
548 549 550
	}
}

551 552 553 554 555 556 557
/**
 * dso_close - Close DSO data file
 * @dso: dso object
 *
 * Close @dso's data file descriptor and updates
 * list/count of open DSO objects.
 */
558 559 560 561 562
static void close_dso(struct dso *dso)
{
	close_data_fd(dso);
}

563 564 565 566 567 568 569 570 571 572 573 574 575 576 577 578 579 580 581 582 583 584 585 586 587 588 589
static void close_first_dso(void)
{
	struct dso *dso;

	dso = list_first_entry(&dso__data_open, struct dso, data.open_entry);
	close_dso(dso);
}

static rlim_t get_fd_limit(void)
{
	struct rlimit l;
	rlim_t limit = 0;

	/* Allow half of the current open fd limit. */
	if (getrlimit(RLIMIT_NOFILE, &l) == 0) {
		if (l.rlim_cur == RLIM_INFINITY)
			limit = l.rlim_cur;
		else
			limit = l.rlim_cur / 2;
	} else {
		pr_err("failed to get fd limit\n");
		limit = 1;
	}

	return limit;
}

590 591 592 593 594 595 596 597
static rlim_t fd_limit;

/*
 * Used only by tests/dso-data.c to reset the environment
 * for tests. I dont expect we should change this during
 * standard runtime.
 */
void reset_fd_limit(void)
598
{
599 600
	fd_limit = 0;
}
601

602 603 604 605
static bool may_cache_fd(void)
{
	if (!fd_limit)
		fd_limit = get_fd_limit();
606

607
	if (fd_limit == RLIM_INFINITY)
608 609
		return true;

610
	return fd_limit > (rlim_t) dso__data_open_cnt;
611 612
}

613 614 615 616 617
/*
 * Check and close LRU dso if we crossed allowed limit
 * for opened dso file descriptors. The limit is half
 * of the RLIMIT_NOFILE files opened.
*/
618 619 620 621 622 623 624 625
static void check_data_close(void)
{
	bool cache_fd = may_cache_fd();

	if (!cache_fd)
		close_first_dso();
}

626 627 628 629 630 631
/**
 * dso__data_close - Close DSO data file
 * @dso: dso object
 *
 * External interface to close @dso's data file descriptor.
 */
632 633
void dso__data_close(struct dso *dso)
{
634
	pthread_mutex_lock(&dso__data_open_lock);
635
	close_dso(dso);
636
	pthread_mutex_unlock(&dso__data_open_lock);
637 638
}

639
static void try_to_open_dso(struct dso *dso, struct machine *machine)
640
{
641
	enum dso_binary_type binary_type_data[] = {
642 643 644 645 646 647
		DSO_BINARY_TYPE__BUILD_ID_CACHE,
		DSO_BINARY_TYPE__SYSTEM_PATH_DSO,
		DSO_BINARY_TYPE__NOT_FOUND,
	};
	int i = 0;

648
	if (dso->data.fd >= 0)
649
		return;
650 651 652

	if (dso->binary_type != DSO_BINARY_TYPE__NOT_FOUND) {
		dso->data.fd = open_dso(dso, machine);
653
		goto out;
654
	}
655 656

	do {
657
		dso->binary_type = binary_type_data[i++];
658

659 660 661
		dso->data.fd = open_dso(dso, machine);
		if (dso->data.fd >= 0)
			goto out;
662

663
	} while (dso->binary_type != DSO_BINARY_TYPE__NOT_FOUND);
664 665 666 667 668
out:
	if (dso->data.fd >= 0)
		dso->data.status = DSO_DATA_STATUS_OK;
	else
		dso->data.status = DSO_DATA_STATUS_ERROR;
669 670 671
}

/**
672
 * dso__data_get_fd - Get dso's data file descriptor
673 674 675 676
 * @dso: dso object
 * @machine: machine object
 *
 * External interface to find dso's file, open it and
677 678
 * returns file descriptor.  It should be paired with
 * dso__data_put_fd() if it returns non-negative value.
679
 */
680
int dso__data_get_fd(struct dso *dso, struct machine *machine)
681 682 683
{
	if (dso->data.status == DSO_DATA_STATUS_ERROR)
		return -1;
684

685 686 687
	if (pthread_mutex_lock(&dso__data_open_lock) < 0)
		return -1;

688
	try_to_open_dso(dso, machine);
689 690 691

	if (dso->data.fd < 0)
		pthread_mutex_unlock(&dso__data_open_lock);
692

693
	return dso->data.fd;
694 695
}

696 697 698 699 700
void dso__data_put_fd(struct dso *dso __maybe_unused)
{
	pthread_mutex_unlock(&dso__data_open_lock);
}

701 702 703 704 705 706 707 708 709 710 711 712
bool dso__data_status_seen(struct dso *dso, enum dso_data_status_seen by)
{
	u32 flag = 1 << by;

	if (dso->data.status_seen & flag)
		return true;

	dso->data.status_seen |= flag;

	return false;
}

713 714 715 716 717 718 719 720 721 722 723 724 725 726 727 728 729 730 731 732 733 734 735 736 737 738 739 740 741 742 743 744 745 746 747 748 749 750
static ssize_t bpf_read(struct dso *dso, u64 offset, char *data)
{
	struct bpf_prog_info_node *node;
	ssize_t size = DSO__DATA_CACHE_SIZE;
	u64 len;
	u8 *buf;

	node = perf_env__find_bpf_prog_info(dso->bpf_prog.env, dso->bpf_prog.id);
	if (!node || !node->info_linear) {
		dso->data.status = DSO_DATA_STATUS_ERROR;
		return -1;
	}

	len = node->info_linear->info.jited_prog_len;
	buf = (u8 *)(uintptr_t)node->info_linear->info.jited_prog_insns;

	if (offset >= len)
		return -1;

	size = (ssize_t)min(len - offset, (u64)size);
	memcpy(data, buf + offset, size);
	return size;
}

static int bpf_size(struct dso *dso)
{
	struct bpf_prog_info_node *node;

	node = perf_env__find_bpf_prog_info(dso->bpf_prog.env, dso->bpf_prog.id);
	if (!node || !node->info_linear) {
		dso->data.status = DSO_DATA_STATUS_ERROR;
		return -1;
	}

	dso->data.file_size = node->info_linear->info.jited_prog_len;
	return 0;
}

751
static void
752
dso_cache__free(struct dso *dso)
753
{
754
	struct rb_root *root = &dso->data.cache;
755 756
	struct rb_node *next = rb_first(root);

757
	pthread_mutex_lock(&dso->lock);
758 759 760 761 762 763 764 765
	while (next) {
		struct dso_cache *cache;

		cache = rb_entry(next, struct dso_cache, rb_node);
		next = rb_next(&cache->rb_node);
		rb_erase(&cache->rb_node, root);
		free(cache);
	}
766
	pthread_mutex_unlock(&dso->lock);
767 768
}

769
static struct dso_cache *dso_cache__find(struct dso *dso, u64 offset)
770
{
771
	const struct rb_root *root = &dso->data.cache;
772 773
	struct rb_node * const *p = &root->rb_node;
	const struct rb_node *parent = NULL;
774 775 776 777 778 779 780 781 782 783 784 785 786 787 788 789
	struct dso_cache *cache;

	while (*p != NULL) {
		u64 end;

		parent = *p;
		cache = rb_entry(parent, struct dso_cache, rb_node);
		end = cache->offset + DSO__DATA_CACHE_SIZE;

		if (offset < cache->offset)
			p = &(*p)->rb_left;
		else if (offset >= end)
			p = &(*p)->rb_right;
		else
			return cache;
	}
790

791 792 793
	return NULL;
}

794 795
static struct dso_cache *
dso_cache__insert(struct dso *dso, struct dso_cache *new)
796
{
797
	struct rb_root *root = &dso->data.cache;
798 799 800 801 802
	struct rb_node **p = &root->rb_node;
	struct rb_node *parent = NULL;
	struct dso_cache *cache;
	u64 offset = new->offset;

803
	pthread_mutex_lock(&dso->lock);
804 805 806 807 808 809 810 811 812 813 814
	while (*p != NULL) {
		u64 end;

		parent = *p;
		cache = rb_entry(parent, struct dso_cache, rb_node);
		end = cache->offset + DSO__DATA_CACHE_SIZE;

		if (offset < cache->offset)
			p = &(*p)->rb_left;
		else if (offset >= end)
			p = &(*p)->rb_right;
815 816
		else
			goto out;
817 818 819 820
	}

	rb_link_node(&new->rb_node, parent, p);
	rb_insert_color(&new->rb_node, root);
821 822 823 824 825

	cache = NULL;
out:
	pthread_mutex_unlock(&dso->lock);
	return cache;
826 827 828 829 830 831 832 833 834 835 836 837 838
}

static ssize_t
dso_cache__memcpy(struct dso_cache *cache, u64 offset,
		  u8 *data, u64 size)
{
	u64 cache_offset = offset - cache->offset;
	u64 cache_size   = min(cache->size - cache_offset, size);

	memcpy(data, cache->data + cache_offset, cache_size);
	return cache_size;
}

839 840 841 842 843 844 845 846 847 848 849 850 851 852 853 854 855 856 857 858 859 860 861 862 863
static ssize_t file_read(struct dso *dso, struct machine *machine,
			 u64 offset, char *data)
{
	ssize_t ret;

	pthread_mutex_lock(&dso__data_open_lock);

	/*
	 * dso->data.fd might be closed if other thread opened another
	 * file (dso) due to open file limit (RLIMIT_NOFILE).
	 */
	try_to_open_dso(dso, machine);

	if (dso->data.fd < 0) {
		dso->data.status = DSO_DATA_STATUS_ERROR;
		ret = -errno;
		goto out;
	}

	ret = pread(dso->data.fd, data, DSO__DATA_CACHE_SIZE, offset);
out:
	pthread_mutex_unlock(&dso__data_open_lock);
	return ret;
}

864
static ssize_t
865 866
dso_cache__read(struct dso *dso, struct machine *machine,
		u64 offset, u8 *data, ssize_t size)
867
{
868
	u64 cache_offset = offset & DSO__DATA_CACHE_MASK;
869
	struct dso_cache *cache;
870
	struct dso_cache *old;
871 872
	ssize_t ret;

873 874 875
	cache = zalloc(sizeof(*cache) + DSO__DATA_CACHE_SIZE);
	if (!cache)
		return -ENOMEM;
876

877 878 879 880 881
	if (dso->binary_type == DSO_BINARY_TYPE__BPF_PROG_INFO)
		ret = bpf_read(dso, cache_offset, cache->data);
	else
		ret = file_read(dso, machine, cache_offset, cache->data);

882
	if (ret > 0) {
883 884
		cache->offset = cache_offset;
		cache->size   = ret;
885

886 887 888 889 890 891
		old = dso_cache__insert(dso, cache);
		if (old) {
			/* we lose the race */
			free(cache);
			cache = old;
		}
892 893

		ret = dso_cache__memcpy(cache, offset, data, size);
894
	}
895 896 897 898 899 900 901

	if (ret <= 0)
		free(cache);

	return ret;
}

902 903
static ssize_t dso_cache_read(struct dso *dso, struct machine *machine,
			      u64 offset, u8 *data, ssize_t size)
904 905 906
{
	struct dso_cache *cache;

907
	cache = dso_cache__find(dso, offset);
908 909 910
	if (cache)
		return dso_cache__memcpy(cache, offset, data, size);
	else
911
		return dso_cache__read(dso, machine, offset, data, size);
912 913
}

914 915 916 917 918
/*
 * Reads and caches dso data DSO__DATA_CACHE_SIZE size chunks
 * in the rb_tree. Any read to already cached data is served
 * by cached data.
 */
919 920
static ssize_t cached_read(struct dso *dso, struct machine *machine,
			   u64 offset, u8 *data, ssize_t size)
921 922 923 924 925 926 927
{
	ssize_t r = 0;
	u8 *p = data;

	do {
		ssize_t ret;

928
		ret = dso_cache_read(dso, machine, offset, p, size);
929 930 931 932 933 934 935 936 937 938 939 940 941 942 943 944 945 946 947
		if (ret < 0)
			return ret;

		/* Reached EOF, return what we have. */
		if (!ret)
			break;

		BUG_ON(ret > size);

		r      += ret;
		p      += ret;
		offset += ret;
		size   -= ret;

	} while (size);

	return r;
}

948
static int file_size(struct dso *dso, struct machine *machine)
949
{
950
	int ret = 0;
951
	struct stat st;
952
	char sbuf[STRERR_BUFSIZE];
953

954 955 956 957 958 959
	pthread_mutex_lock(&dso__data_open_lock);

	/*
	 * dso->data.fd might be closed if other thread opened another
	 * file (dso) due to open file limit (RLIMIT_NOFILE).
	 */
960 961
	try_to_open_dso(dso, machine);

962
	if (dso->data.fd < 0) {
963 964 965
		ret = -errno;
		dso->data.status = DSO_DATA_STATUS_ERROR;
		goto out;
966 967
	}

968 969 970
	if (fstat(dso->data.fd, &st) < 0) {
		ret = -errno;
		pr_err("dso cache fstat failed: %s\n",
971
		       str_error_r(errno, sbuf, sizeof(sbuf)));
972 973 974 975 976 977 978 979
		dso->data.status = DSO_DATA_STATUS_ERROR;
		goto out;
	}
	dso->data.file_size = st.st_size;

out:
	pthread_mutex_unlock(&dso__data_open_lock);
	return ret;
980 981
}

982 983 984 985 986 987 988 989
int dso__data_file_size(struct dso *dso, struct machine *machine)
{
	if (dso->data.file_size)
		return 0;

	if (dso->data.status == DSO_DATA_STATUS_ERROR)
		return -1;

990 991 992
	if (dso->binary_type == DSO_BINARY_TYPE__BPF_PROG_INFO)
		return bpf_size(dso);

993 994 995
	return file_size(dso, machine);
}

A
Adrian Hunter 已提交
996 997 998 999 1000 1001 1002 1003 1004
/**
 * dso__data_size - Return dso data size
 * @dso: dso object
 * @machine: machine object
 *
 * Return: dso data size
 */
off_t dso__data_size(struct dso *dso, struct machine *machine)
{
1005
	if (dso__data_file_size(dso, machine))
A
Adrian Hunter 已提交
1006 1007 1008 1009 1010 1011
		return -1;

	/* For now just estimate dso data size is close to file size */
	return dso->data.file_size;
}

1012 1013
static ssize_t data_read_offset(struct dso *dso, struct machine *machine,
				u64 offset, u8 *data, ssize_t size)
1014
{
1015
	if (dso__data_file_size(dso, machine))
1016 1017 1018 1019 1020 1021 1022 1023 1024
		return -1;

	/* Check the offset sanity. */
	if (offset > dso->data.file_size)
		return -1;

	if (offset + size < offset)
		return -1;

1025
	return cached_read(dso, machine, offset, data, size);
1026 1027
}

1028 1029 1030 1031 1032 1033 1034 1035 1036 1037 1038
/**
 * dso__data_read_offset - Read data from dso file offset
 * @dso: dso object
 * @machine: machine object
 * @offset: file offset
 * @data: buffer to store data
 * @size: size of the @data buffer
 *
 * External interface to read data from dso file offset. Open
 * dso data file and use cached_read to get the data.
 */
1039 1040 1041
ssize_t dso__data_read_offset(struct dso *dso, struct machine *machine,
			      u64 offset, u8 *data, ssize_t size)
{
1042
	if (dso->data.status == DSO_DATA_STATUS_ERROR)
1043 1044
		return -1;

1045
	return data_read_offset(dso, machine, offset, data, size);
1046 1047
}

1048 1049 1050 1051 1052 1053 1054 1055 1056 1057
/**
 * dso__data_read_addr - Read data from dso address
 * @dso: dso object
 * @machine: machine object
 * @add: virtual memory address
 * @data: buffer to store data
 * @size: size of the @data buffer
 *
 * External interface to read data from dso address.
 */
1058 1059 1060 1061 1062 1063 1064 1065 1066 1067 1068 1069 1070 1071
ssize_t dso__data_read_addr(struct dso *dso, struct map *map,
			    struct machine *machine, u64 addr,
			    u8 *data, ssize_t size)
{
	u64 offset = map->map_ip(map, addr);
	return dso__data_read_offset(dso, machine, offset, data, size);
}

struct map *dso__new_map(const char *name)
{
	struct map *map = NULL;
	struct dso *dso = dso__new(name);

	if (dso)
1072
		map = map__new2(0, dso);
1073 1074 1075 1076

	return map;
}

1077 1078
struct dso *machine__findnew_kernel(struct machine *machine, const char *name,
				    const char *short_name, int dso_type)
1079 1080 1081 1082
{
	/*
	 * The kernel dso could be created by build_id processing.
	 */
1083
	struct dso *dso = machine__findnew_dso(machine, name);
1084 1085 1086 1087 1088 1089

	/*
	 * We need to run this in all cases, since during the build_id
	 * processing we had no idea this was the kernel dso.
	 */
	if (dso != NULL) {
1090
		dso__set_short_name(dso, short_name, false);
1091 1092 1093 1094 1095 1096
		dso->kernel = dso_type;
	}

	return dso;
}

1097
void dso__set_long_name(struct dso *dso, const char *name, bool name_allocated)
1098
{
1099 1100
	struct rb_root *root = dso->root;

1101 1102
	if (name == NULL)
		return;
1103 1104

	if (dso->long_name_allocated)
1105
		free((char *)dso->long_name);
1106

1107 1108 1109
	if (root) {
		rb_erase(&dso->rb_node, root);
		/*
1110
		 * __dsos__findnew_link_by_longname() isn't guaranteed to add it
1111 1112 1113 1114 1115 1116
		 * back, so a clean removal is required here.
		 */
		RB_CLEAR_NODE(&dso->rb_node);
		dso->root = NULL;
	}

1117 1118 1119
	dso->long_name		 = name;
	dso->long_name_len	 = strlen(name);
	dso->long_name_allocated = name_allocated;
1120 1121

	if (root)
1122
		__dsos__findnew_link_by_longname(root, dso, NULL);
1123 1124
}

1125
void dso__set_short_name(struct dso *dso, const char *name, bool name_allocated)
1126 1127 1128
{
	if (name == NULL)
		return;
1129 1130 1131 1132 1133 1134 1135

	if (dso->short_name_allocated)
		free((char *)dso->short_name);

	dso->short_name		  = name;
	dso->short_name_len	  = strlen(name);
	dso->short_name_allocated = name_allocated;
1136 1137 1138 1139 1140 1141
}

int dso__name_len(const struct dso *dso)
{
	if (!dso)
		return strlen("[unknown]");
1142
	if (verbose > 0)
1143 1144 1145 1146 1147
		return dso->long_name_len;

	return dso->short_name_len;
}

1148
bool dso__loaded(const struct dso *dso)
1149
{
1150
	return dso->loaded;
1151 1152
}

1153
bool dso__sorted_by_name(const struct dso *dso)
1154
{
1155
	return dso->sorted_by_name;
1156 1157
}

1158
void dso__set_sorted_by_name(struct dso *dso)
1159
{
1160
	dso->sorted_by_name = true;
1161 1162 1163 1164 1165 1166 1167 1168
}

struct dso *dso__new(const char *name)
{
	struct dso *dso = calloc(1, sizeof(*dso) + strlen(name) + 1);

	if (dso != NULL) {
		strcpy(dso->name, name);
1169
		dso__set_long_name(dso, dso->name, false);
1170
		dso__set_short_name(dso, dso->name, false);
1171
		dso->symbols = dso->symbol_names = RB_ROOT_CACHED;
1172
		dso->data.cache = RB_ROOT;
1173 1174
		dso->inlined_nodes = RB_ROOT_CACHED;
		dso->srclines = RB_ROOT_CACHED;
1175
		dso->data.fd = -1;
1176
		dso->data.status = DSO_DATA_STATUS_UNKNOWN;
1177
		dso->symtab_type = DSO_BINARY_TYPE__NOT_FOUND;
1178
		dso->binary_type = DSO_BINARY_TYPE__NOT_FOUND;
1179
		dso->is_64_bit = (sizeof(void *) == 8);
1180
		dso->loaded = 0;
1181
		dso->rel = 0;
1182 1183
		dso->sorted_by_name = 0;
		dso->has_build_id = 0;
1184
		dso->has_srcline = 1;
1185
		dso->a2l_fails = 1;
1186 1187
		dso->kernel = DSO_TYPE_USER;
		dso->needs_swap = DSO_SWAP__UNSET;
1188
		dso->comp = COMP_ID__NONE;
1189
		RB_CLEAR_NODE(&dso->rb_node);
1190
		dso->root = NULL;
1191
		INIT_LIST_HEAD(&dso->node);
1192
		INIT_LIST_HEAD(&dso->data.open_entry);
1193
		pthread_mutex_init(&dso->lock, NULL);
1194
		refcount_set(&dso->refcnt, 1);
1195 1196 1197 1198 1199 1200 1201
	}

	return dso;
}

void dso__delete(struct dso *dso)
{
1202 1203 1204
	if (!RB_EMPTY_NODE(&dso->rb_node))
		pr_err("DSO %s is still in rbtree when being deleted!\n",
		       dso->long_name);
1205 1206 1207

	/* free inlines first, as they reference symbols */
	inlines__tree_delete(&dso->inlined_nodes);
1208
	srcline__tree_delete(&dso->srclines);
1209
	symbols__delete(&dso->symbols);
1210 1211

	if (dso->short_name_allocated) {
1212
		zfree((char **)&dso->short_name);
1213 1214 1215 1216
		dso->short_name_allocated = false;
	}

	if (dso->long_name_allocated) {
1217
		zfree((char **)&dso->long_name);
1218 1219 1220
		dso->long_name_allocated = false;
	}

1221
	dso__data_close(dso);
1222
	auxtrace_cache__free(dso->auxtrace_cache);
1223
	dso_cache__free(dso);
1224
	dso__free_a2l(dso);
1225
	zfree(&dso->symsrc_filename);
1226
	nsinfo__zput(dso->nsinfo);
1227
	pthread_mutex_destroy(&dso->lock);
1228 1229 1230
	free(dso);
}

1231 1232 1233
struct dso *dso__get(struct dso *dso)
{
	if (dso)
1234
		refcount_inc(&dso->refcnt);
1235 1236 1237 1238 1239
	return dso;
}

void dso__put(struct dso *dso)
{
1240
	if (dso && refcount_dec_and_test(&dso->refcnt))
1241 1242 1243
		dso__delete(dso);
}

1244 1245 1246 1247 1248 1249 1250 1251 1252 1253 1254 1255 1256 1257 1258 1259 1260 1261 1262 1263 1264 1265 1266 1267 1268 1269 1270 1271 1272 1273 1274 1275 1276 1277 1278 1279 1280 1281 1282 1283 1284 1285 1286 1287 1288 1289
void dso__set_build_id(struct dso *dso, void *build_id)
{
	memcpy(dso->build_id, build_id, sizeof(dso->build_id));
	dso->has_build_id = 1;
}

bool dso__build_id_equal(const struct dso *dso, u8 *build_id)
{
	return memcmp(dso->build_id, build_id, sizeof(dso->build_id)) == 0;
}

void dso__read_running_kernel_build_id(struct dso *dso, struct machine *machine)
{
	char path[PATH_MAX];

	if (machine__is_default_guest(machine))
		return;
	sprintf(path, "%s/sys/kernel/notes", machine->root_dir);
	if (sysfs__read_build_id(path, dso->build_id,
				 sizeof(dso->build_id)) == 0)
		dso->has_build_id = true;
}

int dso__kernel_module_get_build_id(struct dso *dso,
				    const char *root_dir)
{
	char filename[PATH_MAX];
	/*
	 * kernel module short names are of the form "[module]" and
	 * we need just "module" here.
	 */
	const char *name = dso->short_name + 1;

	snprintf(filename, sizeof(filename),
		 "%s/sys/module/%.*s/notes/.note.gnu.build-id",
		 root_dir, (int)strlen(name) - 1, name);

	if (sysfs__read_build_id(filename, dso->build_id,
				 sizeof(dso->build_id)) == 0)
		dso->has_build_id = true;

	return 0;
}

size_t dso__fprintf_buildid(struct dso *dso, FILE *fp)
{
1290
	char sbuild_id[SBUILD_ID_SIZE];
1291 1292 1293 1294 1295

	build_id__sprintf(dso->build_id, sizeof(dso->build_id), sbuild_id);
	return fprintf(fp, "%s", sbuild_id);
}

1296
size_t dso__fprintf(struct dso *dso, FILE *fp)
1297 1298 1299 1300 1301 1302
{
	struct rb_node *nd;
	size_t ret = fprintf(fp, "dso: %s (", dso->short_name);

	if (dso->short_name != dso->long_name)
		ret += fprintf(fp, "%s, ", dso->long_name);
1303
	ret += fprintf(fp, "%sloaded, ", dso__loaded(dso) ? "" : "NOT ");
1304 1305
	ret += dso__fprintf_buildid(dso, fp);
	ret += fprintf(fp, ")\n");
1306
	for (nd = rb_first_cached(&dso->symbols); nd; nd = rb_next(nd)) {
1307 1308 1309 1310 1311 1312
		struct symbol *pos = rb_entry(nd, struct symbol, rb_node);
		ret += symbol__fprintf(pos, fp);
	}

	return ret;
}
A
Adrian Hunter 已提交
1313 1314 1315 1316

enum dso_type dso__type(struct dso *dso, struct machine *machine)
{
	int fd;
1317
	enum dso_type type = DSO__TYPE_UNKNOWN;
A
Adrian Hunter 已提交
1318

1319 1320 1321 1322 1323
	fd = dso__data_get_fd(dso, machine);
	if (fd >= 0) {
		type = dso__type_fd(fd);
		dso__data_put_fd(dso);
	}
A
Adrian Hunter 已提交
1324

1325
	return type;
A
Adrian Hunter 已提交
1326
}
1327 1328 1329 1330 1331 1332 1333 1334 1335 1336 1337 1338 1339 1340 1341 1342 1343 1344

int dso__strerror_load(struct dso *dso, char *buf, size_t buflen)
{
	int idx, errnum = dso->load_errno;
	/*
	 * This must have a same ordering as the enum dso_load_errno.
	 */
	static const char *dso_load__error_str[] = {
	"Internal tools/perf/ library error",
	"Invalid ELF file",
	"Can not read build id",
	"Mismatching build id",
	"Decompression failure",
	};

	BUG_ON(buflen == 0);

	if (errnum >= 0) {
1345
		const char *err = str_error_r(errnum, buf, buflen);
1346 1347 1348 1349 1350 1351 1352 1353 1354 1355 1356 1357 1358 1359

		if (err != buf)
			scnprintf(buf, buflen, "%s", err);

		return 0;
	}

	if (errnum <  __DSO_LOAD_ERRNO__START || errnum >= __DSO_LOAD_ERRNO__END)
		return -1;

	idx = errnum - __DSO_LOAD_ERRNO__START;
	scnprintf(buf, buflen, "%s", dso_load__error_str[idx]);
	return 0;
}