dso.c 31.8 KB
Newer Older
1
#include <asm/bug.h>
2
#include <linux/kernel.h>
3 4
#include <sys/time.h>
#include <sys/resource.h>
5 6
#include "symbol.h"
#include "dso.h"
7
#include "machine.h"
8
#include "auxtrace.h"
9 10
#include "util.h"
#include "debug.h"
11
#include "string2.h"
12
#include "vdso.h"
13

14 15 16 17 18 19 20
static const char * const debuglink_paths[] = {
	"%.0s%s",
	"%s/%s",
	"%s/.debug/%s",
	"/usr/lib/debug%s/%s"
};

21 22 23
char dso__symtab_origin(const struct dso *dso)
{
	static const char origin[] = {
24 25 26 27 28 29 30 31 32 33 34
		[DSO_BINARY_TYPE__KALLSYMS]			= 'k',
		[DSO_BINARY_TYPE__VMLINUX]			= 'v',
		[DSO_BINARY_TYPE__JAVA_JIT]			= 'j',
		[DSO_BINARY_TYPE__DEBUGLINK]			= 'l',
		[DSO_BINARY_TYPE__BUILD_ID_CACHE]		= 'B',
		[DSO_BINARY_TYPE__FEDORA_DEBUGINFO]		= 'f',
		[DSO_BINARY_TYPE__UBUNTU_DEBUGINFO]		= 'u',
		[DSO_BINARY_TYPE__OPENEMBEDDED_DEBUGINFO]	= 'o',
		[DSO_BINARY_TYPE__BUILDID_DEBUGINFO]		= 'b',
		[DSO_BINARY_TYPE__SYSTEM_PATH_DSO]		= 'd',
		[DSO_BINARY_TYPE__SYSTEM_PATH_KMODULE]		= 'K',
35
		[DSO_BINARY_TYPE__SYSTEM_PATH_KMODULE_COMP]	= 'm',
36 37
		[DSO_BINARY_TYPE__GUEST_KALLSYMS]		= 'g',
		[DSO_BINARY_TYPE__GUEST_KMODULE]		= 'G',
38
		[DSO_BINARY_TYPE__GUEST_KMODULE_COMP]		= 'M',
39
		[DSO_BINARY_TYPE__GUEST_VMLINUX]		= 'V',
40 41 42 43 44 45 46
	};

	if (dso == NULL || dso->symtab_type == DSO_BINARY_TYPE__NOT_FOUND)
		return '!';
	return origin[dso->symtab_type];
}

47 48 49
int dso__read_binary_type_filename(const struct dso *dso,
				   enum dso_binary_type type,
				   char *root_dir, char *filename, size_t size)
50
{
51
	char build_id_hex[SBUILD_ID_SIZE];
52
	int ret = 0;
53
	size_t len;
54 55

	switch (type) {
56 57 58 59 60 61
	case DSO_BINARY_TYPE__DEBUGLINK:
	{
		const char *last_slash;
		char dso_dir[PATH_MAX];
		char symfile[PATH_MAX];
		unsigned int i;
62

63
		len = __symbol__join_symfs(filename, size, dso->long_name);
64 65 66
		last_slash = filename + len;
		while (last_slash != filename && *last_slash != '/')
			last_slash--;
67

68 69 70 71 72
		strncpy(dso_dir, filename, last_slash - filename);
		dso_dir[last_slash-filename] = '\0';

		if (!is_regular_file(filename)) {
			ret = -1;
73
			break;
74
		}
75

76 77 78 79 80 81 82 83 84 85 86 87 88
		ret = filename__read_debuglink(filename, symfile, PATH_MAX);
		if (ret)
			break;

		/* Check predefined locations where debug file might reside */
		ret = -1;
		for (i = 0; i < ARRAY_SIZE(debuglink_paths); i++) {
			snprintf(filename, size,
					debuglink_paths[i], dso_dir, symfile);
			if (is_regular_file(filename)) {
				ret = 0;
				break;
			}
89
		}
90

91
		break;
92
	}
93
	case DSO_BINARY_TYPE__BUILD_ID_CACHE:
94
		if (dso__build_id_filename(dso, filename, size) == NULL)
95 96 97 98
			ret = -1;
		break;

	case DSO_BINARY_TYPE__FEDORA_DEBUGINFO:
99 100
		len = __symbol__join_symfs(filename, size, "/usr/lib/debug");
		snprintf(filename + len, size - len, "%s.debug", dso->long_name);
101 102 103
		break;

	case DSO_BINARY_TYPE__UBUNTU_DEBUGINFO:
104 105
		len = __symbol__join_symfs(filename, size, "/usr/lib/debug");
		snprintf(filename + len, size - len, "%s", dso->long_name);
106 107
		break;

108 109
	case DSO_BINARY_TYPE__OPENEMBEDDED_DEBUGINFO:
	{
110
		const char *last_slash;
111 112 113 114 115 116
		size_t dir_size;

		last_slash = dso->long_name + dso->long_name_len;
		while (last_slash != dso->long_name && *last_slash != '/')
			last_slash--;

117
		len = __symbol__join_symfs(filename, size, "");
118 119 120 121 122
		dir_size = last_slash - dso->long_name + 2;
		if (dir_size > (size - len)) {
			ret = -1;
			break;
		}
123 124
		len += scnprintf(filename + len, dir_size, "%s",  dso->long_name);
		len += scnprintf(filename + len , size - len, ".debug%s",
125 126 127 128
								last_slash);
		break;
	}

129 130 131 132 133 134 135 136 137
	case DSO_BINARY_TYPE__BUILDID_DEBUGINFO:
		if (!dso->has_build_id) {
			ret = -1;
			break;
		}

		build_id__sprintf(dso->build_id,
				  sizeof(dso->build_id),
				  build_id_hex);
138 139 140
		len = __symbol__join_symfs(filename, size, "/usr/lib/debug/.build-id/");
		snprintf(filename + len, size - len, "%.2s/%s.debug",
			 build_id_hex, build_id_hex + 2);
141 142
		break;

143 144
	case DSO_BINARY_TYPE__VMLINUX:
	case DSO_BINARY_TYPE__GUEST_VMLINUX:
145
	case DSO_BINARY_TYPE__SYSTEM_PATH_DSO:
146
		__symbol__join_symfs(filename, size, dso->long_name);
147 148 149
		break;

	case DSO_BINARY_TYPE__GUEST_KMODULE:
150
	case DSO_BINARY_TYPE__GUEST_KMODULE_COMP:
151 152
		path__join3(filename, size, symbol_conf.symfs,
			    root_dir, dso->long_name);
153 154 155
		break;

	case DSO_BINARY_TYPE__SYSTEM_PATH_KMODULE:
156
	case DSO_BINARY_TYPE__SYSTEM_PATH_KMODULE_COMP:
157
		__symbol__join_symfs(filename, size, dso->long_name);
158 159
		break;

160 161
	case DSO_BINARY_TYPE__KCORE:
	case DSO_BINARY_TYPE__GUEST_KCORE:
162
		snprintf(filename, size, "%s", dso->long_name);
163 164
		break;

165 166 167 168 169 170 171 172 173 174 175 176
	default:
	case DSO_BINARY_TYPE__KALLSYMS:
	case DSO_BINARY_TYPE__GUEST_KALLSYMS:
	case DSO_BINARY_TYPE__JAVA_JIT:
	case DSO_BINARY_TYPE__NOT_FOUND:
		ret = -1;
		break;
	}

	return ret;
}

177 178 179 180
static const struct {
	const char *fmt;
	int (*decompress)(const char *input, int output);
} compressions[] = {
181 182
#ifdef HAVE_ZLIB_SUPPORT
	{ "gz", gzip_decompress_to_file },
183 184 185
#endif
#ifdef HAVE_LZMA_SUPPORT
	{ "xz", lzma_decompress_to_file },
186 187
#endif
	{ NULL, NULL },
188 189 190 191 192 193 194 195 196 197 198 199 200
};

bool is_supported_compression(const char *ext)
{
	unsigned i;

	for (i = 0; compressions[i].fmt; i++) {
		if (!strcmp(ext, compressions[i].fmt))
			return true;
	}
	return false;
}

201
bool is_kernel_module(const char *pathname, int cpumode)
202
{
203
	struct kmod_path m;
204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222
	int mode = cpumode & PERF_RECORD_MISC_CPUMODE_MASK;

	WARN_ONCE(mode != cpumode,
		  "Internal error: passing unmasked cpumode (%x) to is_kernel_module",
		  cpumode);

	switch (mode) {
	case PERF_RECORD_MISC_USER:
	case PERF_RECORD_MISC_HYPERVISOR:
	case PERF_RECORD_MISC_GUEST_USER:
		return false;
	/* Treat PERF_RECORD_MISC_CPUMODE_UNKNOWN as kernel */
	default:
		if (kmod_path__parse(&m, pathname)) {
			pr_err("Failed to check whether %s is a kernel module or not. Assume it is.",
					pathname);
			return true;
		}
	}
223

224
	return m.kmod;
225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244
}

bool decompress_to_file(const char *ext, const char *filename, int output_fd)
{
	unsigned i;

	for (i = 0; compressions[i].fmt; i++) {
		if (!strcmp(ext, compressions[i].fmt))
			return !compressions[i].decompress(filename,
							   output_fd);
	}
	return false;
}

bool dso__needs_decompress(struct dso *dso)
{
	return dso->symtab_type == DSO_BINARY_TYPE__SYSTEM_PATH_KMODULE_COMP ||
		dso->symtab_type == DSO_BINARY_TYPE__GUEST_KMODULE_COMP;
}

245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265
/*
 * Parses kernel module specified in @path and updates
 * @m argument like:
 *
 *    @comp - true if @path contains supported compression suffix,
 *            false otherwise
 *    @kmod - true if @path contains '.ko' suffix in right position,
 *            false otherwise
 *    @name - if (@alloc_name && @kmod) is true, it contains strdup-ed base name
 *            of the kernel module without suffixes, otherwise strudup-ed
 *            base name of @path
 *    @ext  - if (@alloc_ext && @comp) is true, it contains strdup-ed string
 *            the compression suffix
 *
 * Returns 0 if there's no strdup error, -ENOMEM otherwise.
 */
int __kmod_path__parse(struct kmod_path *m, const char *path,
		       bool alloc_name, bool alloc_ext)
{
	const char *name = strrchr(path, '/');
	const char *ext  = strrchr(path, '.');
266
	bool is_simple_name = false;
267 268 269 270

	memset(m, 0x0, sizeof(*m));
	name = name ? name + 1 : path;

271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290
	/*
	 * '.' is also a valid character for module name. For example:
	 * [aaa.bbb] is a valid module name. '[' should have higher
	 * priority than '.ko' suffix.
	 *
	 * The kernel names are from machine__mmap_name. Such
	 * name should belong to kernel itself, not kernel module.
	 */
	if (name[0] == '[') {
		is_simple_name = true;
		if ((strncmp(name, "[kernel.kallsyms]", 17) == 0) ||
		    (strncmp(name, "[guest.kernel.kallsyms", 22) == 0) ||
		    (strncmp(name, "[vdso]", 6) == 0) ||
		    (strncmp(name, "[vsyscall]", 10) == 0)) {
			m->kmod = false;

		} else
			m->kmod = true;
	}

291
	/* No extension, just return name. */
292
	if ((ext == NULL) || is_simple_name) {
293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331
		if (alloc_name) {
			m->name = strdup(name);
			return m->name ? 0 : -ENOMEM;
		}
		return 0;
	}

	if (is_supported_compression(ext + 1)) {
		m->comp = true;
		ext -= 3;
	}

	/* Check .ko extension only if there's enough name left. */
	if (ext > name)
		m->kmod = !strncmp(ext, ".ko", 3);

	if (alloc_name) {
		if (m->kmod) {
			if (asprintf(&m->name, "[%.*s]", (int) (ext - name), name) == -1)
				return -ENOMEM;
		} else {
			if (asprintf(&m->name, "%s", name) == -1)
				return -ENOMEM;
		}

		strxfrchar(m->name, '-', '_');
	}

	if (alloc_ext && m->comp) {
		m->ext = strdup(ext + 4);
		if (!m->ext) {
			free((void *) m->name);
			return -ENOMEM;
		}
	}

	return 0;
}

332
/*
333
 * Global list of open DSOs and the counter.
334 335
 */
static LIST_HEAD(dso__data_open);
336
static long dso__data_open_cnt;
337
static pthread_mutex_t dso__data_open_lock = PTHREAD_MUTEX_INITIALIZER;
338 339 340 341

static void dso__list_add(struct dso *dso)
{
	list_add_tail(&dso->data.open_entry, &dso__data_open);
342
	dso__data_open_cnt++;
343 344 345 346 347
}

static void dso__list_del(struct dso *dso)
{
	list_del(&dso->data.open_entry);
348 349 350
	WARN_ONCE(dso__data_open_cnt <= 0,
		  "DSO data fd counter out of bounds.");
	dso__data_open_cnt--;
351 352
}

353 354 355 356 357
static void close_first_dso(void);

static int do_open(char *name)
{
	int fd;
358
	char sbuf[STRERR_BUFSIZE];
359 360 361 362 363 364

	do {
		fd = open(name, O_RDONLY);
		if (fd >= 0)
			return fd;

365
		pr_debug("dso open failed: %s\n",
366
			 str_error_r(errno, sbuf, sizeof(sbuf)));
367 368 369 370 371 372 373 374 375
		if (!dso__data_open_cnt || errno != EMFILE)
			break;

		close_first_dso();
	} while (1);

	return -1;
}

376
static int __open_dso(struct dso *dso, struct machine *machine)
377 378
{
	int fd;
379 380
	char *root_dir = (char *)"";
	char *name = malloc(PATH_MAX);
381 382 383 384 385 386 387

	if (!name)
		return -ENOMEM;

	if (machine)
		root_dir = machine->root_dir;

388
	if (dso__read_binary_type_filename(dso, dso->binary_type,
389
					    root_dir, name, PATH_MAX)) {
390 391 392 393
		free(name);
		return -EINVAL;
	}

394 395 396
	if (!is_regular_file(name))
		return -EINVAL;

397
	fd = do_open(name);
398 399 400 401
	free(name);
	return fd;
}

402 403
static void check_data_close(void);

404 405 406 407 408 409 410
/**
 * dso_close - Open DSO data file
 * @dso: dso object
 *
 * Open @dso's data file descriptor and updates
 * list/count of open DSO objects.
 */
411 412 413 414
static int open_dso(struct dso *dso, struct machine *machine)
{
	int fd = __open_dso(dso, machine);

415
	if (fd >= 0) {
416
		dso__list_add(dso);
417 418 419 420 421 422
		/*
		 * Check if we crossed the allowed number
		 * of opened DSOs and close one if needed.
		 */
		check_data_close();
	}
423 424 425 426 427

	return fd;
}

static void close_data_fd(struct dso *dso)
428 429 430 431
{
	if (dso->data.fd >= 0) {
		close(dso->data.fd);
		dso->data.fd = -1;
432
		dso->data.file_size = 0;
433
		dso__list_del(dso);
434 435 436
	}
}

437 438 439 440 441 442 443
/**
 * dso_close - Close DSO data file
 * @dso: dso object
 *
 * Close @dso's data file descriptor and updates
 * list/count of open DSO objects.
 */
444 445 446 447 448
static void close_dso(struct dso *dso)
{
	close_data_fd(dso);
}

449 450 451 452 453 454 455 456 457 458 459 460 461 462 463 464 465 466 467 468 469 470 471 472 473 474 475
static void close_first_dso(void)
{
	struct dso *dso;

	dso = list_first_entry(&dso__data_open, struct dso, data.open_entry);
	close_dso(dso);
}

static rlim_t get_fd_limit(void)
{
	struct rlimit l;
	rlim_t limit = 0;

	/* Allow half of the current open fd limit. */
	if (getrlimit(RLIMIT_NOFILE, &l) == 0) {
		if (l.rlim_cur == RLIM_INFINITY)
			limit = l.rlim_cur;
		else
			limit = l.rlim_cur / 2;
	} else {
		pr_err("failed to get fd limit\n");
		limit = 1;
	}

	return limit;
}

476 477 478 479 480 481 482 483
static rlim_t fd_limit;

/*
 * Used only by tests/dso-data.c to reset the environment
 * for tests. I dont expect we should change this during
 * standard runtime.
 */
void reset_fd_limit(void)
484
{
485 486
	fd_limit = 0;
}
487

488 489 490 491
static bool may_cache_fd(void)
{
	if (!fd_limit)
		fd_limit = get_fd_limit();
492

493
	if (fd_limit == RLIM_INFINITY)
494 495
		return true;

496
	return fd_limit > (rlim_t) dso__data_open_cnt;
497 498
}

499 500 501 502 503
/*
 * Check and close LRU dso if we crossed allowed limit
 * for opened dso file descriptors. The limit is half
 * of the RLIMIT_NOFILE files opened.
*/
504 505 506 507 508 509 510 511
static void check_data_close(void)
{
	bool cache_fd = may_cache_fd();

	if (!cache_fd)
		close_first_dso();
}

512 513 514 515 516 517
/**
 * dso__data_close - Close DSO data file
 * @dso: dso object
 *
 * External interface to close @dso's data file descriptor.
 */
518 519
void dso__data_close(struct dso *dso)
{
520
	pthread_mutex_lock(&dso__data_open_lock);
521
	close_dso(dso);
522
	pthread_mutex_unlock(&dso__data_open_lock);
523 524
}

525
static void try_to_open_dso(struct dso *dso, struct machine *machine)
526
{
527
	enum dso_binary_type binary_type_data[] = {
528 529 530 531 532 533
		DSO_BINARY_TYPE__BUILD_ID_CACHE,
		DSO_BINARY_TYPE__SYSTEM_PATH_DSO,
		DSO_BINARY_TYPE__NOT_FOUND,
	};
	int i = 0;

534
	if (dso->data.fd >= 0)
535
		return;
536 537 538

	if (dso->binary_type != DSO_BINARY_TYPE__NOT_FOUND) {
		dso->data.fd = open_dso(dso, machine);
539
		goto out;
540
	}
541 542

	do {
543
		dso->binary_type = binary_type_data[i++];
544

545 546 547
		dso->data.fd = open_dso(dso, machine);
		if (dso->data.fd >= 0)
			goto out;
548

549
	} while (dso->binary_type != DSO_BINARY_TYPE__NOT_FOUND);
550 551 552 553 554
out:
	if (dso->data.fd >= 0)
		dso->data.status = DSO_DATA_STATUS_OK;
	else
		dso->data.status = DSO_DATA_STATUS_ERROR;
555 556 557
}

/**
558
 * dso__data_get_fd - Get dso's data file descriptor
559 560 561 562
 * @dso: dso object
 * @machine: machine object
 *
 * External interface to find dso's file, open it and
563 564
 * returns file descriptor.  It should be paired with
 * dso__data_put_fd() if it returns non-negative value.
565
 */
566
int dso__data_get_fd(struct dso *dso, struct machine *machine)
567 568 569
{
	if (dso->data.status == DSO_DATA_STATUS_ERROR)
		return -1;
570

571 572 573
	if (pthread_mutex_lock(&dso__data_open_lock) < 0)
		return -1;

574
	try_to_open_dso(dso, machine);
575 576 577

	if (dso->data.fd < 0)
		pthread_mutex_unlock(&dso__data_open_lock);
578

579
	return dso->data.fd;
580 581
}

582 583 584 585 586
void dso__data_put_fd(struct dso *dso __maybe_unused)
{
	pthread_mutex_unlock(&dso__data_open_lock);
}

587 588 589 590 591 592 593 594 595 596 597 598
bool dso__data_status_seen(struct dso *dso, enum dso_data_status_seen by)
{
	u32 flag = 1 << by;

	if (dso->data.status_seen & flag)
		return true;

	dso->data.status_seen |= flag;

	return false;
}

599
static void
600
dso_cache__free(struct dso *dso)
601
{
602
	struct rb_root *root = &dso->data.cache;
603 604
	struct rb_node *next = rb_first(root);

605
	pthread_mutex_lock(&dso->lock);
606 607 608 609 610 611 612 613
	while (next) {
		struct dso_cache *cache;

		cache = rb_entry(next, struct dso_cache, rb_node);
		next = rb_next(&cache->rb_node);
		rb_erase(&cache->rb_node, root);
		free(cache);
	}
614
	pthread_mutex_unlock(&dso->lock);
615 616
}

617
static struct dso_cache *dso_cache__find(struct dso *dso, u64 offset)
618
{
619
	const struct rb_root *root = &dso->data.cache;
620 621
	struct rb_node * const *p = &root->rb_node;
	const struct rb_node *parent = NULL;
622 623 624 625 626 627 628 629 630 631 632 633 634 635 636 637
	struct dso_cache *cache;

	while (*p != NULL) {
		u64 end;

		parent = *p;
		cache = rb_entry(parent, struct dso_cache, rb_node);
		end = cache->offset + DSO__DATA_CACHE_SIZE;

		if (offset < cache->offset)
			p = &(*p)->rb_left;
		else if (offset >= end)
			p = &(*p)->rb_right;
		else
			return cache;
	}
638

639 640 641
	return NULL;
}

642 643
static struct dso_cache *
dso_cache__insert(struct dso *dso, struct dso_cache *new)
644
{
645
	struct rb_root *root = &dso->data.cache;
646 647 648 649 650
	struct rb_node **p = &root->rb_node;
	struct rb_node *parent = NULL;
	struct dso_cache *cache;
	u64 offset = new->offset;

651
	pthread_mutex_lock(&dso->lock);
652 653 654 655 656 657 658 659 660 661 662
	while (*p != NULL) {
		u64 end;

		parent = *p;
		cache = rb_entry(parent, struct dso_cache, rb_node);
		end = cache->offset + DSO__DATA_CACHE_SIZE;

		if (offset < cache->offset)
			p = &(*p)->rb_left;
		else if (offset >= end)
			p = &(*p)->rb_right;
663 664
		else
			goto out;
665 666 667 668
	}

	rb_link_node(&new->rb_node, parent, p);
	rb_insert_color(&new->rb_node, root);
669 670 671 672 673

	cache = NULL;
out:
	pthread_mutex_unlock(&dso->lock);
	return cache;
674 675 676 677 678 679 680 681 682 683 684 685 686 687
}

static ssize_t
dso_cache__memcpy(struct dso_cache *cache, u64 offset,
		  u8 *data, u64 size)
{
	u64 cache_offset = offset - cache->offset;
	u64 cache_size   = min(cache->size - cache_offset, size);

	memcpy(data, cache->data + cache_offset, cache_size);
	return cache_size;
}

static ssize_t
688 689
dso_cache__read(struct dso *dso, struct machine *machine,
		u64 offset, u8 *data, ssize_t size)
690 691
{
	struct dso_cache *cache;
692
	struct dso_cache *old;
693 694 695 696 697 698 699
	ssize_t ret;

	do {
		u64 cache_offset;

		cache = zalloc(sizeof(*cache) + DSO__DATA_CACHE_SIZE);
		if (!cache)
700 701 702 703 704 705 706 707
			return -ENOMEM;

		pthread_mutex_lock(&dso__data_open_lock);

		/*
		 * dso->data.fd might be closed if other thread opened another
		 * file (dso) due to open file limit (RLIMIT_NOFILE).
		 */
708 709
		try_to_open_dso(dso, machine);

710
		if (dso->data.fd < 0) {
711 712 713
			ret = -errno;
			dso->data.status = DSO_DATA_STATUS_ERROR;
			break;
714
		}
715 716 717

		cache_offset = offset & DSO__DATA_CACHE_MASK;

718
		ret = pread(dso->data.fd, cache->data, DSO__DATA_CACHE_SIZE, cache_offset);
719 720 721 722 723
		if (ret <= 0)
			break;

		cache->offset = cache_offset;
		cache->size   = ret;
724 725 726 727 728
	} while (0);

	pthread_mutex_unlock(&dso__data_open_lock);

	if (ret > 0) {
729 730 731 732 733 734
		old = dso_cache__insert(dso, cache);
		if (old) {
			/* we lose the race */
			free(cache);
			cache = old;
		}
735 736

		ret = dso_cache__memcpy(cache, offset, data, size);
737
	}
738 739 740 741 742 743 744

	if (ret <= 0)
		free(cache);

	return ret;
}

745 746
static ssize_t dso_cache_read(struct dso *dso, struct machine *machine,
			      u64 offset, u8 *data, ssize_t size)
747 748 749
{
	struct dso_cache *cache;

750
	cache = dso_cache__find(dso, offset);
751 752 753
	if (cache)
		return dso_cache__memcpy(cache, offset, data, size);
	else
754
		return dso_cache__read(dso, machine, offset, data, size);
755 756
}

757 758 759 760 761
/*
 * Reads and caches dso data DSO__DATA_CACHE_SIZE size chunks
 * in the rb_tree. Any read to already cached data is served
 * by cached data.
 */
762 763
static ssize_t cached_read(struct dso *dso, struct machine *machine,
			   u64 offset, u8 *data, ssize_t size)
764 765 766 767 768 769 770
{
	ssize_t r = 0;
	u8 *p = data;

	do {
		ssize_t ret;

771
		ret = dso_cache_read(dso, machine, offset, p, size);
772 773 774 775 776 777 778 779 780 781 782 783 784 785 786 787 788 789 790
		if (ret < 0)
			return ret;

		/* Reached EOF, return what we have. */
		if (!ret)
			break;

		BUG_ON(ret > size);

		r      += ret;
		p      += ret;
		offset += ret;
		size   -= ret;

	} while (size);

	return r;
}

791
static int data_file_size(struct dso *dso, struct machine *machine)
792
{
793
	int ret = 0;
794
	struct stat st;
795
	char sbuf[STRERR_BUFSIZE];
796

797 798 799
	if (dso->data.file_size)
		return 0;

800 801 802
	if (dso->data.status == DSO_DATA_STATUS_ERROR)
		return -1;

803 804 805 806 807 808
	pthread_mutex_lock(&dso__data_open_lock);

	/*
	 * dso->data.fd might be closed if other thread opened another
	 * file (dso) due to open file limit (RLIMIT_NOFILE).
	 */
809 810
	try_to_open_dso(dso, machine);

811
	if (dso->data.fd < 0) {
812 813 814
		ret = -errno;
		dso->data.status = DSO_DATA_STATUS_ERROR;
		goto out;
815 816
	}

817 818 819
	if (fstat(dso->data.fd, &st) < 0) {
		ret = -errno;
		pr_err("dso cache fstat failed: %s\n",
820
		       str_error_r(errno, sbuf, sizeof(sbuf)));
821 822 823 824 825 826 827 828
		dso->data.status = DSO_DATA_STATUS_ERROR;
		goto out;
	}
	dso->data.file_size = st.st_size;

out:
	pthread_mutex_unlock(&dso__data_open_lock);
	return ret;
829 830
}

A
Adrian Hunter 已提交
831 832 833 834 835 836 837 838 839
/**
 * dso__data_size - Return dso data size
 * @dso: dso object
 * @machine: machine object
 *
 * Return: dso data size
 */
off_t dso__data_size(struct dso *dso, struct machine *machine)
{
840
	if (data_file_size(dso, machine))
A
Adrian Hunter 已提交
841 842 843 844 845 846
		return -1;

	/* For now just estimate dso data size is close to file size */
	return dso->data.file_size;
}

847 848
static ssize_t data_read_offset(struct dso *dso, struct machine *machine,
				u64 offset, u8 *data, ssize_t size)
849
{
850
	if (data_file_size(dso, machine))
851 852 853 854 855 856 857 858 859
		return -1;

	/* Check the offset sanity. */
	if (offset > dso->data.file_size)
		return -1;

	if (offset + size < offset)
		return -1;

860
	return cached_read(dso, machine, offset, data, size);
861 862
}

863 864 865 866 867 868 869 870 871 872 873
/**
 * dso__data_read_offset - Read data from dso file offset
 * @dso: dso object
 * @machine: machine object
 * @offset: file offset
 * @data: buffer to store data
 * @size: size of the @data buffer
 *
 * External interface to read data from dso file offset. Open
 * dso data file and use cached_read to get the data.
 */
874 875 876
ssize_t dso__data_read_offset(struct dso *dso, struct machine *machine,
			      u64 offset, u8 *data, ssize_t size)
{
877
	if (dso->data.status == DSO_DATA_STATUS_ERROR)
878 879
		return -1;

880
	return data_read_offset(dso, machine, offset, data, size);
881 882
}

883 884 885 886 887 888 889 890 891 892
/**
 * dso__data_read_addr - Read data from dso address
 * @dso: dso object
 * @machine: machine object
 * @add: virtual memory address
 * @data: buffer to store data
 * @size: size of the @data buffer
 *
 * External interface to read data from dso address.
 */
893 894 895 896 897 898 899 900 901 902 903 904 905 906 907 908 909 910 911
ssize_t dso__data_read_addr(struct dso *dso, struct map *map,
			    struct machine *machine, u64 addr,
			    u8 *data, ssize_t size)
{
	u64 offset = map->map_ip(map, addr);
	return dso__data_read_offset(dso, machine, offset, data, size);
}

struct map *dso__new_map(const char *name)
{
	struct map *map = NULL;
	struct dso *dso = dso__new(name);

	if (dso)
		map = map__new2(0, dso, MAP__FUNCTION);

	return map;
}

912 913
struct dso *machine__findnew_kernel(struct machine *machine, const char *name,
				    const char *short_name, int dso_type)
914 915 916 917
{
	/*
	 * The kernel dso could be created by build_id processing.
	 */
918
	struct dso *dso = machine__findnew_dso(machine, name);
919 920 921 922 923 924

	/*
	 * We need to run this in all cases, since during the build_id
	 * processing we had no idea this was the kernel dso.
	 */
	if (dso != NULL) {
925
		dso__set_short_name(dso, short_name, false);
926 927 928 929 930 931
		dso->kernel = dso_type;
	}

	return dso;
}

932 933 934 935 936
/*
 * Find a matching entry and/or link current entry to RB tree.
 * Either one of the dso or name parameter must be non-NULL or the
 * function will not work.
 */
937 938
static struct dso *__dso__findlink_by_longname(struct rb_root *root,
					       struct dso *dso, const char *name)
939 940 941 942 943 944 945 946 947 948 949 950 951 952 953 954 955
{
	struct rb_node **p = &root->rb_node;
	struct rb_node  *parent = NULL;

	if (!name)
		name = dso->long_name;
	/*
	 * Find node with the matching name
	 */
	while (*p) {
		struct dso *this = rb_entry(*p, struct dso, rb_node);
		int rc = strcmp(name, this->long_name);

		parent = *p;
		if (rc == 0) {
			/*
			 * In case the new DSO is a duplicate of an existing
956
			 * one, print a one-time warning & put the new entry
957 958 959 960 961 962 963 964 965 966 967 968 969 970 971 972 973 974 975 976 977 978 979 980
			 * at the end of the list of duplicates.
			 */
			if (!dso || (dso == this))
				return this;	/* Find matching dso */
			/*
			 * The core kernel DSOs may have duplicated long name.
			 * In this case, the short name should be different.
			 * Comparing the short names to differentiate the DSOs.
			 */
			rc = strcmp(dso->short_name, this->short_name);
			if (rc == 0) {
				pr_err("Duplicated dso name: %s\n", name);
				return NULL;
			}
		}
		if (rc < 0)
			p = &parent->rb_left;
		else
			p = &parent->rb_right;
	}
	if (dso) {
		/* Add new node and rebalance tree */
		rb_link_node(&dso->rb_node, parent, p);
		rb_insert_color(&dso->rb_node, root);
981
		dso->root = root;
982 983 984 985
	}
	return NULL;
}

986 987
static inline struct dso *__dso__find_by_longname(struct rb_root *root,
						  const char *name)
988
{
989
	return __dso__findlink_by_longname(root, NULL, name);
990 991
}

992
void dso__set_long_name(struct dso *dso, const char *name, bool name_allocated)
993
{
994 995
	struct rb_root *root = dso->root;

996 997
	if (name == NULL)
		return;
998 999

	if (dso->long_name_allocated)
1000
		free((char *)dso->long_name);
1001

1002 1003 1004 1005 1006 1007 1008 1009 1010 1011
	if (root) {
		rb_erase(&dso->rb_node, root);
		/*
		 * __dso__findlink_by_longname() isn't guaranteed to add it
		 * back, so a clean removal is required here.
		 */
		RB_CLEAR_NODE(&dso->rb_node);
		dso->root = NULL;
	}

1012 1013 1014
	dso->long_name		 = name;
	dso->long_name_len	 = strlen(name);
	dso->long_name_allocated = name_allocated;
1015 1016 1017

	if (root)
		__dso__findlink_by_longname(root, dso, NULL);
1018 1019
}

1020
void dso__set_short_name(struct dso *dso, const char *name, bool name_allocated)
1021 1022 1023
{
	if (name == NULL)
		return;
1024 1025 1026 1027 1028 1029 1030

	if (dso->short_name_allocated)
		free((char *)dso->short_name);

	dso->short_name		  = name;
	dso->short_name_len	  = strlen(name);
	dso->short_name_allocated = name_allocated;
1031 1032 1033 1034
}

static void dso__set_basename(struct dso *dso)
{
1035 1036 1037 1038 1039 1040 1041 1042 1043 1044 1045 1046 1047 1048 1049 1050 1051 1052 1053 1054 1055 1056
       /*
        * basename() may modify path buffer, so we must pass
        * a copy.
        */
       char *base, *lname = strdup(dso->long_name);

       if (!lname)
               return;

       /*
        * basename() may return a pointer to internal
        * storage which is reused in subsequent calls
        * so copy the result.
        */
       base = strdup(basename(lname));

       free(lname);

       if (!base)
               return;

       dso__set_short_name(dso, base, true);
1057 1058 1059 1060 1061 1062
}

int dso__name_len(const struct dso *dso)
{
	if (!dso)
		return strlen("[unknown]");
1063
	if (verbose > 0)
1064 1065 1066 1067 1068 1069 1070 1071 1072 1073 1074 1075 1076 1077 1078 1079 1080 1081 1082 1083 1084 1085 1086 1087 1088 1089 1090
		return dso->long_name_len;

	return dso->short_name_len;
}

bool dso__loaded(const struct dso *dso, enum map_type type)
{
	return dso->loaded & (1 << type);
}

bool dso__sorted_by_name(const struct dso *dso, enum map_type type)
{
	return dso->sorted_by_name & (1 << type);
}

void dso__set_sorted_by_name(struct dso *dso, enum map_type type)
{
	dso->sorted_by_name |= (1 << type);
}

struct dso *dso__new(const char *name)
{
	struct dso *dso = calloc(1, sizeof(*dso) + strlen(name) + 1);

	if (dso != NULL) {
		int i;
		strcpy(dso->name, name);
1091
		dso__set_long_name(dso, dso->name, false);
1092
		dso__set_short_name(dso, dso->name, false);
1093 1094
		for (i = 0; i < MAP__NR_TYPES; ++i)
			dso->symbols[i] = dso->symbol_names[i] = RB_ROOT;
1095
		dso->data.cache = RB_ROOT;
1096
		dso->data.fd = -1;
1097
		dso->data.status = DSO_DATA_STATUS_UNKNOWN;
1098
		dso->symtab_type = DSO_BINARY_TYPE__NOT_FOUND;
1099
		dso->binary_type = DSO_BINARY_TYPE__NOT_FOUND;
1100
		dso->is_64_bit = (sizeof(void *) == 8);
1101
		dso->loaded = 0;
1102
		dso->rel = 0;
1103 1104
		dso->sorted_by_name = 0;
		dso->has_build_id = 0;
1105
		dso->has_srcline = 1;
1106
		dso->a2l_fails = 1;
1107 1108
		dso->kernel = DSO_TYPE_USER;
		dso->needs_swap = DSO_SWAP__UNSET;
1109
		RB_CLEAR_NODE(&dso->rb_node);
1110
		dso->root = NULL;
1111
		INIT_LIST_HEAD(&dso->node);
1112
		INIT_LIST_HEAD(&dso->data.open_entry);
1113
		pthread_mutex_init(&dso->lock, NULL);
1114
		refcount_set(&dso->refcnt, 1);
1115 1116 1117 1118 1119 1120 1121 1122
	}

	return dso;
}

void dso__delete(struct dso *dso)
{
	int i;
1123 1124 1125 1126

	if (!RB_EMPTY_NODE(&dso->rb_node))
		pr_err("DSO %s is still in rbtree when being deleted!\n",
		       dso->long_name);
1127 1128
	for (i = 0; i < MAP__NR_TYPES; ++i)
		symbols__delete(&dso->symbols[i]);
1129 1130

	if (dso->short_name_allocated) {
1131
		zfree((char **)&dso->short_name);
1132 1133 1134 1135
		dso->short_name_allocated = false;
	}

	if (dso->long_name_allocated) {
1136
		zfree((char **)&dso->long_name);
1137 1138 1139
		dso->long_name_allocated = false;
	}

1140
	dso__data_close(dso);
1141
	auxtrace_cache__free(dso->auxtrace_cache);
1142
	dso_cache__free(dso);
1143
	dso__free_a2l(dso);
1144
	zfree(&dso->symsrc_filename);
1145
	pthread_mutex_destroy(&dso->lock);
1146 1147 1148
	free(dso);
}

1149 1150 1151
struct dso *dso__get(struct dso *dso)
{
	if (dso)
1152
		refcount_inc(&dso->refcnt);
1153 1154 1155 1156 1157
	return dso;
}

void dso__put(struct dso *dso)
{
1158
	if (dso && refcount_dec_and_test(&dso->refcnt))
1159 1160 1161
		dso__delete(dso);
}

1162 1163 1164 1165 1166 1167 1168 1169 1170 1171 1172 1173 1174 1175 1176 1177 1178 1179 1180 1181 1182 1183 1184 1185 1186 1187 1188 1189 1190 1191 1192 1193 1194 1195 1196 1197 1198 1199 1200 1201 1202 1203 1204 1205 1206 1207 1208 1209 1210 1211
void dso__set_build_id(struct dso *dso, void *build_id)
{
	memcpy(dso->build_id, build_id, sizeof(dso->build_id));
	dso->has_build_id = 1;
}

bool dso__build_id_equal(const struct dso *dso, u8 *build_id)
{
	return memcmp(dso->build_id, build_id, sizeof(dso->build_id)) == 0;
}

void dso__read_running_kernel_build_id(struct dso *dso, struct machine *machine)
{
	char path[PATH_MAX];

	if (machine__is_default_guest(machine))
		return;
	sprintf(path, "%s/sys/kernel/notes", machine->root_dir);
	if (sysfs__read_build_id(path, dso->build_id,
				 sizeof(dso->build_id)) == 0)
		dso->has_build_id = true;
}

int dso__kernel_module_get_build_id(struct dso *dso,
				    const char *root_dir)
{
	char filename[PATH_MAX];
	/*
	 * kernel module short names are of the form "[module]" and
	 * we need just "module" here.
	 */
	const char *name = dso->short_name + 1;

	snprintf(filename, sizeof(filename),
		 "%s/sys/module/%.*s/notes/.note.gnu.build-id",
		 root_dir, (int)strlen(name) - 1, name);

	if (sysfs__read_build_id(filename, dso->build_id,
				 sizeof(dso->build_id)) == 0)
		dso->has_build_id = true;

	return 0;
}

bool __dsos__read_build_ids(struct list_head *head, bool with_hits)
{
	bool have_build_id = false;
	struct dso *pos;

	list_for_each_entry(pos, head, node) {
1212
		if (with_hits && !pos->hit && !dso__is_vdso(pos))
1213 1214 1215 1216 1217 1218 1219 1220 1221 1222 1223 1224 1225 1226 1227
			continue;
		if (pos->has_build_id) {
			have_build_id = true;
			continue;
		}
		if (filename__read_build_id(pos->long_name, pos->build_id,
					    sizeof(pos->build_id)) > 0) {
			have_build_id	  = true;
			pos->has_build_id = true;
		}
	}

	return have_build_id;
}

1228
void __dsos__add(struct dsos *dsos, struct dso *dso)
1229
{
1230
	list_add_tail(&dso->node, &dsos->head);
1231
	__dso__findlink_by_longname(&dsos->root, dso, NULL);
1232 1233 1234 1235 1236 1237 1238 1239 1240 1241 1242 1243 1244 1245 1246 1247 1248 1249 1250 1251 1252
	/*
	 * It is now in the linked list, grab a reference, then garbage collect
	 * this when needing memory, by looking at LRU dso instances in the
	 * list with atomic_read(&dso->refcnt) == 1, i.e. no references
	 * anywhere besides the one for the list, do, under a lock for the
	 * list: remove it from the list, then a dso__put(), that probably will
	 * be the last and will then call dso__delete(), end of life.
	 *
	 * That, or at the end of the 'struct machine' lifetime, when all
	 * 'struct dso' instances will be removed from the list, in
	 * dsos__exit(), if they have no other reference from some other data
	 * structure.
	 *
	 * E.g.: after processing a 'perf.data' file and storing references
	 * to objects instantiated while processing events, we will have
	 * references to the 'thread', 'map', 'dso' structs all from 'struct
	 * hist_entry' instances, but we may not need anything not referenced,
	 * so we might as well call machines__exit()/machines__delete() and
	 * garbage collect it.
	 */
	dso__get(dso);
1253 1254 1255 1256 1257 1258 1259
}

void dsos__add(struct dsos *dsos, struct dso *dso)
{
	pthread_rwlock_wrlock(&dsos->lock);
	__dsos__add(dsos, dso);
	pthread_rwlock_unlock(&dsos->lock);
1260 1261
}

1262
struct dso *__dsos__find(struct dsos *dsos, const char *name, bool cmp_short)
1263 1264 1265
{
	struct dso *pos;

1266
	if (cmp_short) {
1267
		list_for_each_entry(pos, &dsos->head, node)
1268 1269 1270 1271
			if (strcmp(pos->short_name, name) == 0)
				return pos;
		return NULL;
	}
1272
	return __dso__find_by_longname(&dsos->root, name);
1273 1274
}

1275 1276 1277 1278 1279 1280 1281 1282 1283 1284
struct dso *dsos__find(struct dsos *dsos, const char *name, bool cmp_short)
{
	struct dso *dso;
	pthread_rwlock_rdlock(&dsos->lock);
	dso = __dsos__find(dsos, name, cmp_short);
	pthread_rwlock_unlock(&dsos->lock);
	return dso;
}

struct dso *__dsos__addnew(struct dsos *dsos, const char *name)
1285
{
1286
	struct dso *dso = dso__new(name);
1287

1288
	if (dso != NULL) {
1289
		__dsos__add(dsos, dso);
1290
		dso__set_basename(dso);
1291 1292
		/* Put dso here because __dsos_add already got it */
		dso__put(dso);
1293 1294 1295 1296
	}
	return dso;
}

1297 1298
struct dso *__dsos__findnew(struct dsos *dsos, const char *name)
{
1299 1300 1301 1302
	struct dso *dso = __dsos__find(dsos, name, false);

	return dso ? dso : __dsos__addnew(dsos, name);
}
1303

1304 1305 1306 1307
struct dso *dsos__findnew(struct dsos *dsos, const char *name)
{
	struct dso *dso;
	pthread_rwlock_wrlock(&dsos->lock);
1308
	dso = dso__get(__dsos__findnew(dsos, name));
1309 1310
	pthread_rwlock_unlock(&dsos->lock);
	return dso;
1311 1312
}

1313
size_t __dsos__fprintf_buildid(struct list_head *head, FILE *fp,
1314
			       bool (skip)(struct dso *dso, int parm), int parm)
1315 1316 1317 1318 1319
{
	struct dso *pos;
	size_t ret = 0;

	list_for_each_entry(pos, head, node) {
1320
		if (skip && skip(pos, parm))
1321 1322 1323 1324 1325 1326 1327 1328 1329 1330 1331 1332 1333 1334 1335 1336 1337 1338 1339 1340 1341 1342 1343
			continue;
		ret += dso__fprintf_buildid(pos, fp);
		ret += fprintf(fp, " %s\n", pos->long_name);
	}
	return ret;
}

size_t __dsos__fprintf(struct list_head *head, FILE *fp)
{
	struct dso *pos;
	size_t ret = 0;

	list_for_each_entry(pos, head, node) {
		int i;
		for (i = 0; i < MAP__NR_TYPES; ++i)
			ret += dso__fprintf(pos, i, fp);
	}

	return ret;
}

size_t dso__fprintf_buildid(struct dso *dso, FILE *fp)
{
1344
	char sbuild_id[SBUILD_ID_SIZE];
1345 1346 1347 1348 1349 1350 1351 1352 1353 1354 1355 1356 1357

	build_id__sprintf(dso->build_id, sizeof(dso->build_id), sbuild_id);
	return fprintf(fp, "%s", sbuild_id);
}

size_t dso__fprintf(struct dso *dso, enum map_type type, FILE *fp)
{
	struct rb_node *nd;
	size_t ret = fprintf(fp, "dso: %s (", dso->short_name);

	if (dso->short_name != dso->long_name)
		ret += fprintf(fp, "%s, ", dso->long_name);
	ret += fprintf(fp, "%s, %sloaded, ", map_type__name[type],
1358
		       dso__loaded(dso, type) ? "" : "NOT ");
1359 1360 1361 1362 1363 1364 1365 1366 1367
	ret += dso__fprintf_buildid(dso, fp);
	ret += fprintf(fp, ")\n");
	for (nd = rb_first(&dso->symbols[type]); nd; nd = rb_next(nd)) {
		struct symbol *pos = rb_entry(nd, struct symbol, rb_node);
		ret += symbol__fprintf(pos, fp);
	}

	return ret;
}
A
Adrian Hunter 已提交
1368 1369 1370 1371

enum dso_type dso__type(struct dso *dso, struct machine *machine)
{
	int fd;
1372
	enum dso_type type = DSO__TYPE_UNKNOWN;
A
Adrian Hunter 已提交
1373

1374 1375 1376 1377 1378
	fd = dso__data_get_fd(dso, machine);
	if (fd >= 0) {
		type = dso__type_fd(fd);
		dso__data_put_fd(dso);
	}
A
Adrian Hunter 已提交
1379

1380
	return type;
A
Adrian Hunter 已提交
1381
}
1382 1383 1384 1385 1386 1387 1388 1389 1390 1391 1392 1393 1394 1395 1396 1397 1398 1399

int dso__strerror_load(struct dso *dso, char *buf, size_t buflen)
{
	int idx, errnum = dso->load_errno;
	/*
	 * This must have a same ordering as the enum dso_load_errno.
	 */
	static const char *dso_load__error_str[] = {
	"Internal tools/perf/ library error",
	"Invalid ELF file",
	"Can not read build id",
	"Mismatching build id",
	"Decompression failure",
	};

	BUG_ON(buflen == 0);

	if (errnum >= 0) {
1400
		const char *err = str_error_r(errnum, buf, buflen);
1401 1402 1403 1404 1405 1406 1407 1408 1409 1410 1411 1412 1413 1414

		if (err != buf)
			scnprintf(buf, buflen, "%s", err);

		return 0;
	}

	if (errnum <  __DSO_LOAD_ERRNO__START || errnum >= __DSO_LOAD_ERRNO__END)
		return -1;

	idx = errnum - __DSO_LOAD_ERRNO__START;
	scnprintf(buf, buflen, "%s", dso_load__error_str[idx]);
	return 0;
}