ds.c 10.8 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113
/*
 * Debug Store support
 *
 * This provides a low-level interface to the hardware's Debug Store
 * feature that is used for last branch recording (LBR) and
 * precise-event based sampling (PEBS).
 *
 * Different architectures use a different DS layout/pointer size.
 * The below functions therefore work on a void*.
 *
 *
 * Since there is no user for PEBS, yet, only LBR (or branch
 * trace store, BTS) is supported.
 *
 *
 * Copyright (C) 2007 Intel Corporation.
 * Markus Metzger <markus.t.metzger@intel.com>, Dec 2007
 */

#include <asm/ds.h>

#include <linux/errno.h>
#include <linux/string.h>
#include <linux/slab.h>


/*
 * Debug Store (DS) save area configuration (see Intel64 and IA32
 * Architectures Software Developer's Manual, section 18.5)
 *
 * The DS configuration consists of the following fields; different
 * architetures vary in the size of those fields.
 * - double-word aligned base linear address of the BTS buffer
 * - write pointer into the BTS buffer
 * - end linear address of the BTS buffer (one byte beyond the end of
 *   the buffer)
 * - interrupt pointer into BTS buffer
 *   (interrupt occurs when write pointer passes interrupt pointer)
 * - double-word aligned base linear address of the PEBS buffer
 * - write pointer into the PEBS buffer
 * - end linear address of the PEBS buffer (one byte beyond the end of
 *   the buffer)
 * - interrupt pointer into PEBS buffer
 *   (interrupt occurs when write pointer passes interrupt pointer)
 * - value to which counter is reset following counter overflow
 *
 * On later architectures, the last branch recording hardware uses
 * 64bit pointers even in 32bit mode.
 *
 *
 * Branch Trace Store (BTS) records store information about control
 * flow changes. They at least provide the following information:
 * - source linear address
 * - destination linear address
 *
 * Netburst supported a predicated bit that had been dropped in later
 * architectures. We do not suppor it.
 *
 *
 * In order to abstract from the actual DS and BTS layout, we describe
 * the access to the relevant fields.
 * Thanks to Andi Kleen for proposing this design.
 *
 * The implementation, however, is not as general as it might seem. In
 * order to stay somewhat simple and efficient, we assume an
 * underlying unsigned type (mostly a pointer type) and we expect the
 * field to be at least as big as that type.
 */

/*
 * A special from_ip address to indicate that the BTS record is an
 * info record that needs to be interpreted or skipped.
 */
#define BTS_ESCAPE_ADDRESS (-1)

/*
 * A field access descriptor
 */
struct access_desc {
	unsigned char offset;
	unsigned char size;
};

/*
 * The configuration for a particular DS/BTS hardware implementation.
 */
struct ds_configuration {
	/* the DS configuration */
	unsigned char  sizeof_ds;
	struct access_desc bts_buffer_base;
	struct access_desc bts_index;
	struct access_desc bts_absolute_maximum;
	struct access_desc bts_interrupt_threshold;
	/* the BTS configuration */
	unsigned char  sizeof_bts;
	struct access_desc from_ip;
	struct access_desc to_ip;
	/* BTS variants used to store additional information like
	   timestamps */
	struct access_desc info_type;
	struct access_desc info_data;
	unsigned long debugctl_mask;
};

/*
 * The global configuration used by the below accessor functions
 */
static struct ds_configuration ds_cfg;

/*
 * Accessor functions for some DS and BTS fields using the above
 * global ptrace_bts_cfg.
 */
114
static inline unsigned long get_bts_buffer_base(char *base)
115
{
116
	return *(unsigned long *)(base + ds_cfg.bts_buffer_base.offset);
117
}
118
static inline void set_bts_buffer_base(char *base, unsigned long value)
119
{
120
	(*(unsigned long *)(base + ds_cfg.bts_buffer_base.offset)) = value;
121
}
122
static inline unsigned long get_bts_index(char *base)
123
{
124
	return *(unsigned long *)(base + ds_cfg.bts_index.offset);
125
}
126
static inline void set_bts_index(char *base, unsigned long value)
127
{
128
	(*(unsigned long *)(base + ds_cfg.bts_index.offset)) = value;
129
}
130
static inline unsigned long get_bts_absolute_maximum(char *base)
131
{
132
	return *(unsigned long *)(base + ds_cfg.bts_absolute_maximum.offset);
133
}
134
static inline void set_bts_absolute_maximum(char *base, unsigned long value)
135
{
136
	(*(unsigned long *)(base + ds_cfg.bts_absolute_maximum.offset)) = value;
137
}
138
static inline unsigned long get_bts_interrupt_threshold(char *base)
139
{
140
	return *(unsigned long *)(base + ds_cfg.bts_interrupt_threshold.offset);
141
}
142
static inline void set_bts_interrupt_threshold(char *base, unsigned long value)
143
{
144
	(*(unsigned long *)(base + ds_cfg.bts_interrupt_threshold.offset)) = value;
145
}
146
static inline unsigned long get_from_ip(char *base)
147
{
148
	return *(unsigned long *)(base + ds_cfg.from_ip.offset);
149
}
150
static inline void set_from_ip(char *base, unsigned long value)
151
{
152
	(*(unsigned long *)(base + ds_cfg.from_ip.offset)) = value;
153
}
154
static inline unsigned long get_to_ip(char *base)
155
{
156
	return *(unsigned long *)(base + ds_cfg.to_ip.offset);
157
}
158
static inline void set_to_ip(char *base, unsigned long value)
159
{
160
	(*(unsigned long *)(base + ds_cfg.to_ip.offset)) = value;
161 162 163 164 165 166 167 168 169
}
static inline unsigned char get_info_type(char *base)
{
	return *(unsigned char *)(base + ds_cfg.info_type.offset);
}
static inline void set_info_type(char *base, unsigned char value)
{
	(*(unsigned char *)(base + ds_cfg.info_type.offset)) = value;
}
170
static inline unsigned long get_info_data(char *base)
171
{
172
	return *(unsigned long *)(base + ds_cfg.info_data.offset);
173
}
174
static inline void set_info_data(char *base, unsigned long value)
175
{
176
	(*(unsigned long *)(base + ds_cfg.info_data.offset)) = value;
177 178 179
}


M
Markus Metzger 已提交
180
int ds_allocate(void **dsp, size_t bts_size_in_bytes)
181
{
M
Markus Metzger 已提交
182
	size_t bts_size_in_records;
183
	unsigned long bts;
M
Markus Metzger 已提交
184
	void *ds;
185 186 187 188

	if (!ds_cfg.sizeof_ds || !ds_cfg.sizeof_bts)
		return -EOPNOTSUPP;

M
Markus Metzger 已提交
189
	if (bts_size_in_bytes < 0)
190 191
		return -EINVAL;

M
Markus Metzger 已提交
192 193
	bts_size_in_records =
		bts_size_in_bytes / ds_cfg.sizeof_bts;
194 195 196 197 198 199
	bts_size_in_bytes =
		bts_size_in_records * ds_cfg.sizeof_bts;

	if (bts_size_in_bytes <= 0)
		return -EINVAL;

200
	bts = (unsigned long)kzalloc(bts_size_in_bytes, GFP_KERNEL);
201 202 203 204 205 206 207

	if (!bts)
		return -ENOMEM;

	ds = kzalloc(ds_cfg.sizeof_ds, GFP_KERNEL);

	if (!ds) {
208
		kfree((void *)bts);
209 210 211 212 213 214 215 216 217 218 219 220 221 222
		return -ENOMEM;
	}

	set_bts_buffer_base(ds, bts);
	set_bts_index(ds, bts);
	set_bts_absolute_maximum(ds, bts + bts_size_in_bytes);
	set_bts_interrupt_threshold(ds, bts + bts_size_in_bytes + 1);

	*dsp = ds;
	return 0;
}

int ds_free(void **dsp)
{
223
	if (*dsp) {
224
		kfree((void *)get_bts_buffer_base(*dsp));
225 226 227
		kfree(*dsp);
		*dsp = NULL;
	}
228 229 230 231 232
	return 0;
}

int ds_get_bts_size(void *ds)
{
233
	int size_in_bytes;
234 235 236 237

	if (!ds_cfg.sizeof_ds || !ds_cfg.sizeof_bts)
		return -EOPNOTSUPP;

M
Markus Metzger 已提交
238 239 240
	if (!ds)
		return 0;

241 242 243
	size_in_bytes =
		get_bts_absolute_maximum(ds) -
		get_bts_buffer_base(ds);
M
Markus Metzger 已提交
244 245 246 247 248
	return size_in_bytes;
}

int ds_get_bts_end(void *ds)
{
249
	int size_in_bytes = ds_get_bts_size(ds);
M
Markus Metzger 已提交
250 251 252

	if (size_in_bytes <= 0)
		return size_in_bytes;
253 254 255 256 257 258

	return size_in_bytes / ds_cfg.sizeof_bts;
}

int ds_get_bts_index(void *ds)
{
259
	int index_offset_in_bytes;
260 261 262 263 264 265 266 267 268 269 270

	if (!ds_cfg.sizeof_ds || !ds_cfg.sizeof_bts)
		return -EOPNOTSUPP;

	index_offset_in_bytes =
		get_bts_index(ds) -
		get_bts_buffer_base(ds);

	return index_offset_in_bytes / ds_cfg.sizeof_bts;
}

M
Markus Metzger 已提交
271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290
int ds_set_overflow(void *ds, int method)
{
	switch (method) {
	case DS_O_SIGNAL:
		return -EOPNOTSUPP;
	case DS_O_WRAP:
		return 0;
	default:
		return -EINVAL;
	}
}

int ds_get_overflow(void *ds)
{
	return DS_O_WRAP;
}

int ds_clear(void *ds)
{
	int bts_size = ds_get_bts_size(ds);
291
	unsigned long bts_base;
M
Markus Metzger 已提交
292 293 294 295 296

	if (bts_size <= 0)
		return bts_size;

	bts_base = get_bts_buffer_base(ds);
297
	memset((void *)bts_base, 0, bts_size);
M
Markus Metzger 已提交
298 299 300 301 302

	set_bts_index(ds, bts_base);
	return 0;
}

303
int ds_read_bts(void *ds, int index, struct bts_struct *out)
304 305 306 307 308 309 310 311 312 313 314 315
{
	void *bts;

	if (!ds_cfg.sizeof_ds || !ds_cfg.sizeof_bts)
		return -EOPNOTSUPP;

	if (index < 0)
		return -EINVAL;

	if (index >= ds_get_bts_size(ds))
		return -EINVAL;

316
	bts = (void *)(get_bts_buffer_base(ds) + (index * ds_cfg.sizeof_bts));
317 318 319

	memset(out, 0, sizeof(*out));
	if (get_from_ip(bts) == BTS_ESCAPE_ADDRESS) {
320 321
		out->qualifier       = get_info_type(bts);
		out->variant.jiffies = get_info_data(bts);
322 323 324 325 326 327
	} else {
		out->qualifier = BTS_BRANCH;
		out->variant.lbr.from_ip = get_from_ip(bts);
		out->variant.lbr.to_ip   = get_to_ip(bts);
	}

328
	return sizeof(*out);;
329 330 331 332
}

int ds_write_bts(void *ds, const struct bts_struct *in)
{
333
	unsigned long bts;
334 335 336 337 338 339 340 341 342

	if (!ds_cfg.sizeof_ds || !ds_cfg.sizeof_bts)
		return -EOPNOTSUPP;

	if (ds_get_bts_size(ds) <= 0)
		return -ENXIO;

	bts = get_bts_index(ds);

343
	memset((void *)bts, 0, ds_cfg.sizeof_bts);
344 345 346 347 348
	switch (in->qualifier) {
	case BTS_INVALID:
		break;

	case BTS_BRANCH:
349 350
		set_from_ip((void *)bts, in->variant.lbr.from_ip);
		set_to_ip((void *)bts, in->variant.lbr.to_ip);
351 352 353 354
		break;

	case BTS_TASK_ARRIVES:
	case BTS_TASK_DEPARTS:
355 356 357
		set_from_ip((void *)bts, BTS_ESCAPE_ADDRESS);
		set_info_type((void *)bts, in->qualifier);
		set_info_data((void *)bts, in->variant.jiffies);
358 359 360 361 362 363
		break;

	default:
		return -EINVAL;
	}

364
	bts = bts + ds_cfg.sizeof_bts;
365 366 367 368
	if (bts >= get_bts_absolute_maximum(ds))
		bts = get_bts_buffer_base(ds);
	set_bts_index(ds, bts);

369
	return ds_cfg.sizeof_bts;
370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387
}

unsigned long ds_debugctl_mask(void)
{
	return ds_cfg.debugctl_mask;
}

#ifdef __i386__
static const struct ds_configuration ds_cfg_netburst = {
	.sizeof_ds = 9 * 4,
	.bts_buffer_base = { 0, 4 },
	.bts_index = { 4, 4 },
	.bts_absolute_maximum = { 8, 4 },
	.bts_interrupt_threshold = { 12, 4 },
	.sizeof_bts = 3 * 4,
	.from_ip = { 0, 4 },
	.to_ip = { 4, 4 },
	.info_type = { 4, 1 },
388
	.info_data = { 8, 4 },
389 390 391 392 393 394 395 396 397 398 399 400 401
	.debugctl_mask = (1<<2)|(1<<3)
};

static const struct ds_configuration ds_cfg_pentium_m = {
	.sizeof_ds = 9 * 4,
	.bts_buffer_base = { 0, 4 },
	.bts_index = { 4, 4 },
	.bts_absolute_maximum = { 8, 4 },
	.bts_interrupt_threshold = { 12, 4 },
	.sizeof_bts = 3 * 4,
	.from_ip = { 0, 4 },
	.to_ip = { 4, 4 },
	.info_type = { 4, 1 },
402
	.info_data = { 8, 4 },
403 404 405 406 407 408 409 410 411 412 413 414 415 416
	.debugctl_mask = (1<<6)|(1<<7)
};
#endif /* _i386_ */

static const struct ds_configuration ds_cfg_core2 = {
	.sizeof_ds = 9 * 8,
	.bts_buffer_base = { 0, 8 },
	.bts_index = { 8, 8 },
	.bts_absolute_maximum = { 16, 8 },
	.bts_interrupt_threshold = { 24, 8 },
	.sizeof_bts = 3 * 8,
	.from_ip = { 0, 8 },
	.to_ip = { 8, 8 },
	.info_type = { 8, 1 },
417
	.info_data = { 16, 8 },
418 419 420 421 422 423 424 425 426 427 428 429 430 431 432 433 434 435 436 437 438 439 440 441 442 443 444 445 446 447 448 449 450 451 452 453 454 455 456 457 458 459 460 461 462 463 464
	.debugctl_mask = (1<<6)|(1<<7)|(1<<9)
};

static inline void
ds_configure(const struct ds_configuration *cfg)
{
	ds_cfg = *cfg;
}

void __cpuinit ds_init_intel(struct cpuinfo_x86 *c)
{
	switch (c->x86) {
	case 0x6:
		switch (c->x86_model) {
#ifdef __i386__
		case 0xD:
		case 0xE: /* Pentium M */
			ds_configure(&ds_cfg_pentium_m);
			break;
#endif /* _i386_ */
		case 0xF: /* Core2 */
			ds_configure(&ds_cfg_core2);
			break;
		default:
			/* sorry, don't know about them */
			break;
		}
		break;
	case 0xF:
		switch (c->x86_model) {
#ifdef __i386__
		case 0x0:
		case 0x1:
		case 0x2: /* Netburst */
			ds_configure(&ds_cfg_netburst);
			break;
#endif /* _i386_ */
		default:
			/* sorry, don't know about them */
			break;
		}
		break;
	default:
		/* sorry, don't know about them */
		break;
	}
}