desc.h 12.4 KB
Newer Older
H
H. Peter Anvin 已提交
1 2
#ifndef _ASM_X86_DESC_H
#define _ASM_X86_DESC_H
3 4 5

#include <asm/desc_defs.h>
#include <asm/ldt.h>
6
#include <asm/mmu.h>
I
Ingo Molnar 已提交
7

8
#include <linux/smp.h>
9
#include <linux/percpu.h>
10

I
Ingo Molnar 已提交
11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29
static inline void fill_ldt(struct desc_struct *desc, const struct user_desc *info)
{
	desc->limit0		= info->limit & 0x0ffff;

	desc->base0		= (info->base_addr & 0x0000ffff);
	desc->base1		= (info->base_addr & 0x00ff0000) >> 16;

	desc->type		= (info->read_exec_only ^ 1) << 1;
	desc->type	       |= info->contents << 2;

	desc->s			= 1;
	desc->dpl		= 0x3;
	desc->p			= info->seg_not_present ^ 1;
	desc->limit		= (info->limit & 0xf0000) >> 16;
	desc->avl		= info->useable;
	desc->d			= info->seg_32bit;
	desc->g			= info->limit_in_pages;

	desc->base2		= (info->base_addr & 0xff000000) >> 24;
30
	/*
31 32
	 * Don't allow setting of the lm bit. It would confuse
	 * user_64bit_mode and would get overridden by sysret anyway.
33
	 */
I
Ingo Molnar 已提交
34
	desc->l			= 0;
35 36
}

37 38
extern struct desc_ptr idt_descr;
extern gate_desc idt_table[];
39 40
extern struct desc_ptr debug_idt_descr;
extern gate_desc debug_idt_table[];
41

42 43 44
struct gdt_page {
	struct desc_struct gdt[GDT_ENTRIES];
} __attribute__((aligned(PAGE_SIZE)));
I
Ingo Molnar 已提交
45

46
DECLARE_PER_CPU_PAGE_ALIGNED(struct gdt_page, gdt_page);
47 48 49 50 51 52

static inline struct desc_struct *get_cpu_gdt_table(unsigned int cpu)
{
	return per_cpu(gdt_page, cpu).gdt;
}

53
#ifdef CONFIG_X86_64
54 55 56 57

static inline void pack_gate(gate_desc *gate, unsigned type, unsigned long func,
			     unsigned dpl, unsigned ist, unsigned seg)
{
I
Ingo Molnar 已提交
58 59 60 61 62 63 64 65 66 67
	gate->offset_low	= PTR_LOW(func);
	gate->segment		= __KERNEL_CS;
	gate->ist		= ist;
	gate->p			= 1;
	gate->dpl		= dpl;
	gate->zero0		= 0;
	gate->zero1		= 0;
	gate->type		= type;
	gate->offset_middle	= PTR_MIDDLE(func);
	gate->offset_high	= PTR_HIGH(func);
68 69
}

70
#else
71
static inline void pack_gate(gate_desc *gate, unsigned char type,
72 73
			     unsigned long base, unsigned dpl, unsigned flags,
			     unsigned short seg)
74 75
{
	gate->a = (seg << 16) | (base & 0xffff);
I
Ingo Molnar 已提交
76
	gate->b = (base & 0xffff0000) | (((0x80 | type | (dpl << 5)) & 0xff) << 8);
77 78
}

79 80
#endif

81 82 83
static inline int desc_empty(const void *ptr)
{
	const u32 *desc = ptr;
I
Ingo Molnar 已提交
84

85 86 87
	return !(desc[0] | desc[1]);
}

88 89 90
#ifdef CONFIG_PARAVIRT
#include <asm/paravirt.h>
#else
I
Ingo Molnar 已提交
91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106
#define load_TR_desc()				native_load_tr_desc()
#define load_gdt(dtr)				native_load_gdt(dtr)
#define load_idt(dtr)				native_load_idt(dtr)
#define load_tr(tr)				asm volatile("ltr %0"::"m" (tr))
#define load_ldt(ldt)				asm volatile("lldt %0"::"m" (ldt))

#define store_gdt(dtr)				native_store_gdt(dtr)
#define store_idt(dtr)				native_store_idt(dtr)
#define store_tr(tr)				(tr = native_store_tr())

#define load_TLS(t, cpu)			native_load_tls(t, cpu)
#define set_ldt					native_set_ldt

#define write_ldt_entry(dt, entry, desc)	native_write_ldt_entry(dt, entry, desc)
#define write_gdt_entry(dt, entry, desc, type)	native_write_gdt_entry(dt, entry, desc, type)
#define write_idt_entry(dt, entry, g)		native_write_idt_entry(dt, entry, g)
107 108 109 110 111 112 113 114 115

static inline void paravirt_alloc_ldt(struct desc_struct *ldt, unsigned entries)
{
}

static inline void paravirt_free_ldt(struct desc_struct *ldt, unsigned entries)
{
}
#endif	/* CONFIG_PARAVIRT */
116

117 118
#define store_ldt(ldt) asm("sldt %0" : "=m"(ldt))

I
Ingo Molnar 已提交
119
static inline void native_write_idt_entry(gate_desc *idt, int entry, const gate_desc *gate)
120 121 122 123
{
	memcpy(&idt[entry], gate, sizeof(*gate));
}

I
Ingo Molnar 已提交
124
static inline void native_write_ldt_entry(struct desc_struct *ldt, int entry, const void *desc)
125 126 127 128
{
	memcpy(&ldt[entry], desc, 8);
}

I
Ingo Molnar 已提交
129 130
static inline void
native_write_gdt_entry(struct desc_struct *gdt, int entry, const void *desc, int type)
131 132
{
	unsigned int size;
I
Ingo Molnar 已提交
133

134
	switch (type) {
I
Ingo Molnar 已提交
135 136 137
	case DESC_TSS:	size = sizeof(tss_desc);	break;
	case DESC_LDT:	size = sizeof(ldt_desc);	break;
	default:	size = sizeof(*gdt);		break;
138
	}
I
Ingo Molnar 已提交
139

140 141 142 143 144 145 146 147 148
	memcpy(&gdt[entry], desc, size);
}

static inline void pack_descriptor(struct desc_struct *desc, unsigned long base,
				   unsigned long limit, unsigned char type,
				   unsigned char flags)
{
	desc->a = ((base & 0xffff) << 16) | (limit & 0xffff);
	desc->b = (base & 0xff000000) | ((base & 0xff0000) >> 16) |
149 150
		(limit & 0x000f0000) | ((type & 0xff) << 8) |
		((flags & 0xf) << 20);
151 152 153 154
	desc->p = 1;
}


I
Ingo Molnar 已提交
155
static inline void set_tssldt_descriptor(void *d, unsigned long addr, unsigned type, unsigned size)
156 157
{
#ifdef CONFIG_X86_64
158
	struct ldttss_desc64 *desc = d;
I
Ingo Molnar 已提交
159

160
	memset(desc, 0, sizeof(*desc));
I
Ingo Molnar 已提交
161 162 163 164 165 166 167 168 169

	desc->limit0		= size & 0xFFFF;
	desc->base0		= PTR_LOW(addr);
	desc->base1		= PTR_MIDDLE(addr) & 0xFF;
	desc->type		= type;
	desc->p			= 1;
	desc->limit1		= (size >> 16) & 0xF;
	desc->base2		= (PTR_MIDDLE(addr) >> 8) & 0xFF;
	desc->base3		= PTR_HIGH(addr);
170
#else
171
	pack_descriptor((struct desc_struct *)d, addr, size, 0x80 | type, 0);
172 173 174 175 176 177 178 179 180 181 182 183 184 185 186
#endif
}

static inline void __set_tss_desc(unsigned cpu, unsigned int entry, void *addr)
{
	struct desc_struct *d = get_cpu_gdt_table(cpu);
	tss_desc tss;

	/*
	 * sizeof(unsigned long) coming from an extra "long" at the end
	 * of the iobitmap. See tss_struct definition in processor.h
	 *
	 * -1? seg base+limit should be pointing to the address of the
	 * last valid byte
	 */
187
	set_tssldt_descriptor(&tss, (unsigned long)addr, DESC_TSS,
188 189
			      IO_BITMAP_OFFSET + IO_BITMAP_BYTES +
			      sizeof(unsigned long) - 1);
190 191 192 193 194
	write_gdt_entry(d, entry, &tss, DESC_TSS);
}

#define set_tss_desc(cpu, addr) __set_tss_desc(cpu, GDT_ENTRY_TSS, addr)

195 196 197
static inline void native_set_ldt(const void *addr, unsigned int entries)
{
	if (likely(entries == 0))
198
		asm volatile("lldt %w0"::"q" (0));
199 200 201 202
	else {
		unsigned cpu = smp_processor_id();
		ldt_desc ldt;

M
Michael Karcher 已提交
203 204
		set_tssldt_descriptor(&ldt, (unsigned long)addr, DESC_LDT,
				      entries * LDT_ENTRY_SIZE - 1);
205 206
		write_gdt_entry(get_cpu_gdt_table(cpu), GDT_ENTRY_LDT,
				&ldt, DESC_LDT);
207
		asm volatile("lldt %w0"::"q" (GDT_ENTRY_LDT*8));
208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238
	}
}

static inline void native_load_tr_desc(void)
{
	asm volatile("ltr %w0"::"q" (GDT_ENTRY_TSS*8));
}

static inline void native_load_gdt(const struct desc_ptr *dtr)
{
	asm volatile("lgdt %0"::"m" (*dtr));
}

static inline void native_load_idt(const struct desc_ptr *dtr)
{
	asm volatile("lidt %0"::"m" (*dtr));
}

static inline void native_store_gdt(struct desc_ptr *dtr)
{
	asm volatile("sgdt %0":"=m" (*dtr));
}

static inline void native_store_idt(struct desc_ptr *dtr)
{
	asm volatile("sidt %0":"=m" (*dtr));
}

static inline unsigned long native_store_tr(void)
{
	unsigned long tr;
I
Ingo Molnar 已提交
239

240
	asm volatile("str %0":"=r" (tr));
I
Ingo Molnar 已提交
241

242 243 244 245 246 247
	return tr;
}

static inline void native_load_tls(struct thread_struct *t, unsigned int cpu)
{
	struct desc_struct *gdt = get_cpu_gdt_table(cpu);
I
Ingo Molnar 已提交
248
	unsigned int i;
249 250 251 252 253

	for (i = 0; i < GDT_ENTRY_TLS_ENTRIES; i++)
		gdt[GDT_ENTRY_TLS_MIN + i] = t->tls_array[i];
}

254 255 256 257 258 259 260 261 262
#define _LDT_empty(info)				\
	((info)->base_addr		== 0	&&	\
	 (info)->limit			== 0	&&	\
	 (info)->contents		== 0	&&	\
	 (info)->read_exec_only		== 1	&&	\
	 (info)->seg_32bit		== 0	&&	\
	 (info)->limit_in_pages		== 0	&&	\
	 (info)->seg_not_present	== 1	&&	\
	 (info)->useable		== 0)
263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289

#ifdef CONFIG_X86_64
#define LDT_empty(info) (_LDT_empty(info) && ((info)->lm == 0))
#else
#define LDT_empty(info) (_LDT_empty(info))
#endif

static inline void clear_LDT(void)
{
	set_ldt(NULL, 0);
}

/*
 * load one particular LDT into the current CPU
 */
static inline void load_LDT_nolock(mm_context_t *pc)
{
	set_ldt(pc->ldt, pc->size);
}

static inline void load_LDT(mm_context_t *pc)
{
	preempt_disable();
	load_LDT_nolock(pc);
	preempt_enable();
}

290
static inline unsigned long get_desc_base(const struct desc_struct *desc)
291
{
292
	return (unsigned)(desc->base0 | ((desc->base1) << 16) | ((desc->base2) << 24));
293
}
294

295 296 297 298 299 300 301
static inline void set_desc_base(struct desc_struct *desc, unsigned long base)
{
	desc->base0 = base & 0xffff;
	desc->base1 = (base >> 16) & 0xff;
	desc->base2 = (base >> 24) & 0xff;
}

302 303 304 305 306
static inline unsigned long get_desc_limit(const struct desc_struct *desc)
{
	return desc->limit0 | (desc->limit << 16);
}

307 308 309 310 311 312
static inline void set_desc_limit(struct desc_struct *desc, unsigned long limit)
{
	desc->limit0 = limit & 0xffff;
	desc->limit = (limit >> 16) & 0xf;
}

313 314 315 316 317 318
#ifdef CONFIG_X86_64
static inline void set_nmi_gate(int gate, void *addr)
{
	gate_desc s;

	pack_gate(&s, GATE_INTERRUPT, (unsigned long)addr, 0, 0, __KERNEL_CS);
319
	write_idt_entry(debug_idt_table, gate, &s);
320 321 322
}
#endif

323 324 325 326 327 328 329 330 331 332 333 334 335
#ifdef CONFIG_TRACING
extern struct desc_ptr trace_idt_descr;
extern gate_desc trace_idt_table[];
static inline void write_trace_idt_entry(int entry, const gate_desc *gate)
{
	write_idt_entry(trace_idt_table, entry, gate);
}
#else
static inline void write_trace_idt_entry(int entry, const gate_desc *gate)
{
}
#endif

336
static inline void _set_gate(int gate, unsigned type, void *addr,
337
			     unsigned dpl, unsigned ist, unsigned seg)
338 339
{
	gate_desc s;
I
Ingo Molnar 已提交
340

341 342 343 344 345 346
	pack_gate(&s, type, (unsigned long)addr, dpl, ist, seg);
	/*
	 * does not need to be atomic because it is only done once at
	 * setup time
	 */
	write_idt_entry(idt_table, gate, &s);
347
	write_trace_idt_entry(gate, &s);
348 349 350 351 352 353 354 355 356 357 358 359 360 361
}

/*
 * This needs to use 'idt_table' rather than 'idt', and
 * thus use the _nonmapped_ version of the IDT, as the
 * Pentium F0 0F bugfix can have resulted in the mapped
 * IDT being write-protected.
 */
static inline void set_intr_gate(unsigned int n, void *addr)
{
	BUG_ON((unsigned)n > 0xFF);
	_set_gate(n, GATE_INTERRUPT, addr, 0, 0, __KERNEL_CS);
}

362
extern int first_system_vector;
363 364
/* used_vectors is BITMAP for irq is not managed by percpu vector_irq */
extern unsigned long used_vectors[];
365 366 367

static inline void alloc_system_vector(int vector)
{
368 369
	if (!test_bit(vector, used_vectors)) {
		set_bit(vector, used_vectors);
370 371
		if (first_system_vector > vector)
			first_system_vector = vector;
I
Ingo Molnar 已提交
372
	} else {
373
		BUG();
I
Ingo Molnar 已提交
374
	}
375 376
}

377 378 379 380 381 382 383 384 385 386 387 388 389 390 391 392 393 394 395 396 397 398
#ifdef CONFIG_TRACING
static inline void trace_set_intr_gate(unsigned int gate, void *addr)
{
	gate_desc s;

	pack_gate(&s, GATE_INTERRUPT, (unsigned long)addr, 0, 0, __KERNEL_CS);
	write_idt_entry(trace_idt_table, gate, &s);
}

static inline void __trace_alloc_intr_gate(unsigned int n, void *addr)
{
	trace_set_intr_gate(n, addr);
}
#else
static inline void trace_set_intr_gate(unsigned int gate, void *addr)
{
}

#define __trace_alloc_intr_gate(n, addr)
#endif

static inline void __alloc_intr_gate(unsigned int n, void *addr)
399 400 401 402
{
	set_intr_gate(n, addr);
}

403 404 405 406 407 408 409
#define alloc_intr_gate(n, addr)				\
	do {							\
		alloc_system_vector(n);				\
		__alloc_intr_gate(n, addr);			\
		__trace_alloc_intr_gate(n, trace_##addr);	\
	} while (0)

410 411 412 413 414 415 416 417 418
/*
 * This routine sets up an interrupt gate at directory privilege level 3.
 */
static inline void set_system_intr_gate(unsigned int n, void *addr)
{
	BUG_ON((unsigned)n > 0xFF);
	_set_gate(n, GATE_INTERRUPT, addr, 0x3, 0, __KERNEL_CS);
}

419
static inline void set_system_trap_gate(unsigned int n, void *addr)
420 421
{
	BUG_ON((unsigned)n > 0xFF);
422
	_set_gate(n, GATE_TRAP, addr, 0x3, 0, __KERNEL_CS);
423 424
}

425
static inline void set_trap_gate(unsigned int n, void *addr)
426 427
{
	BUG_ON((unsigned)n > 0xFF);
428
	_set_gate(n, GATE_TRAP, addr, 0, 0, __KERNEL_CS);
429 430 431 432 433 434 435 436 437 438 439 440 441 442
}

static inline void set_task_gate(unsigned int n, unsigned int gdt_entry)
{
	BUG_ON((unsigned)n > 0xFF);
	_set_gate(n, GATE_TASK, (void *)0, 0, 0, (gdt_entry<<3));
}

static inline void set_intr_gate_ist(int n, void *addr, unsigned ist)
{
	BUG_ON((unsigned)n > 0xFF);
	_set_gate(n, GATE_INTERRUPT, addr, 0, ist, __KERNEL_CS);
}

443
static inline void set_system_intr_gate_ist(int n, void *addr, unsigned ist)
444 445 446 447
{
	BUG_ON((unsigned)n > 0xFF);
	_set_gate(n, GATE_INTERRUPT, addr, 0x3, ist, __KERNEL_CS);
}
448

449 450 451 452 453 454 455 456 457 458 459 460 461 462 463 464 465 466 467 468 469 470 471 472 473
#ifdef CONFIG_X86_64
DECLARE_PER_CPU(u32, debug_idt_ctr);
static inline bool is_debug_idt_enabled(void)
{
	if (this_cpu_read(debug_idt_ctr))
		return true;

	return false;
}

static inline void load_debug_idt(void)
{
	load_idt((const struct desc_ptr *)&debug_idt_descr);
}
#else
static inline bool is_debug_idt_enabled(void)
{
	return false;
}

static inline void load_debug_idt(void)
{
}
#endif

474 475 476 477 478 479 480 481 482 483 484 485 486 487 488 489 490 491 492 493 494 495 496 497 498
#ifdef CONFIG_TRACING
extern atomic_t trace_idt_ctr;
static inline bool is_trace_idt_enabled(void)
{
	if (atomic_read(&trace_idt_ctr))
		return true;

	return false;
}

static inline void load_trace_idt(void)
{
	load_idt((const struct desc_ptr *)&trace_idt_descr);
}
#else
static inline bool is_trace_idt_enabled(void)
{
	return false;
}

static inline void load_trace_idt(void)
{
}
#endif

499
/*
500
 * The load_current_idt() must be called with interrupts disabled
501
 * to avoid races. That way the IDT will always be set back to the expected
502 503 504
 * descriptor. It's also called when a CPU is being initialized, and
 * that doesn't need to disable interrupts, as nothing should be
 * bothering the CPU then.
505 506 507 508 509
 */
static inline void load_current_idt(void)
{
	if (is_debug_idt_enabled())
		load_debug_idt();
510 511
	else if (is_trace_idt_enabled())
		load_trace_idt();
512 513 514
	else
		load_idt((const struct desc_ptr *)&idt_descr);
}
H
H. Peter Anvin 已提交
515
#endif /* _ASM_X86_DESC_H */