thread_info.h 9.1 KB
Newer Older
C
Christoph Lameter 已提交
1 2 3 4 5 6
/* thread_info.h: low-level thread information
 *
 * Copyright (C) 2002  David Howells (dhowells@redhat.com)
 * - Incorporating suggestions made by Linus Torvalds and Dave Miller
 */

H
H. Peter Anvin 已提交
7 8
#ifndef _ASM_X86_THREAD_INFO_H
#define _ASM_X86_THREAD_INFO_H
C
Christoph Lameter 已提交
9 10 11

#include <linux/compiler.h>
#include <asm/page.h>
12
#include <asm/percpu.h>
13 14
#include <asm/types.h>

15 16 17 18 19 20 21 22 23 24 25 26 27 28 29
/*
 * TOP_OF_KERNEL_STACK_PADDING is a number of unused bytes that we
 * reserve at the top of the kernel stack.  We do it because of a nasty
 * 32-bit corner case.  On x86_32, the hardware stack frame is
 * variable-length.  Except for vm86 mode, struct pt_regs assumes a
 * maximum-length frame.  If we enter from CPL 0, the top 8 bytes of
 * pt_regs don't actually exist.  Ordinarily this doesn't matter, but it
 * does in at least one case:
 *
 * If we take an NMI early enough in SYSENTER, then we can end up with
 * pt_regs that extends above sp0.  On the way out, in the espfix code,
 * we can read the saved SS value, but that value will be above sp0.
 * Without this offset, that can result in a page fault.  (We are
 * careful that, in this case, the value we read doesn't matter.)
 *
30 31
 * In vm86 mode, the hardware frame is much longer still, so add 16
 * bytes to make room for the real-mode segments.
32 33 34 35
 *
 * x86_64 has a fixed-length stack frame.
 */
#ifdef CONFIG_X86_32
36 37 38 39 40
# ifdef CONFIG_VM86
#  define TOP_OF_KERNEL_STACK_PADDING 16
# else
#  define TOP_OF_KERNEL_STACK_PADDING 8
# endif
41 42 43 44
#else
# define TOP_OF_KERNEL_STACK_PADDING 0
#endif

C
Christoph Lameter 已提交
45 46 47 48 49 50
/*
 * low level task data that entry.S needs immediate access to
 * - this struct should fit entirely inside of one cache line
 * - this struct shares the supervisor stack pages
 */
#ifndef __ASSEMBLY__
51
struct task_struct;
52
#include <asm/cpufeature.h>
A
Arun Sharma 已提交
53
#include <linux/atomic.h>
C
Christoph Lameter 已提交
54 55 56

struct thread_info {
	struct task_struct	*task;		/* main task structure */
57
	__u32			flags;		/* low level flags */
58
	__u32			status;		/* thread synchronous flags */
C
Christoph Lameter 已提交
59
	__u32			cpu;		/* current CPU */
60
	mm_segment_t		addr_limit;
61 62
	unsigned int		sig_on_uaccess_error:1;
	unsigned int		uaccess_err:1;	/* uaccess failed */
C
Christoph Lameter 已提交
63
};
64 65 66 67 68 69 70 71 72 73 74 75

#define INIT_THREAD_INFO(tsk)			\
{						\
	.task		= &tsk,			\
	.flags		= 0,			\
	.cpu		= 0,			\
	.addr_limit	= KERNEL_DS,		\
}

#define init_thread_info	(init_thread_union.thread_info)
#define init_stack		(init_thread_union.stack)

C
Christoph Lameter 已提交
76 77 78 79 80 81
#else /* !__ASSEMBLY__ */

#include <asm/asm-offsets.h>

#endif

82 83 84 85 86 87 88 89 90
/*
 * thread information flags
 * - these are process state flags that various assembly files
 *   may need to access
 * - pending work-to-be-done flags are in LSW
 * - other flags in MSW
 * Warning: layout of LSW is hardcoded in entry.S
 */
#define TIF_SYSCALL_TRACE	0	/* syscall trace active */
91
#define TIF_NOTIFY_RESUME	1	/* callback before returning to user */
92 93 94 95 96 97
#define TIF_SIGPENDING		2	/* signal pending */
#define TIF_NEED_RESCHED	3	/* rescheduling necessary */
#define TIF_SINGLESTEP		4	/* reenable singlestep on user return*/
#define TIF_SYSCALL_EMU		6	/* syscall emulation active */
#define TIF_SYSCALL_AUDIT	7	/* syscall auditing active */
#define TIF_SECCOMP		8	/* secure computing */
A
Avi Kivity 已提交
98
#define TIF_USER_RETURN_NOTIFY	11	/* notify kernel of userspace return */
99
#define TIF_UPROBE		12	/* breakpointed or singlestepping */
100
#define TIF_NOTSC		16	/* TSC is not accessible in userland */
101
#define TIF_IA32		17	/* IA32 compatibility process */
102
#define TIF_FORK		18	/* ret_from_fork */
103
#define TIF_NOHZ		19	/* in adaptive nohz mode */
104
#define TIF_MEMDIE		20	/* is terminating due to OOM killer */
105
#define TIF_POLLING_NRFLAG	21	/* idle is polling for TIF_NEED_RESCHED */
106 107
#define TIF_IO_BITMAP		22	/* uses I/O bitmap */
#define TIF_FORCED_TF		24	/* true if TF in eflags artificially */
P
Peter Zijlstra 已提交
108
#define TIF_BLOCKSTEP		25	/* set when we want DEBUGCTLMSR_BTF */
109
#define TIF_LAZY_MMU_UPDATES	27	/* task is updating the mmu lazily */
110
#define TIF_SYSCALL_TRACEPOINT	28	/* syscall tracepoint instrumentation */
111
#define TIF_ADDR32		29	/* 32-bit address space on 64 bits */
112
#define TIF_X32			30	/* 32-bit native x86-64 binary */
113 114

#define _TIF_SYSCALL_TRACE	(1 << TIF_SYSCALL_TRACE)
115
#define _TIF_NOTIFY_RESUME	(1 << TIF_NOTIFY_RESUME)
116 117 118 119 120 121
#define _TIF_SIGPENDING		(1 << TIF_SIGPENDING)
#define _TIF_SINGLESTEP		(1 << TIF_SINGLESTEP)
#define _TIF_NEED_RESCHED	(1 << TIF_NEED_RESCHED)
#define _TIF_SYSCALL_EMU	(1 << TIF_SYSCALL_EMU)
#define _TIF_SYSCALL_AUDIT	(1 << TIF_SYSCALL_AUDIT)
#define _TIF_SECCOMP		(1 << TIF_SECCOMP)
A
Avi Kivity 已提交
122
#define _TIF_USER_RETURN_NOTIFY	(1 << TIF_USER_RETURN_NOTIFY)
123
#define _TIF_UPROBE		(1 << TIF_UPROBE)
124 125 126
#define _TIF_NOTSC		(1 << TIF_NOTSC)
#define _TIF_IA32		(1 << TIF_IA32)
#define _TIF_FORK		(1 << TIF_FORK)
127
#define _TIF_NOHZ		(1 << TIF_NOHZ)
128
#define _TIF_POLLING_NRFLAG	(1 << TIF_POLLING_NRFLAG)
129 130
#define _TIF_IO_BITMAP		(1 << TIF_IO_BITMAP)
#define _TIF_FORCED_TF		(1 << TIF_FORCED_TF)
P
Peter Zijlstra 已提交
131
#define _TIF_BLOCKSTEP		(1 << TIF_BLOCKSTEP)
132
#define _TIF_LAZY_MMU_UPDATES	(1 << TIF_LAZY_MMU_UPDATES)
133
#define _TIF_SYSCALL_TRACEPOINT	(1 << TIF_SYSCALL_TRACEPOINT)
134
#define _TIF_ADDR32		(1 << TIF_ADDR32)
135
#define _TIF_X32		(1 << TIF_X32)
136

137 138
/* work to do in syscall_trace_enter() */
#define _TIF_WORK_SYSCALL_ENTRY	\
139
	(_TIF_SYSCALL_TRACE | _TIF_SYSCALL_EMU | _TIF_SYSCALL_AUDIT |	\
140 141
	 _TIF_SECCOMP | _TIF_SINGLESTEP | _TIF_SYSCALL_TRACEPOINT |	\
	 _TIF_NOHZ)
142

143
/* work to do on any return to user space */
144
#define _TIF_ALLWORK_MASK						\
145 146
	((0x0000FFFF & ~_TIF_SECCOMP) | _TIF_SYSCALL_TRACEPOINT |	\
	_TIF_NOHZ)
147 148 149

/* flags to check in __switch_to() */
#define _TIF_WORK_CTXSW							\
P
Peter Zijlstra 已提交
150
	(_TIF_IO_BITMAP|_TIF_NOTSC|_TIF_BLOCKSTEP)
151

A
Avi Kivity 已提交
152
#define _TIF_WORK_CTXSW_PREV (_TIF_WORK_CTXSW|_TIF_USER_RETURN_NOTIFY)
O
Oleg Nesterov 已提交
153
#define _TIF_WORK_CTXSW_NEXT (_TIF_WORK_CTXSW)
154

155
#define STACK_WARN		(THREAD_SIZE/8)
156

C
Christoph Lameter 已提交
157 158 159 160 161 162 163
/*
 * macros/functions for gaining access to the thread information structure
 *
 * preempt_count needs to be 1 initially, until the scheduler is functional.
 */
#ifndef __ASSEMBLY__

164
static inline struct thread_info *current_thread_info(void)
C
Christoph Lameter 已提交
165
{
166
	return (struct thread_info *)(current_top_of_stack() - THREAD_SIZE);
C
Christoph Lameter 已提交
167 168
}

169 170 171 172 173 174 175 176 177 178 179
static inline unsigned long current_stack_pointer(void)
{
	unsigned long sp;
#ifdef CONFIG_X86_64
	asm("mov %%rsp,%0" : "=g" (sp));
#else
	asm("mov %%esp,%0" : "=g" (sp));
#endif
	return sp;
}

C
Christoph Lameter 已提交
180 181
#else /* !__ASSEMBLY__ */

182 183 184 185
#ifdef CONFIG_X86_64
# define cpu_current_top_of_stack (cpu_tss + TSS_sp0)
#endif

186
/* Load thread_info address into "reg" */
C
Christoph Lameter 已提交
187
#define GET_THREAD_INFO(reg) \
188
	_ASM_MOV PER_CPU_VAR(cpu_current_top_of_stack),reg ; \
189
	_ASM_SUB $(THREAD_SIZE),reg ;
C
Christoph Lameter 已提交
190

191
/*
192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207
 * ASM operand which evaluates to a 'thread_info' address of
 * the current task, if it is known that "reg" is exactly "off"
 * bytes below the top of the stack currently.
 *
 * ( The kernel stack's size is known at build time, it is usually
 *   2 or 4 pages, and the bottom  of the kernel stack contains
 *   the thread_info structure. So to access the thread_info very
 *   quickly from assembly code we can calculate down from the
 *   top of the kernel stack to the bottom, using constant,
 *   build-time calculations only. )
 *
 * For example, to fetch the current thread_info->flags value into %eax
 * on x86-64 defconfig kernels, in syscall entry code where RSP is
 * currently at exactly SIZEOF_PTREGS bytes away from the top of the
 * stack:
 *
208
 *      mov ASM_THREAD_INFO(TI_flags, %rsp, SIZEOF_PTREGS), %eax
209 210 211 212 213 214
 *
 * will translate to:
 *
 *      8b 84 24 b8 c0 ff ff      mov    -0x3f48(%rsp), %eax
 *
 * which is below the current RSP by almost 16K.
215
 */
216
#define ASM_THREAD_INFO(field, reg, off) ((field)+(off)-THREAD_SIZE)(reg)
217

C
Christoph Lameter 已提交
218 219 220 221 222 223 224 225 226
#endif

/*
 * Thread-synchronous status.
 *
 * This is different from the flags in that nobody else
 * ever touches our thread-synchronous status, so we don't
 * have to worry about atomic accesses.
 */
227
#define TS_COMPAT		0x0002	/* 32bit syscall active (64BIT)*/
I
Ingo Molnar 已提交
228
#define TS_RESTORE_SIGMASK	0x0008	/* restore signal mask in do_signal() */
C
Christoph Lameter 已提交
229

I
Ingo Molnar 已提交
230 231 232 233 234 235
#ifndef __ASSEMBLY__
#define HAVE_SET_RESTORE_SIGMASK	1
static inline void set_restore_sigmask(void)
{
	struct thread_info *ti = current_thread_info();
	ti->status |= TS_RESTORE_SIGMASK;
236
	WARN_ON(!test_bit(TIF_SIGPENDING, (unsigned long *)&ti->flags));
I
Ingo Molnar 已提交
237
}
238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253
static inline void clear_restore_sigmask(void)
{
	current_thread_info()->status &= ~TS_RESTORE_SIGMASK;
}
static inline bool test_restore_sigmask(void)
{
	return current_thread_info()->status & TS_RESTORE_SIGMASK;
}
static inline bool test_and_clear_restore_sigmask(void)
{
	struct thread_info *ti = current_thread_info();
	if (!(ti->status & TS_RESTORE_SIGMASK))
		return false;
	ti->status &= ~TS_RESTORE_SIGMASK;
	return true;
}
254 255 256 257 258 259 260 261 262 263 264 265

static inline bool is_ia32_task(void)
{
#ifdef CONFIG_X86_32
	return true;
#endif
#ifdef CONFIG_IA32_EMULATION
	if (current_thread_info()->status & TS_COMPAT)
		return true;
#endif
	return false;
}
266 267 268 269 270 271 272 273 274 275

/*
 * Force syscall return via IRET by making it look as if there was
 * some work pending. IRET is our most capable (but slowest) syscall
 * return path, which is able to restore modified SS, CS and certain
 * EFLAGS values that other (fast) syscall return instructions
 * are not able to restore properly.
 */
#define force_iret() set_thread_flag(TIF_NOTIFY_RESUME)

I
Ingo Molnar 已提交
276 277
#endif	/* !__ASSEMBLY__ */

278 279 280
#ifndef __ASSEMBLY__
extern void arch_task_cache_init(void);
extern int arch_dup_task_struct(struct task_struct *dst, struct task_struct *src);
281
extern void arch_release_task_struct(struct task_struct *tsk);
282
#endif
H
H. Peter Anvin 已提交
283
#endif /* _ASM_X86_THREAD_INFO_H */