vfphw.S 8.9 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16
/*
 *  linux/arch/arm/vfp/vfphw.S
 *
 *  Copyright (C) 2004 ARM Limited.
 *  Written by Deep Blue Solutions Limited.
 *
 * This program is free software; you can redistribute it and/or modify
 * it under the terms of the GNU General Public License version 2 as
 * published by the Free Software Foundation.
 *
 * This code is called from the kernel's undefined instruction trap.
 * r9 holds the return address for successful handling.
 * lr holds the return address for unrecognised instructions.
 * r10 points at the start of the private FP workspace in the thread structure
 * sp points to a struct pt_regs (as defined in include/asm/proc/ptrace.h)
 */
17 18
#include <linux/init.h>
#include <linux/linkage.h>
L
Linus Torvalds 已提交
19 20
#include <asm/thread_info.h>
#include <asm/vfpmacros.h>
21
#include <linux/kern_levels.h>
22 23
#include <asm/assembler.h>
#include <asm/asm-offsets.h>
L
Linus Torvalds 已提交
24 25 26 27

	.macro	DBGSTR, str
#ifdef DEBUG
	stmfd	sp!, {r0-r3, ip, lr}
28
	ldr	r0, =1f
L
Linus Torvalds 已提交
29
	bl	printk
30 31 32 33 34 35
	ldmfd	sp!, {r0-r3, ip, lr}

	.pushsection .rodata, "a"
1:	.ascii	KERN_DEBUG "VFP: \str\n"
	.byte	0
	.previous
L
Linus Torvalds 已提交
36 37 38 39 40 41 42
#endif
	.endm

	.macro  DBGSTR1, str, arg
#ifdef DEBUG
	stmfd	sp!, {r0-r3, ip, lr}
	mov	r1, \arg
43
	ldr	r0, =1f
L
Linus Torvalds 已提交
44
	bl	printk
45 46 47 48 49 50
	ldmfd	sp!, {r0-r3, ip, lr}

	.pushsection .rodata, "a"
1:	.ascii	KERN_DEBUG "VFP: \str\n"
	.byte	0
	.previous
L
Linus Torvalds 已提交
51 52 53 54 55 56 57 58 59
#endif
	.endm

	.macro  DBGSTR3, str, arg1, arg2, arg3
#ifdef DEBUG
	stmfd	sp!, {r0-r3, ip, lr}
	mov	r3, \arg3
	mov	r2, \arg2
	mov	r1, \arg1
60
	ldr	r0, =1f
L
Linus Torvalds 已提交
61
	bl	printk
62 63 64 65 66 67
	ldmfd	sp!, {r0-r3, ip, lr}

	.pushsection .rodata, "a"
1:	.ascii	KERN_DEBUG "VFP: \str\n"
	.byte	0
	.previous
L
Linus Torvalds 已提交
68 69 70 71 72 73
#endif
	.endm


@ VFP hardware support entry point.
@
74 75 76
@  r0  = instruction opcode (32-bit ARM or two 16-bit Thumb)
@  r2  = PC value to resume execution after successful emulation
@  r9  = normal "successful" return address
L
Linus Torvalds 已提交
77
@  r10 = vfp_state union
78
@  r11 = CPU number
79 80
@  lr  = unrecognised instruction return address
@  IRQs enabled.
81
ENTRY(vfp_support_entry)
L
Linus Torvalds 已提交
82 83
	DBGSTR3	"instr %08x pc %08x state %p", r0, r2, r10

84 85 86 87 88
	ldr	r3, [sp, #S_PSR]	@ Neither lazy restore nor FP exceptions
	and	r3, r3, #MODE_MASK	@ are supported in kernel mode
	teq	r3, #USR_MODE
	bne	vfp_kmode_exception	@ Returns through lr

L
Linus Torvalds 已提交
89 90
	VFPFMRX	r1, FPEXC		@ Is the VFP enabled?
	DBGSTR1	"fpexc %08x", r1
91
	tst	r1, #FPEXC_EN
L
Linus Torvalds 已提交
92 93 94
	bne	look_for_VFP_exceptions	@ VFP is already enabled

	DBGSTR1 "enable %x", r10
95
	ldr	r3, vfp_current_hw_state_address
96
	orr	r1, r1, #FPEXC_EN	@ user FPEXC has the enable bit set
97
	ldr	r4, [r3, r11, lsl #2]	@ vfp_current_hw_state pointer
98
	bic	r5, r1, #FPEXC_EX	@ make sure exceptions are disabled
99
	cmp	r4, r10			@ this thread owns the hw context?
100 101 102
#ifndef CONFIG_SMP
	@ For UP, checking that this thread owns the hw context is
	@ sufficient to determine that the hardware state is valid.
103
	beq	vfp_hw_state_valid
L
Linus Torvalds 已提交
104

105 106 107 108
	@ On UP, we lazily save the VFP context.  As a different
	@ thread wants ownership of the VFP hardware, save the old
	@ state if there was a previous (valid) owner.

L
Linus Torvalds 已提交
109 110 111 112 113
	VFPFMXR	FPEXC, r5		@ enable VFP, disable any pending
					@ exceptions, so we can get at the
					@ rest of it

	DBGSTR1	"save old state %p", r4
114 115
	cmp	r4, #0			@ if the vfp_current_hw_state is NULL
	beq	vfp_reload_hw		@ then the hw state needs reloading
116
	VFPFSTMIA r4, r5		@ save the working registers
L
Linus Torvalds 已提交
117
	VFPFMRX	r5, FPSCR		@ current status
118
#ifndef CONFIG_CPU_FEROCEON
119
	tst	r1, #FPEXC_EX		@ is there additional state to save?
120 121 122 123 124 125
	beq	1f
	VFPFMRX	r6, FPINST		@ FPINST (only if FPEXC.EX is set)
	tst	r1, #FPEXC_FP2V		@ is there an FPINST2 to read?
	beq	1f
	VFPFMRX	r8, FPINST2		@ FPINST2 if needed (and present)
1:
126
#endif
L
Linus Torvalds 已提交
127
	stmia	r4, {r1, r5, r6, r8}	@ save FPEXC, FPSCR, FPINST, FPINST2
128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152
vfp_reload_hw:

#else
	@ For SMP, if this thread does not own the hw context, then we
	@ need to reload it.  No need to save the old state as on SMP,
	@ we always save the state when we switch away from a thread.
	bne	vfp_reload_hw

	@ This thread has ownership of the current hardware context.
	@ However, it may have been migrated to another CPU, in which
	@ case the saved state is newer than the hardware context.
	@ Check this by looking at the CPU number which the state was
	@ last loaded onto.
	ldr	ip, [r10, #VFP_CPU]
	teq	ip, r11
	beq	vfp_hw_state_valid

vfp_reload_hw:
	@ We're loading this threads state into the VFP hardware. Update
	@ the CPU number which contains the most up to date VFP context.
	str	r11, [r10, #VFP_CPU]

	VFPFMXR	FPEXC, r5		@ enable VFP, disable any pending
					@ exceptions, so we can get at the
					@ rest of it
153
#endif
L
Linus Torvalds 已提交
154 155

	DBGSTR1	"load state %p", r10
156
	str	r10, [r3, r11, lsl #2]	@ update the vfp_current_hw_state pointer
L
Linus Torvalds 已提交
157
					@ Load the saved state back into the VFP
158
	VFPFLDMIA r10, r5		@ reload the working registers while
L
Linus Torvalds 已提交
159
					@ FPEXC is in a safe state
160
	ldmia	r10, {r1, r5, r6, r8}	@ load FPEXC, FPSCR, FPINST, FPINST2
161
#ifndef CONFIG_CPU_FEROCEON
162
	tst	r1, #FPEXC_EX		@ is there additional state to restore?
163 164 165 166 167 168
	beq	1f
	VFPFMXR	FPINST, r6		@ restore FPINST (only if FPEXC.EX is set)
	tst	r1, #FPEXC_FP2V		@ is there an FPINST2 to write?
	beq	1f
	VFPFMXR	FPINST2, r8		@ FPINST2 if needed (and present)
1:
169
#endif
L
Linus Torvalds 已提交
170 171
	VFPFMXR	FPSCR, r5		@ restore status

172 173
@ The context stored in the VFP hardware is up to date with this thread
vfp_hw_state_valid:
174
	tst	r1, #FPEXC_EX
L
Linus Torvalds 已提交
175 176 177 178
	bne	process_exception	@ might as well handle the pending
					@ exception before retrying branch
					@ out before setting an FPEXC that
					@ stops us reading stuff
179 180 181 182 183 184
	VFPFMXR	FPEXC, r1		@ Restore FPEXC last
	sub	r2, r2, #4		@ Retry current instruction - if Thumb
	str	r2, [sp, #S_PC]		@ mode it's two 16-bit instructions,
					@ else it's one 32-bit instruction, so
					@ always subtract 4 from the following
					@ instruction address.
185
#ifdef CONFIG_PREEMPT_COUNT
186 187 188 189 190
	get_thread_info	r10
	ldr	r4, [r10, #TI_PREEMPT]	@ get preempt count
	sub	r11, r4, #1		@ decrement it
	str	r11, [r10, #TI_PREEMPT]
#endif
L
Linus Torvalds 已提交
191 192 193 194
	mov	pc, r9			@ we think we have handled things


look_for_VFP_exceptions:
195 196
	@ Check for synchronous or asynchronous exception
	tst	r1, #FPEXC_EX | FPEXC_DEX
L
Linus Torvalds 已提交
197
	bne	process_exception
198 199 200
	@ On some implementations of the VFP subarch 1, setting FPSCR.IXE
	@ causes all the CDP instructions to be bounced synchronously without
	@ setting the FPEXC.EX bit
L
Linus Torvalds 已提交
201
	VFPFMRX	r5, FPSCR
202
	tst	r5, #FPSCR_IXE
L
Linus Torvalds 已提交
203 204 205 206 207 208
	bne	process_exception

	@ Fall into hand on to next handler - appropriate coproc instr
	@ not recognised by VFP

	DBGSTR	"not VFP"
209
#ifdef CONFIG_PREEMPT_COUNT
210 211 212 213 214
	get_thread_info	r10
	ldr	r4, [r10, #TI_PREEMPT]	@ get preempt count
	sub	r11, r4, #1		@ decrement it
	str	r11, [r10, #TI_PREEMPT]
#endif
L
Linus Torvalds 已提交
215 216 217 218 219 220 221 222 223 224 225
	mov	pc, lr

process_exception:
	DBGSTR	"bounce"
	mov	r2, sp			@ nothing stacked - regdump is at TOS
	mov	lr, r9			@ setup for a return to the user code.

	@ Now call the C code to package up the bounce to the support code
	@   r0 holds the trigger instruction
	@   r1 holds the FPEXC value
	@   r2 pointer to register dump
226
	b	VFP_bounce		@ we have handled this - the support
L
Linus Torvalds 已提交
227 228 229
					@ code will raise an exception if
					@ required. If not, the user code will
					@ retry the faulted instruction
230
ENDPROC(vfp_support_entry)
L
Linus Torvalds 已提交
231

232
ENTRY(vfp_save_state)
233 234 235 236
	@ Save the current VFP state
	@ r0 - save location
	@ r1 - FPEXC
	DBGSTR1	"save VFP state %p", r0
237
	VFPFSTMIA r0, r2		@ save the working registers
238
	VFPFMRX	r2, FPSCR		@ current status
239
	tst	r1, #FPEXC_EX		@ is there additional state to save?
240 241 242 243 244 245
	beq	1f
	VFPFMRX	r3, FPINST		@ FPINST (only if FPEXC.EX is set)
	tst	r1, #FPEXC_FP2V		@ is there an FPINST2 to read?
	beq	1f
	VFPFMRX	r12, FPINST2		@ FPINST2 if needed (and present)
1:
246 247
	stmia	r0, {r1, r2, r3, r12}	@ save FPEXC, FPSCR, FPINST, FPINST2
	mov	pc, lr
248
ENDPROC(vfp_save_state)
249

250
	.align
251 252
vfp_current_hw_state_address:
	.word	vfp_current_hw_state
L
Linus Torvalds 已提交
253

254 255 256 257 258 259 260
	.macro	tbl_branch, base, tmp, shift
#ifdef CONFIG_THUMB2_KERNEL
	adr	\tmp, 1f
	add	\tmp, \tmp, \base, lsl \shift
	mov	pc, \tmp
#else
	add	pc, pc, \base, lsl \shift
L
Linus Torvalds 已提交
261
	mov	r0, r0
262 263 264 265 266 267
#endif
1:
	.endm

ENTRY(vfp_get_float)
	tbl_branch r0, r3, #3
L
Linus Torvalds 已提交
268
	.irp	dr,0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15
269
1:	mrc	p10, 0, r0, c\dr, c0, 0	@ fmrs	r0, s0
L
Linus Torvalds 已提交
270
	mov	pc, lr
271 272
	.org	1b + 8
1:	mrc	p10, 0, r0, c\dr, c0, 4	@ fmrs	r0, s1
L
Linus Torvalds 已提交
273
	mov	pc, lr
274
	.org	1b + 8
L
Linus Torvalds 已提交
275
	.endr
276
ENDPROC(vfp_get_float)
L
Linus Torvalds 已提交
277

278
ENTRY(vfp_put_float)
279
	tbl_branch r1, r3, #3
L
Linus Torvalds 已提交
280
	.irp	dr,0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15
281
1:	mcr	p10, 0, r0, c\dr, c0, 0	@ fmsr	r0, s0
L
Linus Torvalds 已提交
282
	mov	pc, lr
283 284
	.org	1b + 8
1:	mcr	p10, 0, r0, c\dr, c0, 4	@ fmsr	r0, s1
L
Linus Torvalds 已提交
285
	mov	pc, lr
286
	.org	1b + 8
L
Linus Torvalds 已提交
287
	.endr
288
ENDPROC(vfp_put_float)
L
Linus Torvalds 已提交
289

290
ENTRY(vfp_get_double)
291
	tbl_branch r0, r3, #3
L
Linus Torvalds 已提交
292
	.irp	dr,0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15
293
1:	fmrrd	r0, r1, d\dr
L
Linus Torvalds 已提交
294
	mov	pc, lr
295
	.org	1b + 8
L
Linus Torvalds 已提交
296
	.endr
297 298 299
#ifdef CONFIG_VFPv3
	@ d16 - d31 registers
	.irp	dr,0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15
300
1:	mrrc	p11, 3, r0, r1, c\dr	@ fmrrd	r0, r1, d\dr
301
	mov	pc, lr
302
	.org	1b + 8
303 304
	.endr
#endif
L
Linus Torvalds 已提交
305

306
	@ virtual register 16 (or 32 if VFPv3) for compare with zero
L
Linus Torvalds 已提交
307 308 309
	mov	r0, #0
	mov	r1, #0
	mov	pc, lr
310
ENDPROC(vfp_get_double)
L
Linus Torvalds 已提交
311

312
ENTRY(vfp_put_double)
313
	tbl_branch r2, r3, #3
L
Linus Torvalds 已提交
314
	.irp	dr,0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15
315
1:	fmdrr	d\dr, r0, r1
L
Linus Torvalds 已提交
316
	mov	pc, lr
317
	.org	1b + 8
L
Linus Torvalds 已提交
318
	.endr
319 320 321
#ifdef CONFIG_VFPv3
	@ d16 - d31 registers
	.irp	dr,0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15
322
1:	mcrr	p11, 3, r0, r1, c\dr	@ fmdrr	r0, r1, d\dr
323
	mov	pc, lr
324
	.org	1b + 8
325 326
	.endr
#endif
327
ENDPROC(vfp_put_double)