vfphw.S 8.9 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18
/*
 *  linux/arch/arm/vfp/vfphw.S
 *
 *  Copyright (C) 2004 ARM Limited.
 *  Written by Deep Blue Solutions Limited.
 *
 * This program is free software; you can redistribute it and/or modify
 * it under the terms of the GNU General Public License version 2 as
 * published by the Free Software Foundation.
 *
 * This code is called from the kernel's undefined instruction trap.
 * r9 holds the return address for successful handling.
 * lr holds the return address for unrecognised instructions.
 * r10 points at the start of the private FP workspace in the thread structure
 * sp points to a struct pt_regs (as defined in include/asm/proc/ptrace.h)
 */
#include <asm/thread_info.h>
#include <asm/vfpmacros.h>
19
#include <linux/kern_levels.h>
L
Linus Torvalds 已提交
20 21 22 23 24
#include "../kernel/entry-header.S"

	.macro	DBGSTR, str
#ifdef DEBUG
	stmfd	sp!, {r0-r3, ip, lr}
25
	ldr	r0, =1f
L
Linus Torvalds 已提交
26
	bl	printk
27 28 29 30 31 32
	ldmfd	sp!, {r0-r3, ip, lr}

	.pushsection .rodata, "a"
1:	.ascii	KERN_DEBUG "VFP: \str\n"
	.byte	0
	.previous
L
Linus Torvalds 已提交
33 34 35 36 37 38 39
#endif
	.endm

	.macro  DBGSTR1, str, arg
#ifdef DEBUG
	stmfd	sp!, {r0-r3, ip, lr}
	mov	r1, \arg
40
	ldr	r0, =1f
L
Linus Torvalds 已提交
41
	bl	printk
42 43 44 45 46 47
	ldmfd	sp!, {r0-r3, ip, lr}

	.pushsection .rodata, "a"
1:	.ascii	KERN_DEBUG "VFP: \str\n"
	.byte	0
	.previous
L
Linus Torvalds 已提交
48 49 50 51 52 53 54 55 56
#endif
	.endm

	.macro  DBGSTR3, str, arg1, arg2, arg3
#ifdef DEBUG
	stmfd	sp!, {r0-r3, ip, lr}
	mov	r3, \arg3
	mov	r2, \arg2
	mov	r1, \arg1
57
	ldr	r0, =1f
L
Linus Torvalds 已提交
58
	bl	printk
59 60 61 62 63 64
	ldmfd	sp!, {r0-r3, ip, lr}

	.pushsection .rodata, "a"
1:	.ascii	KERN_DEBUG "VFP: \str\n"
	.byte	0
	.previous
L
Linus Torvalds 已提交
65 66 67 68 69 70
#endif
	.endm


@ VFP hardware support entry point.
@
71 72 73
@  r0  = instruction opcode (32-bit ARM or two 16-bit Thumb)
@  r2  = PC value to resume execution after successful emulation
@  r9  = normal "successful" return address
L
Linus Torvalds 已提交
74
@  r10 = vfp_state union
75
@  r11 = CPU number
76 77
@  lr  = unrecognised instruction return address
@  IRQs enabled.
78
ENTRY(vfp_support_entry)
L
Linus Torvalds 已提交
79 80
	DBGSTR3	"instr %08x pc %08x state %p", r0, r2, r10

81 82 83 84 85
	ldr	r3, [sp, #S_PSR]	@ Neither lazy restore nor FP exceptions
	and	r3, r3, #MODE_MASK	@ are supported in kernel mode
	teq	r3, #USR_MODE
	bne	vfp_kmode_exception	@ Returns through lr

L
Linus Torvalds 已提交
86 87
	VFPFMRX	r1, FPEXC		@ Is the VFP enabled?
	DBGSTR1	"fpexc %08x", r1
88
	tst	r1, #FPEXC_EN
L
Linus Torvalds 已提交
89 90 91
	bne	look_for_VFP_exceptions	@ VFP is already enabled

	DBGSTR1 "enable %x", r10
92
	ldr	r3, vfp_current_hw_state_address
93
	orr	r1, r1, #FPEXC_EN	@ user FPEXC has the enable bit set
94
	ldr	r4, [r3, r11, lsl #2]	@ vfp_current_hw_state pointer
95
	bic	r5, r1, #FPEXC_EX	@ make sure exceptions are disabled
96
	cmp	r4, r10			@ this thread owns the hw context?
97 98 99
#ifndef CONFIG_SMP
	@ For UP, checking that this thread owns the hw context is
	@ sufficient to determine that the hardware state is valid.
100
	beq	vfp_hw_state_valid
L
Linus Torvalds 已提交
101

102 103 104 105
	@ On UP, we lazily save the VFP context.  As a different
	@ thread wants ownership of the VFP hardware, save the old
	@ state if there was a previous (valid) owner.

L
Linus Torvalds 已提交
106 107 108 109 110
	VFPFMXR	FPEXC, r5		@ enable VFP, disable any pending
					@ exceptions, so we can get at the
					@ rest of it

	DBGSTR1	"save old state %p", r4
111 112
	cmp	r4, #0			@ if the vfp_current_hw_state is NULL
	beq	vfp_reload_hw		@ then the hw state needs reloading
113
	VFPFSTMIA r4, r5		@ save the working registers
L
Linus Torvalds 已提交
114
	VFPFMRX	r5, FPSCR		@ current status
115
#ifndef CONFIG_CPU_FEROCEON
116
	tst	r1, #FPEXC_EX		@ is there additional state to save?
117 118 119 120 121 122
	beq	1f
	VFPFMRX	r6, FPINST		@ FPINST (only if FPEXC.EX is set)
	tst	r1, #FPEXC_FP2V		@ is there an FPINST2 to read?
	beq	1f
	VFPFMRX	r8, FPINST2		@ FPINST2 if needed (and present)
1:
123
#endif
L
Linus Torvalds 已提交
124
	stmia	r4, {r1, r5, r6, r8}	@ save FPEXC, FPSCR, FPINST, FPINST2
125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149
vfp_reload_hw:

#else
	@ For SMP, if this thread does not own the hw context, then we
	@ need to reload it.  No need to save the old state as on SMP,
	@ we always save the state when we switch away from a thread.
	bne	vfp_reload_hw

	@ This thread has ownership of the current hardware context.
	@ However, it may have been migrated to another CPU, in which
	@ case the saved state is newer than the hardware context.
	@ Check this by looking at the CPU number which the state was
	@ last loaded onto.
	ldr	ip, [r10, #VFP_CPU]
	teq	ip, r11
	beq	vfp_hw_state_valid

vfp_reload_hw:
	@ We're loading this threads state into the VFP hardware. Update
	@ the CPU number which contains the most up to date VFP context.
	str	r11, [r10, #VFP_CPU]

	VFPFMXR	FPEXC, r5		@ enable VFP, disable any pending
					@ exceptions, so we can get at the
					@ rest of it
150
#endif
L
Linus Torvalds 已提交
151 152

	DBGSTR1	"load state %p", r10
153
	str	r10, [r3, r11, lsl #2]	@ update the vfp_current_hw_state pointer
L
Linus Torvalds 已提交
154
					@ Load the saved state back into the VFP
155
	VFPFLDMIA r10, r5		@ reload the working registers while
L
Linus Torvalds 已提交
156
					@ FPEXC is in a safe state
157
	ldmia	r10, {r1, r5, r6, r8}	@ load FPEXC, FPSCR, FPINST, FPINST2
158
#ifndef CONFIG_CPU_FEROCEON
159
	tst	r1, #FPEXC_EX		@ is there additional state to restore?
160 161 162 163 164 165
	beq	1f
	VFPFMXR	FPINST, r6		@ restore FPINST (only if FPEXC.EX is set)
	tst	r1, #FPEXC_FP2V		@ is there an FPINST2 to write?
	beq	1f
	VFPFMXR	FPINST2, r8		@ FPINST2 if needed (and present)
1:
166
#endif
L
Linus Torvalds 已提交
167 168
	VFPFMXR	FPSCR, r5		@ restore status

169 170
@ The context stored in the VFP hardware is up to date with this thread
vfp_hw_state_valid:
171
	tst	r1, #FPEXC_EX
L
Linus Torvalds 已提交
172 173 174 175
	bne	process_exception	@ might as well handle the pending
					@ exception before retrying branch
					@ out before setting an FPEXC that
					@ stops us reading stuff
176 177 178 179 180 181
	VFPFMXR	FPEXC, r1		@ Restore FPEXC last
	sub	r2, r2, #4		@ Retry current instruction - if Thumb
	str	r2, [sp, #S_PC]		@ mode it's two 16-bit instructions,
					@ else it's one 32-bit instruction, so
					@ always subtract 4 from the following
					@ instruction address.
182
#ifdef CONFIG_PREEMPT_COUNT
183 184 185 186 187
	get_thread_info	r10
	ldr	r4, [r10, #TI_PREEMPT]	@ get preempt count
	sub	r11, r4, #1		@ decrement it
	str	r11, [r10, #TI_PREEMPT]
#endif
L
Linus Torvalds 已提交
188 189 190 191
	mov	pc, r9			@ we think we have handled things


look_for_VFP_exceptions:
192 193
	@ Check for synchronous or asynchronous exception
	tst	r1, #FPEXC_EX | FPEXC_DEX
L
Linus Torvalds 已提交
194
	bne	process_exception
195 196 197
	@ On some implementations of the VFP subarch 1, setting FPSCR.IXE
	@ causes all the CDP instructions to be bounced synchronously without
	@ setting the FPEXC.EX bit
L
Linus Torvalds 已提交
198
	VFPFMRX	r5, FPSCR
199
	tst	r5, #FPSCR_IXE
L
Linus Torvalds 已提交
200 201 202 203 204 205
	bne	process_exception

	@ Fall into hand on to next handler - appropriate coproc instr
	@ not recognised by VFP

	DBGSTR	"not VFP"
206
#ifdef CONFIG_PREEMPT_COUNT
207 208 209 210 211
	get_thread_info	r10
	ldr	r4, [r10, #TI_PREEMPT]	@ get preempt count
	sub	r11, r4, #1		@ decrement it
	str	r11, [r10, #TI_PREEMPT]
#endif
L
Linus Torvalds 已提交
212 213 214 215 216 217 218 219 220 221 222
	mov	pc, lr

process_exception:
	DBGSTR	"bounce"
	mov	r2, sp			@ nothing stacked - regdump is at TOS
	mov	lr, r9			@ setup for a return to the user code.

	@ Now call the C code to package up the bounce to the support code
	@   r0 holds the trigger instruction
	@   r1 holds the FPEXC value
	@   r2 pointer to register dump
223
	b	VFP_bounce		@ we have handled this - the support
L
Linus Torvalds 已提交
224 225 226
					@ code will raise an exception if
					@ required. If not, the user code will
					@ retry the faulted instruction
227
ENDPROC(vfp_support_entry)
L
Linus Torvalds 已提交
228

229
ENTRY(vfp_save_state)
230 231 232 233
	@ Save the current VFP state
	@ r0 - save location
	@ r1 - FPEXC
	DBGSTR1	"save VFP state %p", r0
234
	VFPFSTMIA r0, r2		@ save the working registers
235
	VFPFMRX	r2, FPSCR		@ current status
236
	tst	r1, #FPEXC_EX		@ is there additional state to save?
237 238 239 240 241 242
	beq	1f
	VFPFMRX	r3, FPINST		@ FPINST (only if FPEXC.EX is set)
	tst	r1, #FPEXC_FP2V		@ is there an FPINST2 to read?
	beq	1f
	VFPFMRX	r12, FPINST2		@ FPINST2 if needed (and present)
1:
243 244
	stmia	r0, {r1, r2, r3, r12}	@ save FPEXC, FPSCR, FPINST, FPINST2
	mov	pc, lr
245
ENDPROC(vfp_save_state)
246

247
	.align
248 249
vfp_current_hw_state_address:
	.word	vfp_current_hw_state
L
Linus Torvalds 已提交
250

251 252 253 254 255 256 257
	.macro	tbl_branch, base, tmp, shift
#ifdef CONFIG_THUMB2_KERNEL
	adr	\tmp, 1f
	add	\tmp, \tmp, \base, lsl \shift
	mov	pc, \tmp
#else
	add	pc, pc, \base, lsl \shift
L
Linus Torvalds 已提交
258
	mov	r0, r0
259 260 261 262 263 264
#endif
1:
	.endm

ENTRY(vfp_get_float)
	tbl_branch r0, r3, #3
L
Linus Torvalds 已提交
265
	.irp	dr,0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15
266
1:	mrc	p10, 0, r0, c\dr, c0, 0	@ fmrs	r0, s0
L
Linus Torvalds 已提交
267
	mov	pc, lr
268 269
	.org	1b + 8
1:	mrc	p10, 0, r0, c\dr, c0, 4	@ fmrs	r0, s1
L
Linus Torvalds 已提交
270
	mov	pc, lr
271
	.org	1b + 8
L
Linus Torvalds 已提交
272
	.endr
273
ENDPROC(vfp_get_float)
L
Linus Torvalds 已提交
274

275
ENTRY(vfp_put_float)
276
	tbl_branch r1, r3, #3
L
Linus Torvalds 已提交
277
	.irp	dr,0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15
278
1:	mcr	p10, 0, r0, c\dr, c0, 0	@ fmsr	r0, s0
L
Linus Torvalds 已提交
279
	mov	pc, lr
280 281
	.org	1b + 8
1:	mcr	p10, 0, r0, c\dr, c0, 4	@ fmsr	r0, s1
L
Linus Torvalds 已提交
282
	mov	pc, lr
283
	.org	1b + 8
L
Linus Torvalds 已提交
284
	.endr
285
ENDPROC(vfp_put_float)
L
Linus Torvalds 已提交
286

287
ENTRY(vfp_get_double)
288
	tbl_branch r0, r3, #3
L
Linus Torvalds 已提交
289
	.irp	dr,0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15
290
1:	fmrrd	r0, r1, d\dr
L
Linus Torvalds 已提交
291
	mov	pc, lr
292
	.org	1b + 8
L
Linus Torvalds 已提交
293
	.endr
294 295 296
#ifdef CONFIG_VFPv3
	@ d16 - d31 registers
	.irp	dr,0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15
297
1:	mrrc	p11, 3, r0, r1, c\dr	@ fmrrd	r0, r1, d\dr
298
	mov	pc, lr
299
	.org	1b + 8
300 301
	.endr
#endif
L
Linus Torvalds 已提交
302

303
	@ virtual register 16 (or 32 if VFPv3) for compare with zero
L
Linus Torvalds 已提交
304 305 306
	mov	r0, #0
	mov	r1, #0
	mov	pc, lr
307
ENDPROC(vfp_get_double)
L
Linus Torvalds 已提交
308

309
ENTRY(vfp_put_double)
310
	tbl_branch r2, r3, #3
L
Linus Torvalds 已提交
311
	.irp	dr,0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15
312
1:	fmdrr	d\dr, r0, r1
L
Linus Torvalds 已提交
313
	mov	pc, lr
314
	.org	1b + 8
L
Linus Torvalds 已提交
315
	.endr
316 317 318
#ifdef CONFIG_VFPv3
	@ d16 - d31 registers
	.irp	dr,0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15
319
1:	mcrr	p11, 3, r0, r1, c\dr	@ fmdrr	r0, r1, d\dr
320
	mov	pc, lr
321
	.org	1b + 8
322 323
	.endr
#endif
324
ENDPROC(vfp_put_double)