324 lines
		
	
	
		
			8.7 KiB
		
	
	
	
		
			ArmAsm
		
	
	
	
	
	
			
		
		
	
	
			324 lines
		
	
	
		
			8.7 KiB
		
	
	
	
		
			ArmAsm
		
	
	
	
	
	
| /*
 | |
|  *  linux/arch/arm/vfp/vfphw.S
 | |
|  *
 | |
|  *  Copyright (C) 2004 ARM Limited.
 | |
|  *  Written by Deep Blue Solutions Limited.
 | |
|  *
 | |
|  * This program is free software; you can redistribute it and/or modify
 | |
|  * it under the terms of the GNU General Public License version 2 as
 | |
|  * published by the Free Software Foundation.
 | |
|  *
 | |
|  * This code is called from the kernel's undefined instruction trap.
 | |
|  * r9 holds the return address for successful handling.
 | |
|  * lr holds the return address for unrecognised instructions.
 | |
|  * r10 points at the start of the private FP workspace in the thread structure
 | |
|  * sp points to a struct pt_regs (as defined in include/asm/proc/ptrace.h)
 | |
|  */
 | |
| #include <linux/init.h>
 | |
| #include <linux/linkage.h>
 | |
| #include <asm/thread_info.h>
 | |
| #include <asm/vfpmacros.h>
 | |
| #include <linux/kern_levels.h>
 | |
| #include <asm/assembler.h>
 | |
| #include <asm/asm-offsets.h>
 | |
| 
 | |
| 	.macro	DBGSTR, str
 | |
| #ifdef DEBUG
 | |
| 	stmfd	sp!, {r0-r3, ip, lr}
 | |
| 	ldr	r0, =1f
 | |
| 	bl	printk
 | |
| 	ldmfd	sp!, {r0-r3, ip, lr}
 | |
| 
 | |
| 	.pushsection .rodata, "a"
 | |
| 1:	.ascii	KERN_DEBUG "VFP: \str\n"
 | |
| 	.byte	0
 | |
| 	.previous
 | |
| #endif
 | |
| 	.endm
 | |
| 
 | |
| 	.macro  DBGSTR1, str, arg
 | |
| #ifdef DEBUG
 | |
| 	stmfd	sp!, {r0-r3, ip, lr}
 | |
| 	mov	r1, \arg
 | |
| 	ldr	r0, =1f
 | |
| 	bl	printk
 | |
| 	ldmfd	sp!, {r0-r3, ip, lr}
 | |
| 
 | |
| 	.pushsection .rodata, "a"
 | |
| 1:	.ascii	KERN_DEBUG "VFP: \str\n"
 | |
| 	.byte	0
 | |
| 	.previous
 | |
| #endif
 | |
| 	.endm
 | |
| 
 | |
| 	.macro  DBGSTR3, str, arg1, arg2, arg3
 | |
| #ifdef DEBUG
 | |
| 	stmfd	sp!, {r0-r3, ip, lr}
 | |
| 	mov	r3, \arg3
 | |
| 	mov	r2, \arg2
 | |
| 	mov	r1, \arg1
 | |
| 	ldr	r0, =1f
 | |
| 	bl	printk
 | |
| 	ldmfd	sp!, {r0-r3, ip, lr}
 | |
| 
 | |
| 	.pushsection .rodata, "a"
 | |
| 1:	.ascii	KERN_DEBUG "VFP: \str\n"
 | |
| 	.byte	0
 | |
| 	.previous
 | |
| #endif
 | |
| 	.endm
 | |
| 
 | |
| 
 | |
| @ VFP hardware support entry point.
 | |
| @
 | |
| @  r0  = instruction opcode (32-bit ARM or two 16-bit Thumb)
 | |
| @  r2  = PC value to resume execution after successful emulation
 | |
| @  r9  = normal "successful" return address
 | |
| @  r10 = vfp_state union
 | |
| @  r11 = CPU number
 | |
| @  lr  = unrecognised instruction return address
 | |
| @  IRQs enabled.
 | |
| ENTRY(vfp_support_entry)
 | |
| 	DBGSTR3	"instr %08x pc %08x state %p", r0, r2, r10
 | |
| 
 | |
| 	ldr	r3, [sp, #S_PSR]	@ Neither lazy restore nor FP exceptions
 | |
| 	and	r3, r3, #MODE_MASK	@ are supported in kernel mode
 | |
| 	teq	r3, #USR_MODE
 | |
| 	bne	vfp_kmode_exception	@ Returns through lr
 | |
| 
 | |
| 	VFPFMRX	r1, FPEXC		@ Is the VFP enabled?
 | |
| 	DBGSTR1	"fpexc %08x", r1
 | |
| 	tst	r1, #FPEXC_EN
 | |
| 	bne	look_for_VFP_exceptions	@ VFP is already enabled
 | |
| 
 | |
| 	DBGSTR1 "enable %x", r10
 | |
| 	ldr	r3, vfp_current_hw_state_address
 | |
| 	orr	r1, r1, #FPEXC_EN	@ user FPEXC has the enable bit set
 | |
| 	ldr	r4, [r3, r11, lsl #2]	@ vfp_current_hw_state pointer
 | |
| 	bic	r5, r1, #FPEXC_EX	@ make sure exceptions are disabled
 | |
| 	cmp	r4, r10			@ this thread owns the hw context?
 | |
| #ifndef CONFIG_SMP
 | |
| 	@ For UP, checking that this thread owns the hw context is
 | |
| 	@ sufficient to determine that the hardware state is valid.
 | |
| 	beq	vfp_hw_state_valid
 | |
| 
 | |
| 	@ On UP, we lazily save the VFP context.  As a different
 | |
| 	@ thread wants ownership of the VFP hardware, save the old
 | |
| 	@ state if there was a previous (valid) owner.
 | |
| 
 | |
| 	VFPFMXR	FPEXC, r5		@ enable VFP, disable any pending
 | |
| 					@ exceptions, so we can get at the
 | |
| 					@ rest of it
 | |
| 
 | |
| 	DBGSTR1	"save old state %p", r4
 | |
| 	cmp	r4, #0			@ if the vfp_current_hw_state is NULL
 | |
| 	beq	vfp_reload_hw		@ then the hw state needs reloading
 | |
| 	VFPFSTMIA r4, r5		@ save the working registers
 | |
| 	VFPFMRX	r5, FPSCR		@ current status
 | |
| #ifndef CONFIG_CPU_FEROCEON
 | |
| 	tst	r1, #FPEXC_EX		@ is there additional state to save?
 | |
| 	beq	1f
 | |
| 	VFPFMRX	r6, FPINST		@ FPINST (only if FPEXC.EX is set)
 | |
| 	tst	r1, #FPEXC_FP2V		@ is there an FPINST2 to read?
 | |
| 	beq	1f
 | |
| 	VFPFMRX	r8, FPINST2		@ FPINST2 if needed (and present)
 | |
| 1:
 | |
| #endif
 | |
| 	stmia	r4, {r1, r5, r6, r8}	@ save FPEXC, FPSCR, FPINST, FPINST2
 | |
| vfp_reload_hw:
 | |
| 
 | |
| #else
 | |
| 	@ For SMP, if this thread does not own the hw context, then we
 | |
| 	@ need to reload it.  No need to save the old state as on SMP,
 | |
| 	@ we always save the state when we switch away from a thread.
 | |
| 	bne	vfp_reload_hw
 | |
| 
 | |
| 	@ This thread has ownership of the current hardware context.
 | |
| 	@ However, it may have been migrated to another CPU, in which
 | |
| 	@ case the saved state is newer than the hardware context.
 | |
| 	@ Check this by looking at the CPU number which the state was
 | |
| 	@ last loaded onto.
 | |
| 	ldr	ip, [r10, #VFP_CPU]
 | |
| 	teq	ip, r11
 | |
| 	beq	vfp_hw_state_valid
 | |
| 
 | |
| vfp_reload_hw:
 | |
| 	@ We're loading this threads state into the VFP hardware. Update
 | |
| 	@ the CPU number which contains the most up to date VFP context.
 | |
| 	str	r11, [r10, #VFP_CPU]
 | |
| 
 | |
| 	VFPFMXR	FPEXC, r5		@ enable VFP, disable any pending
 | |
| 					@ exceptions, so we can get at the
 | |
| 					@ rest of it
 | |
| #endif
 | |
| 
 | |
| 	DBGSTR1	"load state %p", r10
 | |
| 	str	r10, [r3, r11, lsl #2]	@ update the vfp_current_hw_state pointer
 | |
| 					@ Load the saved state back into the VFP
 | |
| 	VFPFLDMIA r10, r5		@ reload the working registers while
 | |
| 					@ FPEXC is in a safe state
 | |
| 	ldmia	r10, {r1, r5, r6, r8}	@ load FPEXC, FPSCR, FPINST, FPINST2
 | |
| #ifndef CONFIG_CPU_FEROCEON
 | |
| 	tst	r1, #FPEXC_EX		@ is there additional state to restore?
 | |
| 	beq	1f
 | |
| 	VFPFMXR	FPINST, r6		@ restore FPINST (only if FPEXC.EX is set)
 | |
| 	tst	r1, #FPEXC_FP2V		@ is there an FPINST2 to write?
 | |
| 	beq	1f
 | |
| 	VFPFMXR	FPINST2, r8		@ FPINST2 if needed (and present)
 | |
| 1:
 | |
| #endif
 | |
| 	VFPFMXR	FPSCR, r5		@ restore status
 | |
| 
 | |
| @ The context stored in the VFP hardware is up to date with this thread
 | |
| vfp_hw_state_valid:
 | |
| 	tst	r1, #FPEXC_EX
 | |
| 	bne	process_exception	@ might as well handle the pending
 | |
| 					@ exception before retrying branch
 | |
| 					@ out before setting an FPEXC that
 | |
| 					@ stops us reading stuff
 | |
| 	VFPFMXR	FPEXC, r1		@ Restore FPEXC last
 | |
| 	sub	r2, r2, #4		@ Retry current instruction - if Thumb
 | |
| 	str	r2, [sp, #S_PC]		@ mode it's two 16-bit instructions,
 | |
| 					@ else it's one 32-bit instruction, so
 | |
| 					@ always subtract 4 from the following
 | |
| 					@ instruction address.
 | |
| 	dec_preempt_count_ti r10, r4
 | |
| 	ret	r9			@ we think we have handled things
 | |
| 
 | |
| 
 | |
| look_for_VFP_exceptions:
 | |
| 	@ Check for synchronous or asynchronous exception
 | |
| 	tst	r1, #FPEXC_EX | FPEXC_DEX
 | |
| 	bne	process_exception
 | |
| 	@ On some implementations of the VFP subarch 1, setting FPSCR.IXE
 | |
| 	@ causes all the CDP instructions to be bounced synchronously without
 | |
| 	@ setting the FPEXC.EX bit
 | |
| 	VFPFMRX	r5, FPSCR
 | |
| 	tst	r5, #FPSCR_IXE
 | |
| 	bne	process_exception
 | |
| 
 | |
| 	tst	r5, #FPSCR_LENGTH_MASK
 | |
| 	beq	skip
 | |
| 	orr	r1, r1, #FPEXC_DEX
 | |
| 	b	process_exception
 | |
| skip:
 | |
| 
 | |
| 	@ Fall into hand on to next handler - appropriate coproc instr
 | |
| 	@ not recognised by VFP
 | |
| 
 | |
| 	DBGSTR	"not VFP"
 | |
| 	dec_preempt_count_ti r10, r4
 | |
| 	ret	lr
 | |
| 
 | |
| process_exception:
 | |
| 	DBGSTR	"bounce"
 | |
| 	mov	r2, sp			@ nothing stacked - regdump is at TOS
 | |
| 	mov	lr, r9			@ setup for a return to the user code.
 | |
| 
 | |
| 	@ Now call the C code to package up the bounce to the support code
 | |
| 	@   r0 holds the trigger instruction
 | |
| 	@   r1 holds the FPEXC value
 | |
| 	@   r2 pointer to register dump
 | |
| 	b	VFP_bounce		@ we have handled this - the support
 | |
| 					@ code will raise an exception if
 | |
| 					@ required. If not, the user code will
 | |
| 					@ retry the faulted instruction
 | |
| ENDPROC(vfp_support_entry)
 | |
| 
 | |
| ENTRY(vfp_save_state)
 | |
| 	@ Save the current VFP state
 | |
| 	@ r0 - save location
 | |
| 	@ r1 - FPEXC
 | |
| 	DBGSTR1	"save VFP state %p", r0
 | |
| 	VFPFSTMIA r0, r2		@ save the working registers
 | |
| 	VFPFMRX	r2, FPSCR		@ current status
 | |
| 	tst	r1, #FPEXC_EX		@ is there additional state to save?
 | |
| 	beq	1f
 | |
| 	VFPFMRX	r3, FPINST		@ FPINST (only if FPEXC.EX is set)
 | |
| 	tst	r1, #FPEXC_FP2V		@ is there an FPINST2 to read?
 | |
| 	beq	1f
 | |
| 	VFPFMRX	r12, FPINST2		@ FPINST2 if needed (and present)
 | |
| 1:
 | |
| 	stmia	r0, {r1, r2, r3, r12}	@ save FPEXC, FPSCR, FPINST, FPINST2
 | |
| 	ret	lr
 | |
| ENDPROC(vfp_save_state)
 | |
| 
 | |
| 	.align
 | |
| vfp_current_hw_state_address:
 | |
| 	.word	vfp_current_hw_state
 | |
| 
 | |
| 	.macro	tbl_branch, base, tmp, shift
 | |
| #ifdef CONFIG_THUMB2_KERNEL
 | |
| 	adr	\tmp, 1f
 | |
| 	add	\tmp, \tmp, \base, lsl \shift
 | |
| 	ret	\tmp
 | |
| #else
 | |
| 	add	pc, pc, \base, lsl \shift
 | |
| 	mov	r0, r0
 | |
| #endif
 | |
| 1:
 | |
| 	.endm
 | |
| 
 | |
| ENTRY(vfp_get_float)
 | |
| 	tbl_branch r0, r3, #3
 | |
| 	.irp	dr,0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15
 | |
| 1:	mrc	p10, 0, r0, c\dr, c0, 0	@ fmrs	r0, s0
 | |
| 	ret	lr
 | |
| 	.org	1b + 8
 | |
| 1:	mrc	p10, 0, r0, c\dr, c0, 4	@ fmrs	r0, s1
 | |
| 	ret	lr
 | |
| 	.org	1b + 8
 | |
| 	.endr
 | |
| ENDPROC(vfp_get_float)
 | |
| 
 | |
| ENTRY(vfp_put_float)
 | |
| 	tbl_branch r1, r3, #3
 | |
| 	.irp	dr,0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15
 | |
| 1:	mcr	p10, 0, r0, c\dr, c0, 0	@ fmsr	r0, s0
 | |
| 	ret	lr
 | |
| 	.org	1b + 8
 | |
| 1:	mcr	p10, 0, r0, c\dr, c0, 4	@ fmsr	r0, s1
 | |
| 	ret	lr
 | |
| 	.org	1b + 8
 | |
| 	.endr
 | |
| ENDPROC(vfp_put_float)
 | |
| 
 | |
| ENTRY(vfp_get_double)
 | |
| 	tbl_branch r0, r3, #3
 | |
| 	.irp	dr,0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15
 | |
| 1:	fmrrd	r0, r1, d\dr
 | |
| 	ret	lr
 | |
| 	.org	1b + 8
 | |
| 	.endr
 | |
| #ifdef CONFIG_VFPv3
 | |
| 	@ d16 - d31 registers
 | |
| 	.irp	dr,0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15
 | |
| 1:	mrrc	p11, 3, r0, r1, c\dr	@ fmrrd	r0, r1, d\dr
 | |
| 	ret	lr
 | |
| 	.org	1b + 8
 | |
| 	.endr
 | |
| #endif
 | |
| 
 | |
| 	@ virtual register 16 (or 32 if VFPv3) for compare with zero
 | |
| 	mov	r0, #0
 | |
| 	mov	r1, #0
 | |
| 	ret	lr
 | |
| ENDPROC(vfp_get_double)
 | |
| 
 | |
| ENTRY(vfp_put_double)
 | |
| 	tbl_branch r2, r3, #3
 | |
| 	.irp	dr,0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15
 | |
| 1:	fmdrr	d\dr, r0, r1
 | |
| 	ret	lr
 | |
| 	.org	1b + 8
 | |
| 	.endr
 | |
| #ifdef CONFIG_VFPv3
 | |
| 	@ d16 - d31 registers
 | |
| 	.irp	dr,0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15
 | |
| 1:	mcrr	p11, 3, r0, r1, c\dr	@ fmdrr	r0, r1, d\dr
 | |
| 	ret	lr
 | |
| 	.org	1b + 8
 | |
| 	.endr
 | |
| #endif
 | |
| ENDPROC(vfp_put_double)
 | 
