| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 1 | /* | 
 | 2 |     NetWinder Floating Point Emulator | 
 | 3 |     (c) Rebel.COM, 1998 | 
 | 4 |     (c) 1998, 1999 Philip Blundell | 
 | 5 |  | 
 | 6 |     Direct questions, comments to Scott Bambrough <scottb@netwinder.org> | 
 | 7 |  | 
 | 8 |     This program is free software; you can redistribute it and/or modify | 
 | 9 |     it under the terms of the GNU General Public License as published by | 
 | 10 |     the Free Software Foundation; either version 2 of the License, or | 
 | 11 |     (at your option) any later version. | 
 | 12 |  | 
 | 13 |     This program is distributed in the hope that it will be useful, | 
 | 14 |     but WITHOUT ANY WARRANTY; without even the implied warranty of | 
 | 15 |     MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the | 
 | 16 |     GNU General Public License for more details. | 
 | 17 |  | 
 | 18 |     You should have received a copy of the GNU General Public License | 
 | 19 |     along with this program; if not, write to the Free Software | 
 | 20 |     Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA. | 
 | 21 | */ | 
 | 22 |  | 
 | 23 | /* This is the kernel's entry point into the floating point emulator. | 
 | 24 | It is called from the kernel with code similar to this: | 
 | 25 |  | 
 | 26 | 	sub	r4, r5, #4 | 
 | 27 | 	ldrt	r0, [r4]			@ r0  = instruction | 
 | 28 | 	adrsvc	al, r9, ret_from_exception	@ r9  = normal FP return | 
 | 29 | 	adrsvc	al, lr, fpundefinstr		@ lr  = undefined instr return | 
 | 30 |  | 
 | 31 | 	get_current_task r10 | 
 | 32 | 	mov	r8, #1 | 
 | 33 | 	strb	r8, [r10, #TSK_USED_MATH]	@ set current->used_math | 
 | 34 | 	add	r10, r10, #TSS_FPESAVE		@ r10 = workspace | 
 | 35 | 	ldr	r4, .LC2 | 
 | 36 | 	ldr	pc, [r4]			@ Call FP emulator entry point | 
 | 37 |  | 
 | 38 | The kernel expects the emulator to return via one of two possible | 
 | 39 | points of return it passes to the emulator.  The emulator, if | 
 | 40 | successful in its emulation, jumps to ret_from_exception (passed in | 
 | 41 | r9) and the kernel takes care of returning control from the trap to | 
 | 42 | the user code.  If the emulator is unable to emulate the instruction, | 
 | 43 | it returns via _fpundefinstr (passed via lr) and the kernel halts the | 
 | 44 | user program with a core dump. | 
 | 45 |  | 
 | 46 | On entry to the emulator r10 points to an area of private FP workspace | 
 | 47 | reserved in the thread structure for this process.  This is where the | 
 | 48 | emulator saves its registers across calls.  The first word of this area | 
 | 49 | is used as a flag to detect the first time a process uses floating point, | 
 | 50 | so that the emulator startup cost can be avoided for tasks that don't | 
 | 51 | want it. | 
 | 52 |  | 
 | 53 | This routine does three things: | 
 | 54 |  | 
 | 55 | 1) The kernel has created a struct pt_regs on the stack and saved the | 
 | 56 | user registers into it.  See /usr/include/asm/proc/ptrace.h for details. | 
 | 57 |  | 
 | 58 | 2) It calls EmulateAll to emulate a floating point instruction. | 
 | 59 | EmulateAll returns 1 if the emulation was successful, or 0 if not. | 
 | 60 |  | 
 | 61 | 3) If an instruction has been emulated successfully, it looks ahead at | 
 | 62 | the next instruction.  If it is a floating point instruction, it | 
 | 63 | executes the instruction, without returning to user space.  In this | 
 | 64 | way it repeatedly looks ahead and executes floating point instructions | 
 | 65 | until it encounters a non floating point instruction, at which time it | 
 | 66 | returns via _fpreturn. | 
 | 67 |  | 
 | 68 | This is done to reduce the effect of the trap overhead on each | 
 | 69 | floating point instructions.  GCC attempts to group floating point | 
 | 70 | instructions to allow the emulator to spread the cost of the trap over | 
 | 71 | several floating point instructions.  */ | 
 | 72 |  | 
| Catalin Marinas | c1f438f | 2007-09-25 15:21:00 +0100 | [diff] [blame] | 73 | #include <asm/asm-offsets.h> | 
 | 74 |  | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 75 | 	.globl	nwfpe_enter | 
 | 76 | nwfpe_enter: | 
 | 77 | 	mov	r4, lr			@ save the failure-return addresses | 
 | 78 | 	mov	sl, sp			@ we access the registers via 'sl' | 
 | 79 |  | 
| Catalin Marinas | c1f438f | 2007-09-25 15:21:00 +0100 | [diff] [blame] | 80 | 	ldr	r5, [sp, #S_PC]		@ get contents of PC; | 
 | 81 | 	mov	r6, r0			@ save the opcode | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 82 | emulate: | 
| Catalin Marinas | c1f438f | 2007-09-25 15:21:00 +0100 | [diff] [blame] | 83 | 	ldr	r1, [sp, #S_PSR]	@ fetch the PSR | 
 | 84 | 	bl	checkCondition		@ check the condition | 
 | 85 | 	cmp	r0, #0			@ r0 = 0 ==> condition failed | 
 | 86 |  | 
 | 87 | 	@ if condition code failed to match, next insn | 
 | 88 | 	beq	next			@ get the next instruction; | 
 | 89 |  | 
 | 90 | 	mov	r0, r6			@ prepare for EmulateAll() | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 91 | 	bl	EmulateAll		@ emulate the instruction | 
 | 92 | 	cmp	r0, #0			@ was emulation successful | 
 | 93 | 	moveq	pc, r4			@ no, return failure | 
 | 94 |  | 
 | 95 | next: | 
 | 96 | .Lx1:	ldrt	r6, [r5], #4		@ get the next instruction and | 
 | 97 | 					@ increment PC | 
 | 98 |  | 
 | 99 | 	and	r2, r6, #0x0F000000	@ test for FP insns | 
 | 100 | 	teq	r2, #0x0C000000 | 
 | 101 | 	teqne	r2, #0x0D000000 | 
 | 102 | 	teqne	r2, #0x0E000000 | 
 | 103 | 	movne	pc, r9			@ return ok if not a fp insn | 
 | 104 |  | 
| Catalin Marinas | c1f438f | 2007-09-25 15:21:00 +0100 | [diff] [blame] | 105 | 	str	r5, [sp, #S_PC]		@ update PC copy in regs | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 106 |  | 
 | 107 | 	mov	r0, r6			@ save a copy | 
| Catalin Marinas | c1f438f | 2007-09-25 15:21:00 +0100 | [diff] [blame] | 108 | 	b	emulate			@ check condition and emulate | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 109 |  | 
 | 110 | 	@ We need to be prepared for the instructions at .Lx1 and .Lx2  | 
 | 111 | 	@ to fault.  Emit the appropriate exception gunk to fix things up. | 
 | 112 | 	@ ??? For some reason, faults can happen at .Lx2 even with a | 
 | 113 | 	@ plain LDR instruction.  Weird, but it seems harmless. | 
 | 114 | 	.section .fixup,"ax" | 
 | 115 | 	.align	2 | 
 | 116 | .Lfix:	mov	pc, r9			@ let the user eat segfaults | 
 | 117 | 	.previous | 
 | 118 |  | 
 | 119 | 	.section __ex_table,"a" | 
 | 120 | 	.align	3 | 
 | 121 | 	.long	.Lx1, .Lfix | 
 | 122 | 	.previous |