| /* SPDX-License-Identifier: GPL-2.0-or-later */ |
| /* |
| NetWinder Floating Point Emulator |
| (c) Rebel.COM, 1998 |
| (c) 1998, 1999 Philip Blundell |
| |
| Direct questions, comments to Scott Bambrough <scottb@netwinder.org> |
| |
| */ |
| #include <linux/linkage.h> |
| #include <asm/assembler.h> |
| #include <asm/opcodes.h> |
| |
| /* This is the kernel's entry point into the floating point emulator. |
| It is called from the kernel with code similar to this: |
| |
| sub r4, r5, #4 |
| ldrt r0, [r4] @ r0 = instruction |
| adrsvc al, r9, ret_from_exception @ r9 = normal FP return |
| adrsvc al, lr, fpundefinstr @ lr = undefined instr return |
| |
| get_current_task r10 |
| mov r8, #1 |
| strb r8, [r10, #TSK_USED_MATH] @ set current->used_math |
| add r10, r10, #TSS_FPESAVE @ r10 = workspace |
| ldr r4, .LC2 |
| ldr pc, [r4] @ Call FP emulator entry point |
| |
| The kernel expects the emulator to return via one of two possible |
| points of return it passes to the emulator. The emulator, if |
| successful in its emulation, jumps to ret_from_exception (passed in |
| r9) and the kernel takes care of returning control from the trap to |
| the user code. If the emulator is unable to emulate the instruction, |
| it returns via _fpundefinstr (passed via lr) and the kernel halts the |
| user program with a core dump. |
| |
| On entry to the emulator r10 points to an area of private FP workspace |
| reserved in the thread structure for this process. This is where the |
| emulator saves its registers across calls. The first word of this area |
| is used as a flag to detect the first time a process uses floating point, |
| so that the emulator startup cost can be avoided for tasks that don't |
| want it. |
| |
| This routine does three things: |
| |
| 1) The kernel has created a struct pt_regs on the stack and saved the |
| user registers into it. See /usr/include/asm/proc/ptrace.h for details. |
| |
| 2) It calls EmulateAll to emulate a floating point instruction. |
| EmulateAll returns 1 if the emulation was successful, or 0 if not. |
| |
| 3) If an instruction has been emulated successfully, it looks ahead at |
| the next instruction. If it is a floating point instruction, it |
| executes the instruction, without returning to user space. In this |
| way it repeatedly looks ahead and executes floating point instructions |
| until it encounters a non floating point instruction, at which time it |
| returns via _fpreturn. |
| |
| This is done to reduce the effect of the trap overhead on each |
| floating point instructions. GCC attempts to group floating point |
| instructions to allow the emulator to spread the cost of the trap over |
| several floating point instructions. */ |
| |
| #include <asm/asm-offsets.h> |
| |
| .globl nwfpe_enter |
| nwfpe_enter: |
| mov r4, lr @ save the failure-return addresses |
| mov sl, sp @ we access the registers via 'sl' |
| |
| ldr r5, [sp, #S_PC] @ get contents of PC; |
| mov r6, r0 @ save the opcode |
| emulate: |
| ldr r1, [sp, #S_PSR] @ fetch the PSR |
| bl arm_check_condition @ check the condition |
| cmp r0, #ARM_OPCODE_CONDTEST_PASS @ condition passed? |
| |
| @ if condition code failed to match, next insn |
| bne next @ get the next instruction; |
| |
| mov r0, r6 @ prepare for EmulateAll() |
| bl EmulateAll @ emulate the instruction |
| cmp r0, #0 @ was emulation successful |
| reteq r4 @ no, return failure |
| |
| next: |
| uaccess_enable r3 |
| .Lx1: ldrt r6, [r5], #4 @ get the next instruction and |
| @ increment PC |
| uaccess_disable r3 |
| and r2, r6, #0x0F000000 @ test for FP insns |
| teq r2, #0x0C000000 |
| teqne r2, #0x0D000000 |
| teqne r2, #0x0E000000 |
| retne r9 @ return ok if not a fp insn |
| |
| str r5, [sp, #S_PC] @ update PC copy in regs |
| |
| mov r0, r6 @ save a copy |
| b emulate @ check condition and emulate |
| |
| @ We need to be prepared for the instructions at .Lx1 and .Lx2 |
| @ to fault. Emit the appropriate exception gunk to fix things up. |
| @ ??? For some reason, faults can happen at .Lx2 even with a |
| @ plain LDR instruction. Weird, but it seems harmless. |
| .pushsection .text.fixup,"ax" |
| .align 2 |
| .Lrep: str r4, [sp, #S_PC] @ retry current instruction |
| .Lfix: ret r9 @ let the user eat segfaults |
| .popsection |
| |
| .pushsection __ex_table,"a" |
| .align 3 |
| .long .Lx1, .Lfix |
| .popsection |
| |
| @ |
| @ Check whether the instruction is a co-processor instruction. |
| @ If yes, we need to call the relevant co-processor handler. |
| @ Only FPE instructions are dispatched here, everything else |
| @ is handled by undef hooks. |
| @ |
| @ Emulators may wish to make use of the following registers: |
| @ r4 = PC value to resume execution after successful emulation |
| @ r9 = normal "successful" return address |
| @ lr = unrecognised instruction return address |
| @ IRQs enabled, FIQs enabled. |
| @ |
| ENTRY(call_fpe) |
| mov r2, r4 |
| sub r4, r4, #4 @ ARM instruction at user PC - 4 |
| USERL( .Lrep, ldrt r0, [r4]) @ load opcode from user space |
| ARM_BE8(rev r0, r0) @ little endian instruction |
| |
| uaccess_disable ip |
| |
| get_thread_info r10 @ get current thread |
| tst r0, #0x08000000 @ only CDP/CPRT/LDC/STC have bit 27 |
| reteq lr |
| and r8, r0, #0x00000f00 @ mask out CP number |
| #ifdef CONFIG_IWMMXT |
| @ Test if we need to give access to iWMMXt coprocessors |
| ldr r5, [r10, #TI_FLAGS] |
| rsbs r7, r8, #(1 << 8) @ CP 0 or 1 only |
| movscs r7, r5, lsr #(TIF_USING_IWMMXT + 1) |
| movcs r0, sp @ pass struct pt_regs |
| bcs iwmmxt_task_enable |
| #endif |
| add pc, pc, r8, lsr #6 |
| nop |
| |
| ret lr @ CP#0 |
| b do_fpe @ CP#1 (FPE) |
| b do_fpe @ CP#2 (FPE) |
| ret lr @ CP#3 |
| ret lr @ CP#4 |
| ret lr @ CP#5 |
| ret lr @ CP#6 |
| ret lr @ CP#7 |
| ret lr @ CP#8 |
| ret lr @ CP#9 |
| ret lr @ CP#10 (VFP) |
| ret lr @ CP#11 (VFP) |
| ret lr @ CP#12 |
| ret lr @ CP#13 |
| ret lr @ CP#14 (Debug) |
| ret lr @ CP#15 (Control) |
| |
| do_fpe: |
| add r10, r10, #TI_FPSTATE @ r10 = workspace |
| ldr_va pc, fp_enter, tmp=r4 @ Call FP module USR entry point |
| |
| @ |
| @ The FP module is called with these registers set: |
| @ r0 = instruction |
| @ r2 = PC+4 |
| @ r9 = normal "successful" return address |
| @ r10 = FP workspace |
| @ lr = unrecognised FP instruction return address |
| @ |
| |
| .pushsection .data |
| .align 2 |
| ENTRY(fp_enter) |
| .word no_fp |
| .popsection |
| |
| no_fp: |
| ret lr |
| ENDPROC(no_fp) |