Thomas Gleixner | d2912cb | 2019-06-04 10:11:33 +0200 | [diff] [blame] | 1 | /* SPDX-License-Identifier: GPL-2.0-only */ |
Nicolas Pitre | 7549423 | 2005-11-01 19:52:23 +0000 | [diff] [blame] | 2 | /* |
| 3 | * linux/arch/arm/lib/memmove.S |
| 4 | * |
| 5 | * Author: Nicolas Pitre |
| 6 | * Created: Sep 28, 2005 |
| 7 | * Copyright: (C) MontaVista Software Inc. |
Nicolas Pitre | 7549423 | 2005-11-01 19:52:23 +0000 | [diff] [blame] | 8 | */ |
| 9 | |
| 10 | #include <linux/linkage.h> |
| 11 | #include <asm/assembler.h> |
Lin Yongting | 207a6cb | 2014-11-26 14:36:15 +0100 | [diff] [blame] | 12 | #include <asm/unwind.h> |
Nicolas Pitre | 7549423 | 2005-11-01 19:52:23 +0000 | [diff] [blame] | 13 | |
Nicolas Pitre | 7549423 | 2005-11-01 19:52:23 +0000 | [diff] [blame] | 14 | .text |
| 15 | |
| 16 | /* |
| 17 | * Prototype: void *memmove(void *dest, const void *src, size_t n); |
| 18 | * |
| 19 | * Note: |
| 20 | * |
| 21 | * If the memory regions don't overlap, we simply branch to memcpy which is |
| 22 | * normally a bit faster. Otherwise the copy is done going downwards. This |
| 23 | * is a transposition of the code from copy_template.S but with the copy |
| 24 | * occurring in the opposite direction. |
| 25 | */ |
| 26 | |
Linus Walleij | d6d51a9 | 2020-10-25 23:52:08 +0100 | [diff] [blame] | 27 | ENTRY(__memmove) |
Fangrui Song | 735e8d9 | 2020-11-06 21:46:11 +0100 | [diff] [blame] | 28 | WEAK(memmove) |
Lin Yongting | 207a6cb | 2014-11-26 14:36:15 +0100 | [diff] [blame] | 29 | UNWIND( .fnstart ) |
Nicolas Pitre | 7549423 | 2005-11-01 19:52:23 +0000 | [diff] [blame] | 30 | |
| 31 | subs ip, r0, r1 |
| 32 | cmphi r2, ip |
Linus Walleij | d6d51a9 | 2020-10-25 23:52:08 +0100 | [diff] [blame] | 33 | bls __memcpy |
Lin Yongting | 207a6cb | 2014-11-26 14:36:15 +0100 | [diff] [blame] | 34 | UNWIND( .fnend ) |
| 35 | |
| 36 | UNWIND( .fnstart ) |
Ard Biesheuvel | ccb8160 | 2021-10-04 11:29:11 +0200 | [diff] [blame] | 37 | UNWIND( .save {r0, r4, fpreg, lr} ) |
| 38 | stmfd sp!, {r0, r4, UNWIND(fpreg,) lr} |
| 39 | UNWIND( .setfp fpreg, sp ) |
| 40 | UNWIND( mov fpreg, sp ) |
Nicolas Pitre | 7549423 | 2005-11-01 19:52:23 +0000 | [diff] [blame] | 41 | add r1, r1, r2 |
| 42 | add r0, r0, r2 |
| 43 | subs r2, r2, #4 |
| 44 | blt 8f |
| 45 | ands ip, r0, #3 |
| 46 | PLD( pld [r1, #-4] ) |
| 47 | bne 9f |
| 48 | ands ip, r1, #3 |
| 49 | bne 10f |
| 50 | |
| 51 | 1: subs r2, r2, #(28) |
Ard Biesheuvel | ccb8160 | 2021-10-04 11:29:11 +0200 | [diff] [blame] | 52 | stmfd sp!, {r5, r6, r8, r9} |
Nicolas Pitre | 7549423 | 2005-11-01 19:52:23 +0000 | [diff] [blame] | 53 | blt 5f |
| 54 | |
Nicolas Pitre | 2239aff | 2008-03-31 12:38:31 -0400 | [diff] [blame] | 55 | CALGN( ands ip, r0, #31 ) |
Stefan Agner | e44fc38 | 2019-02-18 00:57:38 +0100 | [diff] [blame] | 56 | CALGN( sbcsne r4, ip, r2 ) @ C is always set here |
Nicolas Pitre | 7549423 | 2005-11-01 19:52:23 +0000 | [diff] [blame] | 57 | CALGN( bcs 2f ) |
| 58 | CALGN( adr r4, 6f ) |
| 59 | CALGN( subs r2, r2, ip ) @ C is set here |
Nicolas Pitre | 4c4925c | 2008-06-11 12:40:13 -0400 | [diff] [blame] | 60 | CALGN( rsb ip, ip, #32 ) |
Nicolas Pitre | 7549423 | 2005-11-01 19:52:23 +0000 | [diff] [blame] | 61 | CALGN( add pc, r4, ip ) |
| 62 | |
| 63 | PLD( pld [r1, #-4] ) |
| 64 | 2: PLD( subs r2, r2, #96 ) |
| 65 | PLD( pld [r1, #-32] ) |
| 66 | PLD( blt 4f ) |
| 67 | PLD( pld [r1, #-64] ) |
| 68 | PLD( pld [r1, #-96] ) |
| 69 | |
| 70 | 3: PLD( pld [r1, #-128] ) |
Ard Biesheuvel | ccb8160 | 2021-10-04 11:29:11 +0200 | [diff] [blame] | 71 | 4: ldmdb r1!, {r3, r4, r5, r6, r8, r9, ip, lr} |
Nicolas Pitre | 7549423 | 2005-11-01 19:52:23 +0000 | [diff] [blame] | 72 | subs r2, r2, #32 |
Ard Biesheuvel | ccb8160 | 2021-10-04 11:29:11 +0200 | [diff] [blame] | 73 | stmdb r0!, {r3, r4, r5, r6, r8, r9, ip, lr} |
Nicolas Pitre | 7549423 | 2005-11-01 19:52:23 +0000 | [diff] [blame] | 74 | bge 3b |
| 75 | PLD( cmn r2, #96 ) |
| 76 | PLD( bge 4b ) |
| 77 | |
| 78 | 5: ands ip, r2, #28 |
| 79 | rsb ip, ip, #32 |
| 80 | addne pc, pc, ip @ C is always clear here |
| 81 | b 7f |
Catalin Marinas | fd522a8 | 2010-03-29 10:29:46 +0100 | [diff] [blame] | 82 | 6: W(nop) |
Catalin Marinas | 8b59278 | 2009-07-24 12:32:57 +0100 | [diff] [blame] | 83 | W(ldr) r3, [r1, #-4]! |
| 84 | W(ldr) r4, [r1, #-4]! |
| 85 | W(ldr) r5, [r1, #-4]! |
| 86 | W(ldr) r6, [r1, #-4]! |
Catalin Marinas | 8b59278 | 2009-07-24 12:32:57 +0100 | [diff] [blame] | 87 | W(ldr) r8, [r1, #-4]! |
Ard Biesheuvel | ccb8160 | 2021-10-04 11:29:11 +0200 | [diff] [blame] | 88 | W(ldr) r9, [r1, #-4]! |
Catalin Marinas | 8b59278 | 2009-07-24 12:32:57 +0100 | [diff] [blame] | 89 | W(ldr) lr, [r1, #-4]! |
Nicolas Pitre | 7549423 | 2005-11-01 19:52:23 +0000 | [diff] [blame] | 90 | |
| 91 | add pc, pc, ip |
| 92 | nop |
Catalin Marinas | fd522a8 | 2010-03-29 10:29:46 +0100 | [diff] [blame] | 93 | W(nop) |
Catalin Marinas | 8b59278 | 2009-07-24 12:32:57 +0100 | [diff] [blame] | 94 | W(str) r3, [r0, #-4]! |
| 95 | W(str) r4, [r0, #-4]! |
| 96 | W(str) r5, [r0, #-4]! |
| 97 | W(str) r6, [r0, #-4]! |
Catalin Marinas | 8b59278 | 2009-07-24 12:32:57 +0100 | [diff] [blame] | 98 | W(str) r8, [r0, #-4]! |
Ard Biesheuvel | ccb8160 | 2021-10-04 11:29:11 +0200 | [diff] [blame] | 99 | W(str) r9, [r0, #-4]! |
Catalin Marinas | 8b59278 | 2009-07-24 12:32:57 +0100 | [diff] [blame] | 100 | W(str) lr, [r0, #-4]! |
Nicolas Pitre | 7549423 | 2005-11-01 19:52:23 +0000 | [diff] [blame] | 101 | |
| 102 | CALGN( bcs 2b ) |
| 103 | |
Ard Biesheuvel | ccb8160 | 2021-10-04 11:29:11 +0200 | [diff] [blame] | 104 | 7: ldmfd sp!, {r5, r6, r8, r9} |
Nicolas Pitre | 7549423 | 2005-11-01 19:52:23 +0000 | [diff] [blame] | 105 | |
| 106 | 8: movs r2, r2, lsl #31 |
Stefan Agner | e44fc38 | 2019-02-18 00:57:38 +0100 | [diff] [blame] | 107 | ldrbne r3, [r1, #-1]! |
| 108 | ldrbcs r4, [r1, #-1]! |
| 109 | ldrbcs ip, [r1, #-1] |
| 110 | strbne r3, [r0, #-1]! |
| 111 | strbcs r4, [r0, #-1]! |
| 112 | strbcs ip, [r0, #-1] |
Ard Biesheuvel | ccb8160 | 2021-10-04 11:29:11 +0200 | [diff] [blame] | 113 | ldmfd sp!, {r0, r4, UNWIND(fpreg,) pc} |
Nicolas Pitre | 7549423 | 2005-11-01 19:52:23 +0000 | [diff] [blame] | 114 | |
| 115 | 9: cmp ip, #2 |
Stefan Agner | e44fc38 | 2019-02-18 00:57:38 +0100 | [diff] [blame] | 116 | ldrbgt r3, [r1, #-1]! |
| 117 | ldrbge r4, [r1, #-1]! |
Nicolas Pitre | 7549423 | 2005-11-01 19:52:23 +0000 | [diff] [blame] | 118 | ldrb lr, [r1, #-1]! |
Stefan Agner | e44fc38 | 2019-02-18 00:57:38 +0100 | [diff] [blame] | 119 | strbgt r3, [r0, #-1]! |
| 120 | strbge r4, [r0, #-1]! |
Nicolas Pitre | 7549423 | 2005-11-01 19:52:23 +0000 | [diff] [blame] | 121 | subs r2, r2, ip |
| 122 | strb lr, [r0, #-1]! |
| 123 | blt 8b |
| 124 | ands ip, r1, #3 |
| 125 | beq 1b |
| 126 | |
| 127 | 10: bic r1, r1, #3 |
| 128 | cmp ip, #2 |
| 129 | ldr r3, [r1, #0] |
| 130 | beq 17f |
| 131 | blt 18f |
| 132 | |
| 133 | |
| 134 | .macro backward_copy_shift push pull |
| 135 | |
| 136 | subs r2, r2, #28 |
| 137 | blt 14f |
| 138 | |
Nicolas Pitre | 2239aff | 2008-03-31 12:38:31 -0400 | [diff] [blame] | 139 | CALGN( ands ip, r0, #31 ) |
Stefan Agner | e44fc38 | 2019-02-18 00:57:38 +0100 | [diff] [blame] | 140 | CALGN( sbcsne r4, ip, r2 ) @ C is always set here |
Nicolas Pitre | 7549423 | 2005-11-01 19:52:23 +0000 | [diff] [blame] | 141 | CALGN( subcc r2, r2, ip ) |
| 142 | CALGN( bcc 15f ) |
| 143 | |
Ard Biesheuvel | ccb8160 | 2021-10-04 11:29:11 +0200 | [diff] [blame] | 144 | 11: stmfd sp!, {r5, r6, r8 - r10} |
Nicolas Pitre | 7549423 | 2005-11-01 19:52:23 +0000 | [diff] [blame] | 145 | |
| 146 | PLD( pld [r1, #-4] ) |
| 147 | PLD( subs r2, r2, #96 ) |
| 148 | PLD( pld [r1, #-32] ) |
| 149 | PLD( blt 13f ) |
| 150 | PLD( pld [r1, #-64] ) |
| 151 | PLD( pld [r1, #-96] ) |
| 152 | |
| 153 | 12: PLD( pld [r1, #-128] ) |
Ard Biesheuvel | ccb8160 | 2021-10-04 11:29:11 +0200 | [diff] [blame] | 154 | 13: ldmdb r1!, {r8, r9, r10, ip} |
Victor Kamensky | d98b90e | 2014-02-25 08:41:09 +0100 | [diff] [blame] | 155 | mov lr, r3, lspush #\push |
Nicolas Pitre | 7549423 | 2005-11-01 19:52:23 +0000 | [diff] [blame] | 156 | subs r2, r2, #32 |
| 157 | ldmdb r1!, {r3, r4, r5, r6} |
Victor Kamensky | d98b90e | 2014-02-25 08:41:09 +0100 | [diff] [blame] | 158 | orr lr, lr, ip, lspull #\pull |
| 159 | mov ip, ip, lspush #\push |
Ard Biesheuvel | ccb8160 | 2021-10-04 11:29:11 +0200 | [diff] [blame] | 160 | orr ip, ip, r10, lspull #\pull |
| 161 | mov r10, r10, lspush #\push |
| 162 | orr r10, r10, r9, lspull #\pull |
Victor Kamensky | d98b90e | 2014-02-25 08:41:09 +0100 | [diff] [blame] | 163 | mov r9, r9, lspush #\push |
| 164 | orr r9, r9, r8, lspull #\pull |
| 165 | mov r8, r8, lspush #\push |
Ard Biesheuvel | ccb8160 | 2021-10-04 11:29:11 +0200 | [diff] [blame] | 166 | orr r8, r8, r6, lspull #\pull |
Victor Kamensky | d98b90e | 2014-02-25 08:41:09 +0100 | [diff] [blame] | 167 | mov r6, r6, lspush #\push |
| 168 | orr r6, r6, r5, lspull #\pull |
| 169 | mov r5, r5, lspush #\push |
| 170 | orr r5, r5, r4, lspull #\pull |
| 171 | mov r4, r4, lspush #\push |
| 172 | orr r4, r4, r3, lspull #\pull |
Ard Biesheuvel | ccb8160 | 2021-10-04 11:29:11 +0200 | [diff] [blame] | 173 | stmdb r0!, {r4 - r6, r8 - r10, ip, lr} |
Nicolas Pitre | 7549423 | 2005-11-01 19:52:23 +0000 | [diff] [blame] | 174 | bge 12b |
| 175 | PLD( cmn r2, #96 ) |
| 176 | PLD( bge 13b ) |
| 177 | |
Ard Biesheuvel | ccb8160 | 2021-10-04 11:29:11 +0200 | [diff] [blame] | 178 | ldmfd sp!, {r5, r6, r8 - r10} |
Nicolas Pitre | 7549423 | 2005-11-01 19:52:23 +0000 | [diff] [blame] | 179 | |
| 180 | 14: ands ip, r2, #28 |
| 181 | beq 16f |
| 182 | |
Victor Kamensky | d98b90e | 2014-02-25 08:41:09 +0100 | [diff] [blame] | 183 | 15: mov lr, r3, lspush #\push |
Nicolas Pitre | 7549423 | 2005-11-01 19:52:23 +0000 | [diff] [blame] | 184 | ldr r3, [r1, #-4]! |
| 185 | subs ip, ip, #4 |
Victor Kamensky | d98b90e | 2014-02-25 08:41:09 +0100 | [diff] [blame] | 186 | orr lr, lr, r3, lspull #\pull |
Nicolas Pitre | 7549423 | 2005-11-01 19:52:23 +0000 | [diff] [blame] | 187 | str lr, [r0, #-4]! |
| 188 | bgt 15b |
| 189 | CALGN( cmp r2, #0 ) |
| 190 | CALGN( bge 11b ) |
| 191 | |
| 192 | 16: add r1, r1, #(\pull / 8) |
| 193 | b 8b |
| 194 | |
| 195 | .endm |
| 196 | |
| 197 | |
| 198 | backward_copy_shift push=8 pull=24 |
| 199 | |
| 200 | 17: backward_copy_shift push=16 pull=16 |
| 201 | |
| 202 | 18: backward_copy_shift push=24 pull=8 |
| 203 | |
Ard Biesheuvel | ccb8160 | 2021-10-04 11:29:11 +0200 | [diff] [blame] | 204 | UNWIND( .fnend ) |
Catalin Marinas | 93ed397 | 2008-08-28 11:22:32 +0100 | [diff] [blame] | 205 | ENDPROC(memmove) |
Linus Walleij | d6d51a9 | 2020-10-25 23:52:08 +0100 | [diff] [blame] | 206 | ENDPROC(__memmove) |