summaryrefslogtreecommitdiff
path: root/mpn/arm/addmul_1.S
diff options
context:
space:
mode:
Diffstat (limited to 'mpn/arm/addmul_1.S')
-rw-r--r--mpn/arm/addmul_1.S99
1 files changed, 45 insertions, 54 deletions
diff --git a/mpn/arm/addmul_1.S b/mpn/arm/addmul_1.S
index e9b878eaa..f4316df33 100644
--- a/mpn/arm/addmul_1.S
+++ b/mpn/arm/addmul_1.S
@@ -20,14 +20,14 @@
@ along with the GNU MP Library; see the file COPYING.LIB. If not, write to
@ the Free Software Foundation, Inc., 59 Temple Place - Suite 330, Boston,
@ MA 02111-1307, USA.
-
+
#define p r0
#define a r1
#define n r2
#define w r3
-#define sl r10 /* Do not use, reserved for PIC. */
-#define fp r11
+#define z r11
+
#define ip r12
#define sp r13
#define lr r14
@@ -38,61 +38,52 @@
.global __gmpn_addmul_1
.type __gmpn_addmul_1,%function
__gmpn_addmul_1:
- stmfd sp!, { r7, r8, r9, lr }
- mov lr, #0
+ stmfd sp!, { r8-r11, lr }
+ mov z, #0
+ mov ip, #0
movs n, n, lsr #1
- bcc Lskip1
- ldmia a!, { lr }
- umull ip, lr, w, lr
- ldmia p, { r9 }
- adds r9, r9, ip
- adc lr, lr, #0
- stmia p!, { r9 }
-Lskip1:
+ bcc skip1
+ ldr lr, [a], #4
+ ldr r9, [p]
+ umlal r9, ip, w, lr
+ str r9, [p], #4
+skip1:
movs n, n, lsr #1
- bcc Lskip2
- mov r7, lr
+ bcc skip2
+ ldmia p, { r9, r10 }
+ adds r8, ip, r9
+ adc r9, z, #0
ldmia a!, { ip, lr }
- umull r8, r9, w, ip
- umull ip, lr, w, lr
- adds r7, r7, r8
- adcs r8, r9, ip
- adc lr, lr, #0
- ldmia p, { r9, ip }
- adds r7, r7, r9
- adcs r8, r8, ip
- adc lr, lr, #0
- stmia p!, { r7, r8 }
-Lskip2:
+ umlal r8, r9, w, ip
+ adds r9, r9, r10
+ adc ip, z, #0
+ umlal r9, ip, w, lr
+ stmia p!, { r8, r9 }
+skip2:
teq n, #0
- beq Lreturn
- stmfd sp!, { r5, r6 }
-LLoop:
- mov r5, lr
- ldmia a!, { r8, r9, ip, lr }
- umull r6, r7, w, r8
- umull r8, r9, w, r9
+ beq return
+ stmfd sp!, { r4-r7 }
+addmul_loop:
+ ldmia p, { r5, r6, r7, r8 }
+ adds r4, ip, r5
+ adc r5, z, #0
+ ldmia a!, { r9, r10, ip, lr }
+ umlal r4, r5, w, r9
adds r5, r5, r6
- adcs r6, r7, r8
- adc r7, r9, #0
- umull r8, r9, w, ip
- umull ip, lr, w, lr
+ adc r6, z, #0
+ umlal r5, r6, w, r10
+ adds r6, r6, r7
+ adc r7, z, #0
+ umlal r6, r7, w, ip
adds r7, r7, r8
- adcs r8, r9, ip
- adc lr, lr, #0
- ldmia p!, { r9, ip }
- adds r5, r5, r9
- adcs r6, r6, ip
- ldmia p!, { r9, ip }
- adcs r7, r7, r9
- adcs r8, r8, ip
- adc lr, lr, #0
- stmdb p, { r5, r6, r7, r8 }
+ adc ip, z, #0
+ umlal r7, ip, w, lr
subs n, n, #1
- bne LLoop
- ldmfd sp!, { r5, r6 }
-Lreturn:
- mov r0, lr
- ldmfd sp!, { r7, r8, r9, pc }^
-Lend:
- .size __gmpn_addmul_1, Lend - __gmpn_addmul_1
+ stmia p!, { r4, r5, r6, r7 }
+ bne addmul_loop
+ ldmfd sp!, { r4-r7 }
+return:
+ mov r0, ip
+ ldmfd sp!, { r8-r11, pc }
+end:
+ .size __gmpn_addmul_1, end - __gmpn_addmul_1