diff options
Diffstat (limited to 'mpn/arm/addmul_1.S')
-rw-r--r-- | mpn/arm/addmul_1.S | 99 |
1 files changed, 45 insertions, 54 deletions
diff --git a/mpn/arm/addmul_1.S b/mpn/arm/addmul_1.S index e9b878eaa..f4316df33 100644 --- a/mpn/arm/addmul_1.S +++ b/mpn/arm/addmul_1.S @@ -20,14 +20,14 @@ @ along with the GNU MP Library; see the file COPYING.LIB. If not, write to @ the Free Software Foundation, Inc., 59 Temple Place - Suite 330, Boston, @ MA 02111-1307, USA. - + #define p r0 #define a r1 #define n r2 #define w r3 -#define sl r10 /* Do not use, reserved for PIC. */ -#define fp r11 +#define z r11 + #define ip r12 #define sp r13 #define lr r14 @@ -38,61 +38,52 @@ .global __gmpn_addmul_1 .type __gmpn_addmul_1,%function __gmpn_addmul_1: - stmfd sp!, { r7, r8, r9, lr } - mov lr, #0 + stmfd sp!, { r8-r11, lr } + mov z, #0 + mov ip, #0 movs n, n, lsr #1 - bcc Lskip1 - ldmia a!, { lr } - umull ip, lr, w, lr - ldmia p, { r9 } - adds r9, r9, ip - adc lr, lr, #0 - stmia p!, { r9 } -Lskip1: + bcc skip1 + ldr lr, [a], #4 + ldr r9, [p] + umlal r9, ip, w, lr + str r9, [p], #4 +skip1: movs n, n, lsr #1 - bcc Lskip2 - mov r7, lr + bcc skip2 + ldmia p, { r9, r10 } + adds r8, ip, r9 + adc r9, z, #0 ldmia a!, { ip, lr } - umull r8, r9, w, ip - umull ip, lr, w, lr - adds r7, r7, r8 - adcs r8, r9, ip - adc lr, lr, #0 - ldmia p, { r9, ip } - adds r7, r7, r9 - adcs r8, r8, ip - adc lr, lr, #0 - stmia p!, { r7, r8 } -Lskip2: + umlal r8, r9, w, ip + adds r9, r9, r10 + adc ip, z, #0 + umlal r9, ip, w, lr + stmia p!, { r8, r9 } +skip2: teq n, #0 - beq Lreturn - stmfd sp!, { r5, r6 } -LLoop: - mov r5, lr - ldmia a!, { r8, r9, ip, lr } - umull r6, r7, w, r8 - umull r8, r9, w, r9 + beq return + stmfd sp!, { r4-r7 } +addmul_loop: + ldmia p, { r5, r6, r7, r8 } + adds r4, ip, r5 + adc r5, z, #0 + ldmia a!, { r9, r10, ip, lr } + umlal r4, r5, w, r9 adds r5, r5, r6 - adcs r6, r7, r8 - adc r7, r9, #0 - umull r8, r9, w, ip - umull ip, lr, w, lr + adc r6, z, #0 + umlal r5, r6, w, r10 + adds r6, r6, r7 + adc r7, z, #0 + umlal r6, r7, w, ip adds r7, r7, r8 - adcs r8, r9, ip - adc lr, lr, #0 - ldmia p!, { r9, ip } - adds r5, r5, r9 - adcs r6, r6, ip - ldmia p!, { r9, ip } - adcs r7, r7, r9 - adcs r8, r8, ip - adc lr, lr, #0 - stmdb p, { r5, r6, r7, r8 } + adc ip, z, #0 + umlal r7, ip, w, lr subs n, n, #1 - bne LLoop - ldmfd sp!, { r5, r6 } -Lreturn: - mov r0, lr - ldmfd sp!, { r7, r8, r9, pc }^ -Lend: - .size __gmpn_addmul_1, Lend - __gmpn_addmul_1 + stmia p!, { r4, r5, r6, r7 } + bne addmul_loop + ldmfd sp!, { r4-r7 } +return: + mov r0, ip + ldmfd sp!, { r8-r11, pc } +end: + .size __gmpn_addmul_1, end - __gmpn_addmul_1 |