summaryrefslogtreecommitdiff
path: root/gmp/mpn/alpha/sqr_diagonal.asm
blob: 2aa7f2e597bc873d972f01f37b2970fc0f45fc37 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
dnl  Alpha mpn_sqr_diagonal.

dnl  Copyright 2001, 2002 Free Software Foundation, Inc.

dnl  This file is part of the GNU MP Library.

dnl  The GNU MP Library is free software; you can redistribute it and/or modify
dnl  it under the terms of the GNU Lesser General Public License as published
dnl  by the Free Software Foundation; either version 3 of the License, or (at
dnl  your option) any later version.

dnl  The GNU MP Library is distributed in the hope that it will be useful, but
dnl  WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
dnl  or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public
dnl  License for more details.

dnl  You should have received a copy of the GNU Lesser General Public License
dnl  along with the GNU MP Library.  If not, see http://www.gnu.org/licenses/.

include(`../config.m4')

C      cycles/limb
C EV4:     42
C EV5:     18
C EV6:      3.45

C  INPUT PARAMETERS
C  rp	r16
C  up	r17
C  n	r18


ASM_START()
PROLOGUE(mpn_sqr_diagonal)
	ldq	r2,0(r17)	C r2 = s1_limb
	lda	r18,-2(r18)	C size -= 2
	mulq	r2,r2,r3	C r3 = prod_low
	umulh	r2,r2,r4	C r4 = prod_high
	blt	r18,$Lend1	C jump if size was == 1
	ldq	r2,8(r17)	C r2 = s1_limb
	beq	r18,$Lend2	C jump if size was == 2

	ALIGN(8)
$Loop:	stq	r3,0(r16)
	mulq	r2,r2,r3	C r3 = prod_low
	lda	r18,-1(r18)	C size--
	stq	r4,8(r16)
	umulh	r2,r2,r4	C r4 = cy_limb
	ldq	r2,16(r17)	C r2 = s1_limb
	lda	r17,8(r17)	C s1_ptr++
	lda	r16,16(r16)	C res_ptr++
	bne	r18,$Loop

$Lend2:	stq	r3,0(r16)
	mulq	r2,r2,r3	C r3 = prod_low
	stq	r4,8(r16)
	umulh	r2,r2,r4	C r4 = cy_limb
	stq	r3,16(r16)
	stq	r4,24(r16)
	ret	r31,(r26),1
$Lend1:	stq	r3,0(r16)
	stq	r4,8(r16)
	ret	r31,(r26),1
EPILOGUE(mpn_sqr_diagonal)
ASM_END()