go to gmp 4.3.2baserock/pedroalvarez/gcc-5.3.0-gmp432

author: Pedro Alvarez <pedro.alvarez@codethink.co.uk> 2016-05-27 17:39:31 +0100
committer: Pedro Alvarez <pedro.alvarez@codethink.co.uk> 2016-05-27 17:53:32 +0100
commit: 26c75cf8267919f81a1759c9c965a52c660233f9 (patch)
tree: cf2a39cf56c2c8ac45760854413ab233e6263974 /gmp/mpn/arm/v7a/cora15/neon/copyd.asm
parent: 56892c1d217baea02092b51a09bbc924130ca84c (diff)
download: gcc-tarball-baserock/pedroalvarez/gcc-5.3.0-gmp432.tar.gz
1 files changed, 0 insertions, 110 deletions
diff --git a/gmp/mpn/arm/v7a/cora15/neon/copyd.asm b/gmp/mpn/arm/v7a/cora15/neon/copyd.asm
deleted file mode 100644
index 98fe535def..0000000000
--- a/gmp/mpn/arm/v7a/cora15/neon/copyd.asm
+++ /dev/null
@@ -1,110 +0,0 @@
-dnl  ARM Neon mpn_copyd optimised for A15.
-
-dnl  Copyright 2013 Free Software Foundation, Inc.
-
-dnl  This file is part of the GNU MP Library.
-dnl
-dnl  The GNU MP Library is free software; you can redistribute it and/or modify
-dnl  it under the terms of either:
-dnl
-dnl    * the GNU Lesser General Public License as published by the Free
-dnl      Software Foundation; either version 3 of the License, or (at your
-dnl      option) any later version.
-dnl
-dnl  or
-dnl
-dnl    * the GNU General Public License as published by the Free Software
-dnl      Foundation; either version 2 of the License, or (at your option) any
-dnl      later version.
-dnl
-dnl  or both in parallel, as here.
-dnl
-dnl  The GNU MP Library is distributed in the hope that it will be useful, but
-dnl  WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
-dnl  or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
-dnl  for more details.
-dnl
-dnl  You should have received copies of the GNU General Public License and the
-dnl  GNU Lesser General Public License along with the GNU MP Library.  If not,
-dnl  see https://www.gnu.org/licenses/.
-
-include(`../config.m4')
-
-C	     cycles/limb
-C StrongARM	 -
-C XScale	 -
-C Cortex-A7	 ?
-C Cortex-A8	 ?
-C Cortex-A9	 1.75		slower than core register code
-C Cortex-A15	 0.52
-
-define(`rp', `r0')
-define(`up', `r1')
-define(`n',  `r2')
-
-ASM_START()
-PROLOGUE(mpn_copyd)
-	add	rp, rp, n, lsl #2
-	add	up, up, n, lsl #2
-
-	cmp	n, #7
-	ble	L(bc)
-
-C Copy until rp is 128-bit aligned
-	tst	rp, #4
-	beq	L(al1)
-	sub	up, up, #4
-	vld1.32	{d22[0]}, [up]
-	sub	n, n, #1
-	sub	rp, rp, #4
-	vst1.32	{d22[0]}, [rp]
-L(al1):	tst	rp, #8
-	beq	L(al2)
-	sub	up, up, #8
-	vld1.32	{d22}, [up]
-	sub	n, n, #2
-	sub	rp, rp, #8
-	vst1.32	{d22}, [rp:64]
-L(al2):	sub	up, up, #16
-	vld1.32	{d26-d27}, [up]
-	subs	n, n, #12
-	sub	rp, rp, #16			C offset rp for loop
-	blt	L(end)
-
-	sub	up, up, #16			C offset up for loop
-	mov	r12, #-16
-
-	ALIGN(16)
-L(top):	vld1.32	{d22-d23}, [up], r12
-	vst1.32	{d26-d27}, [rp:128], r12
-	vld1.32	{d26-d27}, [up], r12
-	vst1.32	{d22-d23}, [rp:128], r12
-	subs	n, n, #8
-	bge	L(top)
-
-	add	up, up, #16			C undo up offset
-						C rp offset undoing folded
-L(end):	vst1.32	{d26-d27}, [rp:128]
-
-C Copy last 0-7 limbs.  Note that rp is aligned after loop, but not when we
-C arrive here via L(bc)
-L(bc):	tst	n, #4
-	beq	L(tl1)
-	sub	up, up, #16
-	vld1.32	{d22-d23}, [up]
-	sub	rp, rp, #16
-	vst1.32	{d22-d23}, [rp]
-L(tl1):	tst	n, #2
-	beq	L(tl2)
-	sub	up, up, #8
-	vld1.32	{d22}, [up]
-	sub	rp, rp, #8
-	vst1.32	{d22}, [rp]
-L(tl2):	tst	n, #1
-	beq	L(tl3)
-	sub	up, up, #4
-	vld1.32	{d22[0]}, [up]
-	sub	rp, rp, #4
-	vst1.32	{d22[0]}, [rp]
-L(tl3):	bx	lr
-EPILOGUE()
author	Pedro Alvarez <pedro.alvarez@codethink.co.uk>	2016-05-27 17:39:31 +0100
committer	Pedro Alvarez <pedro.alvarez@codethink.co.uk>	2016-05-27 17:53:32 +0100
commit	26c75cf8267919f81a1759c9c965a52c660233f9 (patch)
tree	cf2a39cf56c2c8ac45760854413ab233e6263974 /gmp/mpn/arm/v7a/cora15/neon/copyd.asm
parent	56892c1d217baea02092b51a09bbc924130ca84c (diff)
download	gcc-tarball-baserock/pedroalvarez/gcc-5.3.0-gmp432.tar.gz