[Gmp-commit] /var/hg/gmp: Update c/l tables.

mercurial at gmplib.org mercurial at gmplib.org
Thu Feb 16 21:55:31 UTC 2017


details:   /var/hg/gmp/rev/e8dc1d2d9cff
changeset: 17276:e8dc1d2d9cff
user:      Torbjorn Granlund <tg at gmplib.org>
date:      Thu Feb 16 22:55:29 2017 +0100
description:
Update c/l tables.

diffstat:

 mpn/arm64/bdiv_dbm1c.asm       |  5 +++--
 mpn/arm64/com.asm              |  5 +++--
 mpn/arm64/copyi.asm            |  5 +++--
 mpn/arm64/hamdist.asm          |  5 +++--
 mpn/arm64/logops_n.asm         |  8 +++++---
 mpn/arm64/mod_34lsub1.asm      |  7 ++++---
 mpn/arm64/popcount.asm         |  5 +++--
 mpn/arm64/sec_tabselect.asm    |  5 +++--
 mpn/arm64/sqr_diag_addlsh1.asm |  2 +-
 9 files changed, 28 insertions(+), 19 deletions(-)

diffs (144 lines):

diff -r f1416254f510 -r e8dc1d2d9cff mpn/arm64/bdiv_dbm1c.asm
--- a/mpn/arm64/bdiv_dbm1c.asm	Thu Feb 16 21:09:42 2017 +0100
+++ b/mpn/arm64/bdiv_dbm1c.asm	Thu Feb 16 22:55:29 2017 +0100
@@ -31,8 +31,9 @@
 include(`../config.m4')
 
 C	     cycles/limb
-C Cortex-A53	 ?
-C Cortex-A57	 ?
+C Cortex-A53	 8
+C Cortex-A57	 7
+C X-Gene	 4.25
 
 define(`qp',	  `x0')
 define(`up',	  `x1')
diff -r f1416254f510 -r e8dc1d2d9cff mpn/arm64/com.asm
--- a/mpn/arm64/com.asm	Thu Feb 16 21:09:42 2017 +0100
+++ b/mpn/arm64/com.asm	Thu Feb 16 22:55:29 2017 +0100
@@ -31,8 +31,9 @@
 include(`../config.m4')
 
 C	     cycles/limb
-C Cortex-A53	 ?
-C Cortex-A57	 ?
+C Cortex-A53	 2.25
+C Cortex-A57	 1.25
+C X-Gene	 1.75
 
 changecom(blah)
 
diff -r f1416254f510 -r e8dc1d2d9cff mpn/arm64/copyi.asm
--- a/mpn/arm64/copyi.asm	Thu Feb 16 21:09:42 2017 +0100
+++ b/mpn/arm64/copyi.asm	Thu Feb 16 22:55:29 2017 +0100
@@ -31,8 +31,9 @@
 include(`../config.m4')
 
 C	     cycles/limb
-C Cortex-A53	 ?
-C Cortex-A57	 ?
+C Cortex-A53	 2
+C Cortex-A57	 1
+C X-Gene	 1.25
 
 changecom(blah)
 
diff -r f1416254f510 -r e8dc1d2d9cff mpn/arm64/hamdist.asm
--- a/mpn/arm64/hamdist.asm	Thu Feb 16 21:09:42 2017 +0100
+++ b/mpn/arm64/hamdist.asm	Thu Feb 16 22:55:29 2017 +0100
@@ -31,8 +31,9 @@
 include(`../config.m4')
 
 C	     cycles/limb
-C Cortex-A53	 ?
-C Cortex-A57	 ?
+C Cortex-A53	 4.5
+C Cortex-A57	 1.9
+C X-Gene	 4.36
 
 C TODO
 C  * Consider greater unrolling.
diff -r f1416254f510 -r e8dc1d2d9cff mpn/arm64/logops_n.asm
--- a/mpn/arm64/logops_n.asm	Thu Feb 16 21:09:42 2017 +0100
+++ b/mpn/arm64/logops_n.asm	Thu Feb 16 22:55:29 2017 +0100
@@ -32,9 +32,11 @@
 
 include(`../config.m4')
 
-C	     cycles/limb
-C Cortex-A53	 ?
-C Cortex-A57	 ?
+C	     cycles/limb     cycles/limb
+C	      nand,nior	      all other
+C Cortex-A53	3.5-4		3-3.5
+C Cortex-A57	 2.5		 2.0
+C X-Gene	 3.0		 2.5
 
 changecom(blah)
 
diff -r f1416254f510 -r e8dc1d2d9cff mpn/arm64/mod_34lsub1.asm
--- a/mpn/arm64/mod_34lsub1.asm	Thu Feb 16 21:09:42 2017 +0100
+++ b/mpn/arm64/mod_34lsub1.asm	Thu Feb 16 22:55:29 2017 +0100
@@ -31,8 +31,9 @@
 include(`../config.m4')
 
 C	     cycles/limb
-C Cortex-A53	 ?
-C Cortex-A57	 ?
+C Cortex-A53	 2
+C Cortex-A57	 1
+C X-Gene	 1.45
 
 define(`ap',	x0)
 define(`n',	x1)
@@ -42,7 +43,7 @@
 C mp_limb_t mpn_mod_34lsub1 (mp_srcptr up, mp_size_t n)
 
 C TODO
-C  * An alternative inner loop which could run at 0.722 c/l:
+C  * An alternative inner loop which could run at 0.722 c/l on A57:
 C	adds	x8, x8, x2
 C	adcs	x9, x9, x3
 C	ldp	x2, x3, [ap, #-32]
diff -r f1416254f510 -r e8dc1d2d9cff mpn/arm64/popcount.asm
--- a/mpn/arm64/popcount.asm	Thu Feb 16 21:09:42 2017 +0100
+++ b/mpn/arm64/popcount.asm	Thu Feb 16 22:55:29 2017 +0100
@@ -31,8 +31,9 @@
 include(`../config.m4')
 
 C	     cycles/limb
-C Cortex-A53	 ?
-C Cortex-A57	 ?
+C Cortex-A53	 2.5
+C Cortex-A57	 1.14
+C X-Gene	 3
 
 C TODO
 C  * Consider greater unrolling.
diff -r f1416254f510 -r e8dc1d2d9cff mpn/arm64/sec_tabselect.asm
--- a/mpn/arm64/sec_tabselect.asm	Thu Feb 16 21:09:42 2017 +0100
+++ b/mpn/arm64/sec_tabselect.asm	Thu Feb 16 22:55:29 2017 +0100
@@ -34,8 +34,9 @@
 
 
 C	     cycles/limb
-C Cortex-A53	 ?
-C Cortex-A57	 ?
+C Cortex-A53	 2.25
+C Cortex-A57	 1.33
+C X-Gene	 2
 
 C void
 C mpn_sec_tabselect (mp_ptr rp, mp_srcptr *tab,
diff -r f1416254f510 -r e8dc1d2d9cff mpn/arm64/sqr_diag_addlsh1.asm
--- a/mpn/arm64/sqr_diag_addlsh1.asm	Thu Feb 16 21:09:42 2017 +0100
+++ b/mpn/arm64/sqr_diag_addlsh1.asm	Thu Feb 16 22:55:29 2017 +0100
@@ -34,7 +34,7 @@
 
 C	     cycles/limb
 C Cortex-A53	 6.85
-C Cortex-A57	 ?
+C Cortex-A57	 3.5
 C X-Gene	 4.1
 
 define(`rp', `x0')


More information about the gmp-commit mailing list