[Gmp-commit] /var/hg/gmp: Update c/l tables.
mercurial at gmplib.org
mercurial at gmplib.org
Thu Feb 16 21:55:31 UTC 2017
details: /var/hg/gmp/rev/e8dc1d2d9cff
changeset: 17276:e8dc1d2d9cff
user: Torbjorn Granlund <tg at gmplib.org>
date: Thu Feb 16 22:55:29 2017 +0100
description:
Update c/l tables.
diffstat:
mpn/arm64/bdiv_dbm1c.asm | 5 +++--
mpn/arm64/com.asm | 5 +++--
mpn/arm64/copyi.asm | 5 +++--
mpn/arm64/hamdist.asm | 5 +++--
mpn/arm64/logops_n.asm | 8 +++++---
mpn/arm64/mod_34lsub1.asm | 7 ++++---
mpn/arm64/popcount.asm | 5 +++--
mpn/arm64/sec_tabselect.asm | 5 +++--
mpn/arm64/sqr_diag_addlsh1.asm | 2 +-
9 files changed, 28 insertions(+), 19 deletions(-)
diffs (144 lines):
diff -r f1416254f510 -r e8dc1d2d9cff mpn/arm64/bdiv_dbm1c.asm
--- a/mpn/arm64/bdiv_dbm1c.asm Thu Feb 16 21:09:42 2017 +0100
+++ b/mpn/arm64/bdiv_dbm1c.asm Thu Feb 16 22:55:29 2017 +0100
@@ -31,8 +31,9 @@
include(`../config.m4')
C cycles/limb
-C Cortex-A53 ?
-C Cortex-A57 ?
+C Cortex-A53 8
+C Cortex-A57 7
+C X-Gene 4.25
define(`qp', `x0')
define(`up', `x1')
diff -r f1416254f510 -r e8dc1d2d9cff mpn/arm64/com.asm
--- a/mpn/arm64/com.asm Thu Feb 16 21:09:42 2017 +0100
+++ b/mpn/arm64/com.asm Thu Feb 16 22:55:29 2017 +0100
@@ -31,8 +31,9 @@
include(`../config.m4')
C cycles/limb
-C Cortex-A53 ?
-C Cortex-A57 ?
+C Cortex-A53 2.25
+C Cortex-A57 1.25
+C X-Gene 1.75
changecom(blah)
diff -r f1416254f510 -r e8dc1d2d9cff mpn/arm64/copyi.asm
--- a/mpn/arm64/copyi.asm Thu Feb 16 21:09:42 2017 +0100
+++ b/mpn/arm64/copyi.asm Thu Feb 16 22:55:29 2017 +0100
@@ -31,8 +31,9 @@
include(`../config.m4')
C cycles/limb
-C Cortex-A53 ?
-C Cortex-A57 ?
+C Cortex-A53 2
+C Cortex-A57 1
+C X-Gene 1.25
changecom(blah)
diff -r f1416254f510 -r e8dc1d2d9cff mpn/arm64/hamdist.asm
--- a/mpn/arm64/hamdist.asm Thu Feb 16 21:09:42 2017 +0100
+++ b/mpn/arm64/hamdist.asm Thu Feb 16 22:55:29 2017 +0100
@@ -31,8 +31,9 @@
include(`../config.m4')
C cycles/limb
-C Cortex-A53 ?
-C Cortex-A57 ?
+C Cortex-A53 4.5
+C Cortex-A57 1.9
+C X-Gene 4.36
C TODO
C * Consider greater unrolling.
diff -r f1416254f510 -r e8dc1d2d9cff mpn/arm64/logops_n.asm
--- a/mpn/arm64/logops_n.asm Thu Feb 16 21:09:42 2017 +0100
+++ b/mpn/arm64/logops_n.asm Thu Feb 16 22:55:29 2017 +0100
@@ -32,9 +32,11 @@
include(`../config.m4')
-C cycles/limb
-C Cortex-A53 ?
-C Cortex-A57 ?
+C cycles/limb cycles/limb
+C nand,nior all other
+C Cortex-A53 3.5-4 3-3.5
+C Cortex-A57 2.5 2.0
+C X-Gene 3.0 2.5
changecom(blah)
diff -r f1416254f510 -r e8dc1d2d9cff mpn/arm64/mod_34lsub1.asm
--- a/mpn/arm64/mod_34lsub1.asm Thu Feb 16 21:09:42 2017 +0100
+++ b/mpn/arm64/mod_34lsub1.asm Thu Feb 16 22:55:29 2017 +0100
@@ -31,8 +31,9 @@
include(`../config.m4')
C cycles/limb
-C Cortex-A53 ?
-C Cortex-A57 ?
+C Cortex-A53 2
+C Cortex-A57 1
+C X-Gene 1.45
define(`ap', x0)
define(`n', x1)
@@ -42,7 +43,7 @@
C mp_limb_t mpn_mod_34lsub1 (mp_srcptr up, mp_size_t n)
C TODO
-C * An alternative inner loop which could run at 0.722 c/l:
+C * An alternative inner loop which could run at 0.722 c/l on A57:
C adds x8, x8, x2
C adcs x9, x9, x3
C ldp x2, x3, [ap, #-32]
diff -r f1416254f510 -r e8dc1d2d9cff mpn/arm64/popcount.asm
--- a/mpn/arm64/popcount.asm Thu Feb 16 21:09:42 2017 +0100
+++ b/mpn/arm64/popcount.asm Thu Feb 16 22:55:29 2017 +0100
@@ -31,8 +31,9 @@
include(`../config.m4')
C cycles/limb
-C Cortex-A53 ?
-C Cortex-A57 ?
+C Cortex-A53 2.5
+C Cortex-A57 1.14
+C X-Gene 3
C TODO
C * Consider greater unrolling.
diff -r f1416254f510 -r e8dc1d2d9cff mpn/arm64/sec_tabselect.asm
--- a/mpn/arm64/sec_tabselect.asm Thu Feb 16 21:09:42 2017 +0100
+++ b/mpn/arm64/sec_tabselect.asm Thu Feb 16 22:55:29 2017 +0100
@@ -34,8 +34,9 @@
C cycles/limb
-C Cortex-A53 ?
-C Cortex-A57 ?
+C Cortex-A53 2.25
+C Cortex-A57 1.33
+C X-Gene 2
C void
C mpn_sec_tabselect (mp_ptr rp, mp_srcptr *tab,
diff -r f1416254f510 -r e8dc1d2d9cff mpn/arm64/sqr_diag_addlsh1.asm
--- a/mpn/arm64/sqr_diag_addlsh1.asm Thu Feb 16 21:09:42 2017 +0100
+++ b/mpn/arm64/sqr_diag_addlsh1.asm Thu Feb 16 22:55:29 2017 +0100
@@ -34,7 +34,7 @@
C cycles/limb
C Cortex-A53 6.85
-C Cortex-A57 ?
+C Cortex-A57 3.5
C X-Gene 4.1
define(`rp', `x0')
More information about the gmp-commit
mailing list