[Gmp-commit] /var/hg/gmp: 2 new changesets

mercurial at gmplib.org mercurial at gmplib.org
Wed Mar 12 19:57:12 UTC 2014


details:   /var/hg/gmp/rev/595d66a8d741
changeset: 16330:595d66a8d741
user:      Torbjorn Granlund <tege at gmplib.org>
date:      Wed Mar 12 20:56:56 2014 +0100
description:
Provide AMD bd2 gmp-mparam.h files.

details:   /var/hg/gmp/rev/3f9086cd12d3
changeset: 16331:3f9086cd12d3
user:      Torbjorn Granlund <tege at gmplib.org>
date:      Wed Mar 12 20:57:10 2014 +0100
description:
Tuneup.

diffstat:

 ChangeLog                            |    5 +
 mpn/alpha/ev5/gmp-mparam.h           |  152 ++++++++++++---------
 mpn/arm/v7a/cora15/gmp-mparam.h      |  149 ++++++++++++---------
 mpn/arm/v7a/cora9/gmp-mparam.h       |  157 +++++++++++++---------
 mpn/ia64/gmp-mparam.h                |  125 +++++++++++------
 mpn/powerpc32/gmp-mparam.h           |   62 ++++++--
 mpn/powerpc64/mode64/p4/gmp-mparam.h |  147 +++++++++++++--------
 mpn/s390_32/esame/gmp-mparam.h       |  223 ++++++++++++++++++++------------
 mpn/s390_64/z10/gmp-mparam.h         |  175 +++++++++++++++---------
 mpn/x86/bd2/gmp-mparam.h             |  192 ++++++++++++++++++++++++++++
 mpn/x86/bobcat/gmp-mparam.h          |  193 ++++++++++++++++-----------
 mpn/x86/k7/gmp-mparam.h              |  173 ++++++++++++++++--------
 mpn/x86/k8/gmp-mparam.h              |  192 ++++++++++++++++-----------
 mpn/x86/pentium4/sse2/gmp-mparam.h   |  167 +++++++++++++++---------
 mpn/x86_64/bd2/gmp-mparam.h          |  210 ++++++++++++++++++++++++++++++
 mpn/x86_64/bobcat/gmp-mparam.h       |  202 +++++++++++++++++------------
 mpn/x86_64/coreihwl/gmp-mparam.h     |  228 +++++++++++++++++---------------
 mpn/x86_64/coreinhm/gmp-mparam.h     |   65 ++++----
 mpn/x86_64/coreisbr/gmp-mparam.h     |  169 +++++++++++++++---------
 mpn/x86_64/k10/gmp-mparam.h          |  152 ++++++++++++++--------
 mpn/x86_64/k8/gmp-mparam.h           |  208 +++++++++++++++++++-----------
 mpn/x86_64/nano/gmp-mparam.h         |  181 +++++++++++++++++---------
 mpn/x86_64/pentium4/gmp-mparam.h     |  239 ++++++++++++++++++++--------------
 23 files changed, 2447 insertions(+), 1319 deletions(-)

diffs (truncated from 4982 to 300 lines):

diff -r 99f1e60b85ea -r 3f9086cd12d3 ChangeLog
--- a/ChangeLog	Tue Mar 11 22:55:18 2014 +0100
+++ b/ChangeLog	Wed Mar 12 20:57:10 2014 +0100
@@ -1,3 +1,8 @@
+2014-03-12  Torbjorn Granlund  <tege at gmplib.org>
+
+	* mpn/x86/bd2/gmp-mparam.h: New file.
+	* mpn/x86_64/bd2/gmp-mparam.h: New file.
+
 2014-03-06  Niels Möller  <nisse at lysator.liu.se>
 
 	* tests/mpz/t-pprime_p.c (check_composites): New function.
diff -r 99f1e60b85ea -r 3f9086cd12d3 mpn/alpha/ev5/gmp-mparam.h
--- a/mpn/alpha/ev5/gmp-mparam.h	Tue Mar 11 22:55:18 2014 +0100
+++ b/mpn/alpha/ev5/gmp-mparam.h	Wed Mar 12 20:57:10 2014 +0100
@@ -32,8 +32,8 @@
 #define GMP_LIMB_BITS 64
 #define GMP_LIMB_BYTES 8
 
-
 /* 600 MHz 21164A */
+/* Generated by tuneup.c, 2014-03-12, gcc 4.5 */
 
 #define DIVREM_1_NORM_THRESHOLD              0  /* preinv always */
 #define DIVREM_1_UNNORM_THRESHOLD            0  /* always */
@@ -41,10 +41,10 @@
 #define MOD_1_NORM_THRESHOLD                 0  /* always */
 #define MOD_1_UNNORM_THRESHOLD               0  /* always */
 #define MOD_1N_TO_MOD_1_1_THRESHOLD          3
-#define MOD_1U_TO_MOD_1_1_THRESHOLD          7
-#define MOD_1_1_TO_MOD_1_2_THRESHOLD        20
+#define MOD_1U_TO_MOD_1_1_THRESHOLD          6
+#define MOD_1_1_TO_MOD_1_2_THRESHOLD        22
 #define MOD_1_2_TO_MOD_1_4_THRESHOLD         0  /* never mpn_mod_1s_2p */
-#define PREINV_MOD_1_TO_MOD_1_THRESHOLD     14
+#define PREINV_MOD_1_TO_MOD_1_THRESHOLD     15
 #define USE_PREINV_DIVREM_1                  1  /* preinv always */
 #define DIV_QR_1N_PI1_METHOD                 1
 #define DIV_QR_1_NORM_THRESHOLD          MP_SIZE_T_MAX  /* never */
@@ -54,115 +54,133 @@
 #define BMOD_1_TO_MOD_1_THRESHOLD           80
 
 #define MUL_TOOM22_THRESHOLD                14
-#define MUL_TOOM33_THRESHOLD                66
+#define MUL_TOOM33_THRESHOLD                57
 #define MUL_TOOM44_THRESHOLD               118
 #define MUL_TOOM6H_THRESHOLD               157
-#define MUL_TOOM8H_THRESHOLD               236
+#define MUL_TOOM8H_THRESHOLD               212
 
 #define MUL_TOOM32_TO_TOOM43_THRESHOLD      73
 #define MUL_TOOM32_TO_TOOM53_THRESHOLD      77
 #define MUL_TOOM42_TO_TOOM53_THRESHOLD      81
 #define MUL_TOOM42_TO_TOOM63_THRESHOLD      56
-#define MUL_TOOM43_TO_TOOM54_THRESHOLD      64
+#define MUL_TOOM43_TO_TOOM54_THRESHOLD      66
 
 #define SQR_BASECASE_THRESHOLD               0  /* always */
 #define SQR_TOOM2_THRESHOLD                 24
 #define SQR_TOOM3_THRESHOLD                 74
-#define SQR_TOOM4_THRESHOLD                171
-#define SQR_TOOM6_THRESHOLD                  0  /* always */
+#define SQR_TOOM4_THRESHOLD                120
+#define SQR_TOOM6_THRESHOLD                166
 #define SQR_TOOM8_THRESHOLD                236
 
 #define MULMID_TOOM42_THRESHOLD             18
 
 #define MULMOD_BNM1_THRESHOLD               10
-#define SQRMOD_BNM1_THRESHOLD               12
+#define SQRMOD_BNM1_THRESHOLD               11
 
-#define MUL_FFT_MODF_THRESHOLD             284  /* k = 5 */
+#define MUL_FFT_MODF_THRESHOLD             276  /* k = 5 */
 #define MUL_FFT_TABLE3                                      \
-  { {    284, 5}, {     11, 6}, {      6, 5}, {     13, 6}, \
-    {     13, 7}, {      7, 6}, {     15, 7}, {      8, 6}, \
-    {     17, 7}, {     13, 8}, {      7, 7}, {     17, 8}, \
-    {      9, 7}, {     20, 8}, {     11, 7}, {     23, 8}, \
-    {     13, 9}, {      7, 8}, {     19, 9}, {     11, 8}, \
-    {     25,10}, {      7, 9}, {     15, 8}, {     33, 9}, \
-    {     19, 8}, {     39, 9}, {     23, 8}, {     47,10}, \
-    {     15, 9}, {     39,10}, {     23, 9}, {     47,11}, \
-    {     15,10}, {     31, 9}, {     67,10}, {     39, 9}, \
-    {     79,10}, {     47, 9}, {     95,10}, {     55, 9}, \
-    {    111, 8}, {    223, 9}, {    115,11}, {     31,10}, \
-    {     63, 8}, {    255, 7}, {    511,10}, {     71, 9}, \
-    {    143, 8}, {    287, 7}, {    575, 9}, {    159, 8}, \
-    {    319,11}, {     47,12}, {     31,11}, {     63, 9}, \
-    {    255, 8}, {    511,10}, {    143, 9}, {    287,11}, \
-    {     79,10}, {    159, 9}, {    319,10}, {    175, 9}, \
-    {    351, 8}, {    703,10}, {    191, 9}, {    383,10}, \
-    {    207, 9}, {    415,12}, {   4096,13}, {   8192,14}, \
-    {  16384,15}, {  32768,16}, {  65536,17}, { 131072,18}, \
-    { 262144,19}, { 524288,20}, {1048576,21}, {2097152,22}, \
-    {4194304,23}, {8388608,24} }
-#define MUL_FFT_TABLE3_SIZE 82
+  { {    276, 5}, {     11, 6}, {      6, 5}, {     13, 6}, \
+    {      7, 5}, {     15, 6}, {     13, 7}, {      7, 6}, \
+    {     15, 7}, {      8, 6}, {     17, 7}, {     13, 8}, \
+    {      7, 7}, {     17, 8}, {      9, 7}, {     20, 8}, \
+    {     11, 7}, {     23, 8}, {     13, 9}, {      7, 8}, \
+    {     19, 9}, {     11, 8}, {     25,10}, {      7, 9}, \
+    {     15, 8}, {     33, 9}, {     19, 8}, {     39, 9}, \
+    {     23, 8}, {     47,10}, {     15, 9}, {     39,10}, \
+    {     23, 9}, {     47,11}, {     15,10}, {     31, 9}, \
+    {     67,10}, {     39, 9}, {     79,10}, {     47, 9}, \
+    {     95,10}, {     55,11}, {     31,10}, {     63, 8}, \
+    {    255, 7}, {    511,10}, {     71, 9}, {    143, 8}, \
+    {    287, 7}, {    575, 9}, {    159, 8}, {    319,11}, \
+    {     47,12}, {     31,11}, {     63, 9}, {    255, 8}, \
+    {    511,10}, {    143, 9}, {    287,11}, {     79,10}, \
+    {    159, 9}, {    319,10}, {    175, 9}, {    351, 8}, \
+    {    703,10}, {    191, 9}, {    383,10}, {    207, 9}, \
+    {    415,12}, {     63,10}, {    255,11}, {    143,10}, \
+    {    287, 9}, {    575,11}, {    159,10}, {    319, 9}, \
+    {    639,11}, {    175,12}, {     95,11}, {    191,10}, \
+    {    383,11}, {    207,10}, {    415,11}, {    223,13}, \
+    {     63,11}, {    287,10}, {    575,12}, {    159,11}, \
+    {    319,10}, {    639,11}, {    351,12}, {    191,11}, \
+    {    415,12}, {    223,11}, {    479,12}, {    287,11}, \
+    {    575,12}, {    351,13}, {    191,12}, {    479,13}, \
+    {    255,12}, {    575,13}, {   8192,14}, {  16384,15}, \
+    {  32768,16}, {  65536,17}, { 131072,18}, { 262144,19}, \
+    { 524288,20}, {1048576,21}, {2097152,22}, {4194304,23}, \
+    {8388608,24} }
+#define MUL_FFT_TABLE3_SIZE 113
 #define MUL_FFT_THRESHOLD                 3200
 
 #define SQR_FFT_MODF_THRESHOLD             236  /* k = 5 */
 #define SQR_FFT_TABLE3                                      \
   { {    236, 5}, {     11, 6}, {      6, 5}, {     13, 6}, \
-    {     17, 7}, {      9, 6}, {     19, 7}, {     17, 8}, \
-    {      9, 7}, {     20, 8}, {     11, 7}, {     23, 8}, \
-    {     13, 9}, {      7, 8}, {     19, 9}, {     11, 8}, \
-    {     25,10}, {      7, 9}, {     15, 8}, {     33, 9}, \
-    {     19, 8}, {     39, 9}, {     23, 8}, {     47, 9}, \
-    {     27,10}, {     15, 9}, {     39,10}, {     23, 9}, \
-    {     47,11}, {     15,10}, {     31, 9}, {     63,10}, \
-    {     39, 9}, {     79,10}, {     47,11}, {     31,10}, \
-    {     63, 9}, {    127, 8}, {    255,10}, {     71, 9}, \
-    {    143, 8}, {    287,10}, {     79,11}, {     47,12}, \
-    {     31,11}, {     63,10}, {    127, 9}, {    255, 8}, \
-    {    511,10}, {    143, 9}, {    287,11}, {     79,10}, \
-    {    159, 9}, {    319, 8}, {    639,10}, {    175, 9}, \
-    {    351,11}, {     95,10}, {    191, 9}, {    383,10}, \
-    {    207, 9}, {    415,11}, {    111,10}, {    223,12}, \
-    {   4096,13}, {   8192,14}, {  16384,15}, {  32768,16}, \
+    {      7, 5}, {     15, 6}, {     17, 7}, {      9, 6}, \
+    {     19, 7}, {     17, 8}, {      9, 7}, {     20, 8}, \
+    {     11, 7}, {     23, 8}, {     13, 9}, {      7, 8}, \
+    {     19, 9}, {     11, 8}, {     25,10}, {      7, 9}, \
+    {     15, 8}, {     33, 9}, {     19, 8}, {     39, 9}, \
+    {     23, 8}, {     47, 9}, {     27,10}, {     15, 9}, \
+    {     39,10}, {     23, 9}, {     47,11}, {     15,10}, \
+    {     31, 9}, {     67,10}, {     39, 9}, {     79,10}, \
+    {     47,11}, {     31,10}, {     63, 9}, {    127, 8}, \
+    {    255,10}, {     71, 9}, {    143, 8}, {    287,10}, \
+    {     79,11}, {     47,12}, {     31,11}, {     63,10}, \
+    {    127, 9}, {    255, 8}, {    511,10}, {    143, 9}, \
+    {    287,11}, {     79,10}, {    159, 9}, {    319, 8}, \
+    {    639,10}, {    175, 9}, {    351,11}, {     95,10}, \
+    {    191, 9}, {    383,10}, {    207, 9}, {    415,11}, \
+    {    111,10}, {    223,12}, {     63,11}, {    127,10}, \
+    {    255,11}, {    143,10}, {    287, 9}, {    575,11}, \
+    {    159,10}, {    319,11}, {    175,10}, {    351,12}, \
+    {     95,11}, {    191,10}, {    383,11}, {    207,10}, \
+    {    415,11}, {    223,13}, {     63,12}, {    127,11}, \
+    {    287,10}, {    575,12}, {    159,11}, {    319,10}, \
+    {    639,11}, {    351,12}, {    191,11}, {    415,12}, \
+    {    223,11}, {    447,13}, {    127,12}, {    287,11}, \
+    {    575,12}, {    319,11}, {    639,12}, {    351,13}, \
+    {    191,12}, {    479,14}, {    127,13}, {    255,12}, \
+    {    575,13}, {   8192,14}, {  16384,15}, {  32768,16}, \
     {  65536,17}, { 131072,18}, { 262144,19}, { 524288,20}, \
     {1048576,21}, {2097152,22}, {4194304,23}, {8388608,24} }
-#define SQR_FFT_TABLE3_SIZE 76
+#define SQR_FFT_TABLE3_SIZE 116
 #define SQR_FFT_THRESHOLD                 2240
 
 #define MULLO_BASECASE_THRESHOLD             0  /* always */
 #define MULLO_DC_THRESHOLD                  45
 #define MULLO_MUL_N_THRESHOLD             6253
 
-#define DC_DIV_QR_THRESHOLD                 51
-#define DC_DIVAPPR_Q_THRESHOLD             164
+#define DC_DIV_QR_THRESHOLD                 48
+#define DC_DIVAPPR_Q_THRESHOLD             167
 #define DC_BDIV_QR_THRESHOLD                47
 #define DC_BDIV_Q_THRESHOLD                108
 
 #define INV_MULMOD_BNM1_THRESHOLD           26
-#define INV_NEWTON_THRESHOLD               179
+#define INV_NEWTON_THRESHOLD               187
 #define INV_APPR_THRESHOLD                 173
 
-#define BINV_NEWTON_THRESHOLD              195
+#define BINV_NEWTON_THRESHOLD              190
 #define REDC_1_TO_REDC_N_THRESHOLD          51
 
-#define MU_DIV_QR_THRESHOLD                979
-#define MU_DIVAPPR_Q_THRESHOLD            1057
+#define MU_DIV_QR_THRESHOLD                998
+#define MU_DIVAPPR_Q_THRESHOLD            1078
 #define MUPI_DIV_QR_THRESHOLD               90
-#define MU_BDIV_QR_THRESHOLD               807
-#define MU_BDIV_Q_THRESHOLD                960
+#define MU_BDIV_QR_THRESHOLD               872
+#define MU_BDIV_Q_THRESHOLD                942
 
-#define POWM_SEC_TABLE  1,10,78,452,1167
+#define POWM_SEC_TABLE  3,16,90,473,1167
 
 #define MATRIX22_STRASSEN_THRESHOLD         11
-#define HGCD_THRESHOLD                      95
-#define HGCD_APPR_THRESHOLD                103
-#define HGCD_REDUCE_THRESHOLD             1615
-#define GCD_DC_THRESHOLD                   303
-#define GCDEXT_DC_THRESHOLD                201
+#define HGCD_THRESHOLD                      98
+#define HGCD_APPR_THRESHOLD                104
+#define HGCD_REDUCE_THRESHOLD             1494
+#define GCD_DC_THRESHOLD                   268
+#define GCDEXT_DC_THRESHOLD                189
 #define JACOBI_BASE_METHOD                   3
 
-#define GET_STR_DC_THRESHOLD                13
+#define GET_STR_DC_THRESHOLD                15
 #define GET_STR_PRECOMPUTE_THRESHOLD        28
-#define SET_STR_DC_THRESHOLD               422
-#define SET_STR_PRECOMPUTE_THRESHOLD      1438
+#define SET_STR_DC_THRESHOLD               426
+#define SET_STR_PRECOMPUTE_THRESHOLD      1264
 
 #define FAC_DSC_THRESHOLD                 1404
 #define FAC_ODD_THRESHOLD                    0  /* always */
diff -r 99f1e60b85ea -r 3f9086cd12d3 mpn/arm/v7a/cora15/gmp-mparam.h
--- a/mpn/arm/v7a/cora15/gmp-mparam.h	Tue Mar 11 22:55:18 2014 +0100
+++ b/mpn/arm/v7a/cora15/gmp-mparam.h	Wed Mar 12 20:57:10 2014 +0100
@@ -33,6 +33,7 @@
 #define GMP_LIMB_BYTES 4
 
 /* 1700MHz Cortex-A15 with Neon (in spite of file position) */
+/* Generated by tuneup.c, 2014-03-12, gcc 4.6 */
 
 #define MOD_1_NORM_THRESHOLD                 0  /* always */
 #define MOD_1_UNNORM_THRESHOLD               0  /* always */
@@ -44,27 +45,27 @@
 #define USE_PREINV_DIVREM_1                  1  /* native */
 #define DIV_QR_1N_PI1_METHOD                 1
 #define DIV_QR_1_NORM_THRESHOLD          MP_SIZE_T_MAX  /* never */
-#define DIV_QR_1_UNNORM_THRESHOLD            1
+#define DIV_QR_1_UNNORM_THRESHOLD        MP_SIZE_T_MAX  /* never */
 #define DIV_QR_2_PI2_THRESHOLD           MP_SIZE_T_MAX  /* never */
 #define DIVEXACT_1_THRESHOLD                 0  /* always (native) */
-#define BMOD_1_TO_MOD_1_THRESHOLD           12
+#define BMOD_1_TO_MOD_1_THRESHOLD           15
 
-#define MUL_TOOM22_THRESHOLD                28
-#define MUL_TOOM33_THRESHOLD               110
-#define MUL_TOOM44_THRESHOLD               178
-#define MUL_TOOM6H_THRESHOLD               442
-#define MUL_TOOM8H_THRESHOLD               597
+#define MUL_TOOM22_THRESHOLD                23
+#define MUL_TOOM33_THRESHOLD                90
+#define MUL_TOOM44_THRESHOLD               262
+#define MUL_TOOM6H_THRESHOLD               351
+#define MUL_TOOM8H_THRESHOLD               557
 
-#define MUL_TOOM32_TO_TOOM43_THRESHOLD     113
-#define MUL_TOOM32_TO_TOOM53_THRESHOLD     130
-#define MUL_TOOM42_TO_TOOM53_THRESHOLD     110
-#define MUL_TOOM42_TO_TOOM63_THRESHOLD     121
-#define MUL_TOOM43_TO_TOOM54_THRESHOLD     160
+#define MUL_TOOM32_TO_TOOM43_THRESHOLD      90
+#define MUL_TOOM32_TO_TOOM53_THRESHOLD     160
+#define MUL_TOOM42_TO_TOOM53_THRESHOLD      89
+#define MUL_TOOM42_TO_TOOM63_THRESHOLD     169
+#define MUL_TOOM43_TO_TOOM54_THRESHOLD     130
 
 #define SQR_BASECASE_THRESHOLD               0  /* always (native) */
-#define SQR_TOOM2_THRESHOLD                 42
+#define SQR_TOOM2_THRESHOLD                 43
 #define SQR_TOOM3_THRESHOLD                138
-#define SQR_TOOM4_THRESHOLD                232
+#define SQR_TOOM4_THRESHOLD                363
 #define SQR_TOOM6_THRESHOLD                517
 #define SQR_TOOM8_THRESHOLD                725
 
@@ -73,28 +74,40 @@
 #define MULMOD_BNM1_THRESHOLD               17
 #define SQRMOD_BNM1_THRESHOLD               23
 
-#define MUL_FFT_MODF_THRESHOLD             555  /* k = 5 */
+#define MUL_FFT_MODF_THRESHOLD             525  /* k = 5 */
 #define MUL_FFT_TABLE3                                      \
-  { {    555, 5}, {     25, 6}, {     27, 7}, {     15, 6}, \
-    {     31, 7}, {     19, 6}, {     39, 7}, {     25, 6}, \
-    {     51, 7}, {     27, 8}, {     15, 7}, {     33, 8}, \
-    {     19, 7}, {     41, 8}, {     23, 7}, {     51, 8}, \


More information about the gmp-commit mailing list