[Gmp-commit] /home/hgfiles/gmp: Retune.

mercurial at gmplib.org mercurial at gmplib.org
Thu Feb 4 07:24:36 CET 2010


details:   /home/hgfiles/gmp/rev/5eb53153e12a
changeset: 13412:5eb53153e12a
user:      Torbjorn Granlund <tege at gmplib.org>
date:      Thu Feb 04 07:08:43 2010 +0100
description:
Retune.

diffstat:

 mpn/alpha/ev5/gmp-mparam.h           |    6 +-
 mpn/powerpc64/mode64/p4/gmp-mparam.h |  242 +++++++++++++++++-----------------
 mpn/x86/pentium4/sse2/gmp-mparam.h   |    2 +-
 3 files changed, 128 insertions(+), 122 deletions(-)

diffs (truncated from 313 to 300 lines):

diff -r 5c7b3ee5d37e -r 5eb53153e12a mpn/alpha/ev5/gmp-mparam.h
--- a/mpn/alpha/ev5/gmp-mparam.h	Wed Feb 03 08:05:13 2010 +0100
+++ b/mpn/alpha/ev5/gmp-mparam.h	Thu Feb 04 07:08:43 2010 +0100
@@ -97,7 +97,7 @@
     { 524288,20}, {1048576,21}, {2097152,22}, {4194304,23}, \
     {8388608,24} }
 #define MUL_FFT_TABLE3_SIZE 141
-#define MUL_FFT_THRESHOLD                 4480
+#define MUL_FFT_THRESHOLD                 3008
 
 #define SQR_FFT_MODF_THRESHOLD             220  /* k = 5 */
 #define SQR_FFT_TABLE3                                      \
@@ -136,11 +136,11 @@
     { 131072,18}, { 262144,19}, { 524288,20}, {1048576,21}, \
     {2097152,22}, {4194304,23}, {8388608,24} }
 #define SQR_FFT_TABLE3_SIZE 135
-#define SQR_FFT_THRESHOLD                 3712
+#define SQR_FFT_THRESHOLD                 2240
 
 #define MULLO_BASECASE_THRESHOLD             0  /* always */
 #define MULLO_DC_THRESHOLD                  55
-#define MULLO_MUL_N_THRESHOLD             7916
+#define MULLO_MUL_N_THRESHOLD             5558
 
 #define DC_DIV_QR_THRESHOLD                 55
 #define DC_DIVAPPR_Q_THRESHOLD             192
diff -r 5c7b3ee5d37e -r 5eb53153e12a mpn/powerpc64/mode64/p4/gmp-mparam.h
--- a/mpn/powerpc64/mode64/p4/gmp-mparam.h	Wed Feb 03 08:05:13 2010 +0100
+++ b/mpn/powerpc64/mode64/p4/gmp-mparam.h	Thu Feb 04 07:08:43 2010 +0100
@@ -50,147 +50,153 @@
 #define SQR_TOOM6_THRESHOLD                206
 #define SQR_TOOM8_THRESHOLD                309
 
-#define MULMOD_BNM1_THRESHOLD               12
-#define SQRMOD_BNM1_THRESHOLD               14
+#define MULMOD_BNM1_THRESHOLD               11
+#define SQRMOD_BNM1_THRESHOLD                9
 
-#define MUL_FFT_MODF_THRESHOLD             654  /* k = 5 */
+#define MUL_FFT_MODF_THRESHOLD             380  /* k = 5 */
 #define MUL_FFT_TABLE3                                      \
-  { {    654, 5}, {     21, 6}, {     11, 5}, {     23, 6}, \
-    {     13, 5}, {     27, 6}, {     21, 7}, {     11, 6}, \
-    {     23, 7}, {     12, 6}, {     25, 7}, {     13, 6}, \
-    {     27, 7}, {     21, 8}, {     11, 7}, {     25, 8}, \
-    {     13, 7}, {     27, 8}, {     15, 7}, {     31, 8}, \
-    {     21, 9}, {     11, 8}, {     27, 9}, {     15, 8}, \
-    {     35, 9}, {     19, 8}, {     39, 9}, {     23, 8}, \
+  { {    380, 5}, {     17, 6}, {      9, 5}, {     19, 6}, \
+    {     10, 5}, {     21, 6}, {     11, 5}, {     23, 6}, \
+    {     23, 7}, {     12, 6}, {     25, 7}, {     25, 8}, \
+    {     13, 7}, {     30, 6}, {     61, 7}, {     32, 8}, \
+    {     17, 7}, {     35, 8}, {     29, 9}, {     15, 8}, \
+    {     35, 9}, {     19, 8}, {     41, 9}, {     23, 8}, \
     {     47, 9}, {     27,10}, {     15, 9}, {     39,10}, \
     {     23, 9}, {     55,11}, {     15,10}, {     31, 9}, \
     {     71,10}, {     39, 9}, {     83,10}, {     47, 9}, \
-    {     95,10}, {     55,11}, {     31,10}, {     63, 9}, \
+    {     99,10}, {     55,11}, {     31,10}, {     63, 9}, \
     {    127,10}, {     79,11}, {     47,10}, {    103,12}, \
-    {     31,11}, {     63,10}, {    135, 8}, {    543,11}, \
-    {     79,10}, {    159, 8}, {    639,10}, {    167, 9}, \
-    {    335,11}, {     95, 9}, {    383, 8}, {    767,10}, \
-    {    199, 9}, {    415,11}, {    111,12}, {     63,11}, \
-    {    127, 9}, {    511, 8}, {   1023, 9}, {    543,11}, \
-    {    143, 9}, {    575, 8}, {   1151, 9}, {    607,11}, \
-    {    159, 9}, {    639,10}, {    351,12}, {     95,10}, \
-    {    383, 9}, {    767,10}, {    415, 9}, {    831,13}, \
-    {     63,12}, {    127,10}, {    511, 9}, {   1023,10}, \
-    {    543, 9}, {   1087, 8}, {   2175,10}, {    575, 9}, \
-    {   1151,10}, {    607, 9}, {   1215,12}, {    159,10}, \
-    {    639,11}, {    335,10}, {    671,11}, {    351,10}, \
-    {    703, 9}, {   1407,11}, {    383,10}, {    767,11}, \
-    {    415,10}, {    831, 9}, {   1663,11}, {    447,10}, \
-    {    895,13}, {    127,11}, {    511,10}, {   1023,11}, \
-    {    543,10}, {   1087, 9}, {   2175,11}, {    575,10}, \
-    {   1151,11}, {    607,10}, {   1215, 9}, {   2431,11}, \
-    {    639,10}, {   1279,11}, {    671,12}, {    351,11}, \
-    {    703,10}, {   1407,12}, {    383,11}, {    767,12}, \
-    {    415,11}, {    831,10}, {   1663,12}, {    447,11}, \
-    {    895,12}, {    479,11}, {    959,14}, {    127,12}, \
-    {    511,11}, {   1023,12}, {    543,11}, {   1087,10}, \
-    {   2175,12}, {    575,11}, {   1151,12}, {    607,11}, \
-    {   1215,10}, {   2431,12}, {    639,11}, {   1279,12}, \
-    {    671,11}, {   1343,12}, {    703,11}, {   1407,12}, \
-    {    735,13}, {    383,12}, {    767,11}, {   1535,12}, \
-    {    799,11}, {   1599,12}, {    831,11}, {   1663,13}, \
-    {    447,12}, {    959,11}, {   1919,13}, {    511,12}, \
-    {   1087,11}, {   2175,13}, {    575,12}, {   1215,11}, \
-    {   2431,13}, {    639,12}, {   1343,11}, {   2687,13}, \
-    {    703,12}, {   1407,14}, {    383,13}, {    767,12}, \
-    {   1599,13}, {    831,12}, {   1663,13}, {    895,12}, \
-    {   1791,13}, {    959,12}, {   1919,11}, {   3839,14}, \
+    {     31,11}, {     63,10}, {    127, 9}, {    255,10}, \
+    {    135, 9}, {    271,11}, {     79,10}, {    159, 9}, \
+    {    319,10}, {    167,11}, {     95,10}, {    191, 9}, \
+    {    383, 8}, {    767,10}, {    207,11}, {    111,12}, \
+    {     63,11}, {    127,10}, {    255, 9}, {    511,10}, \
+    {    271,11}, {    143,10}, {    287, 9}, {    575,10}, \
+    {    303, 9}, {    607,11}, {    159,10}, {    319, 9}, \
+    {    639,10}, {    335, 9}, {    671,12}, {     95,11}, \
+    {    191,10}, {    383, 9}, {    767,11}, {    207,10}, \
+    {    415, 9}, {    831,13}, {     63,12}, {    127,11}, \
+    {    255,10}, {    511,11}, {    271,10}, {    543, 9}, \
+    {   1087,11}, {    287,10}, {    575,11}, {    303,10}, \
+    {    607,12}, {    159,11}, {    319,10}, {    639,11}, \
+    {    335,10}, {    671,11}, {    351,10}, {    703,11}, \
+    {    367,12}, {    191,11}, {    383,10}, {    767,11}, \
+    {    415,10}, {    831,12}, {    223,11}, {    447,10}, \
+    {    895,13}, {    127,12}, {    255,11}, {    511,10}, \
+    {   1023,11}, {    543,10}, {   1087,12}, {    287,11}, \
+    {    575,10}, {   1151,11}, {    607,10}, {   1215,12}, \
+    {    319,11}, {    639,10}, {   1279,11}, {    671,12}, \
+    {    351,11}, {    703,10}, {   1407,13}, {    191,12}, \
+    {    383,11}, {    767,12}, {    415,11}, {    831,10}, \
+    {   1663,12}, {    447,11}, {    895,12}, {    479,14}, \
+    {    127,13}, {    255,12}, {    511,11}, {   1023,12}, \
+    {    543,11}, {   1087,10}, {   2175,12}, {    575,11}, \
+    {   1151,12}, {    607,11}, {   1215,13}, {    319,12}, \
+    {    639,11}, {   1279,12}, {    671,11}, {   1343,10}, \
+    {   2687,12}, {    703,11}, {   1407,12}, {    735,13}, \
+    {    383,12}, {    767,11}, {   1535,12}, {    799,11}, \
+    {   1599,12}, {    831,11}, {   1663,13}, {    447,12}, \
+    {    959,14}, {    255,13}, {    511,12}, {   1087,11}, \
+    {   2175,13}, {    575,12}, {   1215,11}, {   2431,13}, \
+    {    639,12}, {   1343,11}, {   2687,13}, {    703,12}, \
+    {   1407,14}, {    383,13}, {    767,12}, {   1599,13}, \
+    {    831,12}, {   1663,13}, {    959,15}, {    255,14}, \
     {    511,13}, {   1087,12}, {   2175,13}, {   1215,12}, \
     {   2431,14}, {    639,13}, {   1343,12}, {   2687,13}, \
     {   1471,12}, {   2943,14}, {    767,13}, {   1599,12}, \
-    {   3199,13}, {   1663,14}, {    895,13}, {   8192,14}, \
-    {  16384,15}, {  32768,16}, {  65536,17}, { 131072,18}, \
-    { 262144,19}, { 524288,20}, {1048576,21}, {2097152,22}, \
-    {4194304,23}, {8388608,24} }
-#define MUL_FFT_TABLE3_SIZE 206
-#define MUL_FFT_THRESHOLD                 9472
+    {   3199,13}, {   1663,14}, {    895,13}, {   1855,15}, \
+    {  32768,16}, {  65536,17}, { 131072,18}, { 262144,19}, \
+    { 524288,20}, {1048576,21}, {2097152,22}, {4194304,23}, \
+    {8388608,24} }
+#define MUL_FFT_TABLE3_SIZE 209
+#define MUL_FFT_THRESHOLD                 7296
 
-#define SQR_FFT_MODF_THRESHOLD             618  /* k = 6 */
+#define SQR_FFT_MODF_THRESHOLD             308  /* k = 5 */
 #define SQR_FFT_TABLE3                                      \
-  { {    618, 6}, {     21, 7}, {     11, 6}, {     23, 7}, \
-    {     21, 8}, {     11, 7}, {     25, 8}, {     13, 7}, \
-    {     27, 8}, {     15, 7}, {     31, 8}, {     21, 9}, \
-    {     11, 8}, {     27, 9}, {     15, 8}, {     33, 9}, \
-    {     19, 8}, {     39, 9}, {     23, 8}, {     47, 9}, \
-    {     27,10}, {     15, 9}, {     39,10}, {     23, 9}, \
-    {     51,11}, {     15,10}, {     31, 9}, {     67,10}, \
-    {     39, 9}, {     79,10}, {     47, 9}, {     95,10}, \
-    {     55,11}, {     31,10}, {     79,11}, {     47,10}, \
-    {     95, 8}, {    383,12}, {     31,11}, {     63,10}, \
-    {    127, 8}, {    511,10}, {    135, 8}, {    543,11}, \
-    {     79, 9}, {    319, 8}, {    639, 9}, {    351,11}, \
-    {     95, 9}, {    383, 8}, {    767, 9}, {    415,12}, \
-    {     63,11}, {    127, 9}, {    511, 8}, {   1023, 9}, \
-    {    543, 8}, {   1087,11}, {    143, 9}, {    575, 8}, \
-    {   1151, 9}, {    607,10}, {    319, 9}, {    639,10}, \
-    {    351,12}, {     95,10}, {    383, 9}, {    767,10}, \
-    {    415, 9}, {    831,13}, {     63,12}, {    127,10}, \
-    {    511, 9}, {   1023,10}, {    543, 9}, {   1087, 8}, \
-    {   2175,10}, {    575, 9}, {   1151,10}, {    607,11}, \
-    {    319,10}, {    639,11}, {    351,10}, {    703, 9}, \
-    {   1407,11}, {    383,10}, {    767,11}, {    415,10}, \
-    {    831, 9}, {   1663,11}, {    447,10}, {    895,11}, \
-    {    479,10}, {    959,13}, {    127,11}, {    511,10}, \
-    {   1023,11}, {    543,10}, {   1087, 9}, {   2175,11}, \
-    {    575,10}, {   1151,11}, {    607,12}, {    319,11}, \
-    {    639,12}, {    351,11}, {    703,10}, {   1407,12}, \
-    {    383,11}, {    767,12}, {    415,11}, {    831,10}, \
-    {   1663,12}, {    447,11}, {    895,12}, {    479,11}, \
-    {    959,10}, {   1919,14}, {    127,12}, {    511,11}, \
-    {   1023,12}, {    543,11}, {   1087,10}, {   2175,12}, \
-    {    575,11}, {   1151,12}, {    607,13}, {    319,12}, \
-    {    639,11}, {   1279,12}, {    671,11}, {   1343,12}, \
-    {    703,11}, {   1407,13}, {    383,12}, {    767,11}, \
-    {   1535,12}, {    831,11}, {   1663,13}, {    447,12}, \
-    {    959,11}, {   1919,10}, {   3839,13}, {    511,12}, \
-    {   1087,11}, {   2175,13}, {    575,12}, {   1215,11}, \
-    {   2431,13}, {    639,12}, {   1343,13}, {    703,12}, \
-    {   1407,14}, {    383,13}, {    767,12}, {   1535,13}, \
-    {    831,12}, {   1663,13}, {    895,12}, {   1791,13}, \
-    {    959,12}, {   1919,11}, {   3839,14}, {    511,13}, \
-    {   1087,12}, {   2175,13}, {   1215,12}, {   2431,14}, \
-    {    639,13}, {   1343,12}, {   2687,13}, {   1407,12}, \
-    {   2815,13}, {   1471,14}, {    767,13}, {   1663,14}, \
-    {    895,13}, {   8192,14}, {  16384,15}, {  32768,16}, \
-    {  65536,17}, { 131072,18}, { 262144,19}, { 524288,20}, \
-    {1048576,21}, {2097152,22}, {4194304,23}, {8388608,24} }
-#define SQR_FFT_TABLE3_SIZE 188
-#define SQR_FFT_THRESHOLD                 7040
+  { {    308, 5}, {     17, 6}, {      9, 5}, {     19, 6}, \
+    {     19, 7}, {     10, 6}, {     21, 7}, {     11, 6}, \
+    {     23, 7}, {     21, 8}, {     11, 7}, {     24, 8}, \
+    {     13, 7}, {     29, 8}, {     15, 7}, {     31, 8}, \
+    {     21, 9}, {     11, 8}, {     27, 9}, {     15, 8}, \
+    {     33, 9}, {     19, 8}, {     39, 9}, {     23, 8}, \
+    {     47, 9}, {     27,10}, {     15, 9}, {     39,10}, \
+    {     23, 9}, {     51,11}, {     15,10}, {     31, 9}, \
+    {     67,10}, {     39, 9}, {     83,10}, {     47, 9}, \
+    {     95,10}, {     55,11}, {     31,10}, {     79,11}, \
+    {     47,10}, {     95, 9}, {    191, 8}, {    383,12}, \
+    {     31,11}, {     63,10}, {    127, 9}, {    255, 8}, \
+    {    511,10}, {    135, 9}, {    271,11}, {     79,10}, \
+    {    159, 9}, {    319,10}, {    175, 9}, {    351,11}, \
+    {     95,10}, {    191, 9}, {    383,10}, {    207, 9}, \
+    {    415,11}, {    111,12}, {     63,11}, {    127,10}, \
+    {    255, 9}, {    511, 8}, {   1023,10}, {    271, 9}, \
+    {    543,10}, {    287, 9}, {    575, 8}, {   1151,10}, \
+    {    303,11}, {    159,10}, {    319, 9}, {    639,11}, \
+    {    175,10}, {    351,12}, {     95,11}, {    191,10}, \
+    {    383, 9}, {    767,11}, {    207,10}, {    415, 9}, \
+    {    831,11}, {    223,13}, {     63,12}, {    127,11}, \
+    {    255,10}, {    511, 9}, {   1023,11}, {    271,10}, \
+    {    543,11}, {    287,10}, {    575, 9}, {   1151,11}, \
+    {    303,12}, {    159,11}, {    319,10}, {    639,11}, \
+    {    351,10}, {    703,12}, {    191,11}, {    383,10}, \
+    {    767,11}, {    415,10}, {    831,12}, {    223,11}, \
+    {    447,10}, {    895,11}, {    479,10}, {    959,13}, \
+    {    127,12}, {    255,11}, {    511,10}, {   1023,11}, \
+    {    543,12}, {    287,11}, {    575,10}, {   1151,11}, \
+    {    607,12}, {    319,11}, {    639,10}, {   1279,12}, \
+    {    351,11}, {    703,13}, {    191,12}, {    383,11}, \
+    {    767,12}, {    415,11}, {    831,10}, {   1663,12}, \
+    {    447,11}, {    895,12}, {    479,11}, {    959,14}, \
+    {    127,13}, {    255,12}, {    511,11}, {   1023,12}, \
+    {    543,11}, {   1087,10}, {   2175,12}, {    575,11}, \
+    {   1151,12}, {    607,13}, {    319,12}, {    639,11}, \
+    {   1279,12}, {    671,11}, {   1343,12}, {    703,11}, \
+    {   1407,13}, {    383,12}, {    767,11}, {   1535,12}, \
+    {    831,11}, {   1663,13}, {    447,12}, {    959,11}, \
+    {   1919,14}, {    255,13}, {    511,12}, {   1087,11}, \
+    {   2175,13}, {    575,12}, {   1215,11}, {   2431,13}, \
+    {    639,12}, {   1343,13}, {    703,12}, {   1407,14}, \
+    {    383,13}, {    767,12}, {   1535,13}, {    831,12}, \
+    {   1663,13}, {    959,12}, {   1919,15}, {    255,14}, \
+    {    511,13}, {   1087,12}, {   2175,13}, {   1215,12}, \
+    {   2431,14}, {    639,13}, {   1343,12}, {   2687,13}, \
+    {   1407,12}, {   2815,13}, {   1471,14}, {    767,13}, \
+    {   1535,12}, {   3071,13}, {   1663,14}, {    895,13}, \
+    {   1791,12}, {   3839,15}, {  32768,16}, {  65536,17}, \
+    { 131072,18}, { 262144,19}, { 524288,20}, {1048576,21}, \
+    {2097152,22}, {4194304,23}, {8388608,24} }
+#define SQR_FFT_TABLE3_SIZE 207
+#define SQR_FFT_THRESHOLD                 2752
 
 #define MULLO_BASECASE_THRESHOLD             5
 #define MULLO_DC_THRESHOLD                  34
-#define MULLO_MUL_N_THRESHOLD            18629
+#define MULLO_MUL_N_THRESHOLD            14281
 
 #define DC_DIV_QR_THRESHOLD                 30
 #define DC_DIVAPPR_Q_THRESHOLD             103
 #define DC_BDIV_QR_THRESHOLD                48
 #define DC_BDIV_Q_THRESHOLD                120
 
-#define INV_MULMOD_BNM1_THRESHOLD          107
-#define INV_NEWTON_THRESHOLD               170
-#define INV_APPR_THRESHOLD                 117
+#define INV_MULMOD_BNM1_THRESHOLD           30
+#define INV_NEWTON_THRESHOLD               129
+#define INV_APPR_THRESHOLD                 109
 
-#define BINV_NEWTON_THRESHOLD              206
-#define REDC_1_TO_REDC_N_THRESHOLD          56
+#define BINV_NEWTON_THRESHOLD              204
+#define REDC_1_TO_REDC_N_THRESHOLD          55
 
-#define MU_DIV_QR_THRESHOLD               1470
-#define MU_DIVAPPR_Q_THRESHOLD            1334
-#define MUPI_DIV_QR_THRESHOLD               57
-#define MU_BDIV_QR_THRESHOLD              1099
-#define MU_BDIV_Q_THRESHOLD               1308
+#define MU_DIV_QR_THRESHOLD                998
+#define MU_DIVAPPR_Q_THRESHOLD            1017
+#define MUPI_DIV_QR_THRESHOLD               61
+#define MU_BDIV_QR_THRESHOLD               889
+#define MU_BDIV_Q_THRESHOLD               1078
 
-#define MATRIX22_STRASSEN_THRESHOLD         17
-#define HGCD_THRESHOLD                      86
-#define GCD_DC_THRESHOLD                   233
-#define GCDEXT_DC_THRESHOLD                221
+#define MATRIX22_STRASSEN_THRESHOLD          9
+#define HGCD_THRESHOLD                      96
+#define GCD_DC_THRESHOLD                   229
+#define GCDEXT_DC_THRESHOLD                225
 #define JACOBI_BASE_METHOD                   1
 
 #define GET_STR_DC_THRESHOLD                11
-#define GET_STR_PRECOMPUTE_THRESHOLD        24
-#define SET_STR_DC_THRESHOLD               795
-#define SET_STR_PRECOMPUTE_THRESHOLD      1790
+#define GET_STR_PRECOMPUTE_THRESHOLD        23
+#define SET_STR_DC_THRESHOLD               650


More information about the gmp-commit mailing list