[Gmp-commit] /var/hg/gmp: mpz/bin_uiui.c: Safer (NAIL ready?) MAXFACS, remove...

Wed May 9 08:31:43 CEST 2012

details:   /var/hg/gmp/rev/8d68a25e59bc
changeset: 14957:8d68a25e59bc
user:      Marco Bodrato <bodrato at mail.dm.unipi.it>
date:      Wed May 09 08:31:40 2012 +0200
description:
mpz/bin_uiui.c: Safer (NAIL ready?) MAXFACS, removed unneeded shifts.

diffstat:

 ChangeLog      |   3 +++
 mpz/bin_uiui.c |  28 +++++++++++++---------------
 2 files changed, 16 insertions(+), 15 deletions(-)

diffs (85 lines):

diff -r bf40df76fb25 -r 8d68a25e59bc ChangeLog

--- a/ChangeLog	Wed May 09 07:59:28 2012 +0200
+++ b/ChangeLog	Wed May 09 08:31:40 2012 +0200
@@ -4,6 +4,9 @@
 
 	* mpn/generic/sqrtrem.c (invsqrttab): Reduce size removing common byte.
 
+	* mpz/bin_uiui.c (mul2, mul3, mul4, mul8): Remove unneeded shifts.
+	(MAXFACS): Redefine, using the shared (safer) log_n_max.
+
 2012-05-08  Torbjorn Granlund  <tege at gmplib.org>
 
 	* mpn/minithres/gmp-mparam.h (REDC_1_TO_REDC_N_THRESHOLD): Up to 9, for
diff -r bf40df76fb25 -r 8d68a25e59bc mpz/bin_uiui.c
--- a/mpz/bin_uiui.c	Wed May 09 07:59:28 2012 +0200
+++ b/mpz/bin_uiui.c	Wed May 09 08:31:40 2012 +0200
@@ -83,7 +83,10 @@
 static mp_limb_t
 mul2 (mp_limb_t m)
 {
-  mp_limb_t m01 = (m + 0) * (m + 1) >> 1;
+  /* THINK: (m + 0) * (m + 1) >> 1 does overflow if (m + 0) * (m + 1)
+     does.  The shift does not give any advantage. We should shift
+     _before_ multiplying: (m | 1) * ((m + 1) >> 1) ... */
+  mp_limb_t m01 = (m + 0) * (m + 1);
   return m01;
 }
 
@@ -100,7 +103,7 @@
 {
   mp_limb_t m01 = (m + 0) * (m + 1) >> 1;
   mp_limb_t m23 = (m + 2) * (m + 3) >> 1;
-  return m01 * m23 >> 1;
+  return m01 * m23;
 }
 
 static mp_limb_t
@@ -108,7 +111,7 @@
 {
   mp_limb_t m012 = (m + 0) * (m + 1) * (m + 2) >> 1;
   mp_limb_t m34 = (m + 3) * (m + 4) >> 1;
-  return m012 * m34 >> 1;
+  return m012 * m34;
 }
 
 static mp_limb_t
@@ -140,7 +143,7 @@
   mp_limb_t m67 = (m + 6) * (m + 7);
   mp_limb_t m0123 = m01 * m23 >> 3;
   mp_limb_t m4567 = m45 * m67 >> 3;
-  return m0123 * m4567 >> 1;
+  return m0123 * m4567;
 }
 
 typedef mp_limb_t (* mulfunc_t) (mp_limb_t);
@@ -149,23 +152,18 @@
 #define M (numberof(mulfunc)-1)
 
 /* Number of factors-of-2 removed by the corresponding mulN functon.  */
-static const unsigned char tcnttab[] = {0,0,1,1,3,3,4,4,7};
+static const unsigned char tcnttab[] = {0,0,0,1,2,2,4,4,6};
 
-/* Rough computation of how many factors we can multiply together without
-   spilling a limb.  */
-#if 0
-/* This variant is inaccurate and relies on an expensive division.  */
+#if 1
+/* This variant is inaccurate but share the code with other functions.  */
 #define MAXFACS(max,l)							\
   do {									\
-    int __cnt, __logb;							\
-    count_leading_zeros (__cnt, (mp_limb_t) (l));			\
-    __logb = GMP_LIMB_BITS - __cnt;					\
-    (max) = (GMP_NUMB_BITS + 1) / __logb; /* FIXME: remove division */	\
+    (max) = log_n_max (l);						\
   } while (0)
 #else
 
-/* This variant is exact but uses a loop.  It takes the 2 removal of mulN into
- account.  */
+/* This variant is exact(?) but uses a loop.  It takes the 2 removal
+ of mulN into account.  */
 static const unsigned long ftab[] =
 #if GMP_NUMB_BITS == 64
   /* 1 to 8 factors per iteration */