fix for mpfr_zeta overflow on 32-bit computers

git-svn-id: svn://scm.gforge.inria.fr/svn/mpfr/trunk@11306 280ebfd0-de03-0410-8827-d642c229c3f4
author: zimmerma <zimmerma@280ebfd0-de03-0410-8827-d642c229c3f4> 2017-02-12 08:06:55 +0000
committer: zimmerma <zimmerma@280ebfd0-de03-0410-8827-d642c229c3f4> 2017-02-12 08:06:55 +0000
commit: 47a310a9f4645afdff1e31ad814fb5843bdb2145 (patch)
tree: e749fd965b9c55419799a38396854f49152e67a0 /src/zeta.c
parent: afb28793807f6e98333096bb2ee3a4deb81720c8 (diff)
download: mpfr-47a310a9f4645afdff1e31ad814fb5843bdb2145.tar.gz
1 files changed, 123 insertions, 7 deletions
diff --git a/src/zeta.c b/src/zeta.c
index 586d727f6..ee45ba6d1 100644
--- a/src/zeta.c
+++ b/src/zeta.c
@@ -336,6 +336,82 @@ compute_add (mpfr_srcptr s, mpfr_prec_t precz)
   return add;
 }
 
+/* return in z a lower bound (for rnd = RNDD) or upper bound (for rnd = RNDU)
+   of |zeta(s)|, using:
+   log(|zeta(s)|/2) = (s-1)*log(2*pi) + lngamma(1-s)
+   + log(abs(sin(Pi*s/2)) * zeta(1-s)).
+   Assumes s < 1/2 and s1 = 1-s exactly, thus s1 > 1/2.
+   y and p are temporary variables.
+   At input, p is pi rounded down.
+   The comments in the code are for rnd = RNDD. */
+static void
+mpfr_reflection_overflow (mpfr_t z, mpfr_t s1, const mpfr_t s, mpfr_t y,
+                          mpfr_t p, mpfr_rnd_t rnd)
+{
+  mpz_t sint;
+
+  /* since log(abs(sin(Pi*s/2)) <= 0, we want to round zeta(1-s) upward
+     and log(abs(sin(Pi*s/2)) toward -infinity */
+  mpz_init (sint);
+  mpfr_get_z (sint, s, MPFR_RNDD);
+  /* we first compute a lower bound of abs(sin(Pi*s/2)):
+     if -4k-2 < s < -4k, then -2k-1 < s/2 < -2k, thus sin(Pi*s/2) < 0
+     if -4k < s < -4k+2, then -2k < s < -2k+1, thus sin(Pi*s/2) > 0 */
+  if (mpz_tstbit (sint, 1) == 0) /* sint = {0,1} mod 4, thus -2k < s < -2k+1 */
+    {
+      if (mpz_tstbit (sint, 0) == 0) /* sin(Pi*x) is increasing: round down */
+        {
+          mpfr_mul (y, p, s, rnd);
+	  if (rnd == MPFR_RNDD)
+	    mpfr_nextabove (p);
+        }
+      else /* sin(Pi*x) is decreasing: round up */
+        {
+	  if (rnd == MPFR_RNDD)
+	    mpfr_nextabove (p);
+          mpfr_mul (y, p, s, rnd);
+        }
+    }
+  else /* -2k-1 < s/2 < -2k */
+    {
+      if (mpz_tstbit (sint, 1) == 0) /* sin(Pi*x) is decreasing: round down */
+        {
+          mpfr_mul (y, p, s, rnd);
+	  if (rnd == MPFR_RNDD)
+	    mpfr_nextabove (p); /* we will need p rounded above afterwards */
+        }
+      else /* sin(Pi*x) is increasing: round up */
+        {
+	  if (rnd == MPFR_RNDD)
+	    mpfr_nextabove (p);
+          mpfr_mul (y, p, s, MPFR_INVERT_RND(rnd));
+        }
+    }
+  mpfr_div_2ui (y, y, 1, rnd);
+  mpfr_sin (y, y, rnd);
+  mpz_clear (sint);
+  mpfr_abs (y, y, rnd);
+  /* now y <= |sin(Pi*s/2)| */
+  mpfr_zeta_pos (z, s1, rnd);   /* zeta(1-s)  */
+  mpfr_mul (z, z, y, rnd);
+  /* now z <= |sin(Pi*s/2)|*zeta(1-s) */
+  mpfr_log (z, z, rnd);
+  /* now z <= log(|sin(Pi*s/2)|*zeta(1-s)) */
+  mpfr_lngamma (y, s1, rnd);
+  mpfr_add (z, z, y, rnd);
+  /* z <= lngamma(1-s) + log(|sin(Pi*s/2)|*zeta(1-s)) */
+  /* since s-1 < 0, we want to round log(2*pi) upwards */
+  mpfr_mul_2ui (y, p, 1, MPFR_INVERT_RND(rnd));
+  mpfr_log (y, y, MPFR_INVERT_RND(rnd));
+  mpfr_mul (y, y, s1, MPFR_INVERT_RND(rnd));
+  mpfr_sub (z, z, y, rnd);
+  mpfr_exp (z, z, rnd);
+  if (rnd == MPFR_RNDD)
+    mpfr_nextbelow (p); /* restore original p */
+  /* multiply by 2 */
+  mpfr_mul_2ui (z, z, 1, rnd);
+}
+
 int
 mpfr_zeta (mpfr_t z, mpfr_srcptr s, mpfr_rnd_t rnd_mode)
 {
@@ -492,9 +568,11 @@ mpfr_zeta (mpfr_t z, mpfr_srcptr s, mpfr_rnd_t rnd_mode)
       for (;;)
         {
           mpfr_exp_t ey;
+	  mpfr_t z_up;
+
+          mpfr_const_pi (p, MPFR_RNDD); /* p is Pi */
 
           mpfr_sub (s1, __gmpfr_one, s, MPFR_RNDN); /* s1 = 1-s */
-          mpfr_zeta_pos (z_pre, s1, MPFR_RNDN);   /* zeta(1-s)  */
           mpfr_gamma (y, s1, MPFR_RNDN);          /* gamma(1-s) */
           if (MPFR_IS_INF (y)) /* zeta(s) < 0 for -4k-2 < s < -4k,
                                   zeta(s) > 0 for -4k < s < -4k+2 */
@@ -515,15 +593,52 @@ mpfr_zeta (mpfr_t z, mpfr_srcptr s, mpfr_rnd_t rnd_mode)
                  4. Correct the sign from the sign of sin(...).
                  5. Round then multiply by 2. Here, an overflow in either
                  operation means a real overflow. */
-              mpfr_div_2ui (s1, s, 2, MPFR_RNDN); /* s/4, exact */
-              mpfr_frac (s1, s1, MPFR_RNDN); /* exact, -1 < s1 < 0 */
-              overflow = (mpfr_cmp_si_2exp (s1, -1, -1) > 0) ? -1 : 1;
-              break;
+              mpfr_reflection_overflow (z_pre, s1, s, y, p, MPFR_RNDD);
+              /* z_pre is a the rounding of a lower bound of |zeta(s)|, thus
+		 if z_pre overflows, then |zeta(s)| overflows too. We assume
+		 here that if z_pre is the largest floating-point, there is
+		 overflow too. */
+	      mpfr_nextabove (z_pre);
+              if (MPFR_IS_INF (z_pre)) /* determine the sign of overflow */
+                {
+                  mpfr_div_2ui (s1, s, 2, MPFR_RNDN); /* s/4, exact */
+                  mpfr_frac (s1, s1, MPFR_RNDN); /* exact, -1 < s1 < 0 */
+                  overflow = (mpfr_cmp_si_2exp (s1, -1, -1) > 0) ? -1 : 1;
+                  break;
+                }
+	      else
+		{
+		  int ok = 0;
+		  mpfr_t z_down;
+		  mpfr_init2 (z_up, mpfr_get_prec (z_pre));
+		  mpfr_reflection_overflow (z_up, s1, s, y, p, MPFR_RNDU);
+		  /* if the lower approximation z_pre does not overflow, but
+		     z_up does, we need more precision */
+		  if (MPFR_IS_INF (z_up))
+		    goto next_loop;
+		  /* check if z_pre and z_up round to the same number */
+		  mpfr_init2 (z_down, precz);
+		  mpfr_set (z_down, z_pre, rnd_mode);
+		  mpfr_prec_round (z_up, precz, rnd_mode);
+		  ok = mpfr_cmp (z_down, z_up) == 0;
+		  mpfr_clear (z_up);
+		  mpfr_clear (z_down);				   
+		  if (ok)
+		    {
+		      /* get correct sign */
+		      mpfr_div_2ui (s1, s, 2, MPFR_RNDN); /* s/4, exact */
+		      mpfr_frac (s1, s1, MPFR_RNDN); /* exact, -1 < s1 < 0 */
+		      if (mpfr_cmp_si_2exp (s1, -1, -1) > 0)
+			mpfr_neg (z_pre, z_pre, rnd_mode);
+		      break;
+		    }
+		  else
+		    goto next_loop;
+		}
             }
+          mpfr_zeta_pos (z_pre, s1, MPFR_RNDN);   /* zeta(1-s)  */
           mpfr_mul (z_pre, z_pre, y, MPFR_RNDN);  /* gamma(1-s)*zeta(1-s) */
 
-          mpfr_const_pi (p, MPFR_RNDD); /* p is Pi */
-
           /* multiply z_pre by 2^s*Pi^(s-1) where p=Pi, s1=1-s */
           mpfr_mul_2ui (y, p, 1, MPFR_RNDN);      /* 2*Pi */
           mpfr_neg (s1, s1, MPFR_RNDN);           /* s-1 */
@@ -559,6 +674,7 @@ mpfr_zeta (mpfr_t z, mpfr_srcptr s, mpfr_rnd_t rnd_mode)
                                            rnd_mode)))
             break;
 
+	next_loop:
           MPFR_ZIV_NEXT (loop, prec1);
           MPFR_GROUP_REPREC_4 (group, prec1, z_pre, s1, y, p);
         }
author	zimmerma <zimmerma@280ebfd0-de03-0410-8827-d642c229c3f4>	2017-02-12 08:06:55 +0000
committer	zimmerma <zimmerma@280ebfd0-de03-0410-8827-d642c229c3f4>	2017-02-12 08:06:55 +0000
commit	47a310a9f4645afdff1e31ad814fb5843bdb2145 (patch)
tree	e749fd965b9c55419799a38396854f49152e67a0 /src/zeta.c
parent	afb28793807f6e98333096bb2ee3a4deb81720c8 (diff)
download	mpfr-47a310a9f4645afdff1e31ad814fb5843bdb2145.tar.gz