[src/cosu.c] Implemented range reduction for mpfr_cosu.

git-svn-id: https://scm.gforge.inria.fr/anonscm/svn/mpfr/trunk@14248 280ebfd0-de03-0410-8827-d642c229c3f4
author: vlefevre <vlefevre@280ebfd0-de03-0410-8827-d642c229c3f4> 2021-01-13 23:26:50 +0000
committer: vlefevre <vlefevre@280ebfd0-de03-0410-8827-d642c229c3f4> 2021-01-13 23:26:50 +0000
commit: 230dfe58bca096f56397bc142a9bb99d75e45df6 (patch)
tree: b030831aeb1a626081feeabab2a20fe3672d22c3 /src/cosu.c
parent: e6162a5aedc8a2fccee55b79a8c8ce9a71026afc (diff)
download: mpfr-230dfe58bca096f56397bc142a9bb99d75e45df6.tar.gz
1 files changed, 33 insertions, 12 deletions
diff --git a/src/cosu.c b/src/cosu.c
index a1140538e..30be5ff38 100644
--- a/src/cosu.c
+++ b/src/cosu.c
@@ -24,16 +24,14 @@ https://www.gnu.org/licenses/ or write to the Free Software Foundation, Inc.,
 #define MPFR_NEED_LONGLONG_H
 #include "mpfr-impl.h"
 
-/* FIXME[VL]: Implement the range reduction in this function.
-   That's the whole point of cosu compared to cos. */
-
 /* put in y the corrected-rounded value of cos(2*pi*x/u) */
 int
 mpfr_cosu (mpfr_ptr y, mpfr_srcptr x, unsigned long u, mpfr_rnd_t rnd_mode)
 {
+  mpfr_srcptr xp;
   mpfr_prec_t precy, prec;
   mpfr_exp_t expx, expt, err, log2u, erra, errb;
-  mpfr_t t;
+  mpfr_t t, xr;
   int inexact = 0, nloops = 0, underflow = 0;
   MPFR_ZIV_DECL (loop);
   MPFR_SAVE_EXPO_DECL (expo);
@@ -60,8 +58,27 @@ mpfr_cosu (mpfr_ptr y, mpfr_srcptr x, unsigned long u, mpfr_rnd_t rnd_mode)
 
   MPFR_SAVE_EXPO_MARK (expo);
 
+  if (mpfr_cmpabs_ui (x, u) < 1)
+    {
+      xp = x;
+    }
+  else
+    {
+      mpfr_exp_t e = MPFR_GET_PREC (x) - MPFR_GET_EXP (x);
+      int inex;
+
+      /* Let's compute xr = x mod u, with sign(xr) = sign(x) though
+         this doesn't matter. */
+      mpfr_init2 (xr, sizeof (unsigned long) * CHAR_BIT + (e < 0 ? 0 : e));
+      MPFR_DBGRES (inex = mpfr_fmod_ui (xr, x, u, MPFR_RNDN));  /* exact */
+      MPFR_ASSERTD (inex == 0);
+      xp = xr;
+    }
+
+  /* now |xp/u| < 1 */
+
   /* for x small, we have |cos(2*pi*x/u)-1| < 1/2*(2*pi*x/u)^2 < 2^5*(x/u)^2 */
-  expx = MPFR_GET_EXP (x);
+  expx = MPFR_GET_EXP (xp);
   log2u = u == 1 ? 0 : MPFR_INT_CEIL_LOG2 (u) - 1;
   /* u >= 2^log2u thus 1/u <= 2^(-log2u) */
   erra = -2 * expx;
@@ -83,9 +100,7 @@ mpfr_cosu (mpfr_ptr y, mpfr_srcptr x, unsigned long u, mpfr_rnd_t rnd_mode)
 
   precy = MPFR_GET_PREC (y);
   /* For x large, since argument reduction is expensive, we want to avoid
-     any failure in Ziv's strategy, thus we take into account expx too.
-     FIXME: this has to be modified when argument reduction is done
-     directly on x. */
+     any failure in Ziv's strategy, thus we take into account expx too. */
   prec = precy + MAX(expx,MPFR_INT_CEIL_LOG2 (precy)) + 8;
   MPFR_ASSERTD(prec >= 2);
   mpfr_init2 (t, prec);
@@ -94,12 +109,13 @@ mpfr_cosu (mpfr_ptr y, mpfr_srcptr x, unsigned long u, mpfr_rnd_t rnd_mode)
     {
       nloops ++;
       /* We first compute an approximation t of 2*pi*x/u, then call cos(t).
-         If t = 2*pi*x/u + s, then |cos(t) - cos(2*pi*x/u)| <= |s|. */
+         If t = 2*pi*x/u + s, then |cos(t) - cos(2*pi*x/u)| <= |s|.
+         In the error analysis below, xp stands for x. */
       mpfr_set_prec (t, prec);
       mpfr_const_pi (t, MPFR_RNDN); /* t = pi * (1 + theta1) where
                                        |theta1| <= 2^-prec */
       mpfr_mul_2ui (t, t, 1, MPFR_RNDN); /* t = 2*pi * (1 + theta1) */
-      mpfr_mul (t, t, x, MPFR_RNDN);     /* t = 2*pi*x * (1 + theta2)^2 where
+      mpfr_mul (t, t, xp, MPFR_RNDN);    /* t = 2*pi*x * (1 + theta2)^2 where
                                             |theta2| <= 2^-prec */
       mpfr_div_ui (t, t, u, MPFR_RNDN);  /* t = 2*pi*x/u * (1 + theta3)^3 where
                                             |theta3| <= 2^-prec */
@@ -137,7 +153,7 @@ mpfr_cosu (mpfr_ptr y, mpfr_srcptr x, unsigned long u, mpfr_rnd_t rnd_mode)
       if (nloops == 1)
         {
           /* detect case (a) */
-          inexact = mpfr_div_ui (t, x, u, MPFR_RNDZ);
+          inexact = mpfr_div_ui (t, xp, u, MPFR_RNDZ);
           mpfr_mul_2ui (t, t, 2, MPFR_RNDZ);
           if (inexact == 0 && mpfr_integer_p (t))
             {
@@ -161,7 +177,7 @@ mpfr_cosu (mpfr_ptr y, mpfr_srcptr x, unsigned long u, mpfr_rnd_t rnd_mode)
           /* detect case (b): this can only occur if u is divisible by 3 */
           if ((u % 3) == 0)
             {
-              inexact = mpfr_div_ui (t, x, u / 3, MPFR_RNDZ);
+              inexact = mpfr_div_ui (t, xp, u / 3, MPFR_RNDZ);
               /* t should be in {1/2,2/2,4/2,5/2} */
               mpfr_mul_2ui (t, t, 1, MPFR_RNDZ);
               /* t should be {1,2,4,5} mod 6:
@@ -201,6 +217,11 @@ mpfr_cosu (mpfr_ptr y, mpfr_srcptr x, unsigned long u, mpfr_rnd_t rnd_mode)
 
  end:
   mpfr_clear (t);
+  if (xp != x)
+    {
+      MPFR_ASSERTD (xp == xr);
+      mpfr_clear (xr);
+    }
   MPFR_SAVE_EXPO_FREE (expo);
   return underflow ? inexact : mpfr_check_range (y, inexact, rnd_mode);
 }
author	vlefevre <vlefevre@280ebfd0-de03-0410-8827-d642c229c3f4>	2021-01-13 23:26:50 +0000
committer	vlefevre <vlefevre@280ebfd0-de03-0410-8827-d642c229c3f4>	2021-01-13 23:26:50 +0000
commit	230dfe58bca096f56397bc142a9bb99d75e45df6 (patch)
tree	b030831aeb1a626081feeabab2a20fe3672d22c3 /src/cosu.c
parent	e6162a5aedc8a2fccee55b79a8c8ce9a71026afc (diff)
download	mpfr-230dfe58bca096f56397bc142a9bb99d75e45df6.tar.gz