mpfr/src/cos.c

78556Sobrien/* mpfr_cos -- cosine of a floating-point number
78556Sobrien
78556SobrienCopyright 2001, 2002, 2003, 2004, 2005, 2006, 2007, 2008, 2009, 2010, 2011, 2012, 2013 Free Software Foundation, Inc.
78556SobrienContributed by the AriC and Caramel projects, INRIA.
78556Sobrien
78556SobrienThis file is part of the GNU MPFR Library.
167974Sdelphij
167974SdelphijThe GNU MPFR Library is free software; you can redistribute it and/or modify
167974Sdelphijit under the terms of the GNU Lesser General Public License as published by
78556Sobrienthe Free Software Foundation; either version 3 of the License, or (at your
215041Sobrienoption) any later version.
215041Sobrien
78556SobrienThe GNU MPFR Library is distributed in the hope that it will be useful, but
167974SdelphijWITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
167974Sdelphijor FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public
78556SobrienLicense for more details.
167974Sdelphij
167974SdelphijYou should have received a copy of the GNU Lesser General Public License
167974Sdelphijalong with the GNU MPFR Library; see the file COPYING.LESSER.  If not, see
78556Sobrienhttp://www.gnu.org/licenses/ or write to the Free Software Foundation, Inc.,
78556Sobrien51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA. */
78556Sobrien
78556Sobrien#define MPFR_NEED_LONGLONG_H
78556Sobrien#include "mpfr-impl.h"
78556Sobrien
78556Sobrienstatic int
78556Sobrienmpfr_cos_fast (mpfr_ptr y, mpfr_srcptr x, mpfr_rnd_t rnd_mode)
78556Sobrien{
78556Sobrien  int inex;
78556Sobrien
78556Sobrien  inex = mpfr_sincos_fast (NULL, y, x, rnd_mode);
78556Sobrien  inex = inex >> 2; /* 0: exact, 1: rounded up, 2: rounded down */
78556Sobrien  return (inex == 2) ? -1 : inex;
78556Sobrien}
78556Sobrien
78556Sobrien/* f <- 1 - r/2! + r^2/4! + ... + (-1)^l r^l/(2l)! + ...
78556Sobrien   Assumes |r| < 1/2, and f, r have the same precision.
78556Sobrien   Returns e such that the error on f is bounded by 2^e ulps.
78556Sobrien*/
78556Sobrienstatic int
78556Sobrienmpfr_cos2_aux (mpfr_ptr f, mpfr_srcptr r)
78556Sobrien{
78556Sobrien  mpz_t x, t, s;
78556Sobrien  mpfr_exp_t ex, l, m;
78556Sobrien  mpfr_prec_t p, q;
78556Sobrien  unsigned long i, maxi, imax;
78556Sobrien
78556Sobrien  MPFR_ASSERTD(mpfr_get_exp (r) <= -1);
78556Sobrien
78556Sobrien  /* compute minimal i such that i*(i+1) does not fit in an unsigned long,
78556Sobrien     assuming that there are no padding bits. */
78556Sobrien  maxi = 1UL << (CHAR_BIT * sizeof(unsigned long) / 2);
78556Sobrien  if (maxi * (maxi / 2) == 0) /* test checked at compile time */
78556Sobrien    {
78556Sobrien      /* can occur only when there are padding bits. */
78556Sobrien      /* maxi * (maxi-1) is representable iff maxi * (maxi / 2) != 0 */
78556Sobrien      do
78556Sobrien        maxi /= 2;
78556Sobrien      while (maxi * (maxi / 2) == 0);
78556Sobrien    }
78556Sobrien
78556Sobrien  mpz_init (x);
78556Sobrien  mpz_init (s);
78556Sobrien  mpz_init (t);
78556Sobrien  ex = mpfr_get_z_2exp (x, r); /* r = x*2^ex */
78556Sobrien
78556Sobrien  /* remove trailing zeroes */
78556Sobrien  l = mpz_scan1 (x, 0);
78556Sobrien  ex += l;
78556Sobrien  mpz_fdiv_q_2exp (x, x, l);
78556Sobrien
78556Sobrien  /* since |r| < 1, r = x*2^ex, and x is an integer, necessarily ex < 0 */
78556Sobrien
78556Sobrien  p = mpfr_get_prec (f); /* same than r */
78556Sobrien  /* bound for number of iterations */
78556Sobrien  imax = p / (-mpfr_get_exp (r));
78556Sobrien  imax += (imax == 0);
78556Sobrien  q = 2 * MPFR_INT_CEIL_LOG2(imax) + 4; /* bound for (3l)^2 */
78556Sobrien
78556Sobrien  mpz_set_ui (s, 1); /* initialize sum with 1 */
78556Sobrien  mpz_mul_2exp (s, s, p + q); /* scale all values by 2^(p+q) */
78556Sobrien  mpz_set (t, s); /* invariant: t is previous term */
78556Sobrien  for (i = 1; (m = mpz_sizeinbase (t, 2)) >= q; i += 2)
78556Sobrien    {
78556Sobrien      /* adjust precision of x to that of t */
78556Sobrien      l = mpz_sizeinbase (x, 2);
78556Sobrien      if (l > m)
78556Sobrien        {
78556Sobrien          l -= m;
78556Sobrien          mpz_fdiv_q_2exp (x, x, l);
78556Sobrien          ex += l;
78556Sobrien        }
78556Sobrien      /* multiply t by r */
78556Sobrien      mpz_mul (t, t, x);
78556Sobrien      mpz_fdiv_q_2exp (t, t, -ex);
78556Sobrien      /* divide t by i*(i+1) */
78556Sobrien      if (i < maxi)
78556Sobrien        mpz_fdiv_q_ui (t, t, i * (i + 1));
78556Sobrien      else
78556Sobrien        {
78556Sobrien          mpz_fdiv_q_ui (t, t, i);
78556Sobrien          mpz_fdiv_q_ui (t, t, i + 1);
78556Sobrien        }
78556Sobrien      /* if m is the (current) number of bits of t, we can consider that
78556Sobrien         all operations on t so far had precision >= m, so we can prove
78556Sobrien         by induction that the relative error on t is of the form
78556Sobrien         (1+u)^(3l)-1, where |u| <= 2^(-m), and l=(i+1)/2 is the # of loops.
78556Sobrien         Since |(1+x^2)^(1/x) - 1| <= 4x/3 for |x| <= 1/2,
78556Sobrien         for |u| <= 1/(3l)^2, the absolute error is bounded by
78556Sobrien         4/3*(3l)*2^(-m)*t <= 4*l since |t| < 2^m.
78556Sobrien         Therefore the error on s is bounded by 2*l*(l+1). */
78556Sobrien      /* add or subtract to s */
78556Sobrien      if (i % 4 == 1)
78556Sobrien        mpz_sub (s, s, t);
78556Sobrien      else
78556Sobrien        mpz_add (s, s, t);
78556Sobrien    }
78556Sobrien
78556Sobrien  mpfr_set_z (f, s, MPFR_RNDN);
78556Sobrien  mpfr_div_2ui (f, f, p + q, MPFR_RNDN);
78556Sobrien
78556Sobrien  mpz_clear (x);
78556Sobrien  mpz_clear (s);
78556Sobrien  mpz_clear (t);
146293Sobrien
146293Sobrien  l = (i - 1) / 2; /* number of iterations */
146293Sobrien  return 2 * MPFR_INT_CEIL_LOG2 (l + 1) + 1; /* bound is 2l(l+1) */
146293Sobrien}
146293Sobrien
146293Sobrienint
146293Sobrienmpfr_cos (mpfr_ptr y, mpfr_srcptr x, mpfr_rnd_t rnd_mode)
146293Sobrien{
146293Sobrien  mpfr_prec_t K0, K, precy, m, k, l;
146293Sobrien  int inexact, reduce = 0;
146293Sobrien  mpfr_t r, s, xr, c;
146293Sobrien  mpfr_exp_t exps, cancel = 0, expx;
146293Sobrien  MPFR_ZIV_DECL (loop);
146293Sobrien  MPFR_SAVE_EXPO_DECL (expo);
146293Sobrien  MPFR_GROUP_DECL (group);
146293Sobrien
146293Sobrien  MPFR_LOG_FUNC (
146293Sobrien    ("x[%Pu]=%*.Rg rnd=%d", mpfr_get_prec (x), mpfr_log_prec, x, rnd_mode),
78556Sobrien    ("y[%Pu]=%*.Rg inexact=%d", mpfr_get_prec (y), mpfr_log_prec, y,
78556Sobrien     inexact));
78556Sobrien
78556Sobrien  if (MPFR_UNLIKELY (MPFR_IS_SINGULAR (x)))
78556Sobrien    {
78556Sobrien      if (MPFR_IS_NAN (x) || MPFR_IS_INF (x))
78556Sobrien        {
78556Sobrien          MPFR_SET_NAN (y);
78556Sobrien          MPFR_RET_NAN;
78556Sobrien        }
78556Sobrien      else
78556Sobrien        {
78556Sobrien          MPFR_ASSERTD (MPFR_IS_ZERO (x));
78556Sobrien          return mpfr_set_ui (y, 1, rnd_mode);
78556Sobrien        }
78556Sobrien    }
78556Sobrien
78556Sobrien  MPFR_SAVE_EXPO_MARK (expo);
78556Sobrien
78556Sobrien  /* cos(x) = 1-x^2/2 + ..., so error < 2^(2*EXP(x)-1) */
78556Sobrien  expx = MPFR_GET_EXP (x);
78556Sobrien  MPFR_SMALL_INPUT_AFTER_SAVE_EXPO (y, __gmpfr_one, -2 * expx,
78556Sobrien                                    1, 0, rnd_mode, expo, {});
78556Sobrien
78556Sobrien  /* Compute initial precision */
78556Sobrien  precy = MPFR_PREC (y);
78556Sobrien
78556Sobrien  if (precy >= MPFR_SINCOS_THRESHOLD)
78556Sobrien    {
78556Sobrien      MPFR_SAVE_EXPO_FREE (expo);
78556Sobrien      return mpfr_cos_fast (y, x, rnd_mode);
78556Sobrien    }
78556Sobrien
78556Sobrien  K0 = __gmpfr_isqrt (precy / 3);
78556Sobrien  m = precy + 2 * MPFR_INT_CEIL_LOG2 (precy) + 2 * K0;
78556Sobrien
78556Sobrien  if (expx >= 3)
78556Sobrien    {
78556Sobrien      reduce = 1;
78556Sobrien      /* As expx + m - 1 will silently be converted into mpfr_prec_t
78556Sobrien         in the mpfr_init2 call, the assert below may be useful to
78556Sobrien         avoid undefined behavior. */
78556Sobrien      MPFR_ASSERTN (expx + m - 1 <= MPFR_PREC_MAX);
78556Sobrien      mpfr_init2 (c, expx + m - 1);
78556Sobrien      mpfr_init2 (xr, m);
78556Sobrien    }
78556Sobrien
78556Sobrien  MPFR_GROUP_INIT_2 (group, m, r, s);
78556Sobrien  MPFR_ZIV_INIT (loop, m);
78556Sobrien  for (;;)
78556Sobrien    {
78556Sobrien      /* If |x| >= 4, first reduce x cmod (2*Pi) into xr, using mpfr_remainder:
78556Sobrien         let e = EXP(x) >= 3, and m the target precision:
78556Sobrien         (1) c <- 2*Pi              [precision e+m-1, nearest]
78556Sobrien         (2) xr <- remainder (x, c) [precision m, nearest]
78556Sobrien         We have |c - 2*Pi| <= 1/2ulp(c) = 2^(3-e-m)
78556Sobrien                 |xr - x - k c| <= 1/2ulp(xr) <= 2^(1-m)
78556Sobrien                 |k| <= |x|/(2*Pi) <= 2^(e-2)
78556Sobrien         Thus |xr - x - 2kPi| <= |k| |c - 2Pi| + 2^(1-m) <= 2^(2-m).
78556Sobrien         It follows |cos(xr) - cos(x)| <= 2^(2-m). */
78556Sobrien      if (reduce)
78556Sobrien        {
78556Sobrien          mpfr_const_pi (c, MPFR_RNDN);
          mpfr_mul_2ui (c, c, 1, MPFR_RNDN); /* 2Pi */
          mpfr_remainder (xr, x, c, MPFR_RNDN);
          if (MPFR_IS_ZERO(xr))
            goto ziv_next;
          /* now |xr| <= 4, thus r <= 16 below */
          mpfr_mul (r, xr, xr, MPFR_RNDU); /* err <= 1 ulp */
        }
      else
        mpfr_mul (r, x, x, MPFR_RNDU); /* err <= 1 ulp */

      /* now |x| < 4 (or xr if reduce = 1), thus |r| <= 16 */

      /* we need |r| < 1/2 for mpfr_cos2_aux, i.e., EXP(r) - 2K <= -1 */
      K = K0 + 1 + MAX(0, MPFR_GET_EXP(r)) / 2;
      /* since K0 >= 0, if EXP(r) < 0, then K >= 1, thus EXP(r) - 2K <= -3;
         otherwise if EXP(r) >= 0, then K >= 1/2 + EXP(r)/2, thus
         EXP(r) - 2K <= -1 */

      MPFR_SET_EXP (r, MPFR_GET_EXP (r) - 2 * K); /* Can't overflow! */

      /* s <- 1 - r/2! + ... + (-1)^l r^l/(2l)! */
      l = mpfr_cos2_aux (s, r);
      /* l is the error bound in ulps on s */
      MPFR_SET_ONE (r);
      for (k = 0; k < K; k++)
        {
          mpfr_sqr (s, s, MPFR_RNDU);            /* err <= 2*olderr */
          MPFR_SET_EXP (s, MPFR_GET_EXP (s) + 1); /* Can't overflow */
          mpfr_sub (s, s, r, MPFR_RNDN);         /* err <= 4*olderr */
          if (MPFR_IS_ZERO(s))
            goto ziv_next;
          MPFR_ASSERTD (MPFR_GET_EXP (s) <= 1);
        }

      /* The absolute error on s is bounded by (2l+1/3)*2^(2K-m)
         2l+1/3 <= 2l+1.
         If |x| >= 4, we need to add 2^(2-m) for the argument reduction
         by 2Pi: if K = 0, this amounts to add 4 to 2l+1/3, i.e., to add
         2 to l; if K >= 1, this amounts to add 1 to 2*l+1/3. */
      l = 2 * l + 1;
      if (reduce)
        l += (K == 0) ? 4 : 1;
      k = MPFR_INT_CEIL_LOG2 (l) + 2*K;
      /* now the error is bounded by 2^(k-m) = 2^(EXP(s)-err) */

      exps = MPFR_GET_EXP (s);
      if (MPFR_LIKELY (MPFR_CAN_ROUND (s, exps + m - k, precy, rnd_mode)))
        break;

      if (MPFR_UNLIKELY (exps == 1))
        /* s = 1 or -1, and except x=0 which was already checked above,
           cos(x) cannot be 1 or -1, so we can round if the error is less
           than 2^(-precy) for directed rounding, or 2^(-precy-1) for rounding
           to nearest. */
        {
          if (m > k && (m - k >= precy + (rnd_mode == MPFR_RNDN)))
            {
              /* If round to nearest or away, result is s = 1 or -1,
                 otherwise it is round(nexttoward (s, 0)). However in order to
                 have the inexact flag correctly set below, we set |s| to
                 1 - 2^(-m) in all cases. */
              mpfr_nexttozero (s);
              break;
            }
        }

      if (exps < cancel)
        {
          m += cancel - exps;
          cancel = exps;
        }

    ziv_next:
      MPFR_ZIV_NEXT (loop, m);
      MPFR_GROUP_REPREC_2 (group, m, r, s);
      if (reduce)
        {
          mpfr_set_prec (xr, m);
          mpfr_set_prec (c, expx + m - 1);
        }
    }
  MPFR_ZIV_FREE (loop);
  inexact = mpfr_set (y, s, rnd_mode);
  MPFR_GROUP_CLEAR (group);
  if (reduce)
    {
      mpfr_clear (xr);
      mpfr_clear (c);
    }

  MPFR_SAVE_EXPO_FREE (expo);
  return mpfr_check_range (y, inexact, rnd_mode);
}