mpfr/src/cos.c

4a238c70SJohn Marino/* mpfr_cos -- cosine of a floating-point number
4a238c70SJohn Marino
*ab6d115fSJohn MarinoCopyright 2001, 2002, 2003, 2004, 2005, 2006, 2007, 2008, 2009, 2010, 2011, 2012, 2013 Free Software Foundation, Inc.
*ab6d115fSJohn MarinoContributed by the AriC and Caramel projects, INRIA.
4a238c70SJohn Marino
4a238c70SJohn MarinoThis file is part of the GNU MPFR Library.
4a238c70SJohn Marino
4a238c70SJohn MarinoThe GNU MPFR Library is free software; you can redistribute it and/or modify
4a238c70SJohn Marinoit under the terms of the GNU Lesser General Public License as published by
4a238c70SJohn Marinothe Free Software Foundation; either version 3 of the License, or (at your
4a238c70SJohn Marinooption) any later version.
4a238c70SJohn Marino
4a238c70SJohn MarinoThe GNU MPFR Library is distributed in the hope that it will be useful, but
4a238c70SJohn MarinoWITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
4a238c70SJohn Marinoor FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public
4a238c70SJohn MarinoLicense for more details.
4a238c70SJohn Marino
4a238c70SJohn MarinoYou should have received a copy of the GNU Lesser General Public License
4a238c70SJohn Marinoalong with the GNU MPFR Library; see the file COPYING.LESSER.  If not, see
4a238c70SJohn Marinohttp://www.gnu.org/licenses/ or write to the Free Software Foundation, Inc.,
4a238c70SJohn Marino51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA. */
4a238c70SJohn Marino
4a238c70SJohn Marino#define MPFR_NEED_LONGLONG_H
4a238c70SJohn Marino#include "mpfr-impl.h"
4a238c70SJohn Marino
4a238c70SJohn Marinostatic int
4a238c70SJohn Marinompfr_cos_fast (mpfr_ptr y, mpfr_srcptr x, mpfr_rnd_t rnd_mode)
4a238c70SJohn Marino{
4a238c70SJohn Marino  int inex;
4a238c70SJohn Marino
4a238c70SJohn Marino  inex = mpfr_sincos_fast (NULL, y, x, rnd_mode);
4a238c70SJohn Marino  inex = inex >> 2; /* 0: exact, 1: rounded up, 2: rounded down */
4a238c70SJohn Marino  return (inex == 2) ? -1 : inex;
4a238c70SJohn Marino}
4a238c70SJohn Marino
4a238c70SJohn Marino/* f <- 1 - r/2! + r^2/4! + ... + (-1)^l r^l/(2l)! + ...
4a238c70SJohn Marino   Assumes |r| < 1/2, and f, r have the same precision.
4a238c70SJohn Marino   Returns e such that the error on f is bounded by 2^e ulps.
4a238c70SJohn Marino*/
4a238c70SJohn Marinostatic int
4a238c70SJohn Marinompfr_cos2_aux (mpfr_ptr f, mpfr_srcptr r)
4a238c70SJohn Marino{
4a238c70SJohn Marino  mpz_t x, t, s;
4a238c70SJohn Marino  mpfr_exp_t ex, l, m;
4a238c70SJohn Marino  mpfr_prec_t p, q;
4a238c70SJohn Marino  unsigned long i, maxi, imax;
4a238c70SJohn Marino
4a238c70SJohn Marino  MPFR_ASSERTD(mpfr_get_exp (r) <= -1);
4a238c70SJohn Marino
4a238c70SJohn Marino  /* compute minimal i such that i*(i+1) does not fit in an unsigned long,
4a238c70SJohn Marino     assuming that there are no padding bits. */
4a238c70SJohn Marino  maxi = 1UL << (CHAR_BIT * sizeof(unsigned long) / 2);
4a238c70SJohn Marino  if (maxi * (maxi / 2) == 0) /* test checked at compile time */
4a238c70SJohn Marino    {
4a238c70SJohn Marino      /* can occur only when there are padding bits. */
4a238c70SJohn Marino      /* maxi * (maxi-1) is representable iff maxi * (maxi / 2) != 0 */
4a238c70SJohn Marino      do
4a238c70SJohn Marino        maxi /= 2;
4a238c70SJohn Marino      while (maxi * (maxi / 2) == 0);
4a238c70SJohn Marino    }
4a238c70SJohn Marino
4a238c70SJohn Marino  mpz_init (x);
4a238c70SJohn Marino  mpz_init (s);
4a238c70SJohn Marino  mpz_init (t);
4a238c70SJohn Marino  ex = mpfr_get_z_2exp (x, r); /* r = x*2^ex */
4a238c70SJohn Marino
4a238c70SJohn Marino  /* remove trailing zeroes */
4a238c70SJohn Marino  l = mpz_scan1 (x, 0);
4a238c70SJohn Marino  ex += l;
4a238c70SJohn Marino  mpz_fdiv_q_2exp (x, x, l);
4a238c70SJohn Marino
4a238c70SJohn Marino  /* since |r| < 1, r = x*2^ex, and x is an integer, necessarily ex < 0 */
4a238c70SJohn Marino
4a238c70SJohn Marino  p = mpfr_get_prec (f); /* same than r */
4a238c70SJohn Marino  /* bound for number of iterations */
4a238c70SJohn Marino  imax = p / (-mpfr_get_exp (r));
4a238c70SJohn Marino  imax += (imax == 0);
4a238c70SJohn Marino  q = 2 * MPFR_INT_CEIL_LOG2(imax) + 4; /* bound for (3l)^2 */
4a238c70SJohn Marino
4a238c70SJohn Marino  mpz_set_ui (s, 1); /* initialize sum with 1 */
4a238c70SJohn Marino  mpz_mul_2exp (s, s, p + q); /* scale all values by 2^(p+q) */
4a238c70SJohn Marino  mpz_set (t, s); /* invariant: t is previous term */
4a238c70SJohn Marino  for (i = 1; (m = mpz_sizeinbase (t, 2)) >= q; i += 2)
4a238c70SJohn Marino    {
4a238c70SJohn Marino      /* adjust precision of x to that of t */
4a238c70SJohn Marino      l = mpz_sizeinbase (x, 2);
4a238c70SJohn Marino      if (l > m)
4a238c70SJohn Marino        {
4a238c70SJohn Marino          l -= m;
4a238c70SJohn Marino          mpz_fdiv_q_2exp (x, x, l);
4a238c70SJohn Marino          ex += l;
4a238c70SJohn Marino        }
4a238c70SJohn Marino      /* multiply t by r */
4a238c70SJohn Marino      mpz_mul (t, t, x);
4a238c70SJohn Marino      mpz_fdiv_q_2exp (t, t, -ex);
4a238c70SJohn Marino      /* divide t by i*(i+1) */
4a238c70SJohn Marino      if (i < maxi)
4a238c70SJohn Marino        mpz_fdiv_q_ui (t, t, i * (i + 1));
4a238c70SJohn Marino      else
4a238c70SJohn Marino        {
4a238c70SJohn Marino          mpz_fdiv_q_ui (t, t, i);
4a238c70SJohn Marino          mpz_fdiv_q_ui (t, t, i + 1);
4a238c70SJohn Marino        }
4a238c70SJohn Marino      /* if m is the (current) number of bits of t, we can consider that
4a238c70SJohn Marino         all operations on t so far had precision >= m, so we can prove
4a238c70SJohn Marino         by induction that the relative error on t is of the form
4a238c70SJohn Marino         (1+u)^(3l)-1, where |u| <= 2^(-m), and l=(i+1)/2 is the # of loops.
4a238c70SJohn Marino         Since |(1+x^2)^(1/x) - 1| <= 4x/3 for |x| <= 1/2,
4a238c70SJohn Marino         for |u| <= 1/(3l)^2, the absolute error is bounded by
4a238c70SJohn Marino         4/3*(3l)*2^(-m)*t <= 4*l since |t| < 2^m.
4a238c70SJohn Marino         Therefore the error on s is bounded by 2*l*(l+1). */
4a238c70SJohn Marino      /* add or subtract to s */
4a238c70SJohn Marino      if (i % 4 == 1)
4a238c70SJohn Marino        mpz_sub (s, s, t);
4a238c70SJohn Marino      else
4a238c70SJohn Marino        mpz_add (s, s, t);
4a238c70SJohn Marino    }
4a238c70SJohn Marino
4a238c70SJohn Marino  mpfr_set_z (f, s, MPFR_RNDN);
4a238c70SJohn Marino  mpfr_div_2ui (f, f, p + q, MPFR_RNDN);
4a238c70SJohn Marino
4a238c70SJohn Marino  mpz_clear (x);
4a238c70SJohn Marino  mpz_clear (s);
4a238c70SJohn Marino  mpz_clear (t);
4a238c70SJohn Marino
4a238c70SJohn Marino  l = (i - 1) / 2; /* number of iterations */
4a238c70SJohn Marino  return 2 * MPFR_INT_CEIL_LOG2 (l + 1) + 1; /* bound is 2l(l+1) */
4a238c70SJohn Marino}
4a238c70SJohn Marino
4a238c70SJohn Marinoint
4a238c70SJohn Marinompfr_cos (mpfr_ptr y, mpfr_srcptr x, mpfr_rnd_t rnd_mode)
4a238c70SJohn Marino{
4a238c70SJohn Marino  mpfr_prec_t K0, K, precy, m, k, l;
4a238c70SJohn Marino  int inexact, reduce = 0;
4a238c70SJohn Marino  mpfr_t r, s, xr, c;
4a238c70SJohn Marino  mpfr_exp_t exps, cancel = 0, expx;
4a238c70SJohn Marino  MPFR_ZIV_DECL (loop);
4a238c70SJohn Marino  MPFR_SAVE_EXPO_DECL (expo);
4a238c70SJohn Marino  MPFR_GROUP_DECL (group);
4a238c70SJohn Marino
4a238c70SJohn Marino  MPFR_LOG_FUNC (
4a238c70SJohn Marino    ("x[%Pu]=%*.Rg rnd=%d", mpfr_get_prec (x), mpfr_log_prec, x, rnd_mode),
4a238c70SJohn Marino    ("y[%Pu]=%*.Rg inexact=%d", mpfr_get_prec (y), mpfr_log_prec, y,
4a238c70SJohn Marino     inexact));
4a238c70SJohn Marino
4a238c70SJohn Marino  if (MPFR_UNLIKELY (MPFR_IS_SINGULAR (x)))
4a238c70SJohn Marino    {
4a238c70SJohn Marino      if (MPFR_IS_NAN (x) || MPFR_IS_INF (x))
4a238c70SJohn Marino        {
4a238c70SJohn Marino          MPFR_SET_NAN (y);
4a238c70SJohn Marino          MPFR_RET_NAN;
4a238c70SJohn Marino        }
4a238c70SJohn Marino      else
4a238c70SJohn Marino        {
4a238c70SJohn Marino          MPFR_ASSERTD (MPFR_IS_ZERO (x));
4a238c70SJohn Marino          return mpfr_set_ui (y, 1, rnd_mode);
4a238c70SJohn Marino        }
4a238c70SJohn Marino    }
4a238c70SJohn Marino
4a238c70SJohn Marino  MPFR_SAVE_EXPO_MARK (expo);
4a238c70SJohn Marino
4a238c70SJohn Marino  /* cos(x) = 1-x^2/2 + ..., so error < 2^(2*EXP(x)-1) */
4a238c70SJohn Marino  expx = MPFR_GET_EXP (x);
4a238c70SJohn Marino  MPFR_SMALL_INPUT_AFTER_SAVE_EXPO (y, __gmpfr_one, -2 * expx,
4a238c70SJohn Marino                                    1, 0, rnd_mode, expo, {});
4a238c70SJohn Marino
4a238c70SJohn Marino  /* Compute initial precision */
4a238c70SJohn Marino  precy = MPFR_PREC (y);
4a238c70SJohn Marino
4a238c70SJohn Marino  if (precy >= MPFR_SINCOS_THRESHOLD)
4a238c70SJohn Marino    {
4a238c70SJohn Marino      MPFR_SAVE_EXPO_FREE (expo);
4a238c70SJohn Marino      return mpfr_cos_fast (y, x, rnd_mode);
4a238c70SJohn Marino    }
4a238c70SJohn Marino
4a238c70SJohn Marino  K0 = __gmpfr_isqrt (precy / 3);
4a238c70SJohn Marino  m = precy + 2 * MPFR_INT_CEIL_LOG2 (precy) + 2 * K0;
4a238c70SJohn Marino
4a238c70SJohn Marino  if (expx >= 3)
4a238c70SJohn Marino    {
4a238c70SJohn Marino      reduce = 1;
4a238c70SJohn Marino      /* As expx + m - 1 will silently be converted into mpfr_prec_t
4a238c70SJohn Marino         in the mpfr_init2 call, the assert below may be useful to
4a238c70SJohn Marino         avoid undefined behavior. */
4a238c70SJohn Marino      MPFR_ASSERTN (expx + m - 1 <= MPFR_PREC_MAX);
4a238c70SJohn Marino      mpfr_init2 (c, expx + m - 1);
4a238c70SJohn Marino      mpfr_init2 (xr, m);
4a238c70SJohn Marino    }
4a238c70SJohn Marino
4a238c70SJohn Marino  MPFR_GROUP_INIT_2 (group, m, r, s);
4a238c70SJohn Marino  MPFR_ZIV_INIT (loop, m);
4a238c70SJohn Marino  for (;;)
4a238c70SJohn Marino    {
4a238c70SJohn Marino      /* If |x| >= 4, first reduce x cmod (2*Pi) into xr, using mpfr_remainder:
4a238c70SJohn Marino         let e = EXP(x) >= 3, and m the target precision:
4a238c70SJohn Marino         (1) c <- 2*Pi              [precision e+m-1, nearest]
4a238c70SJohn Marino         (2) xr <- remainder (x, c) [precision m, nearest]
4a238c70SJohn Marino         We have |c - 2*Pi| <= 1/2ulp(c) = 2^(3-e-m)
4a238c70SJohn Marino                 |xr - x - k c| <= 1/2ulp(xr) <= 2^(1-m)
4a238c70SJohn Marino                 |k| <= |x|/(2*Pi) <= 2^(e-2)
4a238c70SJohn Marino         Thus |xr - x - 2kPi| <= |k| |c - 2Pi| + 2^(1-m) <= 2^(2-m).
4a238c70SJohn Marino         It follows |cos(xr) - cos(x)| <= 2^(2-m). */
4a238c70SJohn Marino      if (reduce)
4a238c70SJohn Marino        {
4a238c70SJohn Marino          mpfr_const_pi (c, MPFR_RNDN);
4a238c70SJohn Marino          mpfr_mul_2ui (c, c, 1, MPFR_RNDN); /* 2Pi */
4a238c70SJohn Marino          mpfr_remainder (xr, x, c, MPFR_RNDN);
4a238c70SJohn Marino          if (MPFR_IS_ZERO(xr))
4a238c70SJohn Marino            goto ziv_next;
4a238c70SJohn Marino          /* now |xr| <= 4, thus r <= 16 below */
4a238c70SJohn Marino          mpfr_mul (r, xr, xr, MPFR_RNDU); /* err <= 1 ulp */
4a238c70SJohn Marino        }
4a238c70SJohn Marino      else
4a238c70SJohn Marino        mpfr_mul (r, x, x, MPFR_RNDU); /* err <= 1 ulp */
4a238c70SJohn Marino
4a238c70SJohn Marino      /* now |x| < 4 (or xr if reduce = 1), thus |r| <= 16 */
4a238c70SJohn Marino
4a238c70SJohn Marino      /* we need |r| < 1/2 for mpfr_cos2_aux, i.e., EXP(r) - 2K <= -1 */
4a238c70SJohn Marino      K = K0 + 1 + MAX(0, MPFR_GET_EXP(r)) / 2;
4a238c70SJohn Marino      /* since K0 >= 0, if EXP(r) < 0, then K >= 1, thus EXP(r) - 2K <= -3;
4a238c70SJohn Marino         otherwise if EXP(r) >= 0, then K >= 1/2 + EXP(r)/2, thus
4a238c70SJohn Marino         EXP(r) - 2K <= -1 */
4a238c70SJohn Marino
4a238c70SJohn Marino      MPFR_SET_EXP (r, MPFR_GET_EXP (r) - 2 * K); /* Can't overflow! */
4a238c70SJohn Marino
4a238c70SJohn Marino      /* s <- 1 - r/2! + ... + (-1)^l r^l/(2l)! */
4a238c70SJohn Marino      l = mpfr_cos2_aux (s, r);
4a238c70SJohn Marino      /* l is the error bound in ulps on s */
4a238c70SJohn Marino      MPFR_SET_ONE (r);
4a238c70SJohn Marino      for (k = 0; k < K; k++)
4a238c70SJohn Marino        {
4a238c70SJohn Marino          mpfr_sqr (s, s, MPFR_RNDU);            /* err <= 2*olderr */
4a238c70SJohn Marino          MPFR_SET_EXP (s, MPFR_GET_EXP (s) + 1); /* Can't overflow */
4a238c70SJohn Marino          mpfr_sub (s, s, r, MPFR_RNDN);         /* err <= 4*olderr */
4a238c70SJohn Marino          if (MPFR_IS_ZERO(s))
4a238c70SJohn Marino            goto ziv_next;
4a238c70SJohn Marino          MPFR_ASSERTD (MPFR_GET_EXP (s) <= 1);
4a238c70SJohn Marino        }
4a238c70SJohn Marino
4a238c70SJohn Marino      /* The absolute error on s is bounded by (2l+1/3)*2^(2K-m)
4a238c70SJohn Marino         2l+1/3 <= 2l+1.
4a238c70SJohn Marino         If |x| >= 4, we need to add 2^(2-m) for the argument reduction
4a238c70SJohn Marino         by 2Pi: if K = 0, this amounts to add 4 to 2l+1/3, i.e., to add
4a238c70SJohn Marino         2 to l; if K >= 1, this amounts to add 1 to 2*l+1/3. */
4a238c70SJohn Marino      l = 2 * l + 1;
4a238c70SJohn Marino      if (reduce)
4a238c70SJohn Marino        l += (K == 0) ? 4 : 1;
4a238c70SJohn Marino      k = MPFR_INT_CEIL_LOG2 (l) + 2*K;
4a238c70SJohn Marino      /* now the error is bounded by 2^(k-m) = 2^(EXP(s)-err) */
4a238c70SJohn Marino
4a238c70SJohn Marino      exps = MPFR_GET_EXP (s);
4a238c70SJohn Marino      if (MPFR_LIKELY (MPFR_CAN_ROUND (s, exps + m - k, precy, rnd_mode)))
4a238c70SJohn Marino        break;
4a238c70SJohn Marino
4a238c70SJohn Marino      if (MPFR_UNLIKELY (exps == 1))
4a238c70SJohn Marino        /* s = 1 or -1, and except x=0 which was already checked above,
4a238c70SJohn Marino           cos(x) cannot be 1 or -1, so we can round if the error is less
4a238c70SJohn Marino           than 2^(-precy) for directed rounding, or 2^(-precy-1) for rounding
4a238c70SJohn Marino           to nearest. */
4a238c70SJohn Marino        {
4a238c70SJohn Marino          if (m > k && (m - k >= precy + (rnd_mode == MPFR_RNDN)))
4a238c70SJohn Marino            {
4a238c70SJohn Marino              /* If round to nearest or away, result is s = 1 or -1,
4a238c70SJohn Marino                 otherwise it is round(nexttoward (s, 0)). However in order to
4a238c70SJohn Marino                 have the inexact flag correctly set below, we set |s| to
4a238c70SJohn Marino                 1 - 2^(-m) in all cases. */
4a238c70SJohn Marino              mpfr_nexttozero (s);
4a238c70SJohn Marino              break;
4a238c70SJohn Marino            }
4a238c70SJohn Marino        }
4a238c70SJohn Marino
4a238c70SJohn Marino      if (exps < cancel)
4a238c70SJohn Marino        {
4a238c70SJohn Marino          m += cancel - exps;
4a238c70SJohn Marino          cancel = exps;
4a238c70SJohn Marino        }
4a238c70SJohn Marino
4a238c70SJohn Marino    ziv_next:
4a238c70SJohn Marino      MPFR_ZIV_NEXT (loop, m);
4a238c70SJohn Marino      MPFR_GROUP_REPREC_2 (group, m, r, s);
4a238c70SJohn Marino      if (reduce)
4a238c70SJohn Marino        {
4a238c70SJohn Marino          mpfr_set_prec (xr, m);
4a238c70SJohn Marino          mpfr_set_prec (c, expx + m - 1);
4a238c70SJohn Marino        }
4a238c70SJohn Marino    }
4a238c70SJohn Marino  MPFR_ZIV_FREE (loop);
4a238c70SJohn Marino  inexact = mpfr_set (y, s, rnd_mode);
4a238c70SJohn Marino  MPFR_GROUP_CLEAR (group);
4a238c70SJohn Marino  if (reduce)
4a238c70SJohn Marino    {
4a238c70SJohn Marino      mpfr_clear (xr);
4a238c70SJohn Marino      mpfr_clear (c);
4a238c70SJohn Marino    }
4a238c70SJohn Marino
4a238c70SJohn Marino  MPFR_SAVE_EXPO_FREE (expo);
4a238c70SJohn Marino  return mpfr_check_range (y, inexact, rnd_mode);
4a238c70SJohn Marino}