mpfr/src/erfc.c

4a238c70SJohn Marino/* mpfr_erfc -- The Complementary Error Function of a floating-point number
4a238c70SJohn Marino
*ab6d115fSJohn MarinoCopyright 2005, 2006, 2007, 2008, 2009, 2010, 2011, 2012, 2013 Free Software Foundation, Inc.
*ab6d115fSJohn MarinoContributed by the AriC and Caramel projects, INRIA.
4a238c70SJohn Marino
4a238c70SJohn MarinoThis file is part of the GNU MPFR Library.
4a238c70SJohn Marino
4a238c70SJohn MarinoThe GNU MPFR Library is free software; you can redistribute it and/or modify
4a238c70SJohn Marinoit under the terms of the GNU Lesser General Public License as published by
4a238c70SJohn Marinothe Free Software Foundation; either version 3 of the License, or (at your
4a238c70SJohn Marinooption) any later version.
4a238c70SJohn Marino
4a238c70SJohn MarinoThe GNU MPFR Library is distributed in the hope that it will be useful, but
4a238c70SJohn MarinoWITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
4a238c70SJohn Marinoor FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public
4a238c70SJohn MarinoLicense for more details.
4a238c70SJohn Marino
4a238c70SJohn MarinoYou should have received a copy of the GNU Lesser General Public License
4a238c70SJohn Marinoalong with the GNU MPFR Library; see the file COPYING.LESSER.  If not, see
4a238c70SJohn Marinohttp://www.gnu.org/licenses/ or write to the Free Software Foundation, Inc.,
4a238c70SJohn Marino51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA. */
4a238c70SJohn Marino
4a238c70SJohn Marino#define MPFR_NEED_LONGLONG_H
4a238c70SJohn Marino#include "mpfr-impl.h"
4a238c70SJohn Marino
4a238c70SJohn Marino/* erfc(x) = 1 - erf(x) */
4a238c70SJohn Marino
4a238c70SJohn Marino/* Put in y an approximation of erfc(x) for large x, using formulae 7.1.23 and
4a238c70SJohn Marino   7.1.24 from Abramowitz and Stegun.
4a238c70SJohn Marino   Returns e such that the error is bounded by 2^e ulp(y),
4a238c70SJohn Marino   or returns 0 in case of underflow.
4a238c70SJohn Marino*/
4a238c70SJohn Marinostatic mpfr_exp_t
4a238c70SJohn Marinompfr_erfc_asympt (mpfr_ptr y, mpfr_srcptr x)
4a238c70SJohn Marino{
4a238c70SJohn Marino  mpfr_t t, xx, err;
4a238c70SJohn Marino  unsigned long k;
4a238c70SJohn Marino  mpfr_prec_t prec = MPFR_PREC(y);
4a238c70SJohn Marino  mpfr_exp_t exp_err;
4a238c70SJohn Marino
4a238c70SJohn Marino  mpfr_init2 (t, prec);
4a238c70SJohn Marino  mpfr_init2 (xx, prec);
4a238c70SJohn Marino  mpfr_init2 (err, 31);
4a238c70SJohn Marino  /* let u = 2^(1-p), and let us represent the error as (1+u)^err
4a238c70SJohn Marino     with a bound for err */
4a238c70SJohn Marino  mpfr_mul (xx, x, x, MPFR_RNDD); /* err <= 1 */
4a238c70SJohn Marino  mpfr_ui_div (xx, 1, xx, MPFR_RNDU); /* upper bound for 1/(2x^2), err <= 2 */
4a238c70SJohn Marino  mpfr_div_2ui (xx, xx, 1, MPFR_RNDU); /* exact */
4a238c70SJohn Marino  mpfr_set_ui (t, 1, MPFR_RNDN); /* current term, exact */
4a238c70SJohn Marino  mpfr_set (y, t, MPFR_RNDN);    /* current sum  */
4a238c70SJohn Marino  mpfr_set_ui (err, 0, MPFR_RNDN);
4a238c70SJohn Marino  for (k = 1; ; k++)
4a238c70SJohn Marino    {
4a238c70SJohn Marino      mpfr_mul_ui (t, t, 2 * k - 1, MPFR_RNDU); /* err <= 4k-3 */
4a238c70SJohn Marino      mpfr_mul (t, t, xx, MPFR_RNDU);           /* err <= 4k */
4a238c70SJohn Marino      /* for -1 < x < 1, and |nx| < 1, we have |(1+x)^n| <= 1+7/4|nx|.
4a238c70SJohn Marino         Indeed, for x>=0: log((1+x)^n) = n*log(1+x) <= n*x. Let y=n*x < 1,
4a238c70SJohn Marino         then exp(y) <= 1+7/4*y.
4a238c70SJohn Marino         For x<=0, let x=-x, we can prove by induction that (1-x)^n >= 1-n*x.*/
4a238c70SJohn Marino      mpfr_mul_2si (err, err, MPFR_GET_EXP (y) - MPFR_GET_EXP (t), MPFR_RNDU);
4a238c70SJohn Marino      mpfr_add_ui (err, err, 14 * k, MPFR_RNDU); /* 2^(1-p) * t <= 2 ulp(t) */
4a238c70SJohn Marino      mpfr_div_2si (err, err, MPFR_GET_EXP (y) - MPFR_GET_EXP (t), MPFR_RNDU);
4a238c70SJohn Marino      if (MPFR_GET_EXP (t) + (mpfr_exp_t) prec <= MPFR_GET_EXP (y))
4a238c70SJohn Marino        {
4a238c70SJohn Marino          /* the truncation error is bounded by |t| < ulp(y) */
4a238c70SJohn Marino          mpfr_add_ui (err, err, 1, MPFR_RNDU);
4a238c70SJohn Marino          break;
4a238c70SJohn Marino        }
4a238c70SJohn Marino      if (k & 1)
4a238c70SJohn Marino        mpfr_sub (y, y, t, MPFR_RNDN);
4a238c70SJohn Marino      else
4a238c70SJohn Marino        mpfr_add (y, y, t, MPFR_RNDN);
4a238c70SJohn Marino    }
4a238c70SJohn Marino  /* the error on y is bounded by err*ulp(y) */
4a238c70SJohn Marino  mpfr_mul (t, x, x, MPFR_RNDU); /* rel. err <= 2^(1-p) */
4a238c70SJohn Marino  mpfr_div_2ui (err, err, 3, MPFR_RNDU);  /* err/8 */
4a238c70SJohn Marino  mpfr_add (err, err, t, MPFR_RNDU);      /* err/8 + xx */
4a238c70SJohn Marino  mpfr_mul_2ui (err, err, 3, MPFR_RNDU);  /* err + 8*xx */
4a238c70SJohn Marino  mpfr_exp (t, t, MPFR_RNDU); /* err <= 1/2*ulp(t) + err(x*x)*t
4a238c70SJohn Marino                                <= 1/2*ulp(t)+2*|x*x|*ulp(t)
4a238c70SJohn Marino                                <= (2*|x*x|+1/2)*ulp(t) */
4a238c70SJohn Marino  mpfr_mul (t, t, x, MPFR_RNDN); /* err <= 1/2*ulp(t) + (4*|x*x|+1)*ulp(t)
4a238c70SJohn Marino                                   <= (4*|x*x|+3/2)*ulp(t) */
4a238c70SJohn Marino  mpfr_const_pi (xx, MPFR_RNDZ); /* err <= ulp(Pi) */
4a238c70SJohn Marino  mpfr_sqrt (xx, xx, MPFR_RNDN); /* err <= 1/2*ulp(xx) + ulp(Pi)/2/sqrt(Pi)
4a238c70SJohn Marino                                   <= 3/2*ulp(xx) */
4a238c70SJohn Marino  mpfr_mul (t, t, xx, MPFR_RNDN); /* err <= (8 |xx| + 13/2) * ulp(t) */
4a238c70SJohn Marino  mpfr_div (y, y, t, MPFR_RNDN); /* the relative error on input y is bounded
4a238c70SJohn Marino                                   by (1+u)^err with u = 2^(1-p), that on
4a238c70SJohn Marino                                   t is bounded by (1+u)^(8 |xx| + 13/2),
4a238c70SJohn Marino                                   thus that on output y is bounded by
4a238c70SJohn Marino                                   8 |xx| + 7 + err. */
4a238c70SJohn Marino
4a238c70SJohn Marino  if (MPFR_IS_ZERO(y))
4a238c70SJohn Marino    {
4a238c70SJohn Marino      /* If y is zero, most probably we have underflow. We check it directly
4a238c70SJohn Marino         using the fact that erfc(x) <= exp(-x^2)/sqrt(Pi)/x for x >= 0.
4a238c70SJohn Marino         We compute an upper approximation of exp(-x^2)/sqrt(Pi)/x.
4a238c70SJohn Marino      */
4a238c70SJohn Marino      mpfr_mul (t, x, x, MPFR_RNDD); /* t <= x^2 */
4a238c70SJohn Marino      mpfr_neg (t, t, MPFR_RNDU);    /* -x^2 <= t */
4a238c70SJohn Marino      mpfr_exp (t, t, MPFR_RNDU);    /* exp(-x^2) <= t */
4a238c70SJohn Marino      mpfr_const_pi (xx, MPFR_RNDD); /* xx <= sqrt(Pi), cached */
4a238c70SJohn Marino      mpfr_mul (xx, xx, x, MPFR_RNDD); /* xx <= sqrt(Pi)*x */
4a238c70SJohn Marino      mpfr_div (y, t, xx, MPFR_RNDN); /* if y is zero, this means that the upper
4a238c70SJohn Marino                                        approximation of exp(-x^2)/sqrt(Pi)/x
4a238c70SJohn Marino                                        is nearer from 0 than from 2^(-emin-1),
4a238c70SJohn Marino                                        thus we have underflow. */
4a238c70SJohn Marino      exp_err = 0;
4a238c70SJohn Marino    }
4a238c70SJohn Marino  else
4a238c70SJohn Marino    {
4a238c70SJohn Marino      mpfr_add_ui (err, err, 7, MPFR_RNDU);
4a238c70SJohn Marino      exp_err = MPFR_GET_EXP (err);
4a238c70SJohn Marino    }
4a238c70SJohn Marino
4a238c70SJohn Marino  mpfr_clear (t);
4a238c70SJohn Marino  mpfr_clear (xx);
4a238c70SJohn Marino  mpfr_clear (err);
4a238c70SJohn Marino  return exp_err;
4a238c70SJohn Marino}
4a238c70SJohn Marino
4a238c70SJohn Marinoint
4a238c70SJohn Marinompfr_erfc (mpfr_ptr y, mpfr_srcptr x, mpfr_rnd_t rnd)
4a238c70SJohn Marino{
4a238c70SJohn Marino  int inex;
4a238c70SJohn Marino  mpfr_t tmp;
4a238c70SJohn Marino  mpfr_exp_t te, err;
4a238c70SJohn Marino  mpfr_prec_t prec;
4a238c70SJohn Marino  mpfr_exp_t emin = mpfr_get_emin ();
4a238c70SJohn Marino  MPFR_SAVE_EXPO_DECL (expo);
4a238c70SJohn Marino  MPFR_ZIV_DECL (loop);
4a238c70SJohn Marino
4a238c70SJohn Marino  MPFR_LOG_FUNC
4a238c70SJohn Marino    (("x[%Pu]=%.*Rg rnd=%d", mpfr_get_prec (x), mpfr_log_prec, x, rnd),
4a238c70SJohn Marino     ("y[%Pu]=%.*Rg inexact=%d", mpfr_get_prec (y), mpfr_log_prec, y, inex));
4a238c70SJohn Marino
4a238c70SJohn Marino  if (MPFR_UNLIKELY (MPFR_IS_SINGULAR (x)))
4a238c70SJohn Marino    {
4a238c70SJohn Marino      if (MPFR_IS_NAN (x))
4a238c70SJohn Marino        {
4a238c70SJohn Marino          MPFR_SET_NAN (y);
4a238c70SJohn Marino          MPFR_RET_NAN;
4a238c70SJohn Marino        }
4a238c70SJohn Marino      /* erfc(+inf) = 0+, erfc(-inf) = 2 erfc (0) = 1 */
4a238c70SJohn Marino      else if (MPFR_IS_INF (x))
4a238c70SJohn Marino        return mpfr_set_ui (y, MPFR_IS_POS (x) ? 0 : 2, rnd);
4a238c70SJohn Marino      else
4a238c70SJohn Marino        return mpfr_set_ui (y, 1, rnd);
4a238c70SJohn Marino    }
4a238c70SJohn Marino
4a238c70SJohn Marino  if (MPFR_SIGN (x) > 0)
4a238c70SJohn Marino    {
4a238c70SJohn Marino      /* by default, emin = 1-2^30, thus the smallest representable
4a238c70SJohn Marino         number is 1/2*2^emin = 2^(-2^30):
4a238c70SJohn Marino         for x >= 27282, erfc(x) < 2^(-2^30-1), and
4a238c70SJohn Marino         for x >= 1787897414, erfc(x) < 2^(-2^62-1).
4a238c70SJohn Marino      */
4a238c70SJohn Marino      if ((emin >= -1073741823 && mpfr_cmp_ui (x, 27282) >= 0) ||
4a238c70SJohn Marino          mpfr_cmp_ui (x, 1787897414) >= 0)
4a238c70SJohn Marino        {
4a238c70SJohn Marino          /* May be incorrect if MPFR_EMAX_MAX >= 2^62. */
4a238c70SJohn Marino          MPFR_ASSERTN ((MPFR_EMAX_MAX >> 31) >> 31 == 0);
4a238c70SJohn Marino          return mpfr_underflow (y, (rnd == MPFR_RNDN) ? MPFR_RNDZ : rnd, 1);
4a238c70SJohn Marino        }
4a238c70SJohn Marino    }
4a238c70SJohn Marino
4a238c70SJohn Marino  /* Init stuff */
4a238c70SJohn Marino  MPFR_SAVE_EXPO_MARK (expo);
4a238c70SJohn Marino
4a238c70SJohn Marino  if (MPFR_SIGN (x) < 0)
4a238c70SJohn Marino    {
4a238c70SJohn Marino      mpfr_exp_t e = MPFR_EXP(x);
4a238c70SJohn Marino      /* For x < 0 going to -infinity, erfc(x) tends to 2 by below.
4a238c70SJohn Marino         More precisely, we have 2 + 1/sqrt(Pi)/x/exp(x^2) < erfc(x) < 2.
4a238c70SJohn Marino         Thus log2 |2 - erfc(x)| <= -log2|x| - x^2 / log(2).
4a238c70SJohn Marino         If |2 - erfc(x)| < 2^(-PREC(y)) then the result is either 2 or
4a238c70SJohn Marino         nextbelow(2).
4a238c70SJohn Marino         For x <= -27282, -log2|x| - x^2 / log(2) <= -2^30.
4a238c70SJohn Marino      */
4a238c70SJohn Marino      if ((MPFR_PREC(y) <= 7 && e >= 2) ||  /* x <= -2 */
4a238c70SJohn Marino          (MPFR_PREC(y) <= 25 && e >= 3) || /* x <= -4 */
4a238c70SJohn Marino          (MPFR_PREC(y) <= 120 && mpfr_cmp_si (x, -9) <= 0) ||
4a238c70SJohn Marino          mpfr_cmp_si (x, -27282) <= 0)
4a238c70SJohn Marino        {
4a238c70SJohn Marino        near_two:
4a238c70SJohn Marino          mpfr_set_ui (y, 2, MPFR_RNDN);
4a238c70SJohn Marino          mpfr_set_inexflag ();
4a238c70SJohn Marino          if (rnd == MPFR_RNDZ || rnd == MPFR_RNDD)
4a238c70SJohn Marino            {
4a238c70SJohn Marino              mpfr_nextbelow (y);
4a238c70SJohn Marino              inex = -1;
4a238c70SJohn Marino            }
4a238c70SJohn Marino          else
4a238c70SJohn Marino            inex = 1;
4a238c70SJohn Marino          goto end;
4a238c70SJohn Marino        }
4a238c70SJohn Marino      else if (e >= 3) /* more accurate test */
4a238c70SJohn Marino        {
4a238c70SJohn Marino          mpfr_t t, u;
4a238c70SJohn Marino          int near_2;
4a238c70SJohn Marino          mpfr_init2 (t, 32);
4a238c70SJohn Marino          mpfr_init2 (u, 32);
4a238c70SJohn Marino          /* the following is 1/log(2) rounded to zero on 32 bits */
4a238c70SJohn Marino          mpfr_set_str_binary (t, "1.0111000101010100011101100101001");
4a238c70SJohn Marino          mpfr_sqr (u, x, MPFR_RNDZ);
4a238c70SJohn Marino          mpfr_mul (t, t, u, MPFR_RNDZ); /* t <= x^2/log(2) */
4a238c70SJohn Marino          mpfr_neg (u, x, MPFR_RNDZ); /* 0 <= u <= |x| */
4a238c70SJohn Marino          mpfr_log2 (u, u, MPFR_RNDZ); /* u <= log2(|x|) */
4a238c70SJohn Marino          mpfr_add (t, t, u, MPFR_RNDZ); /* t <= log2|x| + x^2 / log(2) */
4a238c70SJohn Marino          /* Taking into account that mpfr_exp_t >= mpfr_prec_t */
4a238c70SJohn Marino          mpfr_set_exp_t (u, MPFR_PREC (y), MPFR_RNDU);
4a238c70SJohn Marino          near_2 = mpfr_cmp (t, u) >= 0;  /* 1 if PREC(y) <= u <= t <= ... */
4a238c70SJohn Marino          mpfr_clear (t);
4a238c70SJohn Marino          mpfr_clear (u);
4a238c70SJohn Marino          if (near_2)
4a238c70SJohn Marino            goto near_two;
4a238c70SJohn Marino        }
4a238c70SJohn Marino    }
4a238c70SJohn Marino
4a238c70SJohn Marino  /* erfc(x) ~ 1, with error < 2^(EXP(x)+1) */
4a238c70SJohn Marino  MPFR_FAST_COMPUTE_IF_SMALL_INPUT (y, __gmpfr_one, - MPFR_GET_EXP (x) - 1,
4a238c70SJohn Marino                                    0, MPFR_SIGN(x) < 0,
4a238c70SJohn Marino                                    rnd, inex = _inexact; goto end);
4a238c70SJohn Marino
4a238c70SJohn Marino  prec = MPFR_PREC (y) + MPFR_INT_CEIL_LOG2 (MPFR_PREC (y)) + 3;
4a238c70SJohn Marino  if (MPFR_GET_EXP (x) > 0)
4a238c70SJohn Marino    prec += 2 * MPFR_GET_EXP(x);
4a238c70SJohn Marino
4a238c70SJohn Marino  mpfr_init2 (tmp, prec);
4a238c70SJohn Marino
4a238c70SJohn Marino  MPFR_ZIV_INIT (loop, prec);            /* Initialize the ZivLoop controler */
4a238c70SJohn Marino  for (;;)                               /* Infinite loop */
4a238c70SJohn Marino    {
4a238c70SJohn Marino      /* use asymptotic formula only whenever x^2 >= p*log(2),
4a238c70SJohn Marino         otherwise it will not converge */
4a238c70SJohn Marino      if (MPFR_SIGN (x) > 0 &&
4a238c70SJohn Marino          2 * MPFR_GET_EXP (x) - 2 >= MPFR_INT_CEIL_LOG2 (prec))
4a238c70SJohn Marino        /* we have x^2 >= p in that case */
4a238c70SJohn Marino        {
4a238c70SJohn Marino          err = mpfr_erfc_asympt (tmp, x);
4a238c70SJohn Marino          if (err == 0) /* underflow case */
4a238c70SJohn Marino            {
4a238c70SJohn Marino              mpfr_clear (tmp);
4a238c70SJohn Marino              MPFR_SAVE_EXPO_FREE (expo);
4a238c70SJohn Marino              return mpfr_underflow (y, (rnd == MPFR_RNDN) ? MPFR_RNDZ : rnd, 1);
4a238c70SJohn Marino            }
4a238c70SJohn Marino        }
4a238c70SJohn Marino      else
4a238c70SJohn Marino        {
4a238c70SJohn Marino          mpfr_erf (tmp, x, MPFR_RNDN);
4a238c70SJohn Marino          MPFR_ASSERTD (!MPFR_IS_SINGULAR (tmp)); /* FIXME: 0 only for x=0 ? */
4a238c70SJohn Marino          te = MPFR_GET_EXP (tmp);
4a238c70SJohn Marino          mpfr_ui_sub (tmp, 1, tmp, MPFR_RNDN);
4a238c70SJohn Marino          /* See error analysis in algorithms.tex for details */
4a238c70SJohn Marino          if (MPFR_IS_ZERO (tmp))
4a238c70SJohn Marino            {
4a238c70SJohn Marino              prec *= 2;
4a238c70SJohn Marino              err = prec; /* ensures MPFR_CAN_ROUND fails */
4a238c70SJohn Marino            }
4a238c70SJohn Marino          else
4a238c70SJohn Marino            err = MAX (te - MPFR_GET_EXP (tmp), 0) + 1;
4a238c70SJohn Marino        }
4a238c70SJohn Marino      if (MPFR_LIKELY (MPFR_CAN_ROUND (tmp, prec - err, MPFR_PREC (y), rnd)))
4a238c70SJohn Marino        break;
4a238c70SJohn Marino      MPFR_ZIV_NEXT (loop, prec);        /* Increase used precision */
4a238c70SJohn Marino      mpfr_set_prec (tmp, prec);
4a238c70SJohn Marino    }
4a238c70SJohn Marino  MPFR_ZIV_FREE (loop);                  /* Free the ZivLoop Controler */
4a238c70SJohn Marino
4a238c70SJohn Marino  inex = mpfr_set (y, tmp, rnd);    /* Set y to the computed value */
4a238c70SJohn Marino  mpfr_clear (tmp);
4a238c70SJohn Marino
4a238c70SJohn Marino end:
4a238c70SJohn Marino  MPFR_SAVE_EXPO_FREE (expo);
4a238c70SJohn Marino  return mpfr_check_range (y, inex, rnd);
4a238c70SJohn Marino}