mpfr/src/gamma.c

4a238c70SJohn Marino/* mpfr_gamma -- gamma function
4a238c70SJohn Marino
*ab6d115fSJohn MarinoCopyright 2001, 2002, 2003, 2004, 2005, 2006, 2007, 2008, 2009, 2010, 2011, 2012, 2013 Free Software Foundation, Inc.
*ab6d115fSJohn MarinoContributed by the AriC and Caramel projects, INRIA.
4a238c70SJohn Marino
4a238c70SJohn MarinoThis file is part of the GNU MPFR Library.
4a238c70SJohn Marino
4a238c70SJohn MarinoThe GNU MPFR Library is free software; you can redistribute it and/or modify
4a238c70SJohn Marinoit under the terms of the GNU Lesser General Public License as published by
4a238c70SJohn Marinothe Free Software Foundation; either version 3 of the License, or (at your
4a238c70SJohn Marinooption) any later version.
4a238c70SJohn Marino
4a238c70SJohn MarinoThe GNU MPFR Library is distributed in the hope that it will be useful, but
4a238c70SJohn MarinoWITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
4a238c70SJohn Marinoor FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public
4a238c70SJohn MarinoLicense for more details.
4a238c70SJohn Marino
4a238c70SJohn MarinoYou should have received a copy of the GNU Lesser General Public License
4a238c70SJohn Marinoalong with the GNU MPFR Library; see the file COPYING.LESSER.  If not, see
4a238c70SJohn Marinohttp://www.gnu.org/licenses/ or write to the Free Software Foundation, Inc.,
4a238c70SJohn Marino51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA. */
4a238c70SJohn Marino
4a238c70SJohn Marino#define MPFR_NEED_LONGLONG_H
4a238c70SJohn Marino#include "mpfr-impl.h"
4a238c70SJohn Marino
4a238c70SJohn Marino#define IS_GAMMA
4a238c70SJohn Marino#include "lngamma.c"
4a238c70SJohn Marino#undef IS_GAMMA
4a238c70SJohn Marino
4a238c70SJohn Marino/* return a sufficient precision such that 2-x is exact, assuming x < 0 */
4a238c70SJohn Marinostatic mpfr_prec_t
4a238c70SJohn Marinompfr_gamma_2_minus_x_exact (mpfr_srcptr x)
4a238c70SJohn Marino{
4a238c70SJohn Marino  /* Since x < 0, 2-x = 2+y with y := -x.
4a238c70SJohn Marino     If y < 2, a precision w >= PREC(y) + EXP(2)-EXP(y) = PREC(y) + 2 - EXP(y)
4a238c70SJohn Marino     is enough, since no overlap occurs in 2+y, so no carry happens.
4a238c70SJohn Marino     If y >= 2, either ULP(y) <= 2, and we need w >= PREC(y)+1 since a
4a238c70SJohn Marino     carry can occur, or ULP(y) > 2, and we need w >= EXP(y)-1:
4a238c70SJohn Marino     (a) if EXP(y) <= 1, w = PREC(y) + 2 - EXP(y)
4a238c70SJohn Marino     (b) if EXP(y) > 1 and EXP(y)-PREC(y) <= 1, w = PREC(y) + 1
4a238c70SJohn Marino     (c) if EXP(y) > 1 and EXP(y)-PREC(y) > 1, w = EXP(y) - 1 */
4a238c70SJohn Marino  return (MPFR_GET_EXP(x) <= 1) ? MPFR_PREC(x) + 2 - MPFR_GET_EXP(x)
4a238c70SJohn Marino    : ((MPFR_GET_EXP(x) <= MPFR_PREC(x) + 1) ? MPFR_PREC(x) + 1
4a238c70SJohn Marino       : MPFR_GET_EXP(x) - 1);
4a238c70SJohn Marino}
4a238c70SJohn Marino
4a238c70SJohn Marino/* return a sufficient precision such that 1-x is exact, assuming x < 1 */
4a238c70SJohn Marinostatic mpfr_prec_t
4a238c70SJohn Marinompfr_gamma_1_minus_x_exact (mpfr_srcptr x)
4a238c70SJohn Marino{
4a238c70SJohn Marino  if (MPFR_IS_POS(x))
4a238c70SJohn Marino    return MPFR_PREC(x) - MPFR_GET_EXP(x);
4a238c70SJohn Marino  else if (MPFR_GET_EXP(x) <= 0)
4a238c70SJohn Marino    return MPFR_PREC(x) + 1 - MPFR_GET_EXP(x);
4a238c70SJohn Marino  else if (MPFR_PREC(x) >= MPFR_GET_EXP(x))
4a238c70SJohn Marino    return MPFR_PREC(x) + 1;
4a238c70SJohn Marino  else
4a238c70SJohn Marino    return MPFR_GET_EXP(x);
4a238c70SJohn Marino}
4a238c70SJohn Marino
4a238c70SJohn Marino/* returns a lower bound of the number of significant bits of n!
4a238c70SJohn Marino   (not counting the low zero bits).
4a238c70SJohn Marino   We know n! >= (n/e)^n*sqrt(2*Pi*n) for n >= 1, and the number of zero bits
4a238c70SJohn Marino   is floor(n/2) + floor(n/4) + floor(n/8) + ...
4a238c70SJohn Marino   This approximation is exact for n <= 500000, except for n = 219536, 235928,
4a238c70SJohn Marino   298981, 355854, 464848, 493725, 498992 where it returns a value 1 too small.
4a238c70SJohn Marino*/
4a238c70SJohn Marinostatic unsigned long
4a238c70SJohn Marinobits_fac (unsigned long n)
4a238c70SJohn Marino{
4a238c70SJohn Marino  mpfr_t x, y;
4a238c70SJohn Marino  unsigned long r, k;
4a238c70SJohn Marino  mpfr_init2 (x, 38);
4a238c70SJohn Marino  mpfr_init2 (y, 38);
4a238c70SJohn Marino  mpfr_set_ui (x, n, MPFR_RNDZ);
4a238c70SJohn Marino  mpfr_set_str_binary (y, "10.101101111110000101010001011000101001"); /* upper bound of e */
4a238c70SJohn Marino  mpfr_div (x, x, y, MPFR_RNDZ);
4a238c70SJohn Marino  mpfr_pow_ui (x, x, n, MPFR_RNDZ);
4a238c70SJohn Marino  mpfr_const_pi (y, MPFR_RNDZ);
4a238c70SJohn Marino  mpfr_mul_ui (y, y, 2 * n, MPFR_RNDZ);
4a238c70SJohn Marino  mpfr_sqrt (y, y, MPFR_RNDZ);
4a238c70SJohn Marino  mpfr_mul (x, x, y, MPFR_RNDZ);
4a238c70SJohn Marino  mpfr_log2 (x, x, MPFR_RNDZ);
4a238c70SJohn Marino  r = mpfr_get_ui (x, MPFR_RNDU);
4a238c70SJohn Marino  for (k = 2; k <= n; k *= 2)
4a238c70SJohn Marino    r -= n / k;
4a238c70SJohn Marino  mpfr_clear (x);
4a238c70SJohn Marino  mpfr_clear (y);
4a238c70SJohn Marino  return r;
4a238c70SJohn Marino}
4a238c70SJohn Marino
4a238c70SJohn Marino/* We use the reflection formula
4a238c70SJohn Marino  Gamma(1+t) Gamma(1-t) = - Pi t / sin(Pi (1 + t))
4a238c70SJohn Marino  in order to treat the case x <= 1,
4a238c70SJohn Marino  i.e. with x = 1-t, then Gamma(x) = -Pi*(1-x)/sin(Pi*(2-x))/GAMMA(2-x)
4a238c70SJohn Marino*/
4a238c70SJohn Marinoint
4a238c70SJohn Marinompfr_gamma (mpfr_ptr gamma, mpfr_srcptr x, mpfr_rnd_t rnd_mode)
4a238c70SJohn Marino{
4a238c70SJohn Marino  mpfr_t xp, GammaTrial, tmp, tmp2;
4a238c70SJohn Marino  mpz_t fact;
4a238c70SJohn Marino  mpfr_prec_t realprec;
*ab6d115fSJohn Marino  int compared, is_integer;
*ab6d115fSJohn Marino  int inex = 0;  /* 0 means: result gamma not set yet */
4a238c70SJohn Marino  MPFR_GROUP_DECL (group);
4a238c70SJohn Marino  MPFR_SAVE_EXPO_DECL (expo);
4a238c70SJohn Marino  MPFR_ZIV_DECL (loop);
4a238c70SJohn Marino
4a238c70SJohn Marino  MPFR_LOG_FUNC
4a238c70SJohn Marino    (("x[%Pu]=%.*Rg rnd=%d", mpfr_get_prec (x), mpfr_log_prec, x, rnd_mode),
4a238c70SJohn Marino     ("gamma[%Pu]=%.*Rg inexact=%d",
4a238c70SJohn Marino      mpfr_get_prec (gamma), mpfr_log_prec, gamma, inex));
4a238c70SJohn Marino
4a238c70SJohn Marino  /* Trivial cases */
4a238c70SJohn Marino  if (MPFR_UNLIKELY (MPFR_IS_SINGULAR (x)))
4a238c70SJohn Marino    {
4a238c70SJohn Marino      if (MPFR_IS_NAN (x))
4a238c70SJohn Marino        {
4a238c70SJohn Marino          MPFR_SET_NAN (gamma);
4a238c70SJohn Marino          MPFR_RET_NAN;
4a238c70SJohn Marino        }
4a238c70SJohn Marino      else if (MPFR_IS_INF (x))
4a238c70SJohn Marino        {
4a238c70SJohn Marino          if (MPFR_IS_NEG (x))
4a238c70SJohn Marino            {
4a238c70SJohn Marino              MPFR_SET_NAN (gamma);
4a238c70SJohn Marino              MPFR_RET_NAN;
4a238c70SJohn Marino            }
4a238c70SJohn Marino          else
4a238c70SJohn Marino            {
4a238c70SJohn Marino              MPFR_SET_INF (gamma);
4a238c70SJohn Marino              MPFR_SET_POS (gamma);
4a238c70SJohn Marino              MPFR_RET (0);  /* exact */
4a238c70SJohn Marino            }
4a238c70SJohn Marino        }
4a238c70SJohn Marino      else /* x is zero */
4a238c70SJohn Marino        {
4a238c70SJohn Marino          MPFR_ASSERTD(MPFR_IS_ZERO(x));
4a238c70SJohn Marino          MPFR_SET_INF(gamma);
4a238c70SJohn Marino          MPFR_SET_SAME_SIGN(gamma, x);
4a238c70SJohn Marino          mpfr_set_divby0 ();
4a238c70SJohn Marino          MPFR_RET (0);  /* exact */
4a238c70SJohn Marino        }
4a238c70SJohn Marino    }
4a238c70SJohn Marino
4a238c70SJohn Marino  /* Check for tiny arguments, where gamma(x) ~ 1/x - euler + ....
4a238c70SJohn Marino     We know from "Bound on Runs of Zeros and Ones for Algebraic Functions",
4a238c70SJohn Marino     Proceedings of Arith15, T. Lang and J.-M. Muller, 2001, that the maximal
4a238c70SJohn Marino     number of consecutive zeroes or ones after the round bit is n-1 for an
4a238c70SJohn Marino     input of n bits. But we need a more precise lower bound. Assume x has
4a238c70SJohn Marino     n bits, and 1/x is near a floating-point number y of n+1 bits. We can
4a238c70SJohn Marino     write x = X*2^e, y = Y/2^f with X, Y integers of n and n+1 bits.
4a238c70SJohn Marino     Thus X*Y^2^(e-f) is near from 1, i.e., X*Y is near from 2^(f-e).
4a238c70SJohn Marino     Two cases can happen:
4a238c70SJohn Marino     (i) either X*Y is exactly 2^(f-e), but this can happen only if X and Y
4a238c70SJohn Marino         are themselves powers of two, i.e., x is a power of two;
4a238c70SJohn Marino     (ii) or X*Y is at distance at least one from 2^(f-e), thus
4a238c70SJohn Marino          |xy-1| >= 2^(e-f), or |y-1/x| >= 2^(e-f)/x = 2^(-f)/X >= 2^(-f-n).
4a238c70SJohn Marino          Since ufp(y) = 2^(n-f) [ufp = unit in first place], this means
4a238c70SJohn Marino          that the distance |y-1/x| >= 2^(-2n) ufp(y).
4a238c70SJohn Marino          Now assuming |gamma(x)-1/x| <= 1, which is true for x <= 1,
4a238c70SJohn Marino          if 2^(-2n) ufp(y) >= 2, the error is at most 2^(-2n-1) ufp(y),
4a238c70SJohn Marino          and round(1/x) with precision >= 2n+2 gives the correct result.
4a238c70SJohn Marino          If x < 2^E, then y > 2^(-E), thus ufp(y) > 2^(-E-1).
4a238c70SJohn Marino          A sufficient condition is thus EXP(x) + 2 <= -2 MAX(PREC(x),PREC(Y)).
4a238c70SJohn Marino  */
4a238c70SJohn Marino  if (MPFR_GET_EXP (x) + 2
4a238c70SJohn Marino      <= -2 * (mpfr_exp_t) MAX(MPFR_PREC(x), MPFR_PREC(gamma)))
4a238c70SJohn Marino    {
4a238c70SJohn Marino      int sign = MPFR_SIGN (x); /* retrieve sign before possible override */
4a238c70SJohn Marino      int special;
4a238c70SJohn Marino      MPFR_BLOCK_DECL (flags);
4a238c70SJohn Marino
4a238c70SJohn Marino      MPFR_SAVE_EXPO_MARK (expo);
4a238c70SJohn Marino
4a238c70SJohn Marino      /* for overflow cases, see below; this needs to be done
4a238c70SJohn Marino         before x possibly gets overridden. */
4a238c70SJohn Marino      special =
4a238c70SJohn Marino        MPFR_GET_EXP (x) == 1 - MPFR_EMAX_MAX &&
4a238c70SJohn Marino        MPFR_IS_POS_SIGN (sign) &&
4a238c70SJohn Marino        MPFR_IS_LIKE_RNDD (rnd_mode, sign) &&
4a238c70SJohn Marino        mpfr_powerof2_raw (x);
4a238c70SJohn Marino
4a238c70SJohn Marino      MPFR_BLOCK (flags, inex = mpfr_ui_div (gamma, 1, x, rnd_mode));
4a238c70SJohn Marino      if (inex == 0) /* x is a power of two */
4a238c70SJohn Marino        {
4a238c70SJohn Marino          /* return RND(1/x - euler) = RND(+/- 2^k - eps) with eps > 0 */
4a238c70SJohn Marino          if (rnd_mode == MPFR_RNDN || MPFR_IS_LIKE_RNDU (rnd_mode, sign))
4a238c70SJohn Marino            inex = 1;
4a238c70SJohn Marino          else
4a238c70SJohn Marino            {
4a238c70SJohn Marino              mpfr_nextbelow (gamma);
4a238c70SJohn Marino              inex = -1;
4a238c70SJohn Marino            }
4a238c70SJohn Marino        }
4a238c70SJohn Marino      else if (MPFR_UNLIKELY (MPFR_OVERFLOW (flags)))
4a238c70SJohn Marino        {
4a238c70SJohn Marino          /* Overflow in the division 1/x. This is a real overflow, except
4a238c70SJohn Marino             in RNDZ or RNDD when 1/x = 2^emax, i.e. x = 2^(-emax): due to
4a238c70SJohn Marino             the "- euler", the rounded value in unbounded exponent range
4a238c70SJohn Marino             is 0.111...11 * 2^emax (not an overflow). */
4a238c70SJohn Marino          if (!special)
4a238c70SJohn Marino            MPFR_SAVE_EXPO_UPDATE_FLAGS (expo, flags);
4a238c70SJohn Marino        }
4a238c70SJohn Marino      MPFR_SAVE_EXPO_FREE (expo);
4a238c70SJohn Marino      /* Note: an overflow is possible with an infinite result;
4a238c70SJohn Marino         in this case, the overflow flag will automatically be
4a238c70SJohn Marino         restored by mpfr_check_range. */
4a238c70SJohn Marino      return mpfr_check_range (gamma, inex, rnd_mode);
4a238c70SJohn Marino    }
4a238c70SJohn Marino
4a238c70SJohn Marino  is_integer = mpfr_integer_p (x);
4a238c70SJohn Marino  /* gamma(x) for x a negative integer gives NaN */
4a238c70SJohn Marino  if (is_integer && MPFR_IS_NEG(x))
4a238c70SJohn Marino    {
4a238c70SJohn Marino      MPFR_SET_NAN (gamma);
4a238c70SJohn Marino      MPFR_RET_NAN;
4a238c70SJohn Marino    }
4a238c70SJohn Marino
4a238c70SJohn Marino  compared = mpfr_cmp_ui (x, 1);
4a238c70SJohn Marino  if (compared == 0)
4a238c70SJohn Marino    return mpfr_set_ui (gamma, 1, rnd_mode);
4a238c70SJohn Marino
4a238c70SJohn Marino  /* if x is an integer that fits into an unsigned long, use mpfr_fac_ui
4a238c70SJohn Marino     if argument is not too large.
4a238c70SJohn Marino     If precision is p, fac_ui costs O(u*p), whereas gamma costs O(p*M(p)),
4a238c70SJohn Marino     so for u <= M(p), fac_ui should be faster.
4a238c70SJohn Marino     We approximate here M(p) by p*log(p)^2, which is not a bad guess.
4a238c70SJohn Marino     Warning: since the generic code does not handle exact cases,
4a238c70SJohn Marino     we want all cases where gamma(x) is exact to be treated here.
4a238c70SJohn Marino  */
4a238c70SJohn Marino  if (is_integer && mpfr_fits_ulong_p (x, MPFR_RNDN))
4a238c70SJohn Marino    {
4a238c70SJohn Marino      unsigned long int u;
4a238c70SJohn Marino      mpfr_prec_t p = MPFR_PREC(gamma);
4a238c70SJohn Marino      u = mpfr_get_ui (x, MPFR_RNDN);
4a238c70SJohn Marino      if (u < 44787929UL && bits_fac (u - 1) <= p + (rnd_mode == MPFR_RNDN))
4a238c70SJohn Marino        /* bits_fac: lower bound on the number of bits of m,
4a238c70SJohn Marino           where gamma(x) = (u-1)! = m*2^e with m odd. */
4a238c70SJohn Marino        return mpfr_fac_ui (gamma, u - 1, rnd_mode);
4a238c70SJohn Marino      /* if bits_fac(...) > p (resp. p+1 for rounding to nearest),
4a238c70SJohn Marino         then gamma(x) cannot be exact in precision p (resp. p+1).
4a238c70SJohn Marino         FIXME: remove the test u < 44787929UL after changing bits_fac
4a238c70SJohn Marino         to return a mpz_t or mpfr_t. */
4a238c70SJohn Marino    }
4a238c70SJohn Marino
4a238c70SJohn Marino  MPFR_SAVE_EXPO_MARK (expo);
4a238c70SJohn Marino
4a238c70SJohn Marino  /* check for overflow: according to (6.1.37) in Abramowitz & Stegun,
4a238c70SJohn Marino     gamma(x) >= exp(-x) * x^(x-1/2) * sqrt(2*Pi)
4a238c70SJohn Marino              >= 2 * (x/e)^x / x for x >= 1 */
4a238c70SJohn Marino  if (compared > 0)
4a238c70SJohn Marino    {
4a238c70SJohn Marino      mpfr_t yp;
4a238c70SJohn Marino      mpfr_exp_t expxp;
4a238c70SJohn Marino      MPFR_BLOCK_DECL (flags);
4a238c70SJohn Marino
4a238c70SJohn Marino      /* 1/e rounded down to 53 bits */
4a238c70SJohn Marino#define EXPM1_STR "0.010111100010110101011000110110001011001110111100111"
4a238c70SJohn Marino      mpfr_init2 (xp, 53);
4a238c70SJohn Marino      mpfr_init2 (yp, 53);
4a238c70SJohn Marino      mpfr_set_str_binary (xp, EXPM1_STR);
4a238c70SJohn Marino      mpfr_mul (xp, x, xp, MPFR_RNDZ);
4a238c70SJohn Marino      mpfr_sub_ui (yp, x, 2, MPFR_RNDZ);
4a238c70SJohn Marino      mpfr_pow (xp, xp, yp, MPFR_RNDZ); /* (x/e)^(x-2) */
4a238c70SJohn Marino      mpfr_set_str_binary (yp, EXPM1_STR);
4a238c70SJohn Marino      mpfr_mul (xp, xp, yp, MPFR_RNDZ); /* x^(x-2) / e^(x-1) */
4a238c70SJohn Marino      mpfr_mul (xp, xp, yp, MPFR_RNDZ); /* x^(x-2) / e^x */
4a238c70SJohn Marino      mpfr_mul (xp, xp, x, MPFR_RNDZ); /* lower bound on x^(x-1) / e^x */
4a238c70SJohn Marino      MPFR_BLOCK (flags, mpfr_mul_2ui (xp, xp, 1, MPFR_RNDZ));
4a238c70SJohn Marino      expxp = MPFR_GET_EXP (xp);
4a238c70SJohn Marino      mpfr_clear (xp);
4a238c70SJohn Marino      mpfr_clear (yp);
4a238c70SJohn Marino      MPFR_SAVE_EXPO_FREE (expo);
4a238c70SJohn Marino      return MPFR_OVERFLOW (flags) || expxp > __gmpfr_emax ?
4a238c70SJohn Marino        mpfr_overflow (gamma, rnd_mode, 1) :
4a238c70SJohn Marino        mpfr_gamma_aux (gamma, x, rnd_mode);
4a238c70SJohn Marino    }
4a238c70SJohn Marino
4a238c70SJohn Marino  /* now compared < 0 */
4a238c70SJohn Marino
4a238c70SJohn Marino  /* check for underflow: for x < 1,
4a238c70SJohn Marino     gamma(x) = Pi*(x-1)/sin(Pi*(2-x))/gamma(2-x).
4a238c70SJohn Marino     Since gamma(2-x) >= 2 * ((2-x)/e)^(2-x) / (2-x), we have
4a238c70SJohn Marino     |gamma(x)| <= Pi*(1-x)*(2-x)/2/((2-x)/e)^(2-x) / |sin(Pi*(2-x))|
4a238c70SJohn Marino                <= 12 * ((2-x)/e)^x / |sin(Pi*(2-x))|.
4a238c70SJohn Marino     To avoid an underflow in ((2-x)/e)^x, we compute the logarithm.
4a238c70SJohn Marino  */
4a238c70SJohn Marino  if (MPFR_IS_NEG(x))
4a238c70SJohn Marino    {
4a238c70SJohn Marino      int underflow = 0, sgn, ck;
4a238c70SJohn Marino      mpfr_prec_t w;
4a238c70SJohn Marino
4a238c70SJohn Marino      mpfr_init2 (xp, 53);
4a238c70SJohn Marino      mpfr_init2 (tmp, 53);
4a238c70SJohn Marino      mpfr_init2 (tmp2, 53);
4a238c70SJohn Marino      /* we want an upper bound for x * [log(2-x)-1].
4a238c70SJohn Marino         since x < 0, we need a lower bound on log(2-x) */
4a238c70SJohn Marino      mpfr_ui_sub (xp, 2, x, MPFR_RNDD);
*ab6d115fSJohn Marino      mpfr_log (xp, xp, MPFR_RNDD);
4a238c70SJohn Marino      mpfr_sub_ui (xp, xp, 1, MPFR_RNDD);
4a238c70SJohn Marino      mpfr_mul (xp, xp, x, MPFR_RNDU);
4a238c70SJohn Marino
4a238c70SJohn Marino      /* we need an upper bound on 1/|sin(Pi*(2-x))|,
4a238c70SJohn Marino         thus a lower bound on |sin(Pi*(2-x))|.
4a238c70SJohn Marino         If 2-x is exact, then the error of Pi*(2-x) is (1+u)^2 with u = 2^(-p)
4a238c70SJohn Marino         thus the error on sin(Pi*(2-x)) is less than 1/2ulp + 3Pi(2-x)u,
4a238c70SJohn Marino         assuming u <= 1, thus <= u + 3Pi(2-x)u */
4a238c70SJohn Marino
4a238c70SJohn Marino      w = mpfr_gamma_2_minus_x_exact (x); /* 2-x is exact for prec >= w */
4a238c70SJohn Marino      w += 17; /* to get tmp2 small enough */
4a238c70SJohn Marino      mpfr_set_prec (tmp, w);
4a238c70SJohn Marino      mpfr_set_prec (tmp2, w);
4a238c70SJohn Marino      ck = mpfr_ui_sub (tmp, 2, x, MPFR_RNDN);
4a238c70SJohn Marino      MPFR_ASSERTD (ck == 0);  (void) ck; /* use ck to avoid a warning */
4a238c70SJohn Marino      mpfr_const_pi (tmp2, MPFR_RNDN);
4a238c70SJohn Marino      mpfr_mul (tmp2, tmp2, tmp, MPFR_RNDN); /* Pi*(2-x) */
4a238c70SJohn Marino      mpfr_sin (tmp, tmp2, MPFR_RNDN); /* sin(Pi*(2-x)) */
4a238c70SJohn Marino      sgn = mpfr_sgn (tmp);
4a238c70SJohn Marino      mpfr_abs (tmp, tmp, MPFR_RNDN);
4a238c70SJohn Marino      mpfr_mul_ui (tmp2, tmp2, 3, MPFR_RNDU); /* 3Pi(2-x) */
4a238c70SJohn Marino      mpfr_add_ui (tmp2, tmp2, 1, MPFR_RNDU); /* 3Pi(2-x)+1 */
4a238c70SJohn Marino      mpfr_div_2ui (tmp2, tmp2, mpfr_get_prec (tmp), MPFR_RNDU);
4a238c70SJohn Marino      /* if tmp2<|tmp|, we get a lower bound */
4a238c70SJohn Marino      if (mpfr_cmp (tmp2, tmp) < 0)
4a238c70SJohn Marino        {
4a238c70SJohn Marino          mpfr_sub (tmp, tmp, tmp2, MPFR_RNDZ); /* low bnd on |sin(Pi*(2-x))| */
4a238c70SJohn Marino          mpfr_ui_div (tmp, 12, tmp, MPFR_RNDU); /* upper bound */
4a238c70SJohn Marino          mpfr_log2 (tmp, tmp, MPFR_RNDU);
4a238c70SJohn Marino          mpfr_add (xp, tmp, xp, MPFR_RNDU);
4a238c70SJohn Marino          /* The assert below checks that expo.saved_emin - 2 always
4a238c70SJohn Marino             fits in a long. FIXME if we want to allow mpfr_exp_t to
4a238c70SJohn Marino             be a long long, for instance. */
4a238c70SJohn Marino          MPFR_ASSERTN (MPFR_EMIN_MIN - 2 >= LONG_MIN);
4a238c70SJohn Marino          underflow = mpfr_cmp_si (xp, expo.saved_emin - 2) <= 0;
4a238c70SJohn Marino        }
4a238c70SJohn Marino
4a238c70SJohn Marino      mpfr_clear (xp);
4a238c70SJohn Marino      mpfr_clear (tmp);
4a238c70SJohn Marino      mpfr_clear (tmp2);
4a238c70SJohn Marino      if (underflow) /* the sign is the opposite of that of sin(Pi*(2-x)) */
4a238c70SJohn Marino        {
4a238c70SJohn Marino          MPFR_SAVE_EXPO_FREE (expo);
4a238c70SJohn Marino          return mpfr_underflow (gamma, (rnd_mode == MPFR_RNDN) ? MPFR_RNDZ : rnd_mode, -sgn);
4a238c70SJohn Marino        }
4a238c70SJohn Marino    }
4a238c70SJohn Marino
4a238c70SJohn Marino  realprec = MPFR_PREC (gamma);
4a238c70SJohn Marino  /* we want both 1-x and 2-x to be exact */
4a238c70SJohn Marino  {
4a238c70SJohn Marino    mpfr_prec_t w;
4a238c70SJohn Marino    w = mpfr_gamma_1_minus_x_exact (x);
4a238c70SJohn Marino    if (realprec < w)
4a238c70SJohn Marino      realprec = w;
4a238c70SJohn Marino    w = mpfr_gamma_2_minus_x_exact (x);
4a238c70SJohn Marino    if (realprec < w)
4a238c70SJohn Marino      realprec = w;
4a238c70SJohn Marino  }
4a238c70SJohn Marino  realprec = realprec + MPFR_INT_CEIL_LOG2 (realprec) + 20;
4a238c70SJohn Marino  MPFR_ASSERTD(realprec >= 5);
4a238c70SJohn Marino
4a238c70SJohn Marino  MPFR_GROUP_INIT_4 (group, realprec + MPFR_INT_CEIL_LOG2 (realprec) + 20,
4a238c70SJohn Marino                     xp, tmp, tmp2, GammaTrial);
4a238c70SJohn Marino  mpz_init (fact);
4a238c70SJohn Marino  MPFR_ZIV_INIT (loop, realprec);
4a238c70SJohn Marino  for (;;)
4a238c70SJohn Marino    {
4a238c70SJohn Marino      mpfr_exp_t err_g;
4a238c70SJohn Marino      int ck;
4a238c70SJohn Marino      MPFR_GROUP_REPREC_4 (group, realprec, xp, tmp, tmp2, GammaTrial);
4a238c70SJohn Marino
4a238c70SJohn Marino      /* reflection formula: gamma(x) = Pi*(x-1)/sin(Pi*(2-x))/gamma(2-x) */
4a238c70SJohn Marino
4a238c70SJohn Marino      ck = mpfr_ui_sub (xp, 2, x, MPFR_RNDN); /* 2-x, exact */
4a238c70SJohn Marino      MPFR_ASSERTD(ck == 0);  (void) ck; /* use ck to avoid a warning */
4a238c70SJohn Marino      mpfr_gamma (tmp, xp, MPFR_RNDN);   /* gamma(2-x), error (1+u) */
4a238c70SJohn Marino      mpfr_const_pi (tmp2, MPFR_RNDN);   /* Pi, error (1+u) */
4a238c70SJohn Marino      mpfr_mul (GammaTrial, tmp2, xp, MPFR_RNDN); /* Pi*(2-x), error (1+u)^2 */
4a238c70SJohn Marino      err_g = MPFR_GET_EXP(GammaTrial);
4a238c70SJohn Marino      mpfr_sin (GammaTrial, GammaTrial, MPFR_RNDN); /* sin(Pi*(2-x)) */
*ab6d115fSJohn Marino      /* If tmp is +Inf, we compute exp(lngamma(x)). */
*ab6d115fSJohn Marino      if (mpfr_inf_p (tmp))
*ab6d115fSJohn Marino        {
*ab6d115fSJohn Marino          inex = mpfr_explgamma (gamma, x, &expo, tmp, tmp2, rnd_mode);
*ab6d115fSJohn Marino          if (inex)
*ab6d115fSJohn Marino            goto end;
*ab6d115fSJohn Marino          else
*ab6d115fSJohn Marino            goto ziv_next;
*ab6d115fSJohn Marino        }
4a238c70SJohn Marino      err_g = err_g + 1 - MPFR_GET_EXP(GammaTrial);
4a238c70SJohn Marino      /* let g0 the true value of Pi*(2-x), g the computed value.
4a238c70SJohn Marino         We have g = g0 + h with |h| <= |(1+u^2)-1|*g.
4a238c70SJohn Marino         Thus sin(g) = sin(g0) + h' with |h'| <= |(1+u^2)-1|*g.
4a238c70SJohn Marino         The relative error is thus bounded by |(1+u^2)-1|*g/sin(g)
4a238c70SJohn Marino         <= |(1+u^2)-1|*2^err_g. <= 2.25*u*2^err_g for |u|<=1/4.
4a238c70SJohn Marino         With the rounding error, this gives (0.5 + 2.25*2^err_g)*u. */
4a238c70SJohn Marino      ck = mpfr_sub_ui (xp, x, 1, MPFR_RNDN); /* x-1, exact */
4a238c70SJohn Marino      MPFR_ASSERTD(ck == 0);  (void) ck; /* use ck to avoid a warning */
4a238c70SJohn Marino      mpfr_mul (xp, tmp2, xp, MPFR_RNDN); /* Pi*(x-1), error (1+u)^2 */
4a238c70SJohn Marino      mpfr_mul (GammaTrial, GammaTrial, tmp, MPFR_RNDN);
4a238c70SJohn Marino      /* [1 + (0.5 + 2.25*2^err_g)*u]*(1+u)^2 = 1 + (2.5 + 2.25*2^err_g)*u
4a238c70SJohn Marino         + (0.5 + 2.25*2^err_g)*u*(2u+u^2) + u^2.
4a238c70SJohn Marino         For err_g <= realprec-2, we have (0.5 + 2.25*2^err_g)*u <=
4a238c70SJohn Marino         0.5*u + 2.25/4 <= 0.6875 and u^2 <= u/4, thus
4a238c70SJohn Marino         (0.5 + 2.25*2^err_g)*u*(2u+u^2) + u^2 <= 0.6875*(2u+u/4) + u/4
4a238c70SJohn Marino         <= 1.8*u, thus the rel. error is bounded by (4.5 + 2.25*2^err_g)*u. */
4a238c70SJohn Marino      mpfr_div (GammaTrial, xp, GammaTrial, MPFR_RNDN);
4a238c70SJohn Marino      /* the error is of the form (1+u)^3/[1 + (4.5 + 2.25*2^err_g)*u].
4a238c70SJohn Marino         For realprec >= 5 and err_g <= realprec-2, [(4.5 + 2.25*2^err_g)*u]^2
4a238c70SJohn Marino         <= 0.71, and for |y|<=0.71, 1/(1-y) can be written 1+a*y with a<=4.
4a238c70SJohn Marino         (1+u)^3 * (1+4*(4.5 + 2.25*2^err_g)*u)
4a238c70SJohn Marino         = 1 + (21 + 9*2^err_g)*u + (57+27*2^err_g)*u^2 + (55+27*2^err_g)*u^3
4a238c70SJohn Marino             + (18+9*2^err_g)*u^4
4a238c70SJohn Marino         <= 1 + (21 + 9*2^err_g)*u + (57+27*2^err_g)*u^2 + (56+28*2^err_g)*u^3
4a238c70SJohn Marino         <= 1 + (21 + 9*2^err_g)*u + (59+28*2^err_g)*u^2
4a238c70SJohn Marino         <= 1 + (23 + 10*2^err_g)*u.
4a238c70SJohn Marino         The final error is thus bounded by (23 + 10*2^err_g) ulps,
4a238c70SJohn Marino         which is <= 2^6 for err_g<=2, and <= 2^(err_g+4) for err_g >= 2. */
4a238c70SJohn Marino      err_g = (err_g <= 2) ? 6 : err_g + 4;
4a238c70SJohn Marino
4a238c70SJohn Marino      if (MPFR_LIKELY (MPFR_CAN_ROUND (GammaTrial, realprec - err_g,
4a238c70SJohn Marino                                       MPFR_PREC(gamma), rnd_mode)))
4a238c70SJohn Marino        break;
*ab6d115fSJohn Marino
*ab6d115fSJohn Marino    ziv_next:
4a238c70SJohn Marino      MPFR_ZIV_NEXT (loop, realprec);
4a238c70SJohn Marino    }
*ab6d115fSJohn Marino
*ab6d115fSJohn Marino end:
4a238c70SJohn Marino  MPFR_ZIV_FREE (loop);
4a238c70SJohn Marino
*ab6d115fSJohn Marino  if (inex == 0)
4a238c70SJohn Marino    inex = mpfr_set (gamma, GammaTrial, rnd_mode);
4a238c70SJohn Marino  MPFR_GROUP_CLEAR (group);
4a238c70SJohn Marino  mpz_clear (fact);
4a238c70SJohn Marino
4a238c70SJohn Marino  MPFR_SAVE_EXPO_FREE (expo);
4a238c70SJohn Marino  return mpfr_check_range (gamma, inex, rnd_mode);
4a238c70SJohn Marino}