mpfr/src/lngamma.c

4a238c70SJohn Marino/* mpfr_lngamma -- lngamma function
4a238c70SJohn Marino
*ab6d115fSJohn MarinoCopyright 2005, 2006, 2007, 2008, 2009, 2010, 2011, 2012, 2013 Free Software Foundation, Inc.
*ab6d115fSJohn MarinoContributed by the AriC and Caramel projects, INRIA.
4a238c70SJohn Marino
4a238c70SJohn MarinoThis file is part of the GNU MPFR Library.
4a238c70SJohn Marino
4a238c70SJohn MarinoThe GNU MPFR Library is free software; you can redistribute it and/or modify
4a238c70SJohn Marinoit under the terms of the GNU Lesser General Public License as published by
4a238c70SJohn Marinothe Free Software Foundation; either version 3 of the License, or (at your
4a238c70SJohn Marinooption) any later version.
4a238c70SJohn Marino
4a238c70SJohn MarinoThe GNU MPFR Library is distributed in the hope that it will be useful, but
4a238c70SJohn MarinoWITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
4a238c70SJohn Marinoor FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public
4a238c70SJohn MarinoLicense for more details.
4a238c70SJohn Marino
4a238c70SJohn MarinoYou should have received a copy of the GNU Lesser General Public License
4a238c70SJohn Marinoalong with the GNU MPFR Library; see the file COPYING.LESSER.  If not, see
4a238c70SJohn Marinohttp://www.gnu.org/licenses/ or write to the Free Software Foundation, Inc.,
4a238c70SJohn Marino51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA. */
4a238c70SJohn Marino
4a238c70SJohn Marino#define MPFR_NEED_LONGLONG_H
4a238c70SJohn Marino#include "mpfr-impl.h"
4a238c70SJohn Marino
4a238c70SJohn Marino/* given a precision p, return alpha, such that the argument reduction
4a238c70SJohn Marino   will use k = alpha*p*log(2).
4a238c70SJohn Marino
4a238c70SJohn Marino   Warning: we should always have alpha >= log(2)/(2Pi) ~ 0.11,
4a238c70SJohn Marino   and the smallest value of alpha multiplied by the smallest working
4a238c70SJohn Marino   precision should be >= 4.
4a238c70SJohn Marino*/
4a238c70SJohn Marinostatic void
4a238c70SJohn Marinompfr_gamma_alpha (mpfr_t s, mpfr_prec_t p)
4a238c70SJohn Marino{
4a238c70SJohn Marino  if (p <= 100)
4a238c70SJohn Marino    mpfr_set_ui_2exp (s, 614, -10, MPFR_RNDN); /* about 0.6 */
4a238c70SJohn Marino  else if (p <= 500)
4a238c70SJohn Marino    mpfr_set_ui_2exp (s, 819, -10, MPFR_RNDN); /* about 0.8 */
4a238c70SJohn Marino  else if (p <= 1000)
4a238c70SJohn Marino    mpfr_set_ui_2exp (s, 1331, -10, MPFR_RNDN); /* about 1.3 */
4a238c70SJohn Marino  else if (p <= 2000)
4a238c70SJohn Marino    mpfr_set_ui_2exp (s, 1741, -10, MPFR_RNDN); /* about 1.7 */
4a238c70SJohn Marino  else if (p <= 5000)
4a238c70SJohn Marino    mpfr_set_ui_2exp (s, 2253, -10, MPFR_RNDN); /* about 2.2 */
4a238c70SJohn Marino  else if (p <= 10000)
4a238c70SJohn Marino    mpfr_set_ui_2exp (s, 3482, -10, MPFR_RNDN); /* about 3.4 */
4a238c70SJohn Marino  else
4a238c70SJohn Marino    mpfr_set_ui_2exp (s, 9, -1, MPFR_RNDN); /* 4.5 */
4a238c70SJohn Marino}
4a238c70SJohn Marino
*ab6d115fSJohn Marino#ifdef IS_GAMMA
*ab6d115fSJohn Marino
*ab6d115fSJohn Marino/* This function is called in case of intermediate overflow/underflow.
*ab6d115fSJohn Marino   The s1 and s2 arguments are temporary MPFR numbers, having the
*ab6d115fSJohn Marino   working precision. If the result could be determined, then the
*ab6d115fSJohn Marino   flags are updated via pexpo, y is set to the result, and the
*ab6d115fSJohn Marino   (non-zero) ternary value is returned. Otherwise 0 is returned
*ab6d115fSJohn Marino   in order to perform the next Ziv iteration. */
4a238c70SJohn Marinostatic int
*ab6d115fSJohn Marinompfr_explgamma (mpfr_ptr y, mpfr_srcptr x, mpfr_save_expo_t *pexpo,
*ab6d115fSJohn Marino                mpfr_ptr s1, mpfr_ptr s2, mpfr_rnd_t rnd)
*ab6d115fSJohn Marino{
*ab6d115fSJohn Marino  mpfr_t t1, t2;
*ab6d115fSJohn Marino  int inex1, inex2, sign;
*ab6d115fSJohn Marino  MPFR_BLOCK_DECL (flags1);
*ab6d115fSJohn Marino  MPFR_BLOCK_DECL (flags2);
*ab6d115fSJohn Marino  MPFR_GROUP_DECL (group);
*ab6d115fSJohn Marino
*ab6d115fSJohn Marino  MPFR_BLOCK (flags1, inex1 = mpfr_lgamma (s1, &sign, x, MPFR_RNDD));
*ab6d115fSJohn Marino  MPFR_ASSERTN (inex1 != 0);
*ab6d115fSJohn Marino  /* s1 = RNDD(lngamma(x)), inexact */
*ab6d115fSJohn Marino  if (MPFR_UNLIKELY (MPFR_OVERFLOW (flags1)))
*ab6d115fSJohn Marino    {
*ab6d115fSJohn Marino      if (MPFR_SIGN (s1) > 0)
*ab6d115fSJohn Marino        {
*ab6d115fSJohn Marino          MPFR_SAVE_EXPO_UPDATE_FLAGS (*pexpo, MPFR_FLAGS_OVERFLOW);
*ab6d115fSJohn Marino          return mpfr_overflow (y, rnd, sign);
*ab6d115fSJohn Marino        }
*ab6d115fSJohn Marino      else
*ab6d115fSJohn Marino        {
*ab6d115fSJohn Marino          MPFR_SAVE_EXPO_UPDATE_FLAGS (*pexpo, MPFR_FLAGS_UNDERFLOW);
*ab6d115fSJohn Marino          return mpfr_underflow (y, rnd == MPFR_RNDN ? MPFR_RNDZ : rnd, sign);
*ab6d115fSJohn Marino        }
*ab6d115fSJohn Marino    }
*ab6d115fSJohn Marino
*ab6d115fSJohn Marino  mpfr_set (s2, s1, MPFR_RNDN);     /* exact */
*ab6d115fSJohn Marino  mpfr_nextabove (s2);              /* v = RNDU(lngamma(z0)) */
*ab6d115fSJohn Marino
*ab6d115fSJohn Marino  if (sign < 0)
*ab6d115fSJohn Marino    rnd = MPFR_INVERT_RND (rnd);  /* since the result with be negated */
*ab6d115fSJohn Marino  MPFR_GROUP_INIT_2 (group, MPFR_PREC (y), t1, t2);
*ab6d115fSJohn Marino  MPFR_BLOCK (flags1, inex1 = mpfr_exp (t1, s1, rnd));
*ab6d115fSJohn Marino  MPFR_BLOCK (flags2, inex2 = mpfr_exp (t2, s2, rnd));
*ab6d115fSJohn Marino  /* t1 is the rounding with mode 'rnd' of a lower bound on |Gamma(x)|,
*ab6d115fSJohn Marino     t2 is the rounding with mode 'rnd' of an upper bound, thus if both
*ab6d115fSJohn Marino     are equal, so is the wanted result. If t1 and t2 differ or the flags
*ab6d115fSJohn Marino     differ, at some point of Ziv's loop they should agree. */
*ab6d115fSJohn Marino  if (mpfr_equal_p (t1, t2) && flags1 == flags2)
*ab6d115fSJohn Marino    {
*ab6d115fSJohn Marino      MPFR_ASSERTN ((inex1 > 0 && inex2 > 0) || (inex1 < 0 && inex2 < 0));
*ab6d115fSJohn Marino      mpfr_set4 (y, t1, MPFR_RNDN, sign);  /* exact */
*ab6d115fSJohn Marino      if (sign < 0)
*ab6d115fSJohn Marino        inex1 = - inex1;
*ab6d115fSJohn Marino      MPFR_SAVE_EXPO_UPDATE_FLAGS (*pexpo, flags1);
*ab6d115fSJohn Marino    }
*ab6d115fSJohn Marino  else
*ab6d115fSJohn Marino    inex1 = 0;  /* couldn't determine the result */
*ab6d115fSJohn Marino  MPFR_GROUP_CLEAR (group);
*ab6d115fSJohn Marino
*ab6d115fSJohn Marino  return inex1;
*ab6d115fSJohn Marino}
*ab6d115fSJohn Marino
*ab6d115fSJohn Marino#else
*ab6d115fSJohn Marino
*ab6d115fSJohn Marinostatic int
*ab6d115fSJohn Marinounit_bit (mpfr_srcptr x)
4a238c70SJohn Marino{
4a238c70SJohn Marino  mpfr_exp_t expo;
4a238c70SJohn Marino  mpfr_prec_t prec;
4a238c70SJohn Marino  mp_limb_t x0;
4a238c70SJohn Marino
4a238c70SJohn Marino  expo = MPFR_GET_EXP (x);
4a238c70SJohn Marino  if (expo <= 0)
4a238c70SJohn Marino    return 0;  /* |x| < 1 */
4a238c70SJohn Marino
4a238c70SJohn Marino  prec = MPFR_PREC (x);
4a238c70SJohn Marino  if (expo > prec)
4a238c70SJohn Marino    return 0;  /* y is a multiple of 2^(expo-prec), thus an even integer */
4a238c70SJohn Marino
4a238c70SJohn Marino  /* Now, the unit bit is represented. */
4a238c70SJohn Marino
*ab6d115fSJohn Marino  prec = MPFR_PREC2LIMBS (prec) * GMP_NUMB_BITS - expo;
4a238c70SJohn Marino  /* number of represented fractional bits (including the trailing 0's) */
4a238c70SJohn Marino
4a238c70SJohn Marino  x0 = *(MPFR_MANT (x) + prec / GMP_NUMB_BITS);
4a238c70SJohn Marino  /* limb containing the unit bit */
4a238c70SJohn Marino
4a238c70SJohn Marino  return (x0 >> (prec % GMP_NUMB_BITS)) & 1;
4a238c70SJohn Marino}
*ab6d115fSJohn Marino
4a238c70SJohn Marino#endif
4a238c70SJohn Marino
4a238c70SJohn Marino/* lngamma(x) = log(gamma(x)).
4a238c70SJohn Marino   We use formula [6.1.40] from Abramowitz&Stegun:
4a238c70SJohn Marino   lngamma(z) = (z-1/2)*log(z) - z + 1/2*log(2*Pi)
4a238c70SJohn Marino              + sum (Bernoulli[2m]/(2m)/(2m-1)/z^(2m-1),m=1..infinity)
4a238c70SJohn Marino   According to [6.1.42], if the sum is truncated after m=n, the error
4a238c70SJohn Marino   R_n(z) is bounded by |B[2n+2]|*K(z)/(2n+1)/(2n+2)/|z|^(2n+1)
4a238c70SJohn Marino   where K(z) = max (z^2/(u^2+z^2)) for u >= 0.
4a238c70SJohn Marino   For z real, |K(z)| <= 1 thus R_n(z) is bounded by the first neglected term.
4a238c70SJohn Marino */
4a238c70SJohn Marino#ifdef IS_GAMMA
4a238c70SJohn Marino#define GAMMA_FUNC mpfr_gamma_aux
4a238c70SJohn Marino#else
4a238c70SJohn Marino#define GAMMA_FUNC mpfr_lngamma_aux
4a238c70SJohn Marino#endif
4a238c70SJohn Marino
4a238c70SJohn Marinostatic int
4a238c70SJohn MarinoGAMMA_FUNC (mpfr_ptr y, mpfr_srcptr z0, mpfr_rnd_t rnd)
4a238c70SJohn Marino{
4a238c70SJohn Marino  mpfr_prec_t precy, w; /* working precision */
4a238c70SJohn Marino  mpfr_t s, t, u, v, z;
4a238c70SJohn Marino  unsigned long m, k, maxm;
4a238c70SJohn Marino  mpz_t *INITIALIZED(B);  /* variable B declared as initialized */
*ab6d115fSJohn Marino  int compared;
*ab6d115fSJohn Marino  int inexact = 0;  /* 0 means: result y not set yet */
4a238c70SJohn Marino  mpfr_exp_t err_s, err_t;
4a238c70SJohn Marino  unsigned long Bm = 0; /* number of allocated B[] */
4a238c70SJohn Marino  unsigned long oldBm;
4a238c70SJohn Marino  double d;
4a238c70SJohn Marino  MPFR_SAVE_EXPO_DECL (expo);
*ab6d115fSJohn Marino  MPFR_ZIV_DECL (loop);
4a238c70SJohn Marino
4a238c70SJohn Marino  compared = mpfr_cmp_ui (z0, 1);
4a238c70SJohn Marino
4a238c70SJohn Marino  MPFR_SAVE_EXPO_MARK (expo);
4a238c70SJohn Marino
4a238c70SJohn Marino#ifndef IS_GAMMA /* lngamma or lgamma */
4a238c70SJohn Marino  if (compared == 0 || (compared > 0 && mpfr_cmp_ui (z0, 2) == 0))
4a238c70SJohn Marino    {
4a238c70SJohn Marino      MPFR_SAVE_EXPO_FREE (expo);
4a238c70SJohn Marino      return mpfr_set_ui (y, 0, MPFR_RNDN);  /* lngamma(1 or 2) = +0 */
4a238c70SJohn Marino    }
4a238c70SJohn Marino
4a238c70SJohn Marino  /* Deal here with tiny inputs. We have for -0.3 <= x <= 0.3:
4a238c70SJohn Marino     - log|x| - gamma*x <= log|gamma(x)| <= - log|x| - gamma*x + x^2 */
4a238c70SJohn Marino  if (MPFR_EXP(z0) <= - (mpfr_exp_t) MPFR_PREC(y))
4a238c70SJohn Marino    {
4a238c70SJohn Marino      mpfr_t l, h, g;
*ab6d115fSJohn Marino      int ok, inex1, inex2;
4a238c70SJohn Marino      mpfr_prec_t prec = MPFR_PREC(y) + 14;
4a238c70SJohn Marino      MPFR_ZIV_DECL (loop);
4a238c70SJohn Marino
4a238c70SJohn Marino      MPFR_ZIV_INIT (loop, prec);
4a238c70SJohn Marino      do
4a238c70SJohn Marino        {
4a238c70SJohn Marino          mpfr_init2 (l, prec);
4a238c70SJohn Marino          if (MPFR_IS_POS(z0))
4a238c70SJohn Marino            {
4a238c70SJohn Marino              mpfr_log (l, z0, MPFR_RNDU); /* upper bound for log(z0) */
4a238c70SJohn Marino              mpfr_init2 (h, MPFR_PREC(l));
4a238c70SJohn Marino            }
4a238c70SJohn Marino          else
4a238c70SJohn Marino            {
4a238c70SJohn Marino              mpfr_init2 (h, MPFR_PREC(z0));
4a238c70SJohn Marino              mpfr_neg (h, z0, MPFR_RNDN); /* exact */
4a238c70SJohn Marino              mpfr_log (l, h, MPFR_RNDU); /* upper bound for log(-z0) */
4a238c70SJohn Marino              mpfr_set_prec (h, MPFR_PREC(l));
4a238c70SJohn Marino            }
4a238c70SJohn Marino          mpfr_neg (l, l, MPFR_RNDD); /* lower bound for -log(|z0|) */
4a238c70SJohn Marino          mpfr_set (h, l, MPFR_RNDD); /* exact */
4a238c70SJohn Marino          mpfr_nextabove (h); /* upper bound for -log(|z0|), avoids two calls
4a238c70SJohn Marino                                 to mpfr_log */
4a238c70SJohn Marino          mpfr_init2 (g, MPFR_PREC(l));
4a238c70SJohn Marino          /* if z0>0, we need an upper approximation of Euler's constant
4a238c70SJohn Marino             for the left bound */
4a238c70SJohn Marino          mpfr_const_euler (g, MPFR_IS_POS(z0) ? MPFR_RNDU : MPFR_RNDD);
4a238c70SJohn Marino          mpfr_mul (g, g, z0, MPFR_RNDD);
4a238c70SJohn Marino          mpfr_sub (l, l, g, MPFR_RNDD);
4a238c70SJohn Marino          mpfr_const_euler (g, MPFR_IS_POS(z0) ? MPFR_RNDD : MPFR_RNDU); /* cached */
4a238c70SJohn Marino          mpfr_mul (g, g, z0, MPFR_RNDU);
4a238c70SJohn Marino          mpfr_sub (h, h, g, MPFR_RNDD);
4a238c70SJohn Marino          mpfr_mul (g, z0, z0, MPFR_RNDU);
4a238c70SJohn Marino          mpfr_add (h, h, g, MPFR_RNDU);
*ab6d115fSJohn Marino          inex1 = mpfr_prec_round (l, MPFR_PREC(y), rnd);
4a238c70SJohn Marino          inex2 = mpfr_prec_round (h, MPFR_PREC(y), rnd);
4a238c70SJohn Marino          /* Caution: we not only need l = h, but both inexact flags should
4a238c70SJohn Marino             agree. Indeed, one of the inexact flags might be zero. In that
4a238c70SJohn Marino             case if we assume lngamma(z0) cannot be exact, the other flag
4a238c70SJohn Marino             should be correct. We are conservative here and request that both
4a238c70SJohn Marino             inexact flags agree. */
*ab6d115fSJohn Marino          ok = SAME_SIGN (inex1, inex2) && mpfr_cmp (l, h) == 0;
4a238c70SJohn Marino          if (ok)
4a238c70SJohn Marino            mpfr_set (y, h, rnd); /* exact */
4a238c70SJohn Marino          mpfr_clear (l);
4a238c70SJohn Marino          mpfr_clear (h);
4a238c70SJohn Marino          mpfr_clear (g);
4a238c70SJohn Marino          if (ok)
4a238c70SJohn Marino            {
*ab6d115fSJohn Marino              MPFR_ZIV_FREE (loop);
4a238c70SJohn Marino              MPFR_SAVE_EXPO_FREE (expo);
*ab6d115fSJohn Marino              return mpfr_check_range (y, inex1, rnd);
4a238c70SJohn Marino            }
4a238c70SJohn Marino          /* since we have log|gamma(x)| = - log|x| - gamma*x + O(x^2),
4a238c70SJohn Marino             if x ~ 2^(-n), then we have a n-bit approximation, thus
4a238c70SJohn Marino             we can try again with a working precision of n bits,
4a238c70SJohn Marino             especially when n >> PREC(y).
4a238c70SJohn Marino             Otherwise we would use the reflection formula evaluating x-1,
4a238c70SJohn Marino             which would need precision n. */
4a238c70SJohn Marino          MPFR_ZIV_NEXT (loop, prec);
4a238c70SJohn Marino        }
4a238c70SJohn Marino      while (prec <= -MPFR_EXP(z0));
4a238c70SJohn Marino      MPFR_ZIV_FREE (loop);
4a238c70SJohn Marino    }
4a238c70SJohn Marino#endif
4a238c70SJohn Marino
4a238c70SJohn Marino  precy = MPFR_PREC(y);
4a238c70SJohn Marino
4a238c70SJohn Marino  mpfr_init2 (s, MPFR_PREC_MIN);
4a238c70SJohn Marino  mpfr_init2 (t, MPFR_PREC_MIN);
4a238c70SJohn Marino  mpfr_init2 (u, MPFR_PREC_MIN);
4a238c70SJohn Marino  mpfr_init2 (v, MPFR_PREC_MIN);
4a238c70SJohn Marino  mpfr_init2 (z, MPFR_PREC_MIN);
4a238c70SJohn Marino
4a238c70SJohn Marino  if (compared < 0)
4a238c70SJohn Marino    {
4a238c70SJohn Marino      mpfr_exp_t err_u;
4a238c70SJohn Marino
4a238c70SJohn Marino      /* use reflection formula:
4a238c70SJohn Marino         gamma(x) = Pi*(x-1)/sin(Pi*(2-x))/gamma(2-x)
4a238c70SJohn Marino         thus lngamma(x) = log(Pi*(x-1)/sin(Pi*(2-x))) - lngamma(2-x) */
4a238c70SJohn Marino
4a238c70SJohn Marino      w = precy + MPFR_INT_CEIL_LOG2 (precy);
*ab6d115fSJohn Marino      w += MPFR_INT_CEIL_LOG2 (w) + 14;
*ab6d115fSJohn Marino      MPFR_ZIV_INIT (loop, w);
4a238c70SJohn Marino      while (1)
4a238c70SJohn Marino        {
4a238c70SJohn Marino          MPFR_ASSERTD(w >= 3);
4a238c70SJohn Marino          mpfr_set_prec (s, w);
4a238c70SJohn Marino          mpfr_set_prec (t, w);
4a238c70SJohn Marino          mpfr_set_prec (u, w);
4a238c70SJohn Marino          mpfr_set_prec (v, w);
4a238c70SJohn Marino          /* In the following, we write r for a real of absolute value
4a238c70SJohn Marino             at most 2^(-w). Different instances of r may represent different
4a238c70SJohn Marino             values. */
4a238c70SJohn Marino          mpfr_ui_sub (s, 2, z0, MPFR_RNDD); /* s = (2-z0) * (1+2r) >= 1 */
4a238c70SJohn Marino          mpfr_const_pi (t, MPFR_RNDN);      /* t = Pi * (1+r) */
4a238c70SJohn Marino          mpfr_lngamma (u, s, MPFR_RNDN); /* lngamma(2-x) */
4a238c70SJohn Marino          /* Let s = (2-z0) + h. By construction, -(2-z0)*2^(1-w) <= h <= 0.
4a238c70SJohn Marino             We have lngamma(s) = lngamma(2-z0) + h*Psi(z), z in [2-z0+h,2-z0].
4a238c70SJohn Marino             Since 2-z0+h = s >= 1 and |Psi(x)| <= max(1,log(x)) for x >= 1,
4a238c70SJohn Marino             the error on u is bounded by
4a238c70SJohn Marino             ulp(u)/2 + (2-z0)*max(1,log(2-z0))*2^(1-w)
4a238c70SJohn Marino             = (1/2 + (2-z0)*max(1,log(2-z0))*2^(1-E(u))) ulp(u) */
4a238c70SJohn Marino          d = (double) MPFR_GET_EXP(s) * 0.694; /* upper bound for log(2-z0) */
4a238c70SJohn Marino          err_u = MPFR_GET_EXP(s) + __gmpfr_ceil_log2 (d) + 1 - MPFR_GET_EXP(u);
4a238c70SJohn Marino          err_u = (err_u >= 0) ? err_u + 1 : 0;
4a238c70SJohn Marino          /* now the error on u is bounded by 2^err_u ulps */
4a238c70SJohn Marino
4a238c70SJohn Marino          mpfr_mul (s, s, t, MPFR_RNDN); /* Pi*(2-x) * (1+r)^4 */
4a238c70SJohn Marino          err_s = MPFR_GET_EXP(s); /* 2-x <= 2^err_s */
4a238c70SJohn Marino          mpfr_sin (s, s, MPFR_RNDN); /* sin(Pi*(2-x)) */
4a238c70SJohn Marino          /* the error on s is bounded by 1/2*ulp(s) + [(1+2^(-w))^4-1]*(2-x)
4a238c70SJohn Marino             <= 1/2*ulp(s) + 5*2^(-w)*(2-x) for w >= 3
4a238c70SJohn Marino             <= (1/2 + 5 * 2^(-E(s)) * (2-x)) ulp(s) */
4a238c70SJohn Marino          err_s += 3 - MPFR_GET_EXP(s);
4a238c70SJohn Marino          err_s = (err_s >= 0) ? err_s + 1 : 0;
4a238c70SJohn Marino          /* the error on s is bounded by 2^err_s ulp(s), thus by
4a238c70SJohn Marino             2^(err_s+1)*2^(-w)*|s| since ulp(s) <= 2^(1-w)*|s|.
4a238c70SJohn Marino             Now n*2^(-w) can always be written |(1+r)^n-1| for some
4a238c70SJohn Marino             |r|<=2^(-w), thus taking n=2^(err_s+1) we see that
4a238c70SJohn Marino             |S - s| <= |(1+r)^(2^(err_s+1))-1| * |s|, where S is the
4a238c70SJohn Marino             true value.
4a238c70SJohn Marino             In fact if ulp(s) <= ulp(S) the same inequality holds for
4a238c70SJohn Marino             |S| instead of |s| in the right hand side, i.e., we can
4a238c70SJohn Marino             write s = (1+r)^(2^(err_s+1)) * S.
4a238c70SJohn Marino             But if ulp(S) < ulp(s), we need to add one ``bit'' to the error,
4a238c70SJohn Marino             to get s = (1+r)^(2^(err_s+2)) * S. This is true since with
4a238c70SJohn Marino             E = n*2^(-w) we have |s - S| <= E * |s|, thus
4a238c70SJohn Marino             |s - S| <= E/(1-E) * |S|.
4a238c70SJohn Marino             Now E/(1-E) is bounded by 2E as long as E<=1/2,
4a238c70SJohn Marino             and 2E can be written (1+r)^(2n)-1 as above.
4a238c70SJohn Marino          */
4a238c70SJohn Marino          err_s += 2; /* exponent of relative error */
4a238c70SJohn Marino
4a238c70SJohn Marino          mpfr_sub_ui (v, z0, 1, MPFR_RNDN); /* v = (x-1) * (1+r) */
4a238c70SJohn Marino          mpfr_mul (v, v, t, MPFR_RNDN); /* v = Pi*(x-1) * (1+r)^3 */
4a238c70SJohn Marino          mpfr_div (v, v, s, MPFR_RNDN); /* Pi*(x-1)/sin(Pi*(2-x)) */
4a238c70SJohn Marino          mpfr_abs (v, v, MPFR_RNDN);
4a238c70SJohn Marino          /* (1+r)^(3+2^err_s+1) */
4a238c70SJohn Marino          err_s = (err_s <= 1) ? 3 : err_s + 1;
4a238c70SJohn Marino          /* now (1+r)^M with M <= 2^err_s */
4a238c70SJohn Marino          mpfr_log (v, v, MPFR_RNDN);
4a238c70SJohn Marino          /* log(v*(1+e)) = log(v)+log(1+e) where |e| <= 2^(err_s-w).
4a238c70SJohn Marino             Since |log(1+e)| <= 2*e for |e| <= 1/4, the error on v is
4a238c70SJohn Marino             bounded by ulp(v)/2 + 2^(err_s+1-w). */
4a238c70SJohn Marino          if (err_s + 2 > w)
4a238c70SJohn Marino            {
4a238c70SJohn Marino              w += err_s + 2;
4a238c70SJohn Marino            }
4a238c70SJohn Marino          else
4a238c70SJohn Marino            {
4a238c70SJohn Marino              err_s += 1 - MPFR_GET_EXP(v);
4a238c70SJohn Marino              err_s = (err_s >= 0) ? err_s + 1 : 0;
4a238c70SJohn Marino              /* the error on v is bounded by 2^err_s ulps */
4a238c70SJohn Marino              err_u += MPFR_GET_EXP(u); /* absolute error on u */
4a238c70SJohn Marino              err_s += MPFR_GET_EXP(v); /* absolute error on v */
4a238c70SJohn Marino              mpfr_sub (s, v, u, MPFR_RNDN);
4a238c70SJohn Marino              /* the total error on s is bounded by ulp(s)/2 + 2^(err_u-w)
4a238c70SJohn Marino                 + 2^(err_s-w) <= ulp(s)/2 + 2^(max(err_u,err_s)+1-w) */
4a238c70SJohn Marino              err_s = (err_s >= err_u) ? err_s : err_u;
4a238c70SJohn Marino              err_s += 1 - MPFR_GET_EXP(s); /* error is 2^err_s ulp(s) */
4a238c70SJohn Marino              err_s = (err_s >= 0) ? err_s + 1 : 0;
4a238c70SJohn Marino              if (mpfr_can_round (s, w - err_s, MPFR_RNDN, MPFR_RNDZ, precy
4a238c70SJohn Marino                                  + (rnd == MPFR_RNDN)))
4a238c70SJohn Marino                goto end;
4a238c70SJohn Marino            }
*ab6d115fSJohn Marino          MPFR_ZIV_NEXT (loop, w);
4a238c70SJohn Marino        }
*ab6d115fSJohn Marino      MPFR_ZIV_FREE (loop);
4a238c70SJohn Marino    }
4a238c70SJohn Marino
4a238c70SJohn Marino  /* now z0 > 1 */
4a238c70SJohn Marino
4a238c70SJohn Marino  MPFR_ASSERTD (compared > 0);
4a238c70SJohn Marino
4a238c70SJohn Marino  /* since k is O(w), the value of log(z0*...*(z0+k-1)) is about w*log(w),
4a238c70SJohn Marino     so there is a cancellation of ~log(w) in the argument reconstruction */
4a238c70SJohn Marino  w = precy + MPFR_INT_CEIL_LOG2 (precy);
4a238c70SJohn Marino  w += MPFR_INT_CEIL_LOG2 (w) + 13;
*ab6d115fSJohn Marino  MPFR_ZIV_INIT (loop, w);
*ab6d115fSJohn Marino  while (1)
*ab6d115fSJohn Marino    {
4a238c70SJohn Marino      MPFR_ASSERTD (w >= 3);
4a238c70SJohn Marino
4a238c70SJohn Marino      /* argument reduction: we compute gamma(z0 + k), where the series
4a238c70SJohn Marino         has error term B_{2n}/(z0+k)^(2n) ~ (n/(Pi*e*(z0+k)))^(2n)
4a238c70SJohn Marino         and we need k steps of argument reconstruction. Assuming k is large
4a238c70SJohn Marino         with respect to z0, and k = n, we get 1/(Pi*e)^(2n) ~ 2^(-w), i.e.,
4a238c70SJohn Marino         k ~ w*log(2)/2/log(Pi*e) ~ 0.1616 * w.
4a238c70SJohn Marino         However, since the series is more expensive to compute, the optimal
4a238c70SJohn Marino         value seems to be k ~ 4.5 * w experimentally. */
4a238c70SJohn Marino      mpfr_set_prec (s, 53);
4a238c70SJohn Marino      mpfr_gamma_alpha (s, w);
4a238c70SJohn Marino      mpfr_set_ui_2exp (s, 9, -1, MPFR_RNDU);
4a238c70SJohn Marino      mpfr_mul_ui (s, s, w, MPFR_RNDU);
4a238c70SJohn Marino      if (mpfr_cmp (z0, s) < 0)
4a238c70SJohn Marino        {
4a238c70SJohn Marino          mpfr_sub (s, s, z0, MPFR_RNDU);
4a238c70SJohn Marino          k = mpfr_get_ui (s, MPFR_RNDU);
4a238c70SJohn Marino          if (k < 3)
4a238c70SJohn Marino            k = 3;
4a238c70SJohn Marino        }
4a238c70SJohn Marino      else
4a238c70SJohn Marino        k = 3;
4a238c70SJohn Marino
4a238c70SJohn Marino      mpfr_set_prec (s, w);
4a238c70SJohn Marino      mpfr_set_prec (t, w);
4a238c70SJohn Marino      mpfr_set_prec (u, w);
4a238c70SJohn Marino      mpfr_set_prec (v, w);
4a238c70SJohn Marino      mpfr_set_prec (z, w);
4a238c70SJohn Marino
4a238c70SJohn Marino      mpfr_add_ui (z, z0, k, MPFR_RNDN);
4a238c70SJohn Marino      /* z = (z0+k)*(1+t1) with |t1| <= 2^(-w) */
4a238c70SJohn Marino
4a238c70SJohn Marino      /* z >= 4 ensures the relative error on log(z) is small,
4a238c70SJohn Marino         and also (z-1/2)*log(z)-z >= 0 */
4a238c70SJohn Marino      MPFR_ASSERTD (mpfr_cmp_ui (z, 4) >= 0);
4a238c70SJohn Marino
4a238c70SJohn Marino      mpfr_log (s, z, MPFR_RNDN); /* log(z) */
4a238c70SJohn Marino      /* we have s = log((z0+k)*(1+t1))*(1+t2) with |t1|, |t2| <= 2^(-w).
4a238c70SJohn Marino         Since w >= 2 and z0+k >= 4, we can write log((z0+k)*(1+t1))
4a238c70SJohn Marino         = log(z0+k) * (1+t3) with |t3| <= 2^(-w), thus we have
4a238c70SJohn Marino         s = log(z0+k) * (1+t4)^2 with |t4| <= 2^(-w) */
4a238c70SJohn Marino      mpfr_mul_2ui (t, z, 1, MPFR_RNDN); /* t = 2z * (1+t5) */
4a238c70SJohn Marino      mpfr_sub_ui (t, t, 1, MPFR_RNDN); /* t = 2z-1 * (1+t6)^3 */
4a238c70SJohn Marino      /* since we can write 2z*(1+t5) = (2z-1)*(1+t5') with
4a238c70SJohn Marino         t5' = 2z/(2z-1) * t5, thus |t5'| <= 8/7 * t5 */
4a238c70SJohn Marino      mpfr_mul (s, s, t, MPFR_RNDN); /* (2z-1)*log(z) * (1+t7)^6 */
4a238c70SJohn Marino      mpfr_div_2ui (s, s, 1, MPFR_RNDN); /* (z-1/2)*log(z) * (1+t7)^6 */
4a238c70SJohn Marino      mpfr_sub (s, s, z, MPFR_RNDN); /* (z-1/2)*log(z)-z */
4a238c70SJohn Marino      /* s = [(z-1/2)*log(z)-z]*(1+u)^14, s >= 1/2 */
4a238c70SJohn Marino
4a238c70SJohn Marino      mpfr_ui_div (u, 1, z, MPFR_RNDN); /* 1/z * (1+u), u <= 1/4 since z >= 4 */
4a238c70SJohn Marino
4a238c70SJohn Marino      /* the first term is B[2]/2/z = 1/12/z: t=1/12/z, C[2]=1 */
4a238c70SJohn Marino      mpfr_div_ui (t, u, 12, MPFR_RNDN); /* 1/(12z) * (1+u)^2, t <= 3/128 */
4a238c70SJohn Marino      mpfr_set (v, t, MPFR_RNDN);        /* (1+u)^2, v < 2^(-5) */
4a238c70SJohn Marino      mpfr_add (s, s, v, MPFR_RNDN);     /* (1+u)^15 */
4a238c70SJohn Marino
4a238c70SJohn Marino      mpfr_mul (u, u, u, MPFR_RNDN); /* 1/z^2 * (1+u)^3 */
4a238c70SJohn Marino
4a238c70SJohn Marino      if (Bm == 0)
4a238c70SJohn Marino        {
4a238c70SJohn Marino          B = mpfr_bernoulli_internal ((mpz_t *) 0, 0);
4a238c70SJohn Marino          B = mpfr_bernoulli_internal (B, 1);
4a238c70SJohn Marino          Bm = 2;
4a238c70SJohn Marino        }
4a238c70SJohn Marino
4a238c70SJohn Marino      /* m <= maxm ensures that 2*m*(2*m+1) <= ULONG_MAX */
4a238c70SJohn Marino      maxm = 1UL << (GMP_NUMB_BITS / 2 - 1);
4a238c70SJohn Marino
4a238c70SJohn Marino      /* s:(1+u)^15, t:(1+u)^2, t <= 3/128 */
4a238c70SJohn Marino
4a238c70SJohn Marino      for (m = 2; MPFR_GET_EXP(v) + (mpfr_exp_t) w >= MPFR_GET_EXP(s); m++)
4a238c70SJohn Marino        {
4a238c70SJohn Marino          mpfr_mul (t, t, u, MPFR_RNDN); /* (1+u)^(10m-14) */
4a238c70SJohn Marino          if (m <= maxm)
4a238c70SJohn Marino            {
4a238c70SJohn Marino              mpfr_mul_ui (t, t, 2*(m-1)*(2*m-3), MPFR_RNDN);
4a238c70SJohn Marino              mpfr_div_ui (t, t, 2*m*(2*m-1), MPFR_RNDN);
4a238c70SJohn Marino              mpfr_div_ui (t, t, 2*m*(2*m+1), MPFR_RNDN);
4a238c70SJohn Marino            }
4a238c70SJohn Marino          else
4a238c70SJohn Marino            {
4a238c70SJohn Marino              mpfr_mul_ui (t, t, 2*(m-1), MPFR_RNDN);
4a238c70SJohn Marino              mpfr_mul_ui (t, t, 2*m-3, MPFR_RNDN);
4a238c70SJohn Marino              mpfr_div_ui (t, t, 2*m, MPFR_RNDN);
4a238c70SJohn Marino              mpfr_div_ui (t, t, 2*m-1, MPFR_RNDN);
4a238c70SJohn Marino              mpfr_div_ui (t, t, 2*m, MPFR_RNDN);
4a238c70SJohn Marino              mpfr_div_ui (t, t, 2*m+1, MPFR_RNDN);
4a238c70SJohn Marino            }
4a238c70SJohn Marino          /* (1+u)^(10m-8) */
4a238c70SJohn Marino          /* invariant: t=1/(2m)/(2m-1)/z^(2m-1)/(2m+1)! */
4a238c70SJohn Marino          if (Bm <= m)
4a238c70SJohn Marino            {
4a238c70SJohn Marino              B = mpfr_bernoulli_internal (B, m); /* B[2m]*(2m+1)!, exact */
4a238c70SJohn Marino              Bm ++;
4a238c70SJohn Marino            }
4a238c70SJohn Marino          mpfr_mul_z (v, t, B[m], MPFR_RNDN); /* (1+u)^(10m-7) */
4a238c70SJohn Marino          MPFR_ASSERTD(MPFR_GET_EXP(v) <= - (2 * m + 3));
4a238c70SJohn Marino          mpfr_add (s, s, v, MPFR_RNDN);
4a238c70SJohn Marino        }
4a238c70SJohn Marino      /* m <= 1/2*Pi*e*z ensures that |v[m]| < 1/2^(2m+3) */
4a238c70SJohn Marino      MPFR_ASSERTD ((double) m <= 4.26 * mpfr_get_d (z, MPFR_RNDZ));
4a238c70SJohn Marino
4a238c70SJohn Marino      /* We have sum([(1+u)^(10m-7)-1]*1/2^(2m+3), m=2..infinity)
4a238c70SJohn Marino         <= 1.46*u for u <= 2^(-3).
4a238c70SJohn Marino         We have 0 < lngamma(z) - [(z - 1/2) ln(z) - z + 1/2 ln(2 Pi)] < 0.021
4a238c70SJohn Marino         for z >= 4, thus since the initial s >= 0.85, the different values of
4a238c70SJohn Marino         s differ by at most one binade, and the total rounding error on s
4a238c70SJohn Marino         in the for-loop is bounded by 2*(m-1)*ulp(final_s).
4a238c70SJohn Marino         The error coming from the v's is bounded by
4a238c70SJohn Marino         1.46*2^(-w) <= 2*ulp(final_s).
4a238c70SJohn Marino         Thus the total error so far is bounded by [(1+u)^15-1]*s+2m*ulp(s)
4a238c70SJohn Marino         <= (2m+47)*ulp(s).
4a238c70SJohn Marino         Taking into account the truncation error (which is bounded by the last
4a238c70SJohn Marino         term v[] according to 6.1.42 in A&S), the bound is (2m+48)*ulp(s).
4a238c70SJohn Marino      */
4a238c70SJohn Marino
4a238c70SJohn Marino      /* add 1/2*log(2*Pi) and subtract log(z0*(z0+1)*...*(z0+k-1)) */
4a238c70SJohn Marino      mpfr_const_pi (v, MPFR_RNDN); /* v = Pi*(1+u) */
4a238c70SJohn Marino      mpfr_mul_2ui (v, v, 1, MPFR_RNDN); /* v = 2*Pi * (1+u) */
4a238c70SJohn Marino      if (k)
4a238c70SJohn Marino        {
4a238c70SJohn Marino          unsigned long l;
4a238c70SJohn Marino          mpfr_set (t, z0, MPFR_RNDN); /* t = z0*(1+u) */
4a238c70SJohn Marino          for (l = 1; l < k; l++)
4a238c70SJohn Marino            {
4a238c70SJohn Marino              mpfr_add_ui (u, z0, l, MPFR_RNDN); /* u = (z0+l)*(1+u) */
4a238c70SJohn Marino              mpfr_mul (t, t, u, MPFR_RNDN);     /* (1+u)^(2l+1) */
4a238c70SJohn Marino            }
4a238c70SJohn Marino          /* now t: (1+u)^(2k-1) */
4a238c70SJohn Marino          /* instead of computing log(sqrt(2*Pi)/t), we compute
4a238c70SJohn Marino             1/2*log(2*Pi/t^2), which trades a square root for a square */
4a238c70SJohn Marino          mpfr_mul (t, t, t, MPFR_RNDN); /* (z0*...*(z0+k-1))^2, (1+u)^(4k-1) */
4a238c70SJohn Marino          mpfr_div (v, v, t, MPFR_RNDN);
4a238c70SJohn Marino          /* 2*Pi/(z0*...*(z0+k-1))^2 (1+u)^(4k+1) */
4a238c70SJohn Marino        }
4a238c70SJohn Marino#ifdef IS_GAMMA
4a238c70SJohn Marino      err_s = MPFR_GET_EXP(s);
4a238c70SJohn Marino      mpfr_exp (s, s, MPFR_RNDN);
*ab6d115fSJohn Marino      /* If s is +Inf, we compute exp(lngamma(z0)). */
*ab6d115fSJohn Marino      if (mpfr_inf_p (s))
*ab6d115fSJohn Marino        {
*ab6d115fSJohn Marino          inexact = mpfr_explgamma (y, z0, &expo, s, t, rnd);
*ab6d115fSJohn Marino          if (inexact)
*ab6d115fSJohn Marino            goto end0;
*ab6d115fSJohn Marino          else
*ab6d115fSJohn Marino            goto ziv_next;
*ab6d115fSJohn Marino        }
4a238c70SJohn Marino      /* before the exponential, we have s = s0 + h where
4a238c70SJohn Marino         |h| <= (2m+48)*ulp(s), thus exp(s0) = exp(s) * exp(-h).
4a238c70SJohn Marino         For |h| <= 1/4, we have |exp(h)-1| <= 1.2*|h| thus
4a238c70SJohn Marino         |exp(s) - exp(s0)| <= 1.2 * exp(s) * (2m+48)* 2^(EXP(s)-w). */
4a238c70SJohn Marino      d = 1.2 * (2.0 * (double) m + 48.0);
4a238c70SJohn Marino      /* the error on s is bounded by d*2^err_s * 2^(-w) */
4a238c70SJohn Marino      mpfr_sqrt (t, v, MPFR_RNDN);
4a238c70SJohn Marino      /* let v0 be the exact value of v. We have v = v0*(1+u)^(4k+1),
4a238c70SJohn Marino         thus t = sqrt(v0)*(1+u)^(2k+3/2). */
4a238c70SJohn Marino      mpfr_mul (s, s, t, MPFR_RNDN);
4a238c70SJohn Marino      /* the error on input s is bounded by (1+u)^(d*2^err_s),
4a238c70SJohn Marino         and that on t is (1+u)^(2k+3/2), thus the
4a238c70SJohn Marino         total error is (1+u)^(d*2^err_s+2k+5/2) */
4a238c70SJohn Marino      err_s += __gmpfr_ceil_log2 (d);
4a238c70SJohn Marino      err_t = __gmpfr_ceil_log2 (2.0 * (double) k + 2.5);
4a238c70SJohn Marino      err_s = (err_s >= err_t) ? err_s + 1 : err_t + 1;
4a238c70SJohn Marino#else
4a238c70SJohn Marino      mpfr_log (t, v, MPFR_RNDN);
4a238c70SJohn Marino      /* let v0 be the exact value of v. We have v = v0*(1+u)^(4k+1),
4a238c70SJohn Marino         thus log(v) = log(v0) + (4k+1)*log(1+u). Since |log(1+u)/u| <= 1.07
4a238c70SJohn Marino         for |u| <= 2^(-3), the absolute error on log(v) is bounded by
4a238c70SJohn Marino         1.07*(4k+1)*u, and the rounding error by ulp(t). */
4a238c70SJohn Marino      mpfr_div_2ui (t, t, 1, MPFR_RNDN);
4a238c70SJohn Marino      /* the error on t is now bounded by ulp(t) + 0.54*(4k+1)*2^(-w).
4a238c70SJohn Marino         We have sqrt(2*Pi)/(z0*(z0+1)*...*(z0+k-1)) <= sqrt(2*Pi)/k! <= 0.5
4a238c70SJohn Marino         since k>=3, thus t <= -0.5 and ulp(t) >= 2^(-w).
4a238c70SJohn Marino         Thus the error on t is bounded by (2.16*k+1.54)*ulp(t). */
4a238c70SJohn Marino      err_t = MPFR_GET_EXP(t) + (mpfr_exp_t)
4a238c70SJohn Marino        __gmpfr_ceil_log2 (2.2 * (double) k + 1.6);
4a238c70SJohn Marino      err_s = MPFR_GET_EXP(s) + (mpfr_exp_t)
4a238c70SJohn Marino        __gmpfr_ceil_log2 (2.0 * (double) m + 48.0);
4a238c70SJohn Marino      mpfr_add (s, s, t, MPFR_RNDN); /* this is a subtraction in fact */
4a238c70SJohn Marino      /* the final error in ulp(s) is
4a238c70SJohn Marino         <= 1 + 2^(err_t-EXP(s)) + 2^(err_s-EXP(s))
4a238c70SJohn Marino         <= 2^(1+max(err_t,err_s)-EXP(s)) if err_t <> err_s
4a238c70SJohn Marino         <= 2^(2+max(err_t,err_s)-EXP(s)) if err_t = err_s */
4a238c70SJohn Marino      err_s = (err_t == err_s) ? 1 + err_s : ((err_t > err_s) ? err_t : err_s);
4a238c70SJohn Marino      err_s += 1 - MPFR_GET_EXP(s);
4a238c70SJohn Marino#endif
*ab6d115fSJohn Marino      if (MPFR_LIKELY (MPFR_CAN_ROUND (s, w - err_s, precy, rnd)))
*ab6d115fSJohn Marino        break;
*ab6d115fSJohn Marino#ifdef IS_GAMMA
*ab6d115fSJohn Marino    ziv_next:
*ab6d115fSJohn Marino#endif
*ab6d115fSJohn Marino      MPFR_ZIV_NEXT (loop, w);
4a238c70SJohn Marino    }
4a238c70SJohn Marino
*ab6d115fSJohn Marino#ifdef IS_GAMMA
*ab6d115fSJohn Marino end0:
*ab6d115fSJohn Marino#endif
4a238c70SJohn Marino  oldBm = Bm;
4a238c70SJohn Marino  while (Bm--)
4a238c70SJohn Marino    mpz_clear (B[Bm]);
4a238c70SJohn Marino  (*__gmp_free_func) (B, oldBm * sizeof (mpz_t));
4a238c70SJohn Marino
4a238c70SJohn Marino end:
*ab6d115fSJohn Marino  if (inexact == 0)
4a238c70SJohn Marino    inexact = mpfr_set (y, s, rnd);
*ab6d115fSJohn Marino  MPFR_ZIV_FREE (loop);
4a238c70SJohn Marino
4a238c70SJohn Marino  mpfr_clear (s);
4a238c70SJohn Marino  mpfr_clear (t);
4a238c70SJohn Marino  mpfr_clear (u);
4a238c70SJohn Marino  mpfr_clear (v);
4a238c70SJohn Marino  mpfr_clear (z);
4a238c70SJohn Marino
4a238c70SJohn Marino  MPFR_SAVE_EXPO_FREE (expo);
4a238c70SJohn Marino  return mpfr_check_range (y, inexact, rnd);
4a238c70SJohn Marino}
4a238c70SJohn Marino
4a238c70SJohn Marino#ifndef IS_GAMMA
4a238c70SJohn Marino
4a238c70SJohn Marinoint
4a238c70SJohn Marinompfr_lngamma (mpfr_ptr y, mpfr_srcptr x, mpfr_rnd_t rnd)
4a238c70SJohn Marino{
4a238c70SJohn Marino  int inex;
4a238c70SJohn Marino
4a238c70SJohn Marino  MPFR_LOG_FUNC
4a238c70SJohn Marino    (("x[%Pu]=%.*Rg rnd=%d", mpfr_get_prec (x), mpfr_log_prec, x, rnd),
4a238c70SJohn Marino     ("y[%Pu]=%.*Rg inexact=%d",
4a238c70SJohn Marino      mpfr_get_prec (y), mpfr_log_prec, y, inex));
4a238c70SJohn Marino
4a238c70SJohn Marino  /* special cases */
4a238c70SJohn Marino  if (MPFR_UNLIKELY (MPFR_IS_SINGULAR (x)))
4a238c70SJohn Marino    {
4a238c70SJohn Marino      if (MPFR_IS_NAN (x) || MPFR_IS_NEG (x))
4a238c70SJohn Marino        {
4a238c70SJohn Marino          MPFR_SET_NAN (y);
4a238c70SJohn Marino          MPFR_RET_NAN;
4a238c70SJohn Marino        }
4a238c70SJohn Marino      else /* lngamma(+Inf) = lngamma(+0) = +Inf */
4a238c70SJohn Marino        {
4a238c70SJohn Marino          if (MPFR_IS_ZERO (x))
4a238c70SJohn Marino            mpfr_set_divby0 ();
4a238c70SJohn Marino          MPFR_SET_INF (y);
4a238c70SJohn Marino          MPFR_SET_POS (y);
4a238c70SJohn Marino          MPFR_RET (0);  /* exact */
4a238c70SJohn Marino        }
4a238c70SJohn Marino    }
4a238c70SJohn Marino
4a238c70SJohn Marino  /* if x < 0 and -2k-1 <= x <= -2k, then lngamma(x) = NaN */
4a238c70SJohn Marino  if (MPFR_IS_NEG (x) && (unit_bit (x) == 0 || mpfr_integer_p (x)))
4a238c70SJohn Marino    {
4a238c70SJohn Marino      MPFR_SET_NAN (y);
4a238c70SJohn Marino      MPFR_RET_NAN;
4a238c70SJohn Marino    }
4a238c70SJohn Marino
4a238c70SJohn Marino  inex = mpfr_lngamma_aux (y, x, rnd);
4a238c70SJohn Marino  return inex;
4a238c70SJohn Marino}
4a238c70SJohn Marino
4a238c70SJohn Marinoint
4a238c70SJohn Marinompfr_lgamma (mpfr_ptr y, int *signp, mpfr_srcptr x, mpfr_rnd_t rnd)
4a238c70SJohn Marino{
4a238c70SJohn Marino  int inex;
4a238c70SJohn Marino
4a238c70SJohn Marino  MPFR_LOG_FUNC
4a238c70SJohn Marino    (("x[%Pu]=%.*Rg rnd=%d", mpfr_get_prec (x), mpfr_log_prec, x, rnd),
4a238c70SJohn Marino     ("y[%Pu]=%.*Rg signp=%d inexact=%d",
4a238c70SJohn Marino      mpfr_get_prec (y), mpfr_log_prec, y, *signp, inex));
4a238c70SJohn Marino
4a238c70SJohn Marino  *signp = 1;  /* most common case */
4a238c70SJohn Marino
4a238c70SJohn Marino  if (MPFR_UNLIKELY (MPFR_IS_SINGULAR (x)))
4a238c70SJohn Marino    {
4a238c70SJohn Marino      if (MPFR_IS_NAN (x))
4a238c70SJohn Marino        {
4a238c70SJohn Marino          MPFR_SET_NAN (y);
4a238c70SJohn Marino          MPFR_RET_NAN;
4a238c70SJohn Marino        }
4a238c70SJohn Marino      else
4a238c70SJohn Marino        {
4a238c70SJohn Marino          if (MPFR_IS_ZERO (x))
4a238c70SJohn Marino            mpfr_set_divby0 ();
4a238c70SJohn Marino          *signp = MPFR_INT_SIGN (x);
4a238c70SJohn Marino          MPFR_SET_INF (y);
4a238c70SJohn Marino          MPFR_SET_POS (y);
4a238c70SJohn Marino          MPFR_RET (0);
4a238c70SJohn Marino        }
4a238c70SJohn Marino    }
4a238c70SJohn Marino
4a238c70SJohn Marino  if (MPFR_IS_NEG (x))
4a238c70SJohn Marino    {
4a238c70SJohn Marino      if (mpfr_integer_p (x))
4a238c70SJohn Marino        {
4a238c70SJohn Marino          MPFR_SET_INF (y);
4a238c70SJohn Marino          MPFR_SET_POS (y);
4a238c70SJohn Marino          mpfr_set_divby0 ();
4a238c70SJohn Marino          MPFR_RET (0);
4a238c70SJohn Marino        }
4a238c70SJohn Marino
4a238c70SJohn Marino      if (unit_bit (x) == 0)
4a238c70SJohn Marino        *signp = -1;
4a238c70SJohn Marino
4a238c70SJohn Marino      /* For tiny negative x, we have gamma(x) = 1/x - euler + O(x),
4a238c70SJohn Marino         thus |gamma(x)| = -1/x + euler + O(x), and
4a238c70SJohn Marino         log |gamma(x)| = -log(-x) - euler*x + O(x^2).
4a238c70SJohn Marino         More precisely we have for -0.4 <= x < 0:
4a238c70SJohn Marino         -log(-x) <= log |gamma(x)| <= -log(-x) - x.
4a238c70SJohn Marino         Since log(x) is not representable, we may have an instance of the
4a238c70SJohn Marino         Table Maker Dilemma. The only way to ensure correct rounding is to
4a238c70SJohn Marino         compute an interval [l,h] such that l <= -log(-x) and
4a238c70SJohn Marino         -log(-x) - x <= h, and check whether l and h round to the same number
4a238c70SJohn Marino         for the target precision and rounding modes. */
4a238c70SJohn Marino      if (MPFR_EXP(x) + 1 <= - (mpfr_exp_t) MPFR_PREC(y))
4a238c70SJohn Marino        /* since PREC(y) >= 1, this ensures EXP(x) <= -2,
4a238c70SJohn Marino           thus |x| <= 0.25 < 0.4 */
4a238c70SJohn Marino        {
4a238c70SJohn Marino          mpfr_t l, h;
4a238c70SJohn Marino          int ok, inex2;
4a238c70SJohn Marino          mpfr_prec_t w = MPFR_PREC (y) + 14;
4a238c70SJohn Marino          mpfr_exp_t expl;
4a238c70SJohn Marino
4a238c70SJohn Marino          while (1)
4a238c70SJohn Marino            {
4a238c70SJohn Marino              mpfr_init2 (l, w);
4a238c70SJohn Marino              mpfr_init2 (h, w);
4a238c70SJohn Marino              /* we want a lower bound on -log(-x), thus an upper bound
4a238c70SJohn Marino                 on log(-x), thus an upper bound on -x. */
4a238c70SJohn Marino              mpfr_neg (l, x, MPFR_RNDU); /* upper bound on -x */
4a238c70SJohn Marino              mpfr_log (l, l, MPFR_RNDU); /* upper bound for log(-x) */
4a238c70SJohn Marino              mpfr_neg (l, l, MPFR_RNDD); /* lower bound for -log(-x) */
4a238c70SJohn Marino              mpfr_neg (h, x, MPFR_RNDD); /* lower bound on -x */
4a238c70SJohn Marino              mpfr_log (h, h, MPFR_RNDD); /* lower bound on log(-x) */
4a238c70SJohn Marino              mpfr_neg (h, h, MPFR_RNDU); /* upper bound for -log(-x) */
4a238c70SJohn Marino              mpfr_sub (h, h, x, MPFR_RNDU); /* upper bound for -log(-x) - x */
4a238c70SJohn Marino              inex = mpfr_prec_round (l, MPFR_PREC (y), rnd);
4a238c70SJohn Marino              inex2 = mpfr_prec_round (h, MPFR_PREC (y), rnd);
4a238c70SJohn Marino              /* Caution: we not only need l = h, but both inexact flags
4a238c70SJohn Marino                 should agree. Indeed, one of the inexact flags might be
4a238c70SJohn Marino                 zero. In that case if we assume ln|gamma(x)| cannot be
4a238c70SJohn Marino                 exact, the other flag should be correct. We are conservative
4a238c70SJohn Marino                 here and request that both inexact flags agree. */
4a238c70SJohn Marino              ok = SAME_SIGN (inex, inex2) && mpfr_equal_p (l, h);
4a238c70SJohn Marino              if (ok)
4a238c70SJohn Marino                mpfr_set (y, h, rnd); /* exact */
4a238c70SJohn Marino              else
4a238c70SJohn Marino                expl = MPFR_EXP (l);
4a238c70SJohn Marino              mpfr_clear (l);
4a238c70SJohn Marino              mpfr_clear (h);
4a238c70SJohn Marino              if (ok)
4a238c70SJohn Marino                return inex;
4a238c70SJohn Marino              /* if ulp(log(-x)) <= |x| there is no reason to loop,
4a238c70SJohn Marino                 since the width of [l, h] will be at least |x| */
4a238c70SJohn Marino              if (expl < MPFR_EXP(x) + (mpfr_exp_t) w)
4a238c70SJohn Marino                break;
4a238c70SJohn Marino              w += MPFR_INT_CEIL_LOG2(w) + 3;
4a238c70SJohn Marino            }
4a238c70SJohn Marino        }
4a238c70SJohn Marino    }
4a238c70SJohn Marino
4a238c70SJohn Marino  inex = mpfr_lngamma_aux (y, x, rnd);
4a238c70SJohn Marino  return inex;
4a238c70SJohn Marino}
4a238c70SJohn Marino
4a238c70SJohn Marino#endif