gmp/mpf/sqrt.c

*86d7f5d3SJohn Marino/* mpf_sqrt -- Compute the square root of a float.
*86d7f5d3SJohn Marino
*86d7f5d3SJohn MarinoCopyright 1993, 1994, 1996, 2000, 2001, 2004, 2005 Free Software Foundation,
*86d7f5d3SJohn MarinoInc.
*86d7f5d3SJohn Marino
*86d7f5d3SJohn MarinoThis file is part of the GNU MP Library.
*86d7f5d3SJohn Marino
*86d7f5d3SJohn MarinoThe GNU MP Library is free software; you can redistribute it and/or modify
*86d7f5d3SJohn Marinoit under the terms of the GNU Lesser General Public License as published by
*86d7f5d3SJohn Marinothe Free Software Foundation; either version 3 of the License, or (at your
*86d7f5d3SJohn Marinooption) any later version.
*86d7f5d3SJohn Marino
*86d7f5d3SJohn MarinoThe GNU MP Library is distributed in the hope that it will be useful, but
*86d7f5d3SJohn MarinoWITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
*86d7f5d3SJohn Marinoor FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public
*86d7f5d3SJohn MarinoLicense for more details.
*86d7f5d3SJohn Marino
*86d7f5d3SJohn MarinoYou should have received a copy of the GNU Lesser General Public License
*86d7f5d3SJohn Marinoalong with the GNU MP Library.  If not, see http://www.gnu.org/licenses/.  */
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino#include <stdio.h> /* for NULL */
*86d7f5d3SJohn Marino#include "gmp.h"
*86d7f5d3SJohn Marino#include "gmp-impl.h"
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino/* As usual, the aim is to produce PREC(r) limbs of result, with the high
*86d7f5d3SJohn Marino   limb non-zero.  This is accomplished by applying mpn_sqrtrem to either
*86d7f5d3SJohn Marino   2*prec or 2*prec-1 limbs, both such sizes resulting in prec limbs.
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino   The choice between 2*prec or 2*prec-1 limbs is based on the input
*86d7f5d3SJohn Marino   exponent.  With b=2^GMP_NUMB_BITS the limb base then we can think of
*86d7f5d3SJohn Marino   effectively taking out a factor b^(2k), for suitable k, to get to an
*86d7f5d3SJohn Marino   integer input of the desired size ready for mpn_sqrtrem.  It must be an
*86d7f5d3SJohn Marino   even power taken out, ie. an even number of limbs, so the square root
*86d7f5d3SJohn Marino   gives factor b^k and the radix point is still on a limb boundary.  So if
*86d7f5d3SJohn Marino   EXP(r) is even we'll get an even number of input limbs 2*prec, or if
*86d7f5d3SJohn Marino   EXP(r) is odd we get an odd number 2*prec-1.
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino   Further limbs below the 2*prec or 2*prec-1 used don't affect the result
*86d7f5d3SJohn Marino   and are simply truncated.  This can be seen by considering an integer x,
*86d7f5d3SJohn Marino   with s=floor(sqrt(x)).  s is the unique integer satisfying s^2 <= x <
*86d7f5d3SJohn Marino   (s+1)^2.  Notice that adding a fraction part to x (ie. some further bits)
*86d7f5d3SJohn Marino   doesn't change the inequality, s remains the unique solution.  Working
*86d7f5d3SJohn Marino   suitable factors of 2 into this argument lets it apply to an intended
*86d7f5d3SJohn Marino   precision at any position for any x, not just the integer binary point.
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino   If the input is smaller than 2*prec or 2*prec-1, then we just pad with
*86d7f5d3SJohn Marino   zeros, that of course being our usual interpretation of short inputs.
*86d7f5d3SJohn Marino   The effect is to extend the root beyond the size of the input (for
*86d7f5d3SJohn Marino   instance into fractional limbs if u is an integer).  */
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marinovoid
*86d7f5d3SJohn Marinompf_sqrt (mpf_ptr r, mpf_srcptr u)
*86d7f5d3SJohn Marino{
*86d7f5d3SJohn Marino  mp_size_t usize;
*86d7f5d3SJohn Marino  mp_ptr up, tp;
*86d7f5d3SJohn Marino  mp_size_t prec, tsize;
*86d7f5d3SJohn Marino  mp_exp_t uexp, expodd;
*86d7f5d3SJohn Marino  TMP_DECL;
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino  usize = u->_mp_size;
*86d7f5d3SJohn Marino  if (usize <= 0)
*86d7f5d3SJohn Marino    {
*86d7f5d3SJohn Marino      if (usize < 0)
*86d7f5d3SJohn Marino        SQRT_OF_NEGATIVE;
*86d7f5d3SJohn Marino      r->_mp_size = 0;
*86d7f5d3SJohn Marino      r->_mp_exp = 0;
*86d7f5d3SJohn Marino      return;
*86d7f5d3SJohn Marino    }
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino  TMP_MARK;
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino  uexp = u->_mp_exp;
*86d7f5d3SJohn Marino  prec = r->_mp_prec;
*86d7f5d3SJohn Marino  up = u->_mp_d;
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino  expodd = (uexp & 1);
*86d7f5d3SJohn Marino  tsize = 2 * prec - expodd;
*86d7f5d3SJohn Marino  r->_mp_size = prec;
*86d7f5d3SJohn Marino  r->_mp_exp = (uexp + expodd) / 2;    /* ceil(uexp/2) */
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino  /* root size is ceil(tsize/2), this will be our desired "prec" limbs */
*86d7f5d3SJohn Marino  ASSERT ((tsize + 1) / 2 == prec);
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino  tp = TMP_ALLOC_LIMBS (tsize);
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino  if (usize > tsize)
*86d7f5d3SJohn Marino    {
*86d7f5d3SJohn Marino      up += usize - tsize;
*86d7f5d3SJohn Marino      usize = tsize;
*86d7f5d3SJohn Marino      MPN_COPY (tp, up, tsize);
*86d7f5d3SJohn Marino    }
*86d7f5d3SJohn Marino  else
*86d7f5d3SJohn Marino    {
*86d7f5d3SJohn Marino      MPN_ZERO (tp, tsize - usize);
*86d7f5d3SJohn Marino      MPN_COPY (tp + (tsize - usize), up, usize);
*86d7f5d3SJohn Marino    }
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino  mpn_sqrtrem (r->_mp_d, NULL, tp, tsize);
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino  TMP_FREE;
*86d7f5d3SJohn Marino}