dist/mpz/cfdiv_r_2exp.c

4a1767b4Smrg/* mpz_cdiv_r_2exp, mpz_fdiv_r_2exp -- remainder from mpz divided by 2^n.
4a1767b4Smrg
d25e02daSmrgCopyright 2001, 2002, 2004, 2012 Free Software Foundation, Inc.
4a1767b4Smrg
4a1767b4SmrgThis file is part of the GNU MP Library.
4a1767b4Smrg
4a1767b4SmrgThe GNU MP Library is free software; you can redistribute it and/or modify
*f81b1c5bSmrgit under the terms of either:
*f81b1c5bSmrg
*f81b1c5bSmrg  * the GNU Lesser General Public License as published by the Free
*f81b1c5bSmrg    Software Foundation; either version 3 of the License, or (at your
4a1767b4Smrg    option) any later version.
4a1767b4Smrg
*f81b1c5bSmrgor
*f81b1c5bSmrg
*f81b1c5bSmrg  * the GNU General Public License as published by the Free Software
*f81b1c5bSmrg    Foundation; either version 2 of the License, or (at your option) any
*f81b1c5bSmrg    later version.
*f81b1c5bSmrg
*f81b1c5bSmrgor both in parallel, as here.
*f81b1c5bSmrg
4a1767b4SmrgThe GNU MP Library is distributed in the hope that it will be useful, but
4a1767b4SmrgWITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
*f81b1c5bSmrgor FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
*f81b1c5bSmrgfor more details.
4a1767b4Smrg
*f81b1c5bSmrgYou should have received copies of the GNU General Public License and the
*f81b1c5bSmrgGNU Lesser General Public License along with the GNU MP Library.  If not,
*f81b1c5bSmrgsee https://www.gnu.org/licenses/.  */
4a1767b4Smrg
4a1767b4Smrg#include "gmp-impl.h"
4a1767b4Smrg
4a1767b4Smrg
4a1767b4Smrg/* Bit mask of "n" least significant bits of a limb. */
4a1767b4Smrg#define LOW_MASK(n)   ((CNST_LIMB(1) << (n)) - 1)
4a1767b4Smrg
4a1767b4Smrg
4a1767b4Smrg/* dir==1 for ceil, dir==-1 for floor */
4a1767b4Smrg
d25e02daSmrgstatic void __gmpz_cfdiv_r_2exp (REGPARM_3_1 (mpz_ptr, mpz_srcptr, mp_bitcnt_t, int)) REGPARM_ATTR (1);
4a1767b4Smrg#define cfdiv_r_2exp(w,u,cnt,dir)  __gmpz_cfdiv_r_2exp (REGPARM_3_1 (w, u, cnt, dir))
4a1767b4Smrg
4a1767b4SmrgREGPARM_ATTR (1) static void
4a1767b4Smrgcfdiv_r_2exp (mpz_ptr w, mpz_srcptr u, mp_bitcnt_t cnt, int dir)
4a1767b4Smrg{
4a1767b4Smrg  mp_size_t  usize, abs_usize, limb_cnt, i;
4a1767b4Smrg  mp_srcptr  up;
4a1767b4Smrg  mp_ptr     wp;
4a1767b4Smrg  mp_limb_t  high;
4a1767b4Smrg
4a1767b4Smrg  usize = SIZ(u);
4a1767b4Smrg  if (usize == 0)
4a1767b4Smrg    {
4a1767b4Smrg      SIZ(w) = 0;
4a1767b4Smrg      return;
4a1767b4Smrg    }
4a1767b4Smrg
4a1767b4Smrg  limb_cnt = cnt / GMP_NUMB_BITS;
4a1767b4Smrg  cnt %= GMP_NUMB_BITS;
4a1767b4Smrg  abs_usize = ABS (usize);
4a1767b4Smrg
4a1767b4Smrg  /* MPZ_REALLOC(w) below is only when w!=u, so we can fetch PTR(u) here
4a1767b4Smrg     nice and early */
4a1767b4Smrg  up = PTR(u);
4a1767b4Smrg
4a1767b4Smrg  if ((usize ^ dir) < 0)
4a1767b4Smrg    {
4a1767b4Smrg      /* Round towards zero, means just truncate */
4a1767b4Smrg
4a1767b4Smrg      if (w == u)
4a1767b4Smrg	{
4a1767b4Smrg	  /* if already smaller than limb_cnt then do nothing */
4a1767b4Smrg	  if (abs_usize <= limb_cnt)
4a1767b4Smrg	    return;
*f81b1c5bSmrg	  wp = (mp_ptr) up;
4a1767b4Smrg	}
4a1767b4Smrg      else
4a1767b4Smrg	{
4a1767b4Smrg	  i = MIN (abs_usize, limb_cnt+1);
*f81b1c5bSmrg	  wp = MPZ_NEWALLOC (w, i);
4a1767b4Smrg	  MPN_COPY (wp, up, i);
4a1767b4Smrg
4a1767b4Smrg	  /* if smaller than limb_cnt then only the copy is needed */
4a1767b4Smrg	  if (abs_usize <= limb_cnt)
4a1767b4Smrg	    {
4a1767b4Smrg	      SIZ(w) = usize;
4a1767b4Smrg	      return;
4a1767b4Smrg	    }
4a1767b4Smrg	}
4a1767b4Smrg    }
4a1767b4Smrg  else
4a1767b4Smrg    {
4a1767b4Smrg      /* Round away from zero, means twos complement if non-zero */
4a1767b4Smrg
4a1767b4Smrg      /* if u!=0 and smaller than divisor, then must negate */
4a1767b4Smrg      if (abs_usize <= limb_cnt)
4a1767b4Smrg	goto negate;
4a1767b4Smrg
4a1767b4Smrg      /* if non-zero low limb, then must negate */
4a1767b4Smrg      for (i = 0; i < limb_cnt; i++)
4a1767b4Smrg	if (up[i] != 0)
4a1767b4Smrg	  goto negate;
4a1767b4Smrg
4a1767b4Smrg      /* if non-zero partial limb, then must negate */
4a1767b4Smrg      if ((up[limb_cnt] & LOW_MASK (cnt)) != 0)
4a1767b4Smrg	goto negate;
4a1767b4Smrg
4a1767b4Smrg      /* otherwise low bits of u are zero, so that's the result */
4a1767b4Smrg      SIZ(w) = 0;
4a1767b4Smrg      return;
4a1767b4Smrg
4a1767b4Smrg    negate:
4a1767b4Smrg      /* twos complement negation to get 2**cnt-u */
4a1767b4Smrg
d25e02daSmrg      wp = MPZ_REALLOC (w, limb_cnt+1);
4a1767b4Smrg      up = PTR(u);
4a1767b4Smrg
4a1767b4Smrg      /* Ones complement */
4a1767b4Smrg      i = MIN (abs_usize, limb_cnt+1);
*f81b1c5bSmrg      ASSERT_CARRY (mpn_neg (wp, up, i));
4a1767b4Smrg      for ( ; i <= limb_cnt; i++)
4a1767b4Smrg	wp[i] = GMP_NUMB_MAX;
4a1767b4Smrg
4a1767b4Smrg      usize = -usize;
4a1767b4Smrg    }
4a1767b4Smrg
4a1767b4Smrg  /* Mask the high limb */
4a1767b4Smrg  high = wp[limb_cnt];
4a1767b4Smrg  high &= LOW_MASK (cnt);
4a1767b4Smrg  wp[limb_cnt] = high;
4a1767b4Smrg
4a1767b4Smrg  /* Strip any consequent high zeros */
4a1767b4Smrg  while (high == 0)
4a1767b4Smrg    {
4a1767b4Smrg      limb_cnt--;
4a1767b4Smrg      if (limb_cnt < 0)
4a1767b4Smrg	{
4a1767b4Smrg	  SIZ(w) = 0;
4a1767b4Smrg	  return;
4a1767b4Smrg	}
4a1767b4Smrg      high = wp[limb_cnt];
4a1767b4Smrg    }
4a1767b4Smrg
4a1767b4Smrg  limb_cnt++;
4a1767b4Smrg  SIZ(w) = (usize >= 0 ? limb_cnt : -limb_cnt);
4a1767b4Smrg}
4a1767b4Smrg
4a1767b4Smrg
4a1767b4Smrgvoid
4a1767b4Smrgmpz_cdiv_r_2exp (mpz_ptr w, mpz_srcptr u, mp_bitcnt_t cnt)
4a1767b4Smrg{
4a1767b4Smrg  cfdiv_r_2exp (w, u, cnt, 1);
4a1767b4Smrg}
4a1767b4Smrg
4a1767b4Smrgvoid
4a1767b4Smrgmpz_fdiv_r_2exp (mpz_ptr w, mpz_srcptr u, mp_bitcnt_t cnt)
4a1767b4Smrg{
4a1767b4Smrg  cfdiv_r_2exp (w, u, cnt, -1);
4a1767b4Smrg}