src/ld128/e_hypotl.c

49393c00Smartynas/* @(#)e_hypot.c 5.1 93/09/24 */
49393c00Smartynas/*
49393c00Smartynas * ====================================================
49393c00Smartynas * Copyright (C) 1993 by Sun Microsystems, Inc. All rights reserved.
49393c00Smartynas *
49393c00Smartynas * Developed at SunPro, a Sun Microsystems, Inc. business.
49393c00Smartynas * Permission to use, copy, modify, and distribute this
49393c00Smartynas * software is freely granted, provided that this notice
49393c00Smartynas * is preserved.
49393c00Smartynas * ====================================================
49393c00Smartynas */
49393c00Smartynas
49393c00Smartynas/* hypotl(x,y)
49393c00Smartynas *
49393c00Smartynas * Method :
49393c00Smartynas *	If (assume round-to-nearest) z=x*x+y*y
49393c00Smartynas *	has error less than sqrtl(2)/2 ulp, than
49393c00Smartynas *	sqrtl(z) has error less than 1 ulp (exercise).
49393c00Smartynas *
49393c00Smartynas *	So, compute sqrtl(x*x+y*y) with some care as
49393c00Smartynas *	follows to get the error below 1 ulp:
49393c00Smartynas *
49393c00Smartynas *	Assume x>y>0;
49393c00Smartynas *	(if possible, set rounding to round-to-nearest)
49393c00Smartynas *	1. if x > 2y  use
49393c00Smartynas *		x1*x1+(y*y+(x2*(x+x1))) for x*x+y*y
49393c00Smartynas *	where x1 = x with lower 64 bits cleared, x2 = x-x1; else
49393c00Smartynas *	2. if x <= 2y use
49393c00Smartynas *		t1*yy1+((x-y)*(x-y)+(t1*y2+t2*y))
49393c00Smartynas *	where t1 = 2x with lower 64 bits cleared, t2 = 2x-t1,
49393c00Smartynas *	yy1= y with lower 64 bits chopped, y2 = y-yy1.
49393c00Smartynas *
49393c00Smartynas *	NOTE: scaling may be necessary if some argument is too
49393c00Smartynas *	      large or too tiny
49393c00Smartynas *
49393c00Smartynas * Special cases:
49393c00Smartynas *	hypotl(x,y) is INF if x or y is +INF or -INF; else
49393c00Smartynas *	hypotl(x,y) is NAN if x or y is NAN.
49393c00Smartynas *
49393c00Smartynas * Accuracy:
49393c00Smartynas * 	hypotl(x,y) returns sqrtl(x^2+y^2) with error less
49393c00Smartynas * 	than 1 ulps (units in the last place)
49393c00Smartynas */
49393c00Smartynas
49393c00Smartynas#include <math.h>
49393c00Smartynas
49393c00Smartynas#include "math_private.h"
49393c00Smartynas
49393c00Smartynaslong double
49393c00Smartynashypotl(long double x, long double y)
49393c00Smartynas{
49393c00Smartynas	long double a,b,t1,t2,yy1,y2,w;
49393c00Smartynas	int64_t j,k,ha,hb;
49393c00Smartynas
49393c00Smartynas	GET_LDOUBLE_MSW64(ha,x);
49393c00Smartynas	ha &= 0x7fffffffffffffffLL;
49393c00Smartynas	GET_LDOUBLE_MSW64(hb,y);
49393c00Smartynas	hb &= 0x7fffffffffffffffLL;
49393c00Smartynas	if(hb > ha) {a=y;b=x;j=ha; ha=hb;hb=j;} else {a=x;b=y;}
49393c00Smartynas	SET_LDOUBLE_MSW64(a,ha);	/* a <- |a| */
49393c00Smartynas	SET_LDOUBLE_MSW64(b,hb);	/* b <- |b| */
49393c00Smartynas	if((ha-hb)>0x78000000000000LL) {return a+b;} /* x/y > 2**120 */
49393c00Smartynas	k=0;
49393c00Smartynas	if(ha > 0x5f3f000000000000LL) {	/* a>2**8000 */
49393c00Smartynas	   if(ha >= 0x7fff000000000000LL) {	/* Inf or NaN */
49393c00Smartynas	       u_int64_t low;
49393c00Smartynas	       w = a+b;			/* for sNaN */
49393c00Smartynas	       GET_LDOUBLE_LSW64(low,a);
49393c00Smartynas	       if(((ha&0xffffffffffffLL)|low)==0) w = a;
49393c00Smartynas	       GET_LDOUBLE_LSW64(low,b);
49393c00Smartynas	       if(((hb^0x7fff000000000000LL)|low)==0) w = b;
49393c00Smartynas	       return w;
49393c00Smartynas	   }
49393c00Smartynas	   /* scale a and b by 2**-9600 */
49393c00Smartynas	   ha -= 0x2580000000000000LL;
49393c00Smartynas	   hb -= 0x2580000000000000LL;	k += 9600;
49393c00Smartynas	   SET_LDOUBLE_MSW64(a,ha);
49393c00Smartynas	   SET_LDOUBLE_MSW64(b,hb);
49393c00Smartynas	}
49393c00Smartynas	if(hb < 0x20bf000000000000LL) {	/* b < 2**-8000 */
49393c00Smartynas	    if(hb <= 0x0000ffffffffffffLL) {	/* subnormal b or 0 */
49393c00Smartynas		u_int64_t low;
49393c00Smartynas		GET_LDOUBLE_LSW64(low,b);
49393c00Smartynas		if((hb|low)==0) return a;
49393c00Smartynas		t1=0;
49393c00Smartynas		SET_LDOUBLE_MSW64(t1,0x7ffd000000000000LL); /* t1=2^16382 */
49393c00Smartynas		b *= t1;
49393c00Smartynas		a *= t1;
49393c00Smartynas		k -= 16382;
49393c00Smartynas	    } else {		/* scale a and b by 2^9600 */
49393c00Smartynas		ha += 0x2580000000000000LL;	/* a *= 2^9600 */
49393c00Smartynas		hb += 0x2580000000000000LL;	/* b *= 2^9600 */
49393c00Smartynas		k -= 9600;
49393c00Smartynas		SET_LDOUBLE_MSW64(a,ha);
49393c00Smartynas		SET_LDOUBLE_MSW64(b,hb);
49393c00Smartynas	    }
49393c00Smartynas	}
49393c00Smartynas    /* medium size a and b */
49393c00Smartynas	w = a-b;
49393c00Smartynas	if (w>b) {
49393c00Smartynas	    t1 = 0;
49393c00Smartynas	    SET_LDOUBLE_MSW64(t1,ha);
49393c00Smartynas	    t2 = a-t1;
49393c00Smartynas	    w  = sqrtl(t1*t1-(b*(-b)-t2*(a+t1)));
49393c00Smartynas	} else {
49393c00Smartynas	    a  = a+a;
49393c00Smartynas	    yy1 = 0;
49393c00Smartynas	    SET_LDOUBLE_MSW64(yy1,hb);
49393c00Smartynas	    y2 = b - yy1;
49393c00Smartynas	    t1 = 0;
49393c00Smartynas	    SET_LDOUBLE_MSW64(t1,ha+0x0001000000000000LL);
49393c00Smartynas	    t2 = a - t1;
49393c00Smartynas	    w  = sqrtl(t1*yy1-(w*(-w)-(t1*y2+t2*b)));
49393c00Smartynas	}
49393c00Smartynas	if(k!=0) {
49393c00Smartynas	    u_int64_t high;
49393c00Smartynas	    t1 = 1.0L;
49393c00Smartynas	    GET_LDOUBLE_MSW64(high,t1);
49393c00Smartynas	    SET_LDOUBLE_MSW64(t1,high+(k<<48));
49393c00Smartynas	    return t1*w;
49393c00Smartynas	} else return w;
49393c00Smartynas}
*2f2c0062SguentherDEF_STD(hypotl);