1*05a0b428SJohn Marino /* @(#)e_hypot.c 5.1 93/09/24 */
2*05a0b428SJohn Marino /*
3*05a0b428SJohn Marino  * ====================================================
4*05a0b428SJohn Marino  * Copyright (C) 1993 by Sun Microsystems, Inc. All rights reserved.
5*05a0b428SJohn Marino  *
6*05a0b428SJohn Marino  * Developed at SunPro, a Sun Microsystems, Inc. business.
7*05a0b428SJohn Marino  * Permission to use, copy, modify, and distribute this
8*05a0b428SJohn Marino  * software is freely granted, provided that this notice
9*05a0b428SJohn Marino  * is preserved.
10*05a0b428SJohn Marino  * ====================================================
11*05a0b428SJohn Marino  */
12*05a0b428SJohn Marino 
13*05a0b428SJohn Marino /* hypotl(x,y)
14*05a0b428SJohn Marino  *
15*05a0b428SJohn Marino  * Method :
16*05a0b428SJohn Marino  *	If (assume round-to-nearest) z=x*x+y*y
17*05a0b428SJohn Marino  *	has error less than sqrt(2)/2 ulp, than
18*05a0b428SJohn Marino  *	sqrt(z) has error less than 1 ulp (exercise).
19*05a0b428SJohn Marino  *
20*05a0b428SJohn Marino  *	So, compute sqrt(x*x+y*y) with some care as
21*05a0b428SJohn Marino  *	follows to get the error below 1 ulp:
22*05a0b428SJohn Marino  *
23*05a0b428SJohn Marino  *	Assume x>y>0;
24*05a0b428SJohn Marino  *	(if possible, set rounding to round-to-nearest)
25*05a0b428SJohn Marino  *	1. if x > 2y  use
26*05a0b428SJohn Marino  *		x1*x1+(y*y+(x2*(x+x1))) for x*x+y*y
27*05a0b428SJohn Marino  *	where x1 = x with lower 32 bits cleared, x2 = x-x1; else
28*05a0b428SJohn Marino  *	2. if x <= 2y use
29*05a0b428SJohn Marino  *		t1*yy1+((x-y)*(x-y)+(t1*y2+t2*y))
30*05a0b428SJohn Marino  *	where t1 = 2x with lower 32 bits cleared, t2 = 2x-t1,
31*05a0b428SJohn Marino  *	yy1= y with lower 32 bits chopped, y2 = y-yy1.
32*05a0b428SJohn Marino  *
33*05a0b428SJohn Marino  *	NOTE: scaling may be necessary if some argument is too
34*05a0b428SJohn Marino  *	      large or too tiny
35*05a0b428SJohn Marino  *
36*05a0b428SJohn Marino  * Special cases:
37*05a0b428SJohn Marino  *	hypot(x,y) is INF if x or y is +INF or -INF; else
38*05a0b428SJohn Marino  *	hypot(x,y) is NAN if x or y is NAN.
39*05a0b428SJohn Marino  *
40*05a0b428SJohn Marino  * Accuracy:
41*05a0b428SJohn Marino  * 	hypot(x,y) returns sqrt(x^2+y^2) with error less
42*05a0b428SJohn Marino  * 	than 1 ulps (units in the last place)
43*05a0b428SJohn Marino  */
44*05a0b428SJohn Marino 
45*05a0b428SJohn Marino #include <math.h>
46*05a0b428SJohn Marino 
47*05a0b428SJohn Marino #include "math_private.h"
48*05a0b428SJohn Marino 
49*05a0b428SJohn Marino long double
hypotl(long double x,long double y)50*05a0b428SJohn Marino hypotl(long double x, long double y)
51*05a0b428SJohn Marino {
52*05a0b428SJohn Marino 	long double a,b,t1,t2,yy1,y2,w;
53*05a0b428SJohn Marino 	u_int32_t j,k,ea,eb;
54*05a0b428SJohn Marino 
55*05a0b428SJohn Marino 	GET_LDOUBLE_EXP(ea,x);
56*05a0b428SJohn Marino 	ea &= 0x7fff;
57*05a0b428SJohn Marino 	GET_LDOUBLE_EXP(eb,y);
58*05a0b428SJohn Marino 	eb &= 0x7fff;
59*05a0b428SJohn Marino 	if(eb > ea) {a=y;b=x;j=ea; ea=eb;eb=j;} else {a=x;b=y;}
60*05a0b428SJohn Marino 	SET_LDOUBLE_EXP(a,ea);	/* a <- |a| */
61*05a0b428SJohn Marino 	SET_LDOUBLE_EXP(b,eb);	/* b <- |b| */
62*05a0b428SJohn Marino 	if((ea-eb)>0x46) {return a+b;} /* x/y > 2**70 */
63*05a0b428SJohn Marino 	k=0;
64*05a0b428SJohn Marino 	if(ea > 0x5f3f) {	/* a>2**8000 */
65*05a0b428SJohn Marino 	   if(ea == 0x7fff) {	/* Inf or NaN */
66*05a0b428SJohn Marino 	       u_int32_t es,high,low;
67*05a0b428SJohn Marino 	       w = a+b;			/* for sNaN */
68*05a0b428SJohn Marino 	       GET_LDOUBLE_WORDS(es,high,low,a);
69*05a0b428SJohn Marino 	       if(((high&0x7fffffff)|low)==0) w = a;
70*05a0b428SJohn Marino 	       GET_LDOUBLE_WORDS(es,high,low,b);
71*05a0b428SJohn Marino 	       if(((eb^0x7fff)|(high&0x7fffffff)|low)==0) w = b;
72*05a0b428SJohn Marino 	       return w;
73*05a0b428SJohn Marino 	   }
74*05a0b428SJohn Marino 	   /* scale a and b by 2**-9600 */
75*05a0b428SJohn Marino 	   ea -= 0x2580; eb -= 0x2580;	k += 9600;
76*05a0b428SJohn Marino 	   SET_LDOUBLE_EXP(a,ea);
77*05a0b428SJohn Marino 	   SET_LDOUBLE_EXP(b,eb);
78*05a0b428SJohn Marino 	}
79*05a0b428SJohn Marino 	if(eb < 0x20bf) {	/* b < 2**-8000 */
80*05a0b428SJohn Marino 	    if(eb == 0) {	/* subnormal b or 0 */
81*05a0b428SJohn Marino 		u_int32_t es,high,low;
82*05a0b428SJohn Marino 		GET_LDOUBLE_WORDS(es,high,low,b);
83*05a0b428SJohn Marino 		if((high|low)==0) return a;
84*05a0b428SJohn Marino 		SET_LDOUBLE_WORDS(t1, 0x7ffd, 0, 0);	/* t1=2^16382 */
85*05a0b428SJohn Marino 		b *= t1;
86*05a0b428SJohn Marino 		a *= t1;
87*05a0b428SJohn Marino 		k -= 16382;
88*05a0b428SJohn Marino 	    } else {		/* scale a and b by 2^9600 */
89*05a0b428SJohn Marino 		ea += 0x2580;	/* a *= 2^9600 */
90*05a0b428SJohn Marino 		eb += 0x2580;	/* b *= 2^9600 */
91*05a0b428SJohn Marino 		k -= 9600;
92*05a0b428SJohn Marino 		SET_LDOUBLE_EXP(a,ea);
93*05a0b428SJohn Marino 		SET_LDOUBLE_EXP(b,eb);
94*05a0b428SJohn Marino 	    }
95*05a0b428SJohn Marino 	}
96*05a0b428SJohn Marino     /* medium size a and b */
97*05a0b428SJohn Marino 	w = a-b;
98*05a0b428SJohn Marino 	if (w>b) {
99*05a0b428SJohn Marino 	    u_int32_t high;
100*05a0b428SJohn Marino 	    GET_LDOUBLE_MSW(high,a);
101*05a0b428SJohn Marino 	    SET_LDOUBLE_WORDS(t1,ea,high,0);
102*05a0b428SJohn Marino 	    t2 = a-t1;
103*05a0b428SJohn Marino 	    w  = sqrtl(t1*t1-(b*(-b)-t2*(a+t1)));
104*05a0b428SJohn Marino 	} else {
105*05a0b428SJohn Marino 	    u_int32_t high;
106*05a0b428SJohn Marino 	    GET_LDOUBLE_MSW(high,b);
107*05a0b428SJohn Marino 	    a  = a+a;
108*05a0b428SJohn Marino 	    SET_LDOUBLE_WORDS(yy1,eb,high,0);
109*05a0b428SJohn Marino 	    y2 = b - yy1;
110*05a0b428SJohn Marino 	    GET_LDOUBLE_MSW(high,a);
111*05a0b428SJohn Marino 	    SET_LDOUBLE_WORDS(t1,ea+1,high,0);
112*05a0b428SJohn Marino 	    t2 = a - t1;
113*05a0b428SJohn Marino 	    w  = sqrtl(t1*yy1-(w*(-w)-(t1*y2+t2*b)));
114*05a0b428SJohn Marino 	}
115*05a0b428SJohn Marino 	if(k!=0) {
116*05a0b428SJohn Marino 	    u_int32_t es;
117*05a0b428SJohn Marino 	    t1 = 1.0;
118*05a0b428SJohn Marino 	    GET_LDOUBLE_EXP(es,t1);
119*05a0b428SJohn Marino 	    SET_LDOUBLE_EXP(t1,es+k);
120*05a0b428SJohn Marino 	    return t1*w;
121*05a0b428SJohn Marino 	} else return w;
122*05a0b428SJohn Marino }
123