1 1.1 mrg /* e_hypotl.c -- long double version of e_hypot.c. 2 1.1 mrg * Conversion to long double by Jakub Jelinek, jakub (at) redhat.com. 3 1.1 mrg */ 4 1.1 mrg 5 1.1 mrg /* 6 1.1 mrg * ==================================================== 7 1.1 mrg * Copyright (C) 1993 by Sun Microsystems, Inc. All rights reserved. 8 1.1 mrg * 9 1.1 mrg * Developed at SunPro, a Sun Microsystems, Inc. business. 10 1.1 mrg * Permission to use, copy, modify, and distribute this 11 1.1 mrg * software is freely granted, provided that this notice 12 1.1 mrg * is preserved. 13 1.1 mrg * ==================================================== 14 1.1 mrg */ 15 1.1 mrg 16 1.1 mrg /* hypotq(x,y) 17 1.1 mrg * 18 1.1 mrg * Method : 19 1.1 mrg * If (assume round-to-nearest) z=x*x+y*y 20 1.1 mrg * has error less than sqrtq(2)/2 ulp, than 21 1.1 mrg * sqrtq(z) has error less than 1 ulp (exercise). 22 1.1 mrg * 23 1.1 mrg * So, compute sqrtq(x*x+y*y) with some care as 24 1.1 mrg * follows to get the error below 1 ulp: 25 1.1 mrg * 26 1.1 mrg * Assume x>y>0; 27 1.1 mrg * (if possible, set rounding to round-to-nearest) 28 1.1 mrg * 1. if x > 2y use 29 1.1 mrg * x1*x1+(y*y+(x2*(x+x1))) for x*x+y*y 30 1.1 mrg * where x1 = x with lower 64 bits cleared, x2 = x-x1; else 31 1.1 mrg * 2. if x <= 2y use 32 1.1 mrg * t1*y1+((x-y)*(x-y)+(t1*y2+t2*y)) 33 1.1 mrg * where t1 = 2x with lower 64 bits cleared, t2 = 2x-t1, 34 1.1 mrg * y1= y with lower 64 bits chopped, y2 = y-y1. 35 1.1 mrg * 36 1.1 mrg * NOTE: scaling may be necessary if some argument is too 37 1.1 mrg * large or too tiny 38 1.1 mrg * 39 1.1 mrg * Special cases: 40 1.1 mrg * hypotl(x,y) is INF if x or y is +INF or -INF; else 41 1.1 mrg * hypotl(x,y) is NAN if x or y is NAN. 42 1.1 mrg * 43 1.1 mrg * Accuracy: 44 1.1 mrg * hypotl(x,y) returns sqrtq(x^2+y^2) with error less 45 1.1 mrg * than 1 ulps (units in the last place) 46 1.1 mrg */ 47 1.1 mrg 48 1.1 mrg #include "quadmath-imp.h" 49 1.1 mrg 50 1.1 mrg __float128 51 1.1 mrg hypotq(__float128 x, __float128 y) 52 1.1 mrg { 53 1.1 mrg __float128 a,b,t1,t2,y1,y2,w; 54 1.1 mrg int64_t j,k,ha,hb; 55 1.1 mrg 56 1.1 mrg GET_FLT128_MSW64(ha,x); 57 1.1 mrg ha &= 0x7fffffffffffffffLL; 58 1.1 mrg GET_FLT128_MSW64(hb,y); 59 1.1 mrg hb &= 0x7fffffffffffffffLL; 60 1.1 mrg if(hb > ha) {a=y;b=x;j=ha; ha=hb;hb=j;} else {a=x;b=y;} 61 1.1 mrg SET_FLT128_MSW64(a,ha); /* a <- |a| */ 62 1.1 mrg SET_FLT128_MSW64(b,hb); /* b <- |b| */ 63 1.1 mrg if((ha-hb)>0x78000000000000LL) {return a+b;} /* x/y > 2**120 */ 64 1.1 mrg k=0; 65 1.1 mrg if(ha > 0x5f3f000000000000LL) { /* a>2**8000 */ 66 1.1 mrg if(ha >= 0x7fff000000000000LL) { /* Inf or NaN */ 67 1.1 mrg uint64_t low; 68 1.1 mrg w = a+b; /* for sNaN */ 69 1.1 mrg if (issignalingq (a) || issignalingq (b)) 70 1.1 mrg return w; 71 1.1 mrg GET_FLT128_LSW64(low,a); 72 1.1 mrg if(((ha&0xffffffffffffLL)|low)==0) w = a; 73 1.1 mrg GET_FLT128_LSW64(low,b); 74 1.1 mrg if(((hb^0x7fff000000000000LL)|low)==0) w = b; 75 1.1 mrg return w; 76 1.1 mrg } 77 1.1 mrg /* scale a and b by 2**-9600 */ 78 1.1 mrg ha -= 0x2580000000000000LL; 79 1.1 mrg hb -= 0x2580000000000000LL; k += 9600; 80 1.1 mrg SET_FLT128_MSW64(a,ha); 81 1.1 mrg SET_FLT128_MSW64(b,hb); 82 1.1 mrg } 83 1.1 mrg if(hb < 0x20bf000000000000LL) { /* b < 2**-8000 */ 84 1.1 mrg if(hb <= 0x0000ffffffffffffLL) { /* subnormal b or 0 */ 85 1.1 mrg uint64_t low; 86 1.1 mrg GET_FLT128_LSW64(low,b); 87 1.1 mrg if((hb|low)==0) return a; 88 1.1 mrg t1=0; 89 1.1 mrg SET_FLT128_MSW64(t1,0x7ffd000000000000LL); /* t1=2^16382 */ 90 1.1 mrg b *= t1; 91 1.1 mrg a *= t1; 92 1.1 mrg k -= 16382; 93 1.1 mrg GET_FLT128_MSW64 (ha, a); 94 1.1 mrg GET_FLT128_MSW64 (hb, b); 95 1.1 mrg if (hb > ha) 96 1.1 mrg { 97 1.1 mrg t1 = a; 98 1.1 mrg a = b; 99 1.1 mrg b = t1; 100 1.1 mrg j = ha; 101 1.1 mrg ha = hb; 102 1.1 mrg hb = j; 103 1.1 mrg } 104 1.1 mrg } else { /* scale a and b by 2^9600 */ 105 1.1 mrg ha += 0x2580000000000000LL; /* a *= 2^9600 */ 106 1.1 mrg hb += 0x2580000000000000LL; /* b *= 2^9600 */ 107 1.1 mrg k -= 9600; 108 1.1 mrg SET_FLT128_MSW64(a,ha); 109 1.1 mrg SET_FLT128_MSW64(b,hb); 110 1.1 mrg } 111 1.1 mrg } 112 1.1 mrg /* medium size a and b */ 113 1.1 mrg w = a-b; 114 1.1 mrg if (w>b) { 115 1.1 mrg t1 = 0; 116 1.1 mrg SET_FLT128_MSW64(t1,ha); 117 1.1 mrg t2 = a-t1; 118 1.1 mrg w = sqrtq(t1*t1-(b*(-b)-t2*(a+t1))); 119 1.1 mrg } else { 120 1.1 mrg a = a+a; 121 1.1 mrg y1 = 0; 122 1.1 mrg SET_FLT128_MSW64(y1,hb); 123 1.1 mrg y2 = b - y1; 124 1.1 mrg t1 = 0; 125 1.1 mrg SET_FLT128_MSW64(t1,ha+0x0001000000000000LL); 126 1.1 mrg t2 = a - t1; 127 1.1 mrg w = sqrtq(t1*y1-(w*(-w)-(t1*y2+t2*b))); 128 1.1 mrg } 129 1.1 mrg if(k!=0) { 130 1.1 mrg uint64_t high; 131 1.1 mrg t1 = 1; 132 1.1 mrg GET_FLT128_MSW64(high,t1); 133 1.1 mrg SET_FLT128_MSW64(t1,high+(k<<48)); 134 1.1 mrg w *= t1; 135 1.1 mrg math_check_force_underflow_nonneg (w); 136 1.1 mrg return w; 137 1.1 mrg } else return w; 138 1.1 mrg } 139