libm/noieee_src/n_support.c

1.3.10.1   lukem /*      $NetBSD: n_support.c,v 1.3.10.1 2002/06/18 13:41:24 lukem Exp $ */
     1.1   ragge /*
     1.1   ragge  * Copyright (c) 1985, 1993
     1.1   ragge  *	The Regents of the University of California.  All rights reserved.
     1.1   ragge  *
     1.1   ragge  * Redistribution and use in source and binary forms, with or without
     1.1   ragge  * modification, are permitted provided that the following conditions
     1.1   ragge  * are met:
     1.1   ragge  * 1. Redistributions of source code must retain the above copyright
     1.1   ragge  *    notice, this list of conditions and the following disclaimer.
     1.1   ragge  * 2. Redistributions in binary form must reproduce the above copyright
     1.1   ragge  *    notice, this list of conditions and the following disclaimer in the
     1.1   ragge  *    documentation and/or other materials provided with the distribution.
     1.1   ragge  * 3. All advertising materials mentioning features or use of this software
     1.1   ragge  *    must display the following acknowledgement:
     1.1   ragge  *	This product includes software developed by the University of
     1.1   ragge  *	California, Berkeley and its contributors.
     1.1   ragge  * 4. Neither the name of the University nor the names of its contributors
     1.1   ragge  *    may be used to endorse or promote products derived from this software
     1.1   ragge  *    without specific prior written permission.
     1.1   ragge  *
     1.1   ragge  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
     1.1   ragge  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     1.1   ragge  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     1.1   ragge  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
     1.1   ragge  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     1.1   ragge  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     1.1   ragge  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     1.1   ragge  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     1.1   ragge  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     1.1   ragge  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     1.1   ragge  * SUCH DAMAGE.
     1.1   ragge  */
     1.1   ragge
     1.1   ragge #ifndef lint
     1.1   ragge static char sccsid[] = "@(#)support.c	8.1 (Berkeley) 6/4/93";
     1.1   ragge #endif /* not lint */
     1.1   ragge
     1.3  simonb /*
     1.3  simonb  * Some IEEE standard 754 recommended functions and remainder and sqrt for
     1.1   ragge  * supporting the C elementary functions.
     1.1   ragge  ******************************************************************************
     1.1   ragge  * WARNING:
     1.1   ragge  *      These codes are developed (in double) to support the C elementary
     1.1   ragge  * functions temporarily. They are not universal, and some of them are very
     1.3  simonb  * slow (in particular, drem and sqrt is extremely inefficient). Each
     1.3  simonb  * computer system should have its implementation of these functions using
     1.1   ragge  * its own assembler.
     1.1   ragge  ******************************************************************************
     1.1   ragge  *
     1.1   ragge  * IEEE 754 required operations:
     1.3  simonb  *     drem(x,p)
     1.1   ragge  *              returns  x REM y  =  x - [x/y]*y , where [x/y] is the integer
     1.1   ragge  *              nearest x/y; in half way case, choose the even one.
     1.3  simonb  *     sqrt(x)
     1.3  simonb  *              returns the square root of x correctly rounded according to
     1.1   ragge  *		the rounding mod.
     1.1   ragge  *
     1.1   ragge  * IEEE 754 recommended functions:
     1.3  simonb  * (a) copysign(x,y)
     1.3  simonb  *              returns x with the sign of y.
     1.3  simonb  * (b) scalb(x,N)
     1.1   ragge  *              returns  x * (2**N), for integer values N.
     1.3  simonb  * (c) logb(x)
     1.3  simonb  *              returns the unbiased exponent of x, a signed integer in
     1.3  simonb  *              double precision, except that logb(0) is -INF, logb(INF)
     1.1   ragge  *              is +INF, and logb(NAN) is that NAN.
     1.3  simonb  * (d) finite(x)
     1.3  simonb  *              returns the value TRUE if -INF < x < +INF and returns
     1.1   ragge  *              FALSE otherwise.
     1.1   ragge  *
     1.1   ragge  *
     1.1   ragge  * CODED IN C BY K.C. NG, 11/25/84;
     1.1   ragge  * REVISED BY K.C. NG on 1/22/85, 2/13/85, 3/24/85.
     1.1   ragge  */
     1.1   ragge
     1.1   ragge #include "mathimpl.h"
1.3.10.1   lukem #include "trig.h"
     1.1   ragge
     1.2    matt #if defined(__vax__)||defined(tahoe)      /* VAX D format */
     1.1   ragge #include <errno.h>
     1.1   ragge     static const unsigned short msign=0x7fff , mexp =0x7f80 ;
     1.3  simonb     static const short  prep1=57, gap=7, bias=129           ;
1.3.10.1   lukem     static const double novf=1.7E38, nunf=3.0E-39 ;
     1.2    matt #else	/* defined(__vax__)||defined(tahoe) */
     1.1   ragge     static const unsigned short msign=0x7fff, mexp =0x7ff0  ;
     1.1   ragge     static const short prep1=54, gap=4, bias=1023           ;
1.3.10.1   lukem     static const double novf=1.7E308, nunf=3.0E-308;
     1.2    matt #endif	/* defined(__vax__)||defined(tahoe) */
     1.1   ragge
1.3.10.1   lukem double
1.3.10.1   lukem scalb(double x, int N)
     1.1   ragge {
     1.1   ragge         int k;
     1.1   ragge
     1.1   ragge #ifdef national
     1.1   ragge         unsigned short *px=(unsigned short *) &x + 3;
     1.1   ragge #else	/* national */
     1.1   ragge         unsigned short *px=(unsigned short *) &x;
     1.1   ragge #endif	/* national */
     1.1   ragge
1.3.10.1   lukem         if( x == __zero )  return(x);
     1.1   ragge
     1.2    matt #if defined(__vax__)||defined(tahoe)
     1.1   ragge         if( (k= *px & mexp ) != ~msign ) {
     1.1   ragge             if (N < -260)
     1.1   ragge 		return(nunf*nunf);
     1.1   ragge 	    else if (N > 260) {
     1.1   ragge 		return(copysign(infnan(ERANGE),x));
     1.1   ragge 	    }
     1.2    matt #else	/* defined(__vax__)||defined(tahoe) */
     1.1   ragge         if( (k= *px & mexp ) != mexp ) {
     1.1   ragge             if( N<-2100) return(nunf*nunf); else if(N>2100) return(novf+novf);
     1.1   ragge             if( k == 0 ) {
     1.1   ragge                  x *= scalb(1.0,(int)prep1);  N -= prep1; return(scalb(x,N));}
     1.2    matt #endif	/* defined(__vax__)||defined(tahoe) */
     1.1   ragge
     1.1   ragge             if((k = (k>>gap)+ N) > 0 )
     1.1   ragge                 if( k < (mexp>>gap) ) *px = (*px&~mexp) | (k<<gap);
     1.1   ragge                 else x=novf+novf;               /* overflow */
     1.1   ragge             else
     1.3  simonb                 if( k > -prep1 )
     1.1   ragge                                         /* gradual underflow */
     1.1   ragge                     {*px=(*px&~mexp)|(short)(1<<gap); x *= scalb(1.0,k-1);}
     1.1   ragge                 else
     1.1   ragge                 return(nunf*nunf);
     1.1   ragge             }
     1.1   ragge         return(x);
     1.1   ragge }
     1.1   ragge
     1.1   ragge
1.3.10.1   lukem double
1.3.10.1   lukem copysign(double x, double y)
     1.1   ragge {
     1.1   ragge #ifdef national
     1.1   ragge         unsigned short  *px=(unsigned short *) &x+3,
     1.1   ragge                         *py=(unsigned short *) &y+3;
     1.1   ragge #else	/* national */
     1.1   ragge         unsigned short  *px=(unsigned short *) &x,
     1.1   ragge                         *py=(unsigned short *) &y;
     1.1   ragge #endif	/* national */
     1.1   ragge
     1.2    matt #if defined(__vax__)||defined(tahoe)
     1.1   ragge         if ( (*px & mexp) == 0 ) return(x);
     1.2    matt #endif	/* defined(__vax__)||defined(tahoe) */
     1.1   ragge
     1.1   ragge         *px = ( *px & msign ) | ( *py & ~msign );
     1.1   ragge         return(x);
     1.1   ragge }
     1.1   ragge
1.3.10.1   lukem double
1.3.10.1   lukem logb(double x)
     1.1   ragge {
     1.1   ragge
     1.1   ragge #ifdef national
     1.1   ragge         short *px=(short *) &x+3, k;
     1.1   ragge #else	/* national */
     1.1   ragge         short *px=(short *) &x, k;
     1.1   ragge #endif	/* national */
     1.1   ragge
     1.2    matt #if defined(__vax__)||defined(tahoe)
     1.1   ragge         return (int)(((*px&mexp)>>gap)-bias);
     1.2    matt #else	/* defined(__vax__)||defined(tahoe) */
     1.1   ragge         if( (k= *px & mexp ) != mexp )
     1.1   ragge             if ( k != 0 )
     1.1   ragge                 return ( (k>>gap) - bias );
1.3.10.1   lukem             else if( x != __zero)
     1.1   ragge                 return ( -1022.0 );
     1.3  simonb             else
1.3.10.1   lukem                 return(-(1.0/__zero));
     1.1   ragge         else if(x != x)
     1.1   ragge             return(x);
     1.1   ragge         else
     1.1   ragge             {*px &= msign; return(x);}
     1.2    matt #endif	/* defined(__vax__)||defined(tahoe) */
     1.1   ragge }
     1.1   ragge
1.3.10.1   lukem int
1.3.10.1   lukem finite(double x)
     1.1   ragge {
     1.2    matt #if defined(__vax__)||defined(tahoe)
     1.1   ragge         return(1);
     1.2    matt #else	/* defined(__vax__)||defined(tahoe) */
     1.1   ragge #ifdef national
     1.1   ragge         return( (*((short *) &x+3 ) & mexp ) != mexp );
     1.1   ragge #else	/* national */
     1.1   ragge         return( (*((short *) &x ) & mexp ) != mexp );
     1.1   ragge #endif	/* national */
     1.2    matt #endif	/* defined(__vax__)||defined(tahoe) */
     1.1   ragge }
     1.1   ragge
1.3.10.1   lukem double
1.3.10.1   lukem drem(double x, double p)
     1.1   ragge {
     1.1   ragge         short sign;
     1.1   ragge         double hp,dp,tmp;
     1.3  simonb         unsigned short  k;
     1.1   ragge #ifdef national
     1.1   ragge         unsigned short
     1.3  simonb               *px=(unsigned short *) &x  +3,
     1.1   ragge               *pp=(unsigned short *) &p  +3,
     1.1   ragge               *pd=(unsigned short *) &dp +3,
     1.1   ragge               *pt=(unsigned short *) &tmp+3;
     1.1   ragge #else	/* national */
     1.1   ragge         unsigned short
     1.3  simonb               *px=(unsigned short *) &x  ,
     1.1   ragge               *pp=(unsigned short *) &p  ,
     1.1   ragge               *pd=(unsigned short *) &dp ,
     1.1   ragge               *pt=(unsigned short *) &tmp;
     1.1   ragge #endif	/* national */
     1.1   ragge
     1.1   ragge         *pp &= msign ;
     1.1   ragge
     1.2    matt #if defined(__vax__)||defined(tahoe)
     1.1   ragge         if( ( *px & mexp ) == ~msign )	/* is x a reserved operand? */
     1.2    matt #else	/* defined(__vax__)||defined(tahoe) */
     1.1   ragge         if( ( *px & mexp ) == mexp )
     1.2    matt #endif	/* defined(__vax__)||defined(tahoe) */
     1.1   ragge 		return  (x-p)-(x-p);	/* create nan if x is inf */
1.3.10.1   lukem 	if (p == __zero) {
     1.2    matt #if defined(__vax__)||defined(tahoe)
     1.1   ragge 		return(infnan(EDOM));
     1.2    matt #else	/* defined(__vax__)||defined(tahoe) */
1.3.10.1   lukem 		return __zero/__zero;
     1.2    matt #endif	/* defined(__vax__)||defined(tahoe) */
     1.1   ragge 	}
     1.1   ragge
     1.2    matt #if defined(__vax__)||defined(tahoe)
     1.1   ragge         if( ( *pp & mexp ) == ~msign )	/* is p a reserved operand? */
     1.2    matt #else	/* defined(__vax__)||defined(tahoe) */
     1.1   ragge         if( ( *pp & mexp ) == mexp )
     1.2    matt #endif	/* defined(__vax__)||defined(tahoe) */
     1.1   ragge 		{ if (p != p) return p; else return x;}
     1.1   ragge
     1.3  simonb         else  if ( ((*pp & mexp)>>gap) <= 1 )
     1.1   ragge                 /* subnormal p, or almost subnormal p */
     1.1   ragge             { double b; b=scalb(1.0,(int)prep1);
     1.1   ragge               p *= b; x = drem(x,p); x *= b; return(drem(x,p)/b);}
     1.1   ragge         else  if ( p >= novf/2)
     1.1   ragge             { p /= 2 ; x /= 2; return(drem(x,p)*2);}
     1.3  simonb         else
     1.1   ragge             {
     1.1   ragge                 dp=p+p; hp=p/2;
     1.1   ragge                 sign= *px & ~msign ;
     1.1   ragge                 *px &= msign       ;
     1.1   ragge                 while ( x > dp )
     1.1   ragge                     {
     1.1   ragge                         k=(*px & mexp) - (*pd & mexp) ;
     1.1   ragge                         tmp = dp ;
     1.1   ragge                         *pt += k ;
     1.1   ragge
     1.2    matt #if defined(__vax__)||defined(tahoe)
     1.1   ragge                         if( x < tmp ) *pt -= 128 ;
     1.2    matt #else	/* defined(__vax__)||defined(tahoe) */
     1.1   ragge                         if( x < tmp ) *pt -= 16 ;
     1.2    matt #endif	/* defined(__vax__)||defined(tahoe) */
     1.1   ragge
     1.1   ragge                         x -= tmp ;
     1.1   ragge                     }
     1.1   ragge                 if ( x > hp )
     1.1   ragge                     { x -= p ;  if ( x >= hp ) x -= p ; }
     1.1   ragge
     1.2    matt #if defined(__vax__)||defined(tahoe)
     1.1   ragge 		if (x)
     1.2    matt #endif	/* defined(__vax__)||defined(tahoe) */
     1.1   ragge 			*px ^= sign;
     1.1   ragge                 return( x);
     1.1   ragge
     1.1   ragge             }
     1.1   ragge }
     1.1   ragge
     1.1   ragge
1.3.10.1   lukem double
1.3.10.1   lukem sqrt(double x)
     1.1   ragge {
     1.1   ragge         double q,s,b,r;
     1.1   ragge         double t;
     1.1   ragge         int m,n,i;
     1.2    matt #if defined(__vax__)||defined(tahoe)
     1.1   ragge         int k=54;
     1.2    matt #else	/* defined(__vax__)||defined(tahoe) */
     1.1   ragge         int k=51;
     1.2    matt #endif	/* defined(__vax__)||defined(tahoe) */
     1.1   ragge
     1.1   ragge     /* sqrt(NaN) is NaN, sqrt(+-0) = +-0 */
1.3.10.1   lukem         if(x!=x||x==__zero) return(x);
     1.1   ragge
     1.1   ragge     /* sqrt(negative) is invalid */
1.3.10.1   lukem         if(x<__zero) {
     1.2    matt #if defined(__vax__)||defined(tahoe)
     1.1   ragge 		return (infnan(EDOM));	/* NaN */
     1.2    matt #else	/* defined(__vax__)||defined(tahoe) */
1.3.10.1   lukem 		return(__zero/__zero);
     1.2    matt #endif	/* defined(__vax__)||defined(tahoe) */
     1.1   ragge 	}
     1.1   ragge
     1.1   ragge     /* sqrt(INF) is INF */
     1.3  simonb         if(!finite(x)) return(x);
     1.1   ragge
     1.1   ragge     /* scale x to [1,4) */
     1.1   ragge         n=logb(x);
     1.1   ragge         x=scalb(x,-n);
     1.1   ragge         if((m=logb(x))!=0) x=scalb(x,-m);       /* subnormal number */
     1.3  simonb         m += n;
     1.1   ragge         n = m/2;
     1.1   ragge         if((n+n)!=m) {x *= 2; m -=1; n=m/2;}
     1.1   ragge
     1.1   ragge     /* generate sqrt(x) bit by bit (accumulating in q) */
     1.1   ragge             q=1.0; s=4.0; x -= 1.0; r=1;
     1.1   ragge             for(i=1;i<=k;i++) {
     1.1   ragge                 t=s+1; x *= 4; r /= 2;
     1.1   ragge                 if(t<=x) {
     1.1   ragge                     s=t+t+2, x -= t; q += r;}
     1.1   ragge                 else
     1.1   ragge                     s *= 2;
     1.1   ragge                 }
     1.3  simonb
     1.1   ragge     /* generate the last bit and determine the final rounding */
     1.3  simonb             r/=2; x *= 4;
1.3.10.1   lukem             if(x==__zero) goto end; 100+r; /* trigger inexact flag */
     1.1   ragge             if(s<x) {
     1.1   ragge                 q+=r; x -=s; s += 2; s *= 2; x *= 4;
     1.3  simonb                 t = (x-s)-5;
     1.1   ragge                 b=1.0+3*r/4; if(b==1.0) goto end; /* b==1 : Round-to-zero */
     1.1   ragge                 b=1.0+r/4;   if(b>1.0) t=1;	/* b>1 : Round-to-(+INF) */
     1.1   ragge                 if(t>=0) q+=r; }	      /* else: Round-to-nearest */
     1.3  simonb             else {
     1.3  simonb                 s *= 2; x *= 4;
     1.3  simonb                 t = (x-s)-1;
     1.1   ragge                 b=1.0+3*r/4; if(b==1.0) goto end;
     1.1   ragge                 b=1.0+r/4;   if(b>1.0) t=1;
     1.1   ragge                 if(t>=0) q+=r; }
     1.3  simonb
     1.1   ragge end:        return(scalb(q,n));
     1.1   ragge }
     1.1   ragge
     1.1   ragge #if 0
     1.1   ragge /* DREM(X,Y)
     1.1   ragge  * RETURN X REM Y =X-N*Y, N=[X/Y] ROUNDED (ROUNDED TO EVEN IN THE HALF WAY CASE)
     1.1   ragge  * DOUBLE PRECISION (VAX D format 56 bits, IEEE DOUBLE 53 BITS)
     1.1   ragge  * INTENDED FOR ASSEMBLY LANGUAGE
     1.1   ragge  * CODED IN C BY K.C. NG, 3/23/85, 4/8/85.
     1.1   ragge  *
     1.1   ragge  * Warning: this code should not get compiled in unless ALL of
     1.1   ragge  * the following machine-dependent routines are supplied.
     1.3  simonb  *
     1.1   ragge  * Required machine dependent functions (not on a VAX):
     1.1   ragge  *     swapINX(i): save inexact flag and reset it to "i"
     1.1   ragge  *     swapENI(e): save inexact enable and reset it to "e"
     1.1   ragge  */
     1.1   ragge
1.3.10.1   lukem double
1.3.10.1   lukem drem(double x, double y)
     1.1   ragge {
     1.1   ragge
     1.1   ragge #ifdef national		/* order of words in floating point number */
     1.1   ragge 	static const n0=3,n1=2,n2=1,n3=0;
     1.1   ragge #else /* VAX, SUN, ZILOG, TAHOE */
     1.1   ragge 	static const n0=0,n1=1,n2=2,n3=3;
     1.1   ragge #endif
     1.1   ragge
     1.1   ragge     	static const unsigned short mexp =0x7ff0, m25 =0x0190, m57 =0x0390;
     1.1   ragge 	double hy,y1,t,t1;
     1.1   ragge 	short k;
     1.1   ragge 	long n;
     1.3  simonb 	int i,e;
     1.3  simonb 	unsigned short xexp,yexp, *px  =(unsigned short *) &x  ,
     1.1   ragge 	      		nx,nf,	  *py  =(unsigned short *) &y  ,
     1.1   ragge 	      		sign,	  *pt  =(unsigned short *) &t  ,
     1.1   ragge 	      			  *pt1 =(unsigned short *) &t1 ;
     1.1   ragge
     1.1   ragge 	xexp = px[n0] & mexp ;	/* exponent of x */
     1.1   ragge 	yexp = py[n0] & mexp ;	/* exponent of y */
     1.1   ragge 	sign = px[n0] &0x8000;	/* sign of x     */
     1.1   ragge
     1.1   ragge /* return NaN if x is NaN, or y is NaN, or x is INF, or y is zero */
     1.1   ragge 	if(x!=x) return(x); if(y!=y) return(y);	     /* x or y is NaN */
1.3.10.1   lukem 	if( xexp == mexp )   return(__zero/__zero);      /* x is INF */
1.3.10.1   lukem 	if(y==__zero) return(y/y);
     1.1   ragge
     1.1   ragge /* save the inexact flag and inexact enable in i and e respectively
     1.1   ragge  * and reset them to zero
     1.1   ragge  */
     1.3  simonb 	i=swapINX(0);	e=swapENI(0);
     1.1   ragge
     1.1   ragge /* subnormal number */
     1.1   ragge 	nx=0;
     1.1   ragge 	if(yexp==0) {t=1.0,pt[n0]+=m57; y*=t; nx=m57;}
     1.1   ragge
     1.1   ragge /* if y is tiny (biased exponent <= 57), scale up y to y*2**57 */
     1.1   ragge 	if( yexp <= m57 ) {py[n0]+=m57; nx+=m57; yexp+=m57;}
     1.1   ragge
     1.1   ragge 	nf=nx;
     1.3  simonb 	py[n0] &= 0x7fff;
     1.1   ragge 	px[n0] &= 0x7fff;
     1.1   ragge
     1.1   ragge /* mask off the least significant 27 bits of y */
     1.1   ragge 	t=y; pt[n3]=0; pt[n2]&=0xf800; y1=t;
     1.1   ragge
     1.1   ragge /* LOOP: argument reduction on x whenever x > y */
     1.1   ragge loop:
     1.1   ragge 	while ( x > y )
     1.1   ragge 	{
     1.1   ragge 	    t=y;
     1.1   ragge 	    t1=y1;
     1.1   ragge 	    xexp=px[n0]&mexp;	  /* exponent of x */
     1.1   ragge 	    k=xexp-yexp-m25;
     1.1   ragge 	    if(k>0) 	/* if x/y >= 2**26, scale up y so that x/y < 2**26 */
     1.1   ragge 		{pt[n0]+=k;pt1[n0]+=k;}
     1.1   ragge 	    n=x/t; x=(x-n*t1)-n*(t-t1);
     1.3  simonb 	}
     1.1   ragge     /* end while (x > y) */
     1.1   ragge
     1.1   ragge 	if(nx!=0) {t=1.0; pt[n0]+=nx; x*=t; nx=0; goto loop;}
     1.1   ragge
     1.1   ragge /* final adjustment */
     1.1   ragge
     1.1   ragge 	hy=y/2.0;
     1.3  simonb 	if(x>hy||((x==hy)&&n%2==1)) x-=y;
     1.1   ragge 	px[n0] ^= sign;
     1.1   ragge 	if(nf!=0) { t=1.0; pt[n0]-=nf; x*=t;}
     1.1   ragge
     1.1   ragge /* restore inexact flag and inexact enable */
     1.3  simonb 	swapINX(i); swapENI(e);
     1.1   ragge
     1.3  simonb 	return(x);
     1.1   ragge }
     1.1   ragge #endif
     1.1   ragge
     1.1   ragge #if 0
     1.1   ragge /* SQRT
     1.1   ragge  * RETURN CORRECTLY ROUNDED (ACCORDING TO THE ROUNDING MODE) SQRT
     1.1   ragge  * FOR IEEE DOUBLE PRECISION ONLY, INTENDED FOR ASSEMBLY LANGUAGE
     1.1   ragge  * CODED IN C BY K.C. NG, 3/22/85.
     1.1   ragge  *
     1.1   ragge  * Warning: this code should not get compiled in unless ALL of
     1.1   ragge  * the following machine-dependent routines are supplied.
     1.3  simonb  *
     1.1   ragge  * Required machine dependent functions:
     1.1   ragge  *     swapINX(i)  ...return the status of INEXACT flag and reset it to "i"
     1.1   ragge  *     swapRM(r)   ...return the current Rounding Mode and reset it to "r"
     1.1   ragge  *     swapENI(e)  ...return the status of inexact enable and reset it to "e"
     1.1   ragge  *     addc(t)     ...perform t=t+1 regarding t as a 64 bit unsigned integer
     1.1   ragge  *     subc(t)     ...perform t=t-1 regarding t as a 64 bit unsigned integer
     1.1   ragge  */
     1.1   ragge
     1.1   ragge static const unsigned long table[] = {
     1.1   ragge 0, 1204, 3062, 5746, 9193, 13348, 18162, 23592, 29598, 36145, 43202, 50740,
     1.1   ragge 58733, 67158, 75992, 85215, 83599, 71378, 60428, 50647, 41945, 34246, 27478,
     1.1   ragge 21581, 16499, 12183, 8588, 5674, 3403, 1742, 661, 130, };
     1.1   ragge
1.3.10.1   lukem double
1.3.10.1   lukem newsqrt(double x)
     1.1   ragge {
     1.1   ragge         double y,z,t,addc(),subc()
     1.1   ragge 	double const b54=134217728.*134217728.; /* b54=2**54 */
     1.1   ragge         long mx,scalx;
     1.1   ragge 	long const mexp=0x7ff00000;
     1.3  simonb         int i,j,r,e,swapINX(),swapRM(),swapENI();
     1.1   ragge         unsigned long *py=(unsigned long *) &y   ,
     1.1   ragge                       *pt=(unsigned long *) &t   ,
     1.1   ragge                       *px=(unsigned long *) &x   ;
     1.1   ragge #ifdef national         /* ordering of word in a floating point number */
     1.3  simonb         const int n0=1, n1=0;
     1.1   ragge #else
     1.3  simonb         const int n0=0, n1=1;
     1.1   ragge #endif
     1.3  simonb /* Rounding Mode:  RN ...round-to-nearest
     1.1   ragge  *                 RZ ...round-towards 0
     1.1   ragge  *                 RP ...round-towards +INF
     1.1   ragge  *		   RM ...round-towards -INF
     1.1   ragge  */
     1.1   ragge         const int RN=0,RZ=1,RP=2,RM=3;
     1.1   ragge 				/* machine dependent: work on a Zilog Z8070
     1.1   ragge                                  * and a National 32081 & 16081
     1.1   ragge                                  */
     1.1   ragge
     1.1   ragge /* exceptions */
     1.1   ragge 	if(x!=x||x==0.0) return(x);  /* sqrt(NaN) is NaN, sqrt(+-0) = +-0 */
     1.1   ragge 	if(x<0) return((x-x)/(x-x)); /* sqrt(negative) is invalid */
     1.1   ragge         if((mx=px[n0]&mexp)==mexp) return(x);  /* sqrt(+INF) is +INF */
     1.1   ragge
     1.1   ragge /* save, reset, initialize */
     1.1   ragge         e=swapENI(0);   /* ...save and reset the inexact enable */
     1.1   ragge         i=swapINX(0);   /* ...save INEXACT flag */
     1.1   ragge         r=swapRM(RN);   /* ...save and reset the Rounding Mode to RN */
     1.1   ragge         scalx=0;
     1.1   ragge
     1.1   ragge /* subnormal number, scale up x to x*2**54 */
     1.1   ragge         if(mx==0) {x *= b54 ; scalx-=0x01b00000;}
     1.1   ragge
     1.1   ragge /* scale x to avoid intermediate over/underflow:
     1.1   ragge  * if (x > 2**512) x=x/2**512; if (x < 2**-512) x=x*2**512 */
     1.1   ragge         if(mx>0x5ff00000) {px[n0] -= 0x20000000; scalx+= 0x10000000;}
     1.1   ragge         if(mx<0x1ff00000) {px[n0] += 0x20000000; scalx-= 0x10000000;}
     1.1   ragge
     1.1   ragge /* magic initial approximation to almost 8 sig. bits */
     1.1   ragge         py[n0]=(px[n0]>>1)+0x1ff80000;
     1.1   ragge         py[n0]=py[n0]-table[(py[n0]>>15)&31];
     1.1   ragge
     1.1   ragge /* Heron's rule once with correction to improve y to almost 18 sig. bits */
     1.1   ragge         t=x/y; y=y+t; py[n0]=py[n0]-0x00100006; py[n1]=0;
     1.1   ragge
     1.1   ragge /* triple to almost 56 sig. bits; now y approx. sqrt(x) to within 1 ulp */
     1.3  simonb         t=y*y; z=t;  pt[n0]+=0x00100000; t+=z; z=(x-z)*y;
     1.1   ragge         t=z/(t+x) ;  pt[n0]+=0x00100000; y+=t;
     1.1   ragge
     1.3  simonb /* twiddle last bit to force y correctly rounded */
     1.1   ragge         swapRM(RZ);     /* ...set Rounding Mode to round-toward-zero */
     1.1   ragge         swapINX(0);     /* ...clear INEXACT flag */
     1.1   ragge         swapENI(e);     /* ...restore inexact enable status */
     1.1   ragge         t=x/y;          /* ...chopped quotient, possibly inexact */
     1.1   ragge         j=swapINX(i);   /* ...read and restore inexact flag */
     1.1   ragge         if(j==0) { if(t==y) goto end; else t=subc(t); }  /* ...t=t-ulp */
     1.1   ragge         b54+0.1;        /* ..trigger inexact flag, sqrt(x) is inexact */
     1.1   ragge         if(r==RN) t=addc(t);            /* ...t=t+ulp */
     1.1   ragge         else if(r==RP) { t=addc(t);y=addc(y);}/* ...t=t+ulp;y=y+ulp; */
     1.1   ragge         y=y+t;                          /* ...chopped sum */
     1.1   ragge         py[n0]=py[n0]-0x00100000;       /* ...correctly rounded sqrt(x) */
     1.1   ragge end:    py[n0]=py[n0]+scalx;            /* ...scale back y */
     1.1   ragge         swapRM(r);                      /* ...restore Rounding Mode */
     1.1   ragge         return(y);
     1.1   ragge }
     1.1   ragge #endif