msun/src/e_sqrt.c

141296Sdas
141296Sdas/* @(#)e_sqrt.c 1.3 95/01/18 */
2116Sjkh/*
2116Sjkh * ====================================================
2116Sjkh * Copyright (C) 1993 by Sun Microsystems, Inc. All rights reserved.
2116Sjkh *
141296Sdas * Developed at SunSoft, a Sun Microsystems, Inc. business.
2116Sjkh * Permission to use, copy, modify, and distribute this
141296Sdas * software is freely granted, provided that this notice
2116Sjkh * is preserved.
2116Sjkh * ====================================================
2116Sjkh */
2116Sjkh
176720Sdas#include <sys/cdefs.h>
176720Sdas__FBSDID("$FreeBSD$");
2116Sjkh
2116Sjkh/* __ieee754_sqrt(x)
2116Sjkh * Return correctly rounded sqrt.
2116Sjkh *           ------------------------------------------
2116Sjkh *	     |  Use the hardware sqrt if you have one |
2116Sjkh *           ------------------------------------------
141296Sdas * Method:
141296Sdas *   Bit by bit method using integer arithmetic. (Slow, but portable)
2116Sjkh *   1. Normalization
141296Sdas *	Scale x to y in [1,4) with even powers of 2:
2116Sjkh *	find an integer k such that  1 <= (y=x*2^(2k)) < 4, then
2116Sjkh *		sqrt(x) = 2^k * sqrt(y)
2116Sjkh *   2. Bit by bit computation
2116Sjkh *	Let q  = sqrt(y) truncated to i bit after binary point (q = 1),
2116Sjkh *	     i							 0
2116Sjkh *                                     i+1         2
2116Sjkh *	    s  = 2*q , and	y  =  2   * ( y - q  ).		(1)
2116Sjkh *	     i      i            i                 i
141296Sdas *
141296Sdas *	To compute q    from q , one checks whether
141296Sdas *		    i+1       i
2116Sjkh *
2116Sjkh *			      -(i+1) 2
2116Sjkh *			(q + 2      ) <= y.			(2)
2116Sjkh *     			  i
2116Sjkh *							      -(i+1)
2116Sjkh *	If (2) is false, then q   = q ; otherwise q   = q  + 2      .
2116Sjkh *		 	       i+1   i             i+1   i
2116Sjkh *
2116Sjkh *	With some algebric manipulation, it is not difficult to see
141296Sdas *	that (2) is equivalent to
2116Sjkh *                             -(i+1)
2116Sjkh *			s  +  2       <= y			(3)
2116Sjkh *			 i                i
2116Sjkh *
141296Sdas *	The advantage of (3) is that s  and y  can be computed by
2116Sjkh *				      i      i
2116Sjkh *	the following recurrence formula:
2116Sjkh *	    if (3) is false
2116Sjkh *
2116Sjkh *	    s     =  s  ,	y    = y   ;			(4)
2116Sjkh *	     i+1      i		 i+1    i
2116Sjkh *
2116Sjkh *	    otherwise,
2116Sjkh *                         -i                     -(i+1)
2116Sjkh *	    s	  =  s  + 2  ,  y    = y  -  s  - 2  		(5)
2116Sjkh *           i+1      i          i+1    i     i
141296Sdas *
141296Sdas *	One may easily use induction to prove (4) and (5).
2116Sjkh *	Note. Since the left hand side of (3) contain only i+2 bits,
141296Sdas *	      it does not necessary to do a full (53-bit) comparison
2116Sjkh *	      in (3).
2116Sjkh *   3. Final rounding
2116Sjkh *	After generating the 53 bits result, we compute one more bit.
2116Sjkh *	Together with the remainder, we can decide whether the
2116Sjkh *	result is exact, bigger than 1/2ulp, or less than 1/2ulp
2116Sjkh *	(it will never equal to 1/2ulp).
2116Sjkh *	The rounding mode can be detected by checking whether
2116Sjkh *	huge + tiny is equal to huge, and whether huge - tiny is
2116Sjkh *	equal to huge for some floating point number "huge" and "tiny".
141296Sdas *
2116Sjkh * Special cases:
2116Sjkh *	sqrt(+-0) = +-0 	... exact
2116Sjkh *	sqrt(inf) = inf
2116Sjkh *	sqrt(-ve) = NaN		... with invalid signal
2116Sjkh *	sqrt(NaN) = NaN		... with invalid signal for signaling NaN
2116Sjkh *
2116Sjkh * Other methods : see the appended file at the end of the program below.
2116Sjkh *---------------
2116Sjkh */
2116Sjkh
176720Sdas#include <float.h>
176720Sdas
2116Sjkh#include "math.h"
2116Sjkh#include "math_private.h"
2116Sjkh
2116Sjkhstatic	const double	one	= 1.0, tiny=1.0e-300;
2116Sjkh
97413Salfreddouble
117912Speter__ieee754_sqrt(double x)
2116Sjkh{
2116Sjkh	double z;
8870Srgrimes	int32_t sign = (int)0x80000000;
2116Sjkh	int32_t ix0,s0,q,m,t,i;
2116Sjkh	u_int32_t r,t1,s1,ix1,q1;
2116Sjkh
2116Sjkh	EXTRACT_WORDS(ix0,ix1,x);
2116Sjkh
2116Sjkh    /* take care of Inf and NaN */
141296Sdas	if((ix0&0x7ff00000)==0x7ff00000) {
2116Sjkh	    return x*x+x;		/* sqrt(NaN)=NaN, sqrt(+inf)=+inf
2116Sjkh					   sqrt(-inf)=sNaN */
141296Sdas	}
2116Sjkh    /* take care of zero */
2116Sjkh	if(ix0<=0) {
2116Sjkh	    if(((ix0&(~sign))|ix1)==0) return x;/* sqrt(+-0) = +-0 */
2116Sjkh	    else if(ix0<0)
2116Sjkh		return (x-x)/(x-x);		/* sqrt(-ve) = sNaN */
2116Sjkh	}
2116Sjkh    /* normalize x */
2116Sjkh	m = (ix0>>20);
2116Sjkh	if(m==0) {				/* subnormal x */
2116Sjkh	    while(ix0==0) {
2116Sjkh		m -= 21;
2116Sjkh		ix0 |= (ix1>>11); ix1 <<= 21;
2116Sjkh	    }
2116Sjkh	    for(i=0;(ix0&0x00100000)==0;i++) ix0<<=1;
2116Sjkh	    m -= i-1;
2116Sjkh	    ix0 |= (ix1>>(32-i));
2116Sjkh	    ix1 <<= i;
2116Sjkh	}
2116Sjkh	m -= 1023;	/* unbias exponent */
2116Sjkh	ix0 = (ix0&0x000fffff)|0x00100000;
2116Sjkh	if(m&1){	/* odd m, double x to make it even */
2116Sjkh	    ix0 += ix0 + ((ix1&sign)>>31);
2116Sjkh	    ix1 += ix1;
2116Sjkh	}
2116Sjkh	m >>= 1;	/* m = [m/2] */
2116Sjkh
2116Sjkh    /* generate sqrt(x) bit by bit */
2116Sjkh	ix0 += ix0 + ((ix1&sign)>>31);
2116Sjkh	ix1 += ix1;
2116Sjkh	q = q1 = s0 = s1 = 0;	/* [q,q1] = sqrt(x) */
2116Sjkh	r = 0x00200000;		/* r = moving bit from right to left */
2116Sjkh
2116Sjkh	while(r!=0) {
141296Sdas	    t = s0+r;
141296Sdas	    if(t<=ix0) {
141296Sdas		s0   = t+r;
141296Sdas		ix0 -= t;
141296Sdas		q   += r;
141296Sdas	    }
2116Sjkh	    ix0 += ix0 + ((ix1&sign)>>31);
2116Sjkh	    ix1 += ix1;
2116Sjkh	    r>>=1;
2116Sjkh	}
2116Sjkh
2116Sjkh	r = sign;
2116Sjkh	while(r!=0) {
141296Sdas	    t1 = s1+r;
2116Sjkh	    t  = s0;
141296Sdas	    if((t<ix0)||((t==ix0)&&(t1<=ix1))) {
2116Sjkh		s1  = t1+r;
2116Sjkh		if(((t1&sign)==sign)&&(s1&sign)==0) s0 += 1;
2116Sjkh		ix0 -= t;
2116Sjkh		if (ix1 < t1) ix0 -= 1;
2116Sjkh		ix1 -= t1;
2116Sjkh		q1  += r;
2116Sjkh	    }
2116Sjkh	    ix0 += ix0 + ((ix1&sign)>>31);
2116Sjkh	    ix1 += ix1;
2116Sjkh	    r>>=1;
2116Sjkh	}
2116Sjkh
2116Sjkh    /* use floating add to find out rounding direction */
2116Sjkh	if((ix0|ix1)!=0) {
2116Sjkh	    z = one-tiny; /* trigger inexact flag */
2116Sjkh	    if (z>=one) {
2116Sjkh	        z = one+tiny;
2116Sjkh	        if (q1==(u_int32_t)0xffffffff) { q1=0; q += 1;}
2116Sjkh		else if (z>one) {
2116Sjkh		    if (q1==(u_int32_t)0xfffffffe) q+=1;
141296Sdas		    q1+=2;
2116Sjkh		} else
2116Sjkh	            q1 += (q1&1);
2116Sjkh	    }
2116Sjkh	}
2116Sjkh	ix0 = (q>>1)+0x3fe00000;
2116Sjkh	ix1 =  q1>>1;
2116Sjkh	if ((q&1)==1) ix1 |= sign;
2116Sjkh	ix0 += (m <<20);
2116Sjkh	INSERT_WORDS(z,ix0,ix1);
2116Sjkh	return z;
2116Sjkh}
2116Sjkh
176720Sdas#if (LDBL_MANT_DIG == 53)
176720Sdas__weak_reference(sqrt, sqrtl);
176720Sdas#endif
176720Sdas
2116Sjkh/*
2116SjkhOther methods  (use floating-point arithmetic)
2116Sjkh-------------
141296Sdas(This is a copy of a drafted paper by Prof W. Kahan
2116Sjkhand K.C. Ng, written in May, 1986)
2116Sjkh
141296Sdas	Two algorithms are given here to implement sqrt(x)
2116Sjkh	(IEEE double precision arithmetic) in software.
2116Sjkh	Both supply sqrt(x) correctly rounded. The first algorithm (in
2116Sjkh	Section A) uses newton iterations and involves four divisions.
2116Sjkh	The second one uses reciproot iterations to avoid division, but
2116Sjkh	requires more multiplications. Both algorithms need the ability
141296Sdas	to chop results of arithmetic operations instead of round them,
2116Sjkh	and the INEXACT flag to indicate when an arithmetic operation
141296Sdas	is executed exactly with no roundoff error, all part of the
2116Sjkh	standard (IEEE 754-1985). The ability to perform shift, add,
2116Sjkh	subtract and logical AND operations upon 32-bit words is needed
2116Sjkh	too, though not part of the standard.
2116Sjkh
2116SjkhA.  sqrt(x) by Newton Iteration
2116Sjkh
2116Sjkh   (1)	Initial approximation
2116Sjkh
2116Sjkh	Let x0 and x1 be the leading and the trailing 32-bit words of
141296Sdas	a floating point number x (in IEEE double format) respectively
2116Sjkh
2116Sjkh	    1    11		     52				  ...widths
2116Sjkh	   ------------------------------------------------------
2116Sjkh	x: |s|	  e     |	      f				|
2116Sjkh	   ------------------------------------------------------
2116Sjkh	      msb    lsb  msb				      lsb ...order
2116Sjkh
141296Sdas
2116Sjkh	     ------------------------  	     ------------------------
2116Sjkh	x0:  |s|   e    |    f1     |	 x1: |          f2           |
2116Sjkh	     ------------------------  	     ------------------------
2116Sjkh
2116Sjkh	By performing shifts and subtracts on x0 and x1 (both regarded
2116Sjkh	as integers), we obtain an 8-bit approximation of sqrt(x) as
2116Sjkh	follows.
2116Sjkh
2116Sjkh		k  := (x0>>1) + 0x1ff80000;
2116Sjkh		y0 := k - T1[31&(k>>15)].	... y ~ sqrt(x) to 8 bits
2116Sjkh	Here k is a 32-bit integer and T1[] is an integer array containing
2116Sjkh	correction terms. Now magically the floating value of y (y's
2116Sjkh	leading 32-bit word is y0, the value of its trailing word is 0)
2116Sjkh	approximates sqrt(x) to almost 8-bit.
2116Sjkh
2116Sjkh	Value of T1:
2116Sjkh	static int T1[32]= {
2116Sjkh	0,	1024,	3062,	5746,	9193,	13348,	18162,	23592,
2116Sjkh	29598,	36145,	43202,	50740,	58733,	67158,	75992,	85215,
2116Sjkh	83599,	71378,	60428,	50647,	41945,	34246,	27478,	21581,
2116Sjkh	16499,	12183,	8588,	5674,	3403,	1742,	661,	130,};
2116Sjkh
2116Sjkh    (2)	Iterative refinement
2116Sjkh
141296Sdas	Apply Heron's rule three times to y, we have y approximates
2116Sjkh	sqrt(x) to within 1 ulp (Unit in the Last Place):
2116Sjkh
2116Sjkh		y := (y+x/y)/2		... almost 17 sig. bits
2116Sjkh		y := (y+x/y)/2		... almost 35 sig. bits
2116Sjkh		y := y-(y-x/y)/2	... within 1 ulp
2116Sjkh
2116Sjkh
2116Sjkh	Remark 1.
2116Sjkh	    Another way to improve y to within 1 ulp is:
2116Sjkh
2116Sjkh		y := (y+x/y)		... almost 17 sig. bits to 2*sqrt(x)
2116Sjkh		y := y - 0x00100006	... almost 18 sig. bits to sqrt(x)
2116Sjkh
2116Sjkh				2
2116Sjkh			    (x-y )*y
2116Sjkh		y := y + 2* ----------	...within 1 ulp
2116Sjkh			       2
2116Sjkh			     3y  + x
2116Sjkh
2116Sjkh
2116Sjkh	This formula has one division fewer than the one above; however,
2116Sjkh	it requires more multiplications and additions. Also x must be
2116Sjkh	scaled in advance to avoid spurious overflow in evaluating the
2116Sjkh	expression 3y*y+x. Hence it is not recommended uless division
141296Sdas	is slow. If division is very slow, then one should use the
2116Sjkh	reciproot algorithm given in section B.
2116Sjkh
2116Sjkh    (3) Final adjustment
2116Sjkh
141296Sdas	By twiddling y's last bit it is possible to force y to be
2116Sjkh	correctly rounded according to the prevailing rounding mode
2116Sjkh	as follows. Let r and i be copies of the rounding mode and
2116Sjkh	inexact flag before entering the square root program. Also we
2116Sjkh	use the expression y+-ulp for the next representable floating
2116Sjkh	numbers (up and down) of y. Note that y+-ulp = either fixed
2116Sjkh	point y+-1, or multiply y by nextafter(1,+-inf) in chopped
2116Sjkh	mode.
2116Sjkh
2116Sjkh		I := FALSE;	... reset INEXACT flag I
2116Sjkh		R := RZ;	... set rounding mode to round-toward-zero
2116Sjkh		z := x/y;	... chopped quotient, possibly inexact
2116Sjkh		If(not I) then {	... if the quotient is exact
2116Sjkh		    if(z=y) {
2116Sjkh		        I := i;	 ... restore inexact flag
2116Sjkh		        R := r;  ... restore rounded mode
2116Sjkh		        return sqrt(x):=y.
2116Sjkh		    } else {
2116Sjkh			z := z - ulp;	... special rounding
2116Sjkh		    }
2116Sjkh		}
2116Sjkh		i := TRUE;		... sqrt(x) is inexact
2116Sjkh		If (r=RN) then z=z+ulp	... rounded-to-nearest
2116Sjkh		If (r=RP) then {	... round-toward-+inf
2116Sjkh		    y = y+ulp; z=z+ulp;
2116Sjkh		}
2116Sjkh		y := y+z;		... chopped sum
2116Sjkh		y0:=y0-0x00100000;	... y := y/2 is correctly rounded.
2116Sjkh	        I := i;	 		... restore inexact flag
2116Sjkh	        R := r;  		... restore rounded mode
2116Sjkh	        return sqrt(x):=y.
141296Sdas
2116Sjkh    (4)	Special cases
2116Sjkh
2116Sjkh	Square root of +inf, +-0, or NaN is itself;
2116Sjkh	Square root of a negative number is NaN with invalid signal.
2116Sjkh
2116Sjkh
2116SjkhB.  sqrt(x) by Reciproot Iteration
2116Sjkh
2116Sjkh   (1)	Initial approximation
2116Sjkh
2116Sjkh	Let x0 and x1 be the leading and the trailing 32-bit words of
2116Sjkh	a floating point number x (in IEEE double format) respectively
2116Sjkh	(see section A). By performing shifs and subtracts on x0 and y0,
2116Sjkh	we obtain a 7.8-bit approximation of 1/sqrt(x) as follows.
2116Sjkh
2116Sjkh	    k := 0x5fe80000 - (x0>>1);
2116Sjkh	    y0:= k - T2[63&(k>>14)].	... y ~ 1/sqrt(x) to 7.8 bits
2116Sjkh
141296Sdas	Here k is a 32-bit integer and T2[] is an integer array
2116Sjkh	containing correction terms. Now magically the floating
2116Sjkh	value of y (y's leading 32-bit word is y0, the value of
2116Sjkh	its trailing word y1 is set to zero) approximates 1/sqrt(x)
2116Sjkh	to almost 7.8-bit.
2116Sjkh
2116Sjkh	Value of T2:
2116Sjkh	static int T2[64]= {
2116Sjkh	0x1500,	0x2ef8,	0x4d67,	0x6b02,	0x87be,	0xa395,	0xbe7a,	0xd866,
2116Sjkh	0xf14a,	0x1091b,0x11fcd,0x13552,0x14999,0x15c98,0x16e34,0x17e5f,
2116Sjkh	0x18d03,0x19a01,0x1a545,0x1ae8a,0x1b5c4,0x1bb01,0x1bfde,0x1c28d,
2116Sjkh	0x1c2de,0x1c0db,0x1ba73,0x1b11c,0x1a4b5,0x1953d,0x18266,0x16be0,
2116Sjkh	0x1683e,0x179d8,0x18a4d,0x19992,0x1a789,0x1b445,0x1bf61,0x1c989,
2116Sjkh	0x1d16d,0x1d77b,0x1dddf,0x1e2ad,0x1e5bf,0x1e6e8,0x1e654,0x1e3cd,
2116Sjkh	0x1df2a,0x1d635,0x1cb16,0x1be2c,0x1ae4e,0x19bde,0x1868e,0x16e2e,
2116Sjkh	0x1527f,0x1334a,0x11051,0xe951,	0xbe01,	0x8e0d,	0x5924,	0x1edd,};
2116Sjkh
2116Sjkh    (2)	Iterative refinement
2116Sjkh
2116Sjkh	Apply Reciproot iteration three times to y and multiply the
2116Sjkh	result by x to get an approximation z that matches sqrt(x)
141296Sdas	to about 1 ulp. To be exact, we will have
2116Sjkh		-1ulp < sqrt(x)-z<1.0625ulp.
141296Sdas
2116Sjkh	... set rounding mode to Round-to-nearest
2116Sjkh	   y := y*(1.5-0.5*x*y*y)	... almost 15 sig. bits to 1/sqrt(x)
2116Sjkh	   y := y*((1.5-2^-30)+0.5*x*y*y)... about 29 sig. bits to 1/sqrt(x)
2116Sjkh	... special arrangement for better accuracy
2116Sjkh	   z := x*y			... 29 bits to sqrt(x), with z*y<1
2116Sjkh	   z := z + 0.5*z*(1-z*y)	... about 1 ulp to sqrt(x)
2116Sjkh
2116Sjkh	Remark 2. The constant 1.5-2^-30 is chosen to bias the error so that
141296Sdas	(a) the term z*y in the final iteration is always less than 1;
2116Sjkh	(b) the error in the final result is biased upward so that
2116Sjkh		-1 ulp < sqrt(x) - z < 1.0625 ulp
2116Sjkh	    instead of |sqrt(x)-z|<1.03125ulp.
2116Sjkh
2116Sjkh    (3)	Final adjustment
2116Sjkh
141296Sdas	By twiddling y's last bit it is possible to force y to be
2116Sjkh	correctly rounded according to the prevailing rounding mode
2116Sjkh	as follows. Let r and i be copies of the rounding mode and
2116Sjkh	inexact flag before entering the square root program. Also we
2116Sjkh	use the expression y+-ulp for the next representable floating
2116Sjkh	numbers (up and down) of y. Note that y+-ulp = either fixed
2116Sjkh	point y+-1, or multiply y by nextafter(1,+-inf) in chopped
2116Sjkh	mode.
2116Sjkh
2116Sjkh	R := RZ;		... set rounding mode to round-toward-zero
2116Sjkh	switch(r) {
2116Sjkh	    case RN:		... round-to-nearest
2116Sjkh	       if(x<= z*(z-ulp)...chopped) z = z - ulp; else
2116Sjkh	       if(x<= z*(z+ulp)...chopped) z = z; else z = z+ulp;
2116Sjkh	       break;
2116Sjkh	    case RZ:case RM:	... round-to-zero or round-to--inf
2116Sjkh	       R:=RP;		... reset rounding mod to round-to-+inf
2116Sjkh	       if(x<z*z ... rounded up) z = z - ulp; else
2116Sjkh	       if(x>=(z+ulp)*(z+ulp) ...rounded up) z = z+ulp;
2116Sjkh	       break;
2116Sjkh	    case RP:		... round-to-+inf
2116Sjkh	       if(x>(z+ulp)*(z+ulp)...chopped) z = z+2*ulp; else
2116Sjkh	       if(x>z*z ...chopped) z = z+ulp;
2116Sjkh	       break;
2116Sjkh	}
2116Sjkh
2116Sjkh	Remark 3. The above comparisons can be done in fixed point. For
2116Sjkh	example, to compare x and w=z*z chopped, it suffices to compare
2116Sjkh	x1 and w1 (the trailing parts of x and w), regarding them as
2116Sjkh	two's complement integers.
2116Sjkh
2116Sjkh	...Is z an exact square root?
2116Sjkh	To determine whether z is an exact square root of x, let z1 be the
2116Sjkh	trailing part of z, and also let x0 and x1 be the leading and
2116Sjkh	trailing parts of x.
2116Sjkh
2116Sjkh	If ((z1&0x03ffffff)!=0)	... not exact if trailing 26 bits of z!=0
2116Sjkh	    I := 1;		... Raise Inexact flag: z is not exact
2116Sjkh	else {
2116Sjkh	    j := 1 - [(x0>>20)&1]	... j = logb(x) mod 2
141296Sdas	    k := z1 >> 26;		... get z's 25-th and 26-th
2116Sjkh					    fraction bits
2116Sjkh	    I := i or (k&j) or ((k&(j+j+1))!=(x1&3));
2116Sjkh	}
2116Sjkh	R:= r		... restore rounded mode
2116Sjkh	return sqrt(x):=z.
2116Sjkh
141296Sdas	If multiplication is cheaper then the foregoing red tape, the
2116Sjkh	Inexact flag can be evaluated by
2116Sjkh
2116Sjkh	    I := i;
2116Sjkh	    I := (z*z!=x) or I.
2116Sjkh
141296Sdas	Note that z*z can overwrite I; this value must be sensed if it is
2116Sjkh	True.
2116Sjkh
2116Sjkh	Remark 4. If z*z = x exactly, then bit 25 to bit 0 of z1 must be
2116Sjkh	zero.
2116Sjkh
2116Sjkh		    --------------------
141296Sdas		z1: |        f2        |
2116Sjkh		    --------------------
2116Sjkh		bit 31		   bit 0
2116Sjkh
2116Sjkh	Further more, bit 27 and 26 of z1, bit 0 and 1 of x1, and the odd
2116Sjkh	or even of logb(x) have the following relations:
2116Sjkh
2116Sjkh	-------------------------------------------------
2116Sjkh	bit 27,26 of z1		bit 1,0 of x1	logb(x)
2116Sjkh	-------------------------------------------------
2116Sjkh	00			00		odd and even
2116Sjkh	01			01		even
2116Sjkh	10			10		odd
2116Sjkh	10			00		even
2116Sjkh	11			01		even
2116Sjkh	-------------------------------------------------
2116Sjkh
141296Sdas    (4)	Special cases (see (4) of Section A).
141296Sdas
2116Sjkh */
141296Sdas