msun/src/s_cbrt.c

210284Sjmallett/* @(#)s_cbrt.c 5.1 93/09/24 */
232812Sjmallett/*
215990Sjmallett * ====================================================
210284Sjmallett * Copyright (C) 1993 by Sun Microsystems, Inc. All rights reserved.
210284Sjmallett *
215990Sjmallett * Developed at SunPro, a Sun Microsystems, Inc. business.
215990Sjmallett * Permission to use, copy, modify, and distribute this
215990Sjmallett * software is freely granted, provided that this notice
210284Sjmallett * is preserved.
215990Sjmallett * ====================================================
215990Sjmallett */
210284Sjmallett
215990Sjmallett#ifndef lint
215990Sjmallettstatic char rcsid[] = "$FreeBSD: head/lib/msun/src/s_cbrt.c 153306 2005-12-11 19:51:30Z bde $";
215990Sjmallett#endif
215990Sjmallett
215990Sjmallett#include "math.h"
232812Sjmallett#include "math_private.h"
215990Sjmallett
215990Sjmallett/* cbrt(x)
215990Sjmallett * Return cube root of x
215990Sjmallett */
215990Sjmallettstatic const u_int32_t
215990Sjmallett	B1 = 715094163, /* B1 = (1023-1023/3-0.03306235651)*2**20 */
215990Sjmallett	B2 = 696219795; /* B2 = (1023-1023/3-54/3-0.03306235651)*2**20 */
215990Sjmallett
215990Sjmallettstatic const double
215990SjmallettC =  5.42857142857142815906e-01, /* 19/35     = 0x3FE15F15, 0xF15F15F1 */
232812SjmallettD = -7.05306122448979611050e-01, /* -864/1225 = 0xBFE691DE, 0x2532C834 */
215990SjmallettE =  1.41428571428571436819e+00, /* 99/70     = 0x3FF6A0EA, 0x0EA0EA0F */
215990SjmallettF =  1.60714285714285720630e+00, /* 45/28     = 0x3FF9B6DB, 0x6DB6DB6E */
215990SjmallettG =  3.57142857142857150787e-01; /* 5/14      = 0x3FD6DB6D, 0xB6DB6DB7 */
215990Sjmallett
215990Sjmallettdouble
215990Sjmallettcbrt(double x)
215990Sjmallett{
215990Sjmallett	int32_t	hx;
210284Sjmallett	double r,s,t=0.0,w;
210284Sjmallett	u_int32_t sign;
215990Sjmallett	u_int32_t high,low;
210284Sjmallett
210284Sjmallett	GET_HIGH_WORD(hx,x);
210284Sjmallett	sign=hx&0x80000000; 		/* sign= sign(x) */
210284Sjmallett	hx  ^=sign;
210284Sjmallett	if(hx>=0x7ff00000) return(x+x); /* cbrt(NaN,INF) is itself */
210284Sjmallett	GET_LOW_WORD(low,x);
210284Sjmallett	if((hx|low)==0)
210284Sjmallett	    return(x);		/* cbrt(0) is itself */
232812Sjmallett
210284Sjmallett	SET_HIGH_WORD(x,hx);	/* x <- |x| */
210284Sjmallett    /*
210284Sjmallett     * Rough cbrt to 5 bits:
210284Sjmallett     *    cbrt(2**e*(1+m) ~= 2**(e/3)*(1+(e%3+m)/3)
215990Sjmallett     * where e is integral and >= 0, m is real and in [0, 1), and "/" and
215990Sjmallett     * "%" are integer division and modulus with rounding towards minus
215990Sjmallett     * infinity.  The RHS is always >= the LHS and has a maximum relative
232812Sjmallett     * error of about 1 in 16.  Adding a bias of -0.03306235651 to the
215990Sjmallett     * (e%3+m)/3 term reduces the error to about 1 in 32. With the IEEE
215990Sjmallett     * floating point representation, for finite positive normal values,
215990Sjmallett     * ordinary integer divison of the value in bits magically gives
215990Sjmallett     * almost exactly the RHS of the above provided we first subtract the
215990Sjmallett     * exponent bias (1023 for doubles) and later add it back.  We do the
232812Sjmallett     * subtraction virtually to keep e >= 0 so that ordinary integer
232812Sjmallett     * division rounds towards minus infinity; this is also efficient.
215990Sjmallett     */
215990Sjmallett	if(hx<0x00100000) 		/* subnormal number */
215990Sjmallett	  {SET_HIGH_WORD(t,0x43500000);	/* set t= 2**54 */
232812Sjmallett	   t*=x; GET_HIGH_WORD(high,t); SET_HIGH_WORD(t,high/3+B2);
232812Sjmallett	  }
215990Sjmallett	else
215990Sjmallett	  SET_HIGH_WORD(t,hx/3+B1);
215990Sjmallett
215990Sjmallett    /* new cbrt to 23 bits; may be implemented in single precision */
215990Sjmallett	r=t*t/x;
215990Sjmallett	s=C+r*t;
215990Sjmallett	t*=G+F/(s+E+D/s);
215990Sjmallett
215990Sjmallett    /* chop t to 20 bits and make it larger than cbrt(x) */
215990Sjmallett	GET_HIGH_WORD(high,t);
215990Sjmallett	INSERT_WORDS(t,high+0x00000001,0);
215990Sjmallett
215990Sjmallett    /* one step Newton iteration to 53 bits with error less than 0.667 ulps */
215990Sjmallett	s=t*t;		/* t*t is exact */
215990Sjmallett	r=x/s;
215990Sjmallett	w=t+t;
215990Sjmallett	r=(r-t)/(w+r);	/* r-t is exact */
215990Sjmallett	t=t+t*r;
215990Sjmallett
215990Sjmallett    /* restore the sign bit */
215990Sjmallett	GET_HIGH_WORD(high,t);
215990Sjmallett	SET_HIGH_WORD(t,high|sign);
215990Sjmallett	return(t);
215990Sjmallett}
215990Sjmallett