msun/src/e_logf.c

0Sduke/* e_logf.c -- float version of e_log.c.
11884Sykantser * Conversion to float by Ian Lance Taylor, Cygnus Support, ian@cygnus.com.
0Sduke */
0Sduke
0Sduke/*
0Sduke * ====================================================
0Sduke * Copyright (C) 1993 by Sun Microsystems, Inc. All rights reserved.
0Sduke *
0Sduke * Developed at SunPro, a Sun Microsystems, Inc. business.
0Sduke * Permission to use, copy, modify, and distribute this
0Sduke * software is freely granted, provided that this notice
0Sduke * is preserved.
0Sduke * ====================================================
0Sduke */
0Sduke
0Sduke#include <sys/cdefs.h>
0Sduke__FBSDID("$FreeBSD: head/lib/msun/src/e_logf.c 241755 2012-10-19 22:46:48Z imp $");
0Sduke
2362Sohair#include "math.h"
2362Sohair#include "math_private.h"
2362Sohair
0Sduke/* __ieee754_log(x)
0Sduke * Return the logrithm of x
0Sduke *
0Sduke * Method :
0Sduke *   1. Argument Reduction: find k and f such that
0Sduke *                      x = 2^k * (1+f),
0Sduke *         where  sqrt(2)/2 < 1+f < sqrt(2) .
16958Siignatyev *
0Sduke *   2. Approximation of log(1+f).
0Sduke *      Let s = f/(2+f) ; based on log(1+f) = log(1+s) - log(1-s)
0Sduke *               = 2s + 2/3 s**3 + 2/5 s**5 + .....,
0Sduke *               = 2s + s*R
0Sduke *      We use a special Reme algorithm on [0,0.1716] to generate
0Sduke *      a polynomial of degree 8 to approximate R The maximum error
0Sduke *      of this polynomial approximation is bounded by 2**-34.24. In
0Sduke *      other words,
0Sduke *                      2      4      6      8
0Sduke *          R(z) ~ Lg1*s +Lg2*s +Lg3*s +Lg4*s
0Sduke *      (the values of Lg1 to Lg7 are listed in the program)
0Sduke *      and
0Sduke *          |      2          8           |     -34.24
0Sduke *          | Lg1*s +...+Lg4*s    -  R(z) | <= 2
0Sduke *          |                             |
0Sduke *      Note that 2s = f - s*f = f - hfsq + s*hfsq, where hfsq = f*f/2.
0Sduke *      In order to guarantee error in log below 1ulp, we compute log
0Sduke *      by
0Sduke *              log(1+f) = f - s*(f - R)        (if f is not too large)
0Sduke *              log(1+f) = f - (hfsq - s*(hfsq+R)).     (better accuracy)
0Sduke *
0Sduke *      3. Finally,  log(x) = k*ln2 + log(1+f).
0Sduke *                          = k*ln2_hi+(f-(hfsq-(s*(hfsq+R)+k*ln2_lo)))
0Sduke *         Here ln2 is split into two floating point number:
0Sduke *                      ln2_hi + ln2_lo,
0Sduke *         where n*ln2_hi is always exact for |n| < 2000.
0Sduke *
0Sduke * Special cases:
0Sduke *      log(x) is NaN with signal if x < 0 (including -INF) ;
0Sduke *      log(+INF) is +INF; log(0) is -INF with signal;
0Sduke *      log(NaN) is that NaN with no signal.
0Sduke *
0Sduke * Accuracy:
0Sduke *      according to an error analysis, the error is always less than
0Sduke *      1 ulp (unit in the last place).
0Sduke *
0Sduke * Constants:
0Sduke * The hexadecimal values are the intended ones for the following
0Sduke * constants. The decimal values may be used, provided that the
0Sduke * compiler will convert from decimal to binary accurately enough
0Sduke * to produce the hexadecimal values shown.
0Sduke */
0Sduke
0Sdukestatic const float
0Sdukeln2_hi =   6.9313812256e-01,	/* 0x3f317180 */
0Sdukeln2_lo =   9.0580006145e-06,	/* 0x3717f7d1 */
0Sduketwo25 =    3.355443200e+07,	/* 0x4c000000 */
0Sduke/* |(log(1+s)-log(1-s))/s - Lg(s)| < 2**-34.24 (~[-4.95e-11, 4.97e-11]). */
0SdukeLg1 =      0xaaaaaa.0p-24,	/* 0.66666662693 */
0SdukeLg2 =      0xccce13.0p-25,	/* 0.40000972152 */
0SdukeLg3 =      0x91e9ee.0p-25,	/* 0.28498786688 */
0SdukeLg4 =      0xf89e26.0p-26;	/* 0.24279078841 */
0Sduke
0Sdukestatic const float zero   =  0.0;
0Sduke
0Sdukefloat
0Sduke__ieee754_logf(float x)
0Sduke{
0Sduke	float hfsq,f,s,z,R,w,t1,t2,dk;
0Sduke	int32_t k,ix,i,j;
0Sduke
0Sduke	GET_FLOAT_WORD(ix,x);
0Sduke
0Sduke	k=0;
0Sduke	if (ix < 0x00800000) {			/* x < 2**-126  */
0Sduke	    if ((ix&0x7fffffff)==0)
0Sduke		return -two25/zero;		/* log(+-0)=-inf */
0Sduke	    if (ix<0) return (x-x)/zero;	/* log(-#) = NaN */
0Sduke	    k -= 25; x *= two25; /* subnormal number, scale up x */
	    GET_FLOAT_WORD(ix,x);
	}
	if (ix >= 0x7f800000) return x+x;
	k += (ix>>23)-127;
	ix &= 0x007fffff;
	i = (ix+(0x95f64<<3))&0x800000;
	SET_FLOAT_WORD(x,ix|(i^0x3f800000));	/* normalize x or x/2 */
	k += (i>>23);
	f = x-(float)1.0;
	if((0x007fffff&(0x8000+ix))<0xc000) {	/* -2**-9 <= f < 2**-9 */
	    if(f==zero) {
		if(k==0) {
		    return zero;
		} else {
		    dk=(float)k;
		    return dk*ln2_hi+dk*ln2_lo;
		}
	    }
	    R = f*f*((float)0.5-(float)0.33333333333333333*f);
	    if(k==0) return f-R; else {dk=(float)k;
	    	     return dk*ln2_hi-((R-dk*ln2_lo)-f);}
	}
 	s = f/((float)2.0+f);
	dk = (float)k;
	z = s*s;
	i = ix-(0x6147a<<3);
	w = z*z;
	j = (0x6b851<<3)-ix;
	t1= w*(Lg2+w*Lg4);
	t2= z*(Lg1+w*Lg3);
	i |= j;
	R = t2+t1;
	if(i>0) {
	    hfsq=(float)0.5*f*f;
	    if(k==0) return f-(hfsq-s*(hfsq+R)); else
		     return dk*ln2_hi-((hfsq-(s*(hfsq+R)+dk*ln2_lo))-f);
	} else {
	    if(k==0) return f-s*(f-R); else
		     return dk*ln2_hi-((s*(f-R)-dk*ln2_lo)-f);
	}
}