e_rem_pio2.c revision 176467
145096Simp
245096Simp/* @(#)e_rem_pio2.c 1.4 95/01/18 */
3100280Sgordon/*
450472Speter * ====================================================
566830Sobrien * Copyright (C) 1993 by Sun Microsystems, Inc. All rights reserved.
664446Schris *
7100280Sgordon * Developed at SunSoft, a Sun Microsystems, Inc. business.
8100280Sgordon * Permission to use, copy, modify, and distribute this
9100280Sgordon * software is freely granted, provided that this notice
10100280Sgordon * is preserved.
1166830Sobrien * ====================================================
12100280Sgordon *
1392516Sdougb */
14100280Sgordon
15100280Sgordon#include <sys/cdefs.h>
16100280Sgordon__FBSDID("$FreeBSD: head/lib/msun/src/e_rem_pio2.c 176467 2008-02-22 18:43:23Z bde $");
17103019Sgordon
18100280Sgordon/* __ieee754_rem_pio2(x,y)
19100280Sgordon *
20100280Sgordon * return the remainder of x rem pi/2 in y[0]+y[1]
21100280Sgordon * use __kernel_rem_pio2()
22100280Sgordon */
23100280Sgordon
24100280Sgordon#include <float.h>
25100280Sgordon
26100280Sgordon#include "math.h"
27100280Sgordon#include "math_private.h"
28100280Sgordon
29100280Sgordon/*
30100280Sgordon * invpio2:  53 bits of 2/pi
31100280Sgordon * pio2_1:   first  33 bit of pi/2
32100280Sgordon * pio2_1t:  pi/2 - pio2_1
33100280Sgordon * pio2_2:   second 33 bit of pi/2
34100280Sgordon * pio2_2t:  pi/2 - (pio2_1+pio2_2)
35100280Sgordon * pio2_3:   third  33 bit of pi/2
36100280Sgordon * pio2_3t:  pi/2 - (pio2_1+pio2_2+pio2_3)
37100280Sgordon */
38100280Sgordon
39100280Sgordonstatic const double
40100280Sgordonzero =  0.00000000000000000000e+00, /* 0x00000000, 0x00000000 */
41100280Sgordonhalf =  5.00000000000000000000e-01, /* 0x3FE00000, 0x00000000 */
42100280Sgordontwo24 =  1.67772160000000000000e+07, /* 0x41700000, 0x00000000 */
43100280Sgordoninvpio2 =  6.36619772367581382433e-01, /* 0x3FE45F30, 0x6DC9C883 */
44100280Sgordonpio2_1  =  1.57079632673412561417e+00, /* 0x3FF921FB, 0x54400000 */
45100280Sgordonpio2_1t =  6.07710050650619224932e-11, /* 0x3DD0B461, 0x1A626331 */
46100280Sgordonpio2_2  =  6.07710050630396597660e-11, /* 0x3DD0B461, 0x1A600000 */
47100280Sgordonpio2_2t =  2.02226624879595063154e-21, /* 0x3BA3198A, 0x2E037073 */
48100280Sgordonpio2_3  =  2.02226624871116645580e-21, /* 0x3BA3198A, 0x2E000000 */
49100280Sgordonpio2_3t =  8.47842766036889956997e-32; /* 0x397B839A, 0x252049C1 */
50100280Sgordon
51100280Sgordon#ifdef INLINE_REM_PIO2
52105968Sfennerextern inline
53105968Sfenner#endif
54100280Sgordonint
55100280Sgordon__ieee754_rem_pio2(double x, double *y)
56100280Sgordon{
57100280Sgordon	double z,w,t,r,fn;
58100280Sgordon	double tx[3];
59100280Sgordon	int32_t e0,i,j,nx,n,ix,hx;
60100280Sgordon	u_int32_t low;
61100280Sgordon
62100280Sgordon	GET_HIGH_WORD(hx,x);		/* high word of x */
63100280Sgordon	ix = hx&0x7fffffff;
64100280Sgordon#if 0 /* Must be handled in caller. */
65100280Sgordon	if(ix<=0x3fe921fb)   /* |x| ~<= pi/4 , no need for reduction */
66100280Sgordon	    {y[0] = x; y[1] = 0; return 0;}
67100280Sgordon#endif
68100280Sgordon	if (ix <= 0x400f6a7a) {		/* |x| ~<= 5pi/4 */
69100280Sgordon	    if ((ix & 0xfffff) == 0x921fb)  /* |x| ~= pi/2 or 2pi/2 */
70100280Sgordon		goto medium;		/* cancellation -- use medium case */
71	    if (ix <= 0x4002d97c) {	/* |x| ~<= 3pi/4 */
72		if (hx > 0) {
73		    z = x - pio2_1;	/* one round good to 85 bits */
74		    y[0] = z - pio2_1t;
75		    y[1] = (z-y[0])-pio2_1t;
76		    return 1;
77		} else {
78		    z = x + pio2_1;
79		    y[0] = z + pio2_1t;
80		    y[1] = (z-y[0])+pio2_1t;
81		    return -1;
82		}
83	    } else {
84		if (hx > 0) {
85		    z = x - 2*pio2_1;
86		    y[0] = z - 2*pio2_1t;
87		    y[1] = (z-y[0])-2*pio2_1t;
88		    return 2;
89		} else {
90		    z = x + 2*pio2_1;
91		    y[0] = z + 2*pio2_1t;
92		    y[1] = (z-y[0])+2*pio2_1t;
93		    return -2;
94		}
95	    }
96	}
97	if (ix <= 0x401c463b) {		/* |x| ~<= 9pi/4 */
98	    if (ix <= 0x4015fdbc) {	/* |x| ~<= 7pi/4 */
99		if (ix == 0x4012d97c)	/* |x| ~= 3pi/2 */
100		    goto medium;
101		if (hx > 0) {
102		    z = x - 3*pio2_1;
103		    y[0] = z - 3*pio2_1t;
104		    y[1] = (z-y[0])-3*pio2_1t;
105		    return 3;
106		} else {
107		    z = x + 3*pio2_1;
108		    y[0] = z + 3*pio2_1t;
109		    y[1] = (z-y[0])+3*pio2_1t;
110		    return -3;
111		}
112	    } else {
113		if (ix == 0x401921fb)	/* |x| ~= 4pi/2 */
114		    goto medium;
115		if (hx > 0) {
116		    z = x - 4*pio2_1;
117		    y[0] = z - 4*pio2_1t;
118		    y[1] = (z-y[0])-4*pio2_1t;
119		    return 4;
120		} else {
121		    z = x + 4*pio2_1;
122		    y[0] = z + 4*pio2_1t;
123		    y[1] = (z-y[0])+4*pio2_1t;
124		    return -4;
125		}
126	    }
127	}
128	if(ix<=0x413921fb) { /* |x| ~<= 2^19*(pi/2), medium size */
129medium:
130	    t  = fabs(x);
131	    /* Use a specialized rint() to get fn.  Assume round-to-nearest. */
132	    STRICT_ASSIGN(double,fn,t*invpio2+0x1.8p52);
133	    fn = fn-0x1.8p52;
134#ifdef HAVE_EFFICIENT_IRINT
135	    n  = irint(fn);
136#else
137	    n  = (int32_t)fn;
138#endif
139	    r  = t-fn*pio2_1;
140	    w  = fn*pio2_1t;	/* 1st round good to 85 bit */
141	    {
142	        u_int32_t high;
143	        j  = ix>>20;
144	        y[0] = r-w;
145		GET_HIGH_WORD(high,y[0]);
146	        i = j-((high>>20)&0x7ff);
147	        if(i>16) {  /* 2nd iteration needed, good to 118 */
148		    t  = r;
149		    w  = fn*pio2_2;
150		    r  = t-w;
151		    w  = fn*pio2_2t-((t-r)-w);
152		    y[0] = r-w;
153		    GET_HIGH_WORD(high,y[0]);
154		    i = j-((high>>20)&0x7ff);
155		    if(i>49)  {	/* 3rd iteration need, 151 bits acc */
156		    	t  = r;	/* will cover all possible cases */
157		    	w  = fn*pio2_3;
158		    	r  = t-w;
159		    	w  = fn*pio2_3t-((t-r)-w);
160		    	y[0] = r-w;
161		    }
162		}
163	    }
164	    y[1] = (r-y[0])-w;
165	    if(hx<0) 	{y[0] = -y[0]; y[1] = -y[1]; return -n;}
166	    else	 return n;
167	}
168    /*
169     * all other (large) arguments
170     */
171	if(ix>=0x7ff00000) {		/* x is inf or NaN */
172	    y[0]=y[1]=x-x; return 0;
173	}
174    /* set z = scalbn(|x|,ilogb(x)-23) */
175	GET_LOW_WORD(low,x);
176	SET_LOW_WORD(z,low);
177	e0 	= (ix>>20)-1046;	/* e0 = ilogb(z)-23; */
178	SET_HIGH_WORD(z, ix - ((int32_t)(e0<<20)));
179	for(i=0;i<2;i++) {
180		tx[i] = (double)((int32_t)(z));
181		z     = (z-tx[i])*two24;
182	}
183	tx[2] = z;
184	nx = 3;
185	while(tx[nx-1]==zero) nx--;	/* skip zero term */
186	n  =  __kernel_rem_pio2(tx,y,e0,nx,2);
187	if(hx<0) {y[0] = -y[0]; y[1] = -y[1]; return -n;}
188	return n;
189}
190