softfloat.h revision 1.1
1/* $NetBSD: softfloat.h,v 1.1 2014/08/10 05:47:37 matt Exp $ */
2
3/* This is a derivative work. */
4
5/*
6===============================================================================
7
8This C header file is part of the SoftFloat IEC/IEEE Floating-point
9Arithmetic Package, Release 2a.
10
11Written by John R. Hauser.  This work was made possible in part by the
12International Computer Science Institute, located at Suite 600, 1947 Center
13Street, Berkeley, California 94704.  Funding was partially provided by the
14National Science Foundation under grant MIP-9311980.  The original version
15of this code was written as part of a project to build a fixed-point vector
16processor in collaboration with the University of California at Berkeley,
17overseen by Profs. Nelson Morgan and John Wawrzynek.  More information
18is available through the Web page `http://HTTP.CS.Berkeley.EDU/~jhauser/
19arithmetic/SoftFloat.html'.
20
21THIS SOFTWARE IS DISTRIBUTED AS IS, FOR FREE.  Although reasonable effort
22has been made to avoid it, THIS SOFTWARE MAY CONTAIN FAULTS THAT WILL AT
23TIMES RESULT IN INCORRECT BEHAVIOR.  USE OF THIS SOFTWARE IS RESTRICTED TO
24PERSONS AND ORGANIZATIONS WHO CAN AND WILL TAKE FULL RESPONSIBILITY FOR ANY
25AND ALL LOSSES, COSTS, OR OTHER PROBLEMS ARISING FROM ITS USE.
26
27Derivative works are acceptable, even for commercial purposes, so long as
28(1) they include prominent notice that the work is derivative, and (2) they
29include prominent notice akin to these four paragraphs for those parts of
30this code that are retained.
31
32===============================================================================
33*/
34
35/*
36-------------------------------------------------------------------------------
37The macro `FLOATX80' must be defined to enable the extended double-precision
38floating-point format `floatx80'.  If this macro is not defined, the
39`floatx80' type will not be defined, and none of the functions that either
40input or output the `floatx80' type will be defined.  The same applies to
41the `FLOAT128' macro and the quadruple-precision format `float128'.
42-------------------------------------------------------------------------------
43*/
44/* #define FLOATX80 */
45#define FLOAT128
46
47#include "softfloat-qp.h"
48
49#include <machine/ieeefp.h>
50
51/*
52-------------------------------------------------------------------------------
53Software IEC/IEEE floating-point types.
54-------------------------------------------------------------------------------
55*/
56typedef unsigned int float32;
57typedef unsigned long long float64;
58#ifdef FLOATX80
59typedef struct {
60    unsigned short high;
61    unsigned long long low;
62} floatx80;
63#endif
64#ifdef FLOAT128
65typedef struct {
66    unsigned long long high, low;
67} float128;
68#endif
69
70/*
71-------------------------------------------------------------------------------
72Software IEC/IEEE floating-point underflow tininess-detection mode.
73-------------------------------------------------------------------------------
74*/
75#ifndef SOFTFLOAT_FOR_GCC
76extern int8 float_detect_tininess;
77#endif
78enum {
79    float_tininess_after_rounding  = 0,
80    float_tininess_before_rounding = 1
81};
82
83/*
84-------------------------------------------------------------------------------
85Software IEC/IEEE floating-point rounding mode.
86-------------------------------------------------------------------------------
87*/
88extern fp_rnd float_rounding_mode;
89#define float_round_nearest_even FP_RN
90#define float_round_to_zero      FP_RZ
91#define float_round_down         FP_RM
92#define float_round_up           FP_RP
93
94/*
95-------------------------------------------------------------------------------
96Software IEC/IEEE floating-point exception flags.
97-------------------------------------------------------------------------------
98*/
99extern fp_except float_exception_flags;
100extern fp_except float_exception_mask;
101enum {
102    float_flag_inexact   = FP_X_IMP,
103    float_flag_underflow = FP_X_UFL,
104    float_flag_overflow  = FP_X_OFL,
105    float_flag_divbyzero = FP_X_DZ,
106    float_flag_invalid   = FP_X_INV
107};
108
109/*
110-------------------------------------------------------------------------------
111Routine to raise any or all of the software IEC/IEEE floating-point
112exception flags.
113-------------------------------------------------------------------------------
114*/
115void float_raise( fp_except );
116
117/*
118-------------------------------------------------------------------------------
119Software IEC/IEEE integer-to-floating-point conversion routines.
120-------------------------------------------------------------------------------
121*/
122float32 int32_to_float32( int32 );
123float32 uint32_to_float32( uint32 );
124float64 int32_to_float64( int32 );
125float64 uint32_to_float64( uint32 );
126#ifdef FLOATX80
127floatx80 int32_to_floatx80( int32 );
128floatx80 uint32_to_floatx80( uint32 );
129#endif
130#ifdef FLOAT128
131float128 int32_to_float128( int32 );
132float128 uint32_to_float128( uint32 );
133#endif
134float32 int64_to_float32( long long );
135float64 int64_to_float64( long long );
136#ifdef FLOATX80
137floatx80 int64_to_floatx80( long long );
138#endif
139#ifdef FLOAT128
140float128 int64_to_float128( long long );
141#endif
142
143/*
144-------------------------------------------------------------------------------
145Software IEC/IEEE single-precision conversion routines.
146-------------------------------------------------------------------------------
147*/
148int float32_to_int32( float32 );
149int float32_to_int32_round_to_zero( float32 );
150unsigned int float32_to_uint32_round_to_zero( float32 );
151long long float32_to_int64( float32 );
152long long float32_to_int64_round_to_zero( float32 );
153float64 float32_to_float64( float32 );
154#ifdef FLOATX80
155floatx80 float32_to_floatx80( float32 );
156#endif
157#ifdef FLOAT128
158float128 float32_to_float128( float32 );
159#endif
160
161/*
162-------------------------------------------------------------------------------
163Software IEC/IEEE single-precision operations.
164-------------------------------------------------------------------------------
165*/
166float32 float32_round_to_int( float32 );
167float32 float32_add( float32, float32 );
168float32 float32_sub( float32, float32 );
169float32 float32_mul( float32, float32 );
170float32 float32_div( float32, float32 );
171float32 float32_rem( float32, float32 );
172float32 float32_sqrt( float32 );
173flag float32_eq( float32, float32 );
174flag float32_le( float32, float32 );
175flag float32_lt( float32, float32 );
176flag float32_eq_signaling( float32, float32 );
177flag float32_le_quiet( float32, float32 );
178flag float32_lt_quiet( float32, float32 );
179flag float32_is_signaling_nan( float32 );
180
181/*
182-------------------------------------------------------------------------------
183Software IEC/IEEE double-precision conversion routines.
184-------------------------------------------------------------------------------
185*/
186int float64_to_int32( float64 );
187int float64_to_int32_round_to_zero( float64 );
188unsigned int float64_to_uint32_round_to_zero( float64 );
189long long float64_to_int64( float64 );
190long long float64_to_int64_round_to_zero( float64 );
191float32 float64_to_float32( float64 );
192#ifdef FLOATX80
193floatx80 float64_to_floatx80( float64 );
194#endif
195#ifdef FLOAT128
196float128 float64_to_float128( float64 );
197#endif
198
199/*
200-------------------------------------------------------------------------------
201Software IEC/IEEE double-precision operations.
202-------------------------------------------------------------------------------
203*/
204float64 float64_round_to_int( float64 );
205float64 float64_add( float64, float64 );
206float64 float64_sub( float64, float64 );
207float64 float64_mul( float64, float64 );
208float64 float64_div( float64, float64 );
209float64 float64_rem( float64, float64 );
210float64 float64_sqrt( float64 );
211flag float64_eq( float64, float64 );
212flag float64_le( float64, float64 );
213flag float64_lt( float64, float64 );
214flag float64_eq_signaling( float64, float64 );
215flag float64_le_quiet( float64, float64 );
216flag float64_lt_quiet( float64, float64 );
217flag float64_is_signaling_nan( float64 );
218
219#ifdef FLOATX80
220
221/*
222-------------------------------------------------------------------------------
223Software IEC/IEEE extended double-precision conversion routines.
224-------------------------------------------------------------------------------
225*/
226int floatx80_to_int32( floatx80 );
227int floatx80_to_int32_round_to_zero( floatx80 );
228long long floatx80_to_int64( floatx80 );
229long long floatx80_to_int64_round_to_zero( floatx80 );
230float32 floatx80_to_float32( floatx80 );
231float64 floatx80_to_float64( floatx80 );
232#ifdef FLOAT128
233float128 floatx80_to_float128( floatx80 );
234#endif
235
236/*
237-------------------------------------------------------------------------------
238Software IEC/IEEE extended double-precision rounding precision.  Valid
239values are 32, 64, and 80.
240-------------------------------------------------------------------------------
241*/
242extern int floatx80_rounding_precision;
243
244/*
245-------------------------------------------------------------------------------
246Software IEC/IEEE extended double-precision operations.
247-------------------------------------------------------------------------------
248*/
249floatx80 floatx80_round_to_int( floatx80 );
250floatx80 floatx80_add( floatx80, floatx80 );
251floatx80 floatx80_sub( floatx80, floatx80 );
252floatx80 floatx80_mul( floatx80, floatx80 );
253floatx80 floatx80_div( floatx80, floatx80 );
254floatx80 floatx80_rem( floatx80, floatx80 );
255floatx80 floatx80_sqrt( floatx80 );
256flag floatx80_eq( floatx80, floatx80 );
257flag floatx80_le( floatx80, floatx80 );
258flag floatx80_lt( floatx80, floatx80 );
259flag floatx80_eq_signaling( floatx80, floatx80 );
260flag floatx80_le_quiet( floatx80, floatx80 );
261flag floatx80_lt_quiet( floatx80, floatx80 );
262flag floatx80_is_signaling_nan( floatx80 );
263
264#endif
265
266#ifdef FLOAT128
267
268/*
269-------------------------------------------------------------------------------
270Software IEC/IEEE quadruple-precision conversion routines.
271-------------------------------------------------------------------------------
272*/
273int float128_to_int32( float128 );
274int float128_to_int32_round_to_zero( float128 );
275long long float128_to_int64( float128 );
276long long float128_to_int64_round_to_zero( float128 );
277unsigned long long float128_to_uint64_round_to_zero( float128 );
278float32 float128_to_float32( float128 );
279float64 float128_to_float64( float128 );
280#ifdef FLOATX80
281floatx80 float128_to_floatx80( float128 );
282#endif
283
284/*
285-------------------------------------------------------------------------------
286Software IEC/IEEE quadruple-precision operations.
287-------------------------------------------------------------------------------
288*/
289float128 float128_round_to_int( float128 );
290float128 float128_add( float128, float128 );
291float128 float128_sub( float128, float128 );
292float128 float128_mul( float128, float128 );
293float128 float128_div( float128, float128 );
294float128 float128_rem( float128, float128 );
295float128 float128_sqrt( float128 );
296flag float128_eq( float128, float128 );
297flag float128_le( float128, float128 );
298flag float128_lt( float128, float128 );
299flag float128_eq_signaling( float128, float128 );
300flag float128_le_quiet( float128, float128 );
301flag float128_lt_quiet( float128, float128 );
302flag float128_is_signaling_nan( float128 );
303flag float128_is_nan( float128 );
304
305#endif
306