1 /* $NetBSD: softfloat.h,v 1.10 2013/04/24 18:04:46 matt Exp $ */
3 /* This is a derivative work. */
6 ===============================================================================
8 This C header file is part of the SoftFloat IEC/IEEE Floating-point
9 Arithmetic Package, Release 2a.
11 Written by John R. Hauser. This work was made possible in part by the
12 International Computer Science Institute, located at Suite 600, 1947 Center
13 Street, Berkeley, California 94704. Funding was partially provided by the
14 National Science Foundation under grant MIP-9311980. The original version
15 of this code was written as part of a project to build a fixed-point vector
16 processor in collaboration with the University of California at Berkeley,
17 overseen by Profs. Nelson Morgan and John Wawrzynek. More information
18 is available through the Web page `http://HTTP.CS.Berkeley.EDU/~jhauser/
19 arithmetic/SoftFloat.html'.
21 THIS SOFTWARE IS DISTRIBUTED AS IS, FOR FREE. Although reasonable effort
22 has been made to avoid it, THIS SOFTWARE MAY CONTAIN FAULTS THAT WILL AT
23 TIMES RESULT IN INCORRECT BEHAVIOR. USE OF THIS SOFTWARE IS RESTRICTED TO
24 PERSONS AND ORGANIZATIONS WHO CAN AND WILL TAKE FULL RESPONSIBILITY FOR ANY
25 AND ALL LOSSES, COSTS, OR OTHER PROBLEMS ARISING FROM ITS USE.
27 Derivative works are acceptable, even for commercial purposes, so long as
28 (1) they include prominent notice that the work is derivative, and (2) they
29 include prominent notice akin to these four paragraphs for those parts of
30 this code that are retained.
32 ===============================================================================
36 -------------------------------------------------------------------------------
37 The macro `FLOATX80' must be defined to enable the extended double-precision
38 floating-point format `floatx80'. If this macro is not defined, the
39 `floatx80' type will not be defined, and none of the functions that either
40 input or output the `floatx80' type will be defined. The same applies to
41 the `FLOAT128' macro and the quadruple-precision format `float128'.
42 -------------------------------------------------------------------------------
44 /* #define FLOATX80 */
45 /* #define FLOAT128 */
47 #define FE_INVALID 0x01 /* invalid operation exception */
48 #define FE_DIVBYZERO 0x02 /* divide-by-zero exception */
49 #define FE_OVERFLOW 0x04 /* overflow exception */
50 #define FE_UNDERFLOW 0x08 /* underflow exception */
51 #define FE_INEXACT 0x10 /* imprecise (loss of precision; "inexact") */
53 #define FE_ALL_EXCEPT 0x1f
55 #define FE_TONEAREST 0 /* round to nearest representable number */
56 #define FE_UPWARD 1 /* round toward positive infinity */
57 #define FE_DOWNWARD 2 /* round toward negative infinity */
58 #define FE_TOWARDZERO 3 /* round to zero (truncate) */
60 typedef int fp_except
;
62 /* Bit defines for fp_except */
64 #define FP_X_INV FE_INVALID /* invalid operation exception */
65 #define FP_X_DZ FE_DIVBYZERO /* divide-by-zero exception */
66 #define FP_X_OFL FE_OVERFLOW /* overflow exception */
67 #define FP_X_UFL FE_UNDERFLOW /* underflow exception */
68 #define FP_X_IMP FE_INEXACT /* imprecise (prec. loss; "inexact") */
73 FP_RN
=FE_TONEAREST
, /* round to nearest representable number */
74 FP_RP
=FE_UPWARD
, /* round toward positive infinity */
75 FP_RM
=FE_DOWNWARD
, /* round toward negative infinity */
76 FP_RZ
=FE_TOWARDZERO
/* round to zero (truncate) */
80 -------------------------------------------------------------------------------
81 Software IEC/IEEE floating-point types.
82 -------------------------------------------------------------------------------
84 typedef unsigned int float32
;
85 typedef unsigned long long float64
;
89 unsigned long long low
;
94 unsigned long long high
, low
;
99 -------------------------------------------------------------------------------
100 Software IEC/IEEE floating-point underflow tininess-detection mode.
101 -------------------------------------------------------------------------------
103 #ifndef SOFTFLOAT_FOR_GCC
104 extern int float_detect_tininess
;
107 float_tininess_after_rounding
= 0,
108 float_tininess_before_rounding
= 1
112 -------------------------------------------------------------------------------
113 Software IEC/IEEE floating-point rounding mode.
114 -------------------------------------------------------------------------------
116 extern fp_rnd float_rounding_mode
;
117 #define float_round_nearest_even FP_RN
118 #define float_round_to_zero FP_RZ
119 #define float_round_down FP_RM
120 #define float_round_up FP_RP
123 -------------------------------------------------------------------------------
124 Software IEC/IEEE floating-point exception flags.
125 -------------------------------------------------------------------------------
127 extern fp_except float_exception_flags
;
128 extern fp_except float_exception_mask
;
130 float_flag_inexact
= FP_X_IMP
,
131 float_flag_underflow
= FP_X_UFL
,
132 float_flag_overflow
= FP_X_OFL
,
133 float_flag_divbyzero
= FP_X_DZ
,
134 float_flag_invalid
= FP_X_INV
138 -------------------------------------------------------------------------------
139 Routine to raise any or all of the software IEC/IEEE floating-point
141 -------------------------------------------------------------------------------
143 void float_raise( fp_except
);
146 -------------------------------------------------------------------------------
147 Software IEC/IEEE integer-to-floating-point conversion routines.
148 -------------------------------------------------------------------------------
150 float32
int32_to_float32( int32
);
151 float32
uint32_to_float32( uint32
);
152 float64
int32_to_float64( int32
);
153 float64
uint32_to_float64( uint32
);
155 floatx80
int32_to_floatx80( int32
);
156 floatx80
uint32_to_floatx80( uint32
);
159 float128
int32_to_float128( int32
);
160 float128
uint32_to_float128( uint32
);
162 #ifndef SOFTFLOAT_FOR_GCC /* __floatdi?f is in libgcc2.c */
163 float32
int64_to_float32( long long );
164 float64
int64_to_float64( long long );
166 floatx80
int64_to_floatx80( long long );
169 float128
int64_to_float128( long long );
174 -------------------------------------------------------------------------------
175 Software IEC/IEEE single-precision conversion routines.
176 -------------------------------------------------------------------------------
178 int float32_to_int32( float32
);
179 int float32_to_int32_round_to_zero( float32
);
180 #if defined(SOFTFLOAT_FOR_GCC) && defined(SOFTFLOAT_NEED_FIXUNS)
181 unsigned int float32_to_uint32_round_to_zero( float32
);
183 #ifndef SOFTFLOAT_FOR_GCC /* __fix?fdi provided by libgcc2.c */
184 long long float32_to_int64( float32
);
185 long long float32_to_int64_round_to_zero( float32
);
187 float64
float32_to_float64( float32
);
189 floatx80
float32_to_floatx80( float32
);
192 float128
float32_to_float128( float32
);
196 -------------------------------------------------------------------------------
197 Software IEC/IEEE single-precision operations.
198 -------------------------------------------------------------------------------
200 float32
float32_round_to_int( float32
);
201 float32
float32_add( float32
, float32
);
202 float32
float32_sub( float32
, float32
);
203 float32
float32_mul( float32
, float32
);
204 float32
float32_div( float32
, float32
);
205 float32
float32_rem( float32
, float32
);
206 float32
float32_sqrt( float32
);
207 int float32_eq( float32
, float32
);
208 int float32_le( float32
, float32
);
209 int float32_lt( float32
, float32
);
210 int float32_eq_signaling( float32
, float32
);
211 int float32_le_quiet( float32
, float32
);
212 int float32_lt_quiet( float32
, float32
);
213 #ifndef SOFTFLOAT_FOR_GCC
214 int float32_is_signaling_nan( float32
);
218 -------------------------------------------------------------------------------
219 Software IEC/IEEE double-precision conversion routines.
220 -------------------------------------------------------------------------------
222 int float64_to_int32( float64
);
223 int float64_to_int32_round_to_zero( float64
);
224 #if defined(SOFTFLOAT_FOR_GCC) && defined(SOFTFLOAT_NEED_FIXUNS)
225 unsigned int float64_to_uint32_round_to_zero( float64
);
227 #ifndef SOFTFLOAT_FOR_GCC /* __fix?fdi provided by libgcc2.c */
228 long long float64_to_int64( float64
);
229 long long float64_to_int64_round_to_zero( float64
);
231 float32
float64_to_float32( float64
);
233 floatx80
float64_to_floatx80( float64
);
236 float128
float64_to_float128( float64
);
240 -------------------------------------------------------------------------------
241 Software IEC/IEEE double-precision operations.
242 -------------------------------------------------------------------------------
244 float64
float64_round_to_int( float64
);
245 float64
float64_add( float64
, float64
);
246 float64
float64_sub( float64
, float64
);
247 float64
float64_mul( float64
, float64
);
248 float64
float64_div( float64
, float64
);
249 float64
float64_rem( float64
, float64
);
250 float64
float64_sqrt( float64
);
251 int float64_eq( float64
, float64
);
252 int float64_le( float64
, float64
);
253 int float64_lt( float64
, float64
);
254 int float64_eq_signaling( float64
, float64
);
255 int float64_le_quiet( float64
, float64
);
256 int float64_lt_quiet( float64
, float64
);
257 #ifndef SOFTFLOAT_FOR_GCC
258 int float64_is_signaling_nan( float64
);
264 -------------------------------------------------------------------------------
265 Software IEC/IEEE extended double-precision conversion routines.
266 -------------------------------------------------------------------------------
268 int floatx80_to_int32( floatx80
);
269 int floatx80_to_int32_round_to_zero( floatx80
);
270 long long floatx80_to_int64( floatx80
);
271 long long floatx80_to_int64_round_to_zero( floatx80
);
272 float32
floatx80_to_float32( floatx80
);
273 float64
floatx80_to_float64( floatx80
);
275 float128
floatx80_to_float128( floatx80
);
279 -------------------------------------------------------------------------------
280 Software IEC/IEEE extended double-precision rounding precision. Valid
281 values are 32, 64, and 80.
282 -------------------------------------------------------------------------------
284 extern int floatx80_rounding_precision
;
287 -------------------------------------------------------------------------------
288 Software IEC/IEEE extended double-precision operations.
289 -------------------------------------------------------------------------------
291 floatx80
floatx80_round_to_int( floatx80
);
292 floatx80
floatx80_add( floatx80
, floatx80
);
293 floatx80
floatx80_sub( floatx80
, floatx80
);
294 floatx80
floatx80_mul( floatx80
, floatx80
);
295 floatx80
floatx80_div( floatx80
, floatx80
);
296 floatx80
floatx80_rem( floatx80
, floatx80
);
297 floatx80
floatx80_sqrt( floatx80
);
298 int floatx80_eq( floatx80
, floatx80
);
299 int floatx80_le( floatx80
, floatx80
);
300 int floatx80_lt( floatx80
, floatx80
);
301 int floatx80_eq_signaling( floatx80
, floatx80
);
302 int floatx80_le_quiet( floatx80
, floatx80
);
303 int floatx80_lt_quiet( floatx80
, floatx80
);
304 int floatx80_is_signaling_nan( floatx80
);
311 -------------------------------------------------------------------------------
312 Software IEC/IEEE quadruple-precision conversion routines.
313 -------------------------------------------------------------------------------
315 int float128_to_int32( float128
);
316 int float128_to_int32_round_to_zero( float128
);
317 long long float128_to_int64( float128
);
318 long long float128_to_int64_round_to_zero( float128
);
319 float32
float128_to_float32( float128
);
320 float64
float128_to_float64( float128
);
322 floatx80
float128_to_floatx80( float128
);
326 -------------------------------------------------------------------------------
327 Software IEC/IEEE quadruple-precision operations.
328 -------------------------------------------------------------------------------
330 float128
float128_round_to_int( float128
);
331 float128
float128_add( float128
, float128
);
332 float128
float128_sub( float128
, float128
);
333 float128
float128_mul( float128
, float128
);
334 float128
float128_div( float128
, float128
);
335 float128
float128_rem( float128
, float128
);
336 float128
float128_sqrt( float128
);
337 int float128_eq( float128
, float128
);
338 int float128_le( float128
, float128
);
339 int float128_lt( float128
, float128
);
340 int float128_eq_signaling( float128
, float128
);
341 int float128_le_quiet( float128
, float128
);
342 int float128_lt_quiet( float128
, float128
);
343 int float128_is_signaling_nan( float128
);