• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 /*  $NetBSD: softfloat.h,v 1.10 2013/04/24 18:04:46 matt Exp $  */
2 
3 /* This is a derivative work. */
4 
5 /*
6 ===============================================================================
7 
8 This C header file is part of the SoftFloat IEC/IEEE Floating-point
9 Arithmetic Package, Release 2a.
10 
11 Written by John R. Hauser.  This work was made possible in part by the
12 International Computer Science Institute, located at Suite 600, 1947 Center
13 Street, Berkeley, California 94704.  Funding was partially provided by the
14 National Science Foundation under grant MIP-9311980.  The original version
15 of this code was written as part of a project to build a fixed-point vector
16 processor in collaboration with the University of California at Berkeley,
17 overseen by Profs. Nelson Morgan and John Wawrzynek.  More information
18 is available through the Web page `http://HTTP.CS.Berkeley.EDU/~jhauser/
19 arithmetic/SoftFloat.html'.
20 
21 THIS SOFTWARE IS DISTRIBUTED AS IS, FOR FREE.  Although reasonable effort
22 has been made to avoid it, THIS SOFTWARE MAY CONTAIN FAULTS THAT WILL AT
23 TIMES RESULT IN INCORRECT BEHAVIOR.  USE OF THIS SOFTWARE IS RESTRICTED TO
24 PERSONS AND ORGANIZATIONS WHO CAN AND WILL TAKE FULL RESPONSIBILITY FOR ANY
25 AND ALL LOSSES, COSTS, OR OTHER PROBLEMS ARISING FROM ITS USE.
26 
27 Derivative works are acceptable, even for commercial purposes, so long as
28 (1) they include prominent notice that the work is derivative, and (2) they
29 include prominent notice akin to these four paragraphs for those parts of
30 this code that are retained.
31 
32 ===============================================================================
33 */
34 
35 /*
36 -------------------------------------------------------------------------------
37 The macro `FLOATX80' must be defined to enable the extended double-precision
38 floating-point format `floatx80'.  If this macro is not defined, the
39 `floatx80' type will not be defined, and none of the functions that either
40 input or output the `floatx80' type will be defined.  The same applies to
41 the `FLOAT128' macro and the quadruple-precision format `float128'.
42 -------------------------------------------------------------------------------
43 */
44 /* #define FLOATX80 */
45 /* #define FLOAT128 */
46 
47 #define FE_INVALID      0x01    /* invalid operation exception */
48 #define FE_DIVBYZERO    0x02    /* divide-by-zero exception */
49 #define FE_OVERFLOW     0x04    /* overflow exception */
50 #define FE_UNDERFLOW    0x08    /* underflow exception */
51 #define FE_INEXACT      0x10    /* imprecise (loss of precision; "inexact") */
52 
53 #define FE_ALL_EXCEPT   0x1f
54 
55 #define FE_TONEAREST    0   /* round to nearest representable number */
56 #define FE_UPWARD       1   /* round toward positive infinity */
57 #define FE_DOWNWARD     2   /* round toward negative infinity */
58 #define FE_TOWARDZERO   3   /* round to zero (truncate) */
59 
60 typedef int fp_except;
61 
62 /* Bit defines for fp_except */
63 
64 #define FP_X_INV    FE_INVALID      /* invalid operation exception */
65 #define FP_X_DZ     FE_DIVBYZERO    /* divide-by-zero exception */
66 #define FP_X_OFL    FE_OVERFLOW     /* overflow exception */
67 #define FP_X_UFL    FE_UNDERFLOW    /* underflow exception */
68 #define FP_X_IMP    FE_INEXACT      /* imprecise (prec. loss; "inexact") */
69 
70 /* Rounding modes */
71 
72 typedef enum {
73     FP_RN=FE_TONEAREST,     /* round to nearest representable number */
74     FP_RP=FE_UPWARD,        /* round toward positive infinity */
75     FP_RM=FE_DOWNWARD,      /* round toward negative infinity */
76     FP_RZ=FE_TOWARDZERO     /* round to zero (truncate) */
77 } fp_rnd;
78 
79 /*
80 -------------------------------------------------------------------------------
81 Software IEC/IEEE floating-point types.
82 -------------------------------------------------------------------------------
83 */
84 typedef unsigned int float32;
85 typedef unsigned long long float64;
86 #ifdef FLOATX80
87 typedef struct {
88     unsigned short high;
89     unsigned long long low;
90 } floatx80;
91 #endif
92 #ifdef FLOAT128
93 typedef struct {
94     unsigned long long high, low;
95 } float128;
96 #endif
97 
98 /*
99 -------------------------------------------------------------------------------
100 Software IEC/IEEE floating-point underflow tininess-detection mode.
101 -------------------------------------------------------------------------------
102 */
103 #ifndef SOFTFLOAT_FOR_GCC
104 extern int float_detect_tininess;
105 #endif
106 enum {
107     float_tininess_after_rounding  = 0,
108     float_tininess_before_rounding = 1
109 };
110 
111 /*
112 -------------------------------------------------------------------------------
113 Software IEC/IEEE floating-point rounding mode.
114 -------------------------------------------------------------------------------
115 */
116 extern fp_rnd float_rounding_mode;
117 #define float_round_nearest_even FP_RN
118 #define float_round_to_zero      FP_RZ
119 #define float_round_down         FP_RM
120 #define float_round_up           FP_RP
121 
122 /*
123 -------------------------------------------------------------------------------
124 Software IEC/IEEE floating-point exception flags.
125 -------------------------------------------------------------------------------
126 */
127 extern fp_except float_exception_flags;
128 extern fp_except float_exception_mask;
129 enum {
130     float_flag_inexact   = FP_X_IMP,
131     float_flag_underflow = FP_X_UFL,
132     float_flag_overflow  = FP_X_OFL,
133     float_flag_divbyzero = FP_X_DZ,
134     float_flag_invalid   = FP_X_INV
135 };
136 
137 /*
138 -------------------------------------------------------------------------------
139 Routine to raise any or all of the software IEC/IEEE floating-point
140 exception flags.
141 -------------------------------------------------------------------------------
142 */
143 void float_raise( fp_except );
144 
145 /*
146 -------------------------------------------------------------------------------
147 Software IEC/IEEE integer-to-floating-point conversion routines.
148 -------------------------------------------------------------------------------
149 */
150 float32 int32_to_float32( int32 );
151 float32 uint32_to_float32( uint32 );
152 float64 int32_to_float64( int32 );
153 float64 uint32_to_float64( uint32 );
154 #ifdef FLOATX80
155 floatx80 int32_to_floatx80( int32 );
156 floatx80 uint32_to_floatx80( uint32 );
157 #endif
158 #ifdef FLOAT128
159 float128 int32_to_float128( int32 );
160 float128 uint32_to_float128( uint32 );
161 #endif
162 #ifndef SOFTFLOAT_FOR_GCC /* __floatdi?f is in libgcc2.c */
163 float32 int64_to_float32( long long );
164 float64 int64_to_float64( long long );
165 #ifdef FLOATX80
166 floatx80 int64_to_floatx80( long long );
167 #endif
168 #ifdef FLOAT128
169 float128 int64_to_float128( long long );
170 #endif
171 #endif
172 
173 /*
174 -------------------------------------------------------------------------------
175 Software IEC/IEEE single-precision conversion routines.
176 -------------------------------------------------------------------------------
177 */
178 int float32_to_int32( float32 );
179 int float32_to_int32_round_to_zero( float32 );
180 #if defined(SOFTFLOAT_FOR_GCC) && defined(SOFTFLOAT_NEED_FIXUNS)
181 unsigned int float32_to_uint32_round_to_zero( float32 );
182 #endif
183 #ifndef SOFTFLOAT_FOR_GCC /* __fix?fdi provided by libgcc2.c */
184 long long float32_to_int64( float32 );
185 long long float32_to_int64_round_to_zero( float32 );
186 #endif
187 float64 float32_to_float64( float32 );
188 #ifdef FLOATX80
189 floatx80 float32_to_floatx80( float32 );
190 #endif
191 #ifdef FLOAT128
192 float128 float32_to_float128( float32 );
193 #endif
194 
195 /*
196 -------------------------------------------------------------------------------
197 Software IEC/IEEE single-precision operations.
198 -------------------------------------------------------------------------------
199 */
200 float32 float32_round_to_int( float32 );
201 float32 float32_add( float32, float32 );
202 float32 float32_sub( float32, float32 );
203 float32 float32_mul( float32, float32 );
204 float32 float32_div( float32, float32 );
205 float32 float32_rem( float32, float32 );
206 float32 float32_sqrt( float32 );
207 int float32_eq( float32, float32 );
208 int float32_le( float32, float32 );
209 int float32_lt( float32, float32 );
210 int float32_eq_signaling( float32, float32 );
211 int float32_le_quiet( float32, float32 );
212 int float32_lt_quiet( float32, float32 );
213 #ifndef SOFTFLOAT_FOR_GCC
214 int float32_is_signaling_nan( float32 );
215 #endif
216 
217 /*
218 -------------------------------------------------------------------------------
219 Software IEC/IEEE double-precision conversion routines.
220 -------------------------------------------------------------------------------
221 */
222 int float64_to_int32( float64 );
223 int float64_to_int32_round_to_zero( float64 );
224 #if defined(SOFTFLOAT_FOR_GCC) && defined(SOFTFLOAT_NEED_FIXUNS)
225 unsigned int float64_to_uint32_round_to_zero( float64 );
226 #endif
227 #ifndef SOFTFLOAT_FOR_GCC /* __fix?fdi provided by libgcc2.c */
228 long long float64_to_int64( float64 );
229 long long float64_to_int64_round_to_zero( float64 );
230 #endif
231 float32 float64_to_float32( float64 );
232 #ifdef FLOATX80
233 floatx80 float64_to_floatx80( float64 );
234 #endif
235 #ifdef FLOAT128
236 float128 float64_to_float128( float64 );
237 #endif
238 
239 /*
240 -------------------------------------------------------------------------------
241 Software IEC/IEEE double-precision operations.
242 -------------------------------------------------------------------------------
243 */
244 float64 float64_round_to_int( float64 );
245 float64 float64_add( float64, float64 );
246 float64 float64_sub( float64, float64 );
247 float64 float64_mul( float64, float64 );
248 float64 float64_div( float64, float64 );
249 float64 float64_rem( float64, float64 );
250 float64 float64_sqrt( float64 );
251 int float64_eq( float64, float64 );
252 int float64_le( float64, float64 );
253 int float64_lt( float64, float64 );
254 int float64_eq_signaling( float64, float64 );
255 int float64_le_quiet( float64, float64 );
256 int float64_lt_quiet( float64, float64 );
257 #ifndef SOFTFLOAT_FOR_GCC
258 int float64_is_signaling_nan( float64 );
259 #endif
260 
261 #ifdef FLOATX80
262 
263 /*
264 -------------------------------------------------------------------------------
265 Software IEC/IEEE extended double-precision conversion routines.
266 -------------------------------------------------------------------------------
267 */
268 int floatx80_to_int32( floatx80 );
269 int floatx80_to_int32_round_to_zero( floatx80 );
270 long long floatx80_to_int64( floatx80 );
271 long long floatx80_to_int64_round_to_zero( floatx80 );
272 float32 floatx80_to_float32( floatx80 );
273 float64 floatx80_to_float64( floatx80 );
274 #ifdef FLOAT128
275 float128 floatx80_to_float128( floatx80 );
276 #endif
277 
278 /*
279 -------------------------------------------------------------------------------
280 Software IEC/IEEE extended double-precision rounding precision.  Valid
281 values are 32, 64, and 80.
282 -------------------------------------------------------------------------------
283 */
284 extern int floatx80_rounding_precision;
285 
286 /*
287 -------------------------------------------------------------------------------
288 Software IEC/IEEE extended double-precision operations.
289 -------------------------------------------------------------------------------
290 */
291 floatx80 floatx80_round_to_int( floatx80 );
292 floatx80 floatx80_add( floatx80, floatx80 );
293 floatx80 floatx80_sub( floatx80, floatx80 );
294 floatx80 floatx80_mul( floatx80, floatx80 );
295 floatx80 floatx80_div( floatx80, floatx80 );
296 floatx80 floatx80_rem( floatx80, floatx80 );
297 floatx80 floatx80_sqrt( floatx80 );
298 int floatx80_eq( floatx80, floatx80 );
299 int floatx80_le( floatx80, floatx80 );
300 int floatx80_lt( floatx80, floatx80 );
301 int floatx80_eq_signaling( floatx80, floatx80 );
302 int floatx80_le_quiet( floatx80, floatx80 );
303 int floatx80_lt_quiet( floatx80, floatx80 );
304 int floatx80_is_signaling_nan( floatx80 );
305 
306 #endif
307 
308 #ifdef FLOAT128
309 
310 /*
311 -------------------------------------------------------------------------------
312 Software IEC/IEEE quadruple-precision conversion routines.
313 -------------------------------------------------------------------------------
314 */
315 int float128_to_int32( float128 );
316 int float128_to_int32_round_to_zero( float128 );
317 long long float128_to_int64( float128 );
318 long long float128_to_int64_round_to_zero( float128 );
319 float32 float128_to_float32( float128 );
320 float64 float128_to_float64( float128 );
321 #ifdef FLOATX80
322 floatx80 float128_to_floatx80( float128 );
323 #endif
324 
325 /*
326 -------------------------------------------------------------------------------
327 Software IEC/IEEE quadruple-precision operations.
328 -------------------------------------------------------------------------------
329 */
330 float128 float128_round_to_int( float128 );
331 float128 float128_add( float128, float128 );
332 float128 float128_sub( float128, float128 );
333 float128 float128_mul( float128, float128 );
334 float128 float128_div( float128, float128 );
335 float128 float128_rem( float128, float128 );
336 float128 float128_sqrt( float128 );
337 int float128_eq( float128, float128 );
338 int float128_le( float128, float128 );
339 int float128_lt( float128, float128 );
340 int float128_eq_signaling( float128, float128 );
341 int float128_le_quiet( float128, float128 );
342 int float128_lt_quiet( float128, float128 );
343 int float128_is_signaling_nan( float128 );
344 
345 #endif
346