comparison gcc/config/soft-fp/op-common.h @ 0:a06113de4d67

first commit
author kent <kent@cr.ie.u-ryukyu.ac.jp>
date Fri, 17 Jul 2009 14:47:48 +0900
parents
children
comparison
equal deleted inserted replaced
-1:000000000000 0:a06113de4d67
1 /* Software floating-point emulation. Common operations.
2 Copyright (C) 1997,1998,1999,2006,2007 Free Software Foundation, Inc.
3 This file is part of the GNU C Library.
4 Contributed by Richard Henderson (rth@cygnus.com),
5 Jakub Jelinek (jj@ultra.linux.cz),
6 David S. Miller (davem@redhat.com) and
7 Peter Maydell (pmaydell@chiark.greenend.org.uk).
8
9 The GNU C Library is free software; you can redistribute it and/or
10 modify it under the terms of the GNU Lesser General Public
11 License as published by the Free Software Foundation; either
12 version 2.1 of the License, or (at your option) any later version.
13
14 In addition to the permissions in the GNU Lesser General Public
15 License, the Free Software Foundation gives you unlimited
16 permission to link the compiled version of this file into
17 combinations with other programs, and to distribute those
18 combinations without any restriction coming from the use of this
19 file. (The Lesser General Public License restrictions do apply in
20 other respects; for example, they cover modification of the file,
21 and distribution when not linked into a combine executable.)
22
23 The GNU C Library is distributed in the hope that it will be useful,
24 but WITHOUT ANY WARRANTY; without even the implied warranty of
25 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
26 Lesser General Public License for more details.
27
28 You should have received a copy of the GNU Lesser General Public
29 License along with the GNU C Library; if not, write to the Free
30 Software Foundation, 51 Franklin Street, Fifth Floor, Boston,
31 MA 02110-1301, USA. */
32
33 #define _FP_DECL(wc, X) \
34 _FP_I_TYPE X##_c __attribute__((unused)), X##_s, X##_e; \
35 _FP_FRAC_DECL_##wc(X)
36
37 /*
38 * Finish truely unpacking a native fp value by classifying the kind
39 * of fp value and normalizing both the exponent and the fraction.
40 */
41
42 #define _FP_UNPACK_CANONICAL(fs, wc, X) \
43 do { \
44 switch (X##_e) \
45 { \
46 default: \
47 _FP_FRAC_HIGH_RAW_##fs(X) |= _FP_IMPLBIT_##fs; \
48 _FP_FRAC_SLL_##wc(X, _FP_WORKBITS); \
49 X##_e -= _FP_EXPBIAS_##fs; \
50 X##_c = FP_CLS_NORMAL; \
51 break; \
52 \
53 case 0: \
54 if (_FP_FRAC_ZEROP_##wc(X)) \
55 X##_c = FP_CLS_ZERO; \
56 else \
57 { \
58 /* a denormalized number */ \
59 _FP_I_TYPE _shift; \
60 _FP_FRAC_CLZ_##wc(_shift, X); \
61 _shift -= _FP_FRACXBITS_##fs; \
62 _FP_FRAC_SLL_##wc(X, (_shift+_FP_WORKBITS)); \
63 X##_e -= _FP_EXPBIAS_##fs - 1 + _shift; \
64 X##_c = FP_CLS_NORMAL; \
65 FP_SET_EXCEPTION(FP_EX_DENORM); \
66 } \
67 break; \
68 \
69 case _FP_EXPMAX_##fs: \
70 if (_FP_FRAC_ZEROP_##wc(X)) \
71 X##_c = FP_CLS_INF; \
72 else \
73 { \
74 X##_c = FP_CLS_NAN; \
75 /* Check for signaling NaN */ \
76 if (!(_FP_FRAC_HIGH_RAW_##fs(X) & _FP_QNANBIT_##fs)) \
77 FP_SET_EXCEPTION(FP_EX_INVALID); \
78 } \
79 break; \
80 } \
81 } while (0)
82
83 /* Finish unpacking an fp value in semi-raw mode: the mantissa is
84 shifted by _FP_WORKBITS but the implicit MSB is not inserted and
85 other classification is not done. */
86 #define _FP_UNPACK_SEMIRAW(fs, wc, X) _FP_FRAC_SLL_##wc(X, _FP_WORKBITS)
87
88 /* A semi-raw value has overflowed to infinity. Adjust the mantissa
89 and exponent appropriately. */
90 #define _FP_OVERFLOW_SEMIRAW(fs, wc, X) \
91 do { \
92 if (FP_ROUNDMODE == FP_RND_NEAREST \
93 || (FP_ROUNDMODE == FP_RND_PINF && !X##_s) \
94 || (FP_ROUNDMODE == FP_RND_MINF && X##_s)) \
95 { \
96 X##_e = _FP_EXPMAX_##fs; \
97 _FP_FRAC_SET_##wc(X, _FP_ZEROFRAC_##wc); \
98 } \
99 else \
100 { \
101 X##_e = _FP_EXPMAX_##fs - 1; \
102 _FP_FRAC_SET_##wc(X, _FP_MAXFRAC_##wc); \
103 } \
104 FP_SET_EXCEPTION(FP_EX_INEXACT); \
105 FP_SET_EXCEPTION(FP_EX_OVERFLOW); \
106 } while (0)
107
108 /* Check for a semi-raw value being a signaling NaN and raise the
109 invalid exception if so. */
110 #define _FP_CHECK_SIGNAN_SEMIRAW(fs, wc, X) \
111 do { \
112 if (X##_e == _FP_EXPMAX_##fs \
113 && !_FP_FRAC_ZEROP_##wc(X) \
114 && !(_FP_FRAC_HIGH_##fs(X) & _FP_QNANBIT_SH_##fs)) \
115 FP_SET_EXCEPTION(FP_EX_INVALID); \
116 } while (0)
117
118 /* Choose a NaN result from an operation on two semi-raw NaN
119 values. */
120 #define _FP_CHOOSENAN_SEMIRAW(fs, wc, R, X, Y, OP) \
121 do { \
122 /* _FP_CHOOSENAN expects raw values, so shift as required. */ \
123 _FP_FRAC_SRL_##wc(X, _FP_WORKBITS); \
124 _FP_FRAC_SRL_##wc(Y, _FP_WORKBITS); \
125 _FP_CHOOSENAN(fs, wc, R, X, Y, OP); \
126 _FP_FRAC_SLL_##wc(R, _FP_WORKBITS); \
127 } while (0)
128
129 /* Test whether a biased exponent is normal (not zero or maximum). */
130 #define _FP_EXP_NORMAL(fs, wc, X) (((X##_e + 1) & _FP_EXPMAX_##fs) > 1)
131
132 /* Prepare to pack an fp value in semi-raw mode: the mantissa is
133 rounded and shifted right, with the rounding possibly increasing
134 the exponent (including changing a finite value to infinity). */
135 #define _FP_PACK_SEMIRAW(fs, wc, X) \
136 do { \
137 _FP_ROUND(wc, X); \
138 if (_FP_FRAC_HIGH_##fs(X) \
139 & (_FP_OVERFLOW_##fs >> 1)) \
140 { \
141 _FP_FRAC_HIGH_##fs(X) &= ~(_FP_OVERFLOW_##fs >> 1); \
142 X##_e++; \
143 if (X##_e == _FP_EXPMAX_##fs) \
144 _FP_OVERFLOW_SEMIRAW(fs, wc, X); \
145 } \
146 _FP_FRAC_SRL_##wc(X, _FP_WORKBITS); \
147 if (!_FP_EXP_NORMAL(fs, wc, X) && !_FP_FRAC_ZEROP_##wc(X)) \
148 { \
149 if (X##_e == 0) \
150 FP_SET_EXCEPTION(FP_EX_UNDERFLOW); \
151 else \
152 { \
153 if (!_FP_KEEPNANFRACP) \
154 { \
155 _FP_FRAC_SET_##wc(X, _FP_NANFRAC_##fs); \
156 X##_s = _FP_NANSIGN_##fs; \
157 } \
158 else \
159 _FP_FRAC_HIGH_RAW_##fs(X) |= _FP_QNANBIT_##fs; \
160 } \
161 } \
162 } while (0)
163
164 /*
165 * Before packing the bits back into the native fp result, take care
166 * of such mundane things as rounding and overflow. Also, for some
167 * kinds of fp values, the original parts may not have been fully
168 * extracted -- but that is ok, we can regenerate them now.
169 */
170
171 #define _FP_PACK_CANONICAL(fs, wc, X) \
172 do { \
173 switch (X##_c) \
174 { \
175 case FP_CLS_NORMAL: \
176 X##_e += _FP_EXPBIAS_##fs; \
177 if (X##_e > 0) \
178 { \
179 _FP_ROUND(wc, X); \
180 if (_FP_FRAC_OVERP_##wc(fs, X)) \
181 { \
182 _FP_FRAC_CLEAR_OVERP_##wc(fs, X); \
183 X##_e++; \
184 } \
185 _FP_FRAC_SRL_##wc(X, _FP_WORKBITS); \
186 if (X##_e >= _FP_EXPMAX_##fs) \
187 { \
188 /* overflow */ \
189 switch (FP_ROUNDMODE) \
190 { \
191 case FP_RND_NEAREST: \
192 X##_c = FP_CLS_INF; \
193 break; \
194 case FP_RND_PINF: \
195 if (!X##_s) X##_c = FP_CLS_INF; \
196 break; \
197 case FP_RND_MINF: \
198 if (X##_s) X##_c = FP_CLS_INF; \
199 break; \
200 } \
201 if (X##_c == FP_CLS_INF) \
202 { \
203 /* Overflow to infinity */ \
204 X##_e = _FP_EXPMAX_##fs; \
205 _FP_FRAC_SET_##wc(X, _FP_ZEROFRAC_##wc); \
206 } \
207 else \
208 { \
209 /* Overflow to maximum normal */ \
210 X##_e = _FP_EXPMAX_##fs - 1; \
211 _FP_FRAC_SET_##wc(X, _FP_MAXFRAC_##wc); \
212 } \
213 FP_SET_EXCEPTION(FP_EX_OVERFLOW); \
214 FP_SET_EXCEPTION(FP_EX_INEXACT); \
215 } \
216 } \
217 else \
218 { \
219 /* we've got a denormalized number */ \
220 X##_e = -X##_e + 1; \
221 if (X##_e <= _FP_WFRACBITS_##fs) \
222 { \
223 _FP_FRAC_SRS_##wc(X, X##_e, _FP_WFRACBITS_##fs); \
224 _FP_ROUND(wc, X); \
225 if (_FP_FRAC_HIGH_##fs(X) \
226 & (_FP_OVERFLOW_##fs >> 1)) \
227 { \
228 X##_e = 1; \
229 _FP_FRAC_SET_##wc(X, _FP_ZEROFRAC_##wc); \
230 } \
231 else \
232 { \
233 X##_e = 0; \
234 _FP_FRAC_SRL_##wc(X, _FP_WORKBITS); \
235 FP_SET_EXCEPTION(FP_EX_UNDERFLOW); \
236 } \
237 } \
238 else \
239 { \
240 /* underflow to zero */ \
241 X##_e = 0; \
242 if (!_FP_FRAC_ZEROP_##wc(X)) \
243 { \
244 _FP_FRAC_SET_##wc(X, _FP_MINFRAC_##wc); \
245 _FP_ROUND(wc, X); \
246 _FP_FRAC_LOW_##wc(X) >>= (_FP_WORKBITS); \
247 } \
248 FP_SET_EXCEPTION(FP_EX_UNDERFLOW); \
249 } \
250 } \
251 break; \
252 \
253 case FP_CLS_ZERO: \
254 X##_e = 0; \
255 _FP_FRAC_SET_##wc(X, _FP_ZEROFRAC_##wc); \
256 break; \
257 \
258 case FP_CLS_INF: \
259 X##_e = _FP_EXPMAX_##fs; \
260 _FP_FRAC_SET_##wc(X, _FP_ZEROFRAC_##wc); \
261 break; \
262 \
263 case FP_CLS_NAN: \
264 X##_e = _FP_EXPMAX_##fs; \
265 if (!_FP_KEEPNANFRACP) \
266 { \
267 _FP_FRAC_SET_##wc(X, _FP_NANFRAC_##fs); \
268 X##_s = _FP_NANSIGN_##fs; \
269 } \
270 else \
271 _FP_FRAC_HIGH_RAW_##fs(X) |= _FP_QNANBIT_##fs; \
272 break; \
273 } \
274 } while (0)
275
276 /* This one accepts raw argument and not cooked, returns
277 * 1 if X is a signaling NaN.
278 */
279 #define _FP_ISSIGNAN(fs, wc, X) \
280 ({ \
281 int __ret = 0; \
282 if (X##_e == _FP_EXPMAX_##fs) \
283 { \
284 if (!_FP_FRAC_ZEROP_##wc(X) \
285 && !(_FP_FRAC_HIGH_RAW_##fs(X) & _FP_QNANBIT_##fs)) \
286 __ret = 1; \
287 } \
288 __ret; \
289 })
290
291
292
293
294
295 /* Addition on semi-raw values. */
296 #define _FP_ADD_INTERNAL(fs, wc, R, X, Y, OP) \
297 do { \
298 if (X##_s == Y##_s) \
299 { \
300 /* Addition. */ \
301 R##_s = X##_s; \
302 int ediff = X##_e - Y##_e; \
303 if (ediff > 0) \
304 { \
305 R##_e = X##_e; \
306 if (Y##_e == 0) \
307 { \
308 /* Y is zero or denormalized. */ \
309 if (_FP_FRAC_ZEROP_##wc(Y)) \
310 { \
311 _FP_CHECK_SIGNAN_SEMIRAW(fs, wc, X); \
312 _FP_FRAC_COPY_##wc(R, X); \
313 goto add_done; \
314 } \
315 else \
316 { \
317 FP_SET_EXCEPTION(FP_EX_DENORM); \
318 ediff--; \
319 if (ediff == 0) \
320 { \
321 _FP_FRAC_ADD_##wc(R, X, Y); \
322 goto add3; \
323 } \
324 if (X##_e == _FP_EXPMAX_##fs) \
325 { \
326 _FP_CHECK_SIGNAN_SEMIRAW(fs, wc, X); \
327 _FP_FRAC_COPY_##wc(R, X); \
328 goto add_done; \
329 } \
330 goto add1; \
331 } \
332 } \
333 else if (X##_e == _FP_EXPMAX_##fs) \
334 { \
335 /* X is NaN or Inf, Y is normal. */ \
336 _FP_CHECK_SIGNAN_SEMIRAW(fs, wc, X); \
337 _FP_FRAC_COPY_##wc(R, X); \
338 goto add_done; \
339 } \
340 \
341 /* Insert implicit MSB of Y. */ \
342 _FP_FRAC_HIGH_##fs(Y) |= _FP_IMPLBIT_SH_##fs; \
343 \
344 add1: \
345 /* Shift the mantissa of Y to the right EDIFF steps; \
346 remember to account later for the implicit MSB of X. */ \
347 if (ediff <= _FP_WFRACBITS_##fs) \
348 _FP_FRAC_SRS_##wc(Y, ediff, _FP_WFRACBITS_##fs); \
349 else if (!_FP_FRAC_ZEROP_##wc(Y)) \
350 _FP_FRAC_SET_##wc(Y, _FP_MINFRAC_##wc); \
351 _FP_FRAC_ADD_##wc(R, X, Y); \
352 } \
353 else if (ediff < 0) \
354 { \
355 ediff = -ediff; \
356 R##_e = Y##_e; \
357 if (X##_e == 0) \
358 { \
359 /* X is zero or denormalized. */ \
360 if (_FP_FRAC_ZEROP_##wc(X)) \
361 { \
362 _FP_CHECK_SIGNAN_SEMIRAW(fs, wc, Y); \
363 _FP_FRAC_COPY_##wc(R, Y); \
364 goto add_done; \
365 } \
366 else \
367 { \
368 FP_SET_EXCEPTION(FP_EX_DENORM); \
369 ediff--; \
370 if (ediff == 0) \
371 { \
372 _FP_FRAC_ADD_##wc(R, Y, X); \
373 goto add3; \
374 } \
375 if (Y##_e == _FP_EXPMAX_##fs) \
376 { \
377 _FP_CHECK_SIGNAN_SEMIRAW(fs, wc, Y); \
378 _FP_FRAC_COPY_##wc(R, Y); \
379 goto add_done; \
380 } \
381 goto add2; \
382 } \
383 } \
384 else if (Y##_e == _FP_EXPMAX_##fs) \
385 { \
386 /* Y is NaN or Inf, X is normal. */ \
387 _FP_CHECK_SIGNAN_SEMIRAW(fs, wc, Y); \
388 _FP_FRAC_COPY_##wc(R, Y); \
389 goto add_done; \
390 } \
391 \
392 /* Insert implicit MSB of X. */ \
393 _FP_FRAC_HIGH_##fs(X) |= _FP_IMPLBIT_SH_##fs; \
394 \
395 add2: \
396 /* Shift the mantissa of X to the right EDIFF steps; \
397 remember to account later for the implicit MSB of Y. */ \
398 if (ediff <= _FP_WFRACBITS_##fs) \
399 _FP_FRAC_SRS_##wc(X, ediff, _FP_WFRACBITS_##fs); \
400 else if (!_FP_FRAC_ZEROP_##wc(X)) \
401 _FP_FRAC_SET_##wc(X, _FP_MINFRAC_##wc); \
402 _FP_FRAC_ADD_##wc(R, Y, X); \
403 } \
404 else \
405 { \
406 /* ediff == 0. */ \
407 if (!_FP_EXP_NORMAL(fs, wc, X)) \
408 { \
409 if (X##_e == 0) \
410 { \
411 /* X and Y are zero or denormalized. */ \
412 R##_e = 0; \
413 if (_FP_FRAC_ZEROP_##wc(X)) \
414 { \
415 if (!_FP_FRAC_ZEROP_##wc(Y)) \
416 FP_SET_EXCEPTION(FP_EX_DENORM); \
417 _FP_FRAC_COPY_##wc(R, Y); \
418 goto add_done; \
419 } \
420 else if (_FP_FRAC_ZEROP_##wc(Y)) \
421 { \
422 FP_SET_EXCEPTION(FP_EX_DENORM); \
423 _FP_FRAC_COPY_##wc(R, X); \
424 goto add_done; \
425 } \
426 else \
427 { \
428 FP_SET_EXCEPTION(FP_EX_DENORM); \
429 _FP_FRAC_ADD_##wc(R, X, Y); \
430 if (_FP_FRAC_HIGH_##fs(R) & _FP_IMPLBIT_SH_##fs) \
431 { \
432 /* Normalized result. */ \
433 _FP_FRAC_HIGH_##fs(R) \
434 &= ~(_FP_W_TYPE)_FP_IMPLBIT_SH_##fs; \
435 R##_e = 1; \
436 } \
437 goto add_done; \
438 } \
439 } \
440 else \
441 { \
442 /* X and Y are NaN or Inf. */ \
443 _FP_CHECK_SIGNAN_SEMIRAW(fs, wc, X); \
444 _FP_CHECK_SIGNAN_SEMIRAW(fs, wc, Y); \
445 R##_e = _FP_EXPMAX_##fs; \
446 if (_FP_FRAC_ZEROP_##wc(X)) \
447 _FP_FRAC_COPY_##wc(R, Y); \
448 else if (_FP_FRAC_ZEROP_##wc(Y)) \
449 _FP_FRAC_COPY_##wc(R, X); \
450 else \
451 _FP_CHOOSENAN_SEMIRAW(fs, wc, R, X, Y, OP); \
452 goto add_done; \
453 } \
454 } \
455 /* The exponents of X and Y, both normal, are equal. The \
456 implicit MSBs will always add to increase the \
457 exponent. */ \
458 _FP_FRAC_ADD_##wc(R, X, Y); \
459 R##_e = X##_e + 1; \
460 _FP_FRAC_SRS_##wc(R, 1, _FP_WFRACBITS_##fs); \
461 if (R##_e == _FP_EXPMAX_##fs) \
462 /* Overflow to infinity (depending on rounding mode). */ \
463 _FP_OVERFLOW_SEMIRAW(fs, wc, R); \
464 goto add_done; \
465 } \
466 add3: \
467 if (_FP_FRAC_HIGH_##fs(R) & _FP_IMPLBIT_SH_##fs) \
468 { \
469 /* Overflow. */ \
470 _FP_FRAC_HIGH_##fs(R) &= ~(_FP_W_TYPE)_FP_IMPLBIT_SH_##fs; \
471 R##_e++; \
472 _FP_FRAC_SRS_##wc(R, 1, _FP_WFRACBITS_##fs); \
473 if (R##_e == _FP_EXPMAX_##fs) \
474 /* Overflow to infinity (depending on rounding mode). */ \
475 _FP_OVERFLOW_SEMIRAW(fs, wc, R); \
476 } \
477 add_done: ; \
478 } \
479 else \
480 { \
481 /* Subtraction. */ \
482 int ediff = X##_e - Y##_e; \
483 if (ediff > 0) \
484 { \
485 R##_e = X##_e; \
486 R##_s = X##_s; \
487 if (Y##_e == 0) \
488 { \
489 /* Y is zero or denormalized. */ \
490 if (_FP_FRAC_ZEROP_##wc(Y)) \
491 { \
492 _FP_CHECK_SIGNAN_SEMIRAW(fs, wc, X); \
493 _FP_FRAC_COPY_##wc(R, X); \
494 goto sub_done; \
495 } \
496 else \
497 { \
498 FP_SET_EXCEPTION(FP_EX_DENORM); \
499 ediff--; \
500 if (ediff == 0) \
501 { \
502 _FP_FRAC_SUB_##wc(R, X, Y); \
503 goto sub3; \
504 } \
505 if (X##_e == _FP_EXPMAX_##fs) \
506 { \
507 _FP_CHECK_SIGNAN_SEMIRAW(fs, wc, X); \
508 _FP_FRAC_COPY_##wc(R, X); \
509 goto sub_done; \
510 } \
511 goto sub1; \
512 } \
513 } \
514 else if (X##_e == _FP_EXPMAX_##fs) \
515 { \
516 /* X is NaN or Inf, Y is normal. */ \
517 _FP_CHECK_SIGNAN_SEMIRAW(fs, wc, X); \
518 _FP_FRAC_COPY_##wc(R, X); \
519 goto sub_done; \
520 } \
521 \
522 /* Insert implicit MSB of Y. */ \
523 _FP_FRAC_HIGH_##fs(Y) |= _FP_IMPLBIT_SH_##fs; \
524 \
525 sub1: \
526 /* Shift the mantissa of Y to the right EDIFF steps; \
527 remember to account later for the implicit MSB of X. */ \
528 if (ediff <= _FP_WFRACBITS_##fs) \
529 _FP_FRAC_SRS_##wc(Y, ediff, _FP_WFRACBITS_##fs); \
530 else if (!_FP_FRAC_ZEROP_##wc(Y)) \
531 _FP_FRAC_SET_##wc(Y, _FP_MINFRAC_##wc); \
532 _FP_FRAC_SUB_##wc(R, X, Y); \
533 } \
534 else if (ediff < 0) \
535 { \
536 ediff = -ediff; \
537 R##_e = Y##_e; \
538 R##_s = Y##_s; \
539 if (X##_e == 0) \
540 { \
541 /* X is zero or denormalized. */ \
542 if (_FP_FRAC_ZEROP_##wc(X)) \
543 { \
544 _FP_CHECK_SIGNAN_SEMIRAW(fs, wc, Y); \
545 _FP_FRAC_COPY_##wc(R, Y); \
546 goto sub_done; \
547 } \
548 else \
549 { \
550 FP_SET_EXCEPTION(FP_EX_DENORM); \
551 ediff--; \
552 if (ediff == 0) \
553 { \
554 _FP_FRAC_SUB_##wc(R, Y, X); \
555 goto sub3; \
556 } \
557 if (Y##_e == _FP_EXPMAX_##fs) \
558 { \
559 _FP_CHECK_SIGNAN_SEMIRAW(fs, wc, Y); \
560 _FP_FRAC_COPY_##wc(R, Y); \
561 goto sub_done; \
562 } \
563 goto sub2; \
564 } \
565 } \
566 else if (Y##_e == _FP_EXPMAX_##fs) \
567 { \
568 /* Y is NaN or Inf, X is normal. */ \
569 _FP_CHECK_SIGNAN_SEMIRAW(fs, wc, Y); \
570 _FP_FRAC_COPY_##wc(R, Y); \
571 goto sub_done; \
572 } \
573 \
574 /* Insert implicit MSB of X. */ \
575 _FP_FRAC_HIGH_##fs(X) |= _FP_IMPLBIT_SH_##fs; \
576 \
577 sub2: \
578 /* Shift the mantissa of X to the right EDIFF steps; \
579 remember to account later for the implicit MSB of Y. */ \
580 if (ediff <= _FP_WFRACBITS_##fs) \
581 _FP_FRAC_SRS_##wc(X, ediff, _FP_WFRACBITS_##fs); \
582 else if (!_FP_FRAC_ZEROP_##wc(X)) \
583 _FP_FRAC_SET_##wc(X, _FP_MINFRAC_##wc); \
584 _FP_FRAC_SUB_##wc(R, Y, X); \
585 } \
586 else \
587 { \
588 /* ediff == 0. */ \
589 if (!_FP_EXP_NORMAL(fs, wc, X)) \
590 { \
591 if (X##_e == 0) \
592 { \
593 /* X and Y are zero or denormalized. */ \
594 R##_e = 0; \
595 if (_FP_FRAC_ZEROP_##wc(X)) \
596 { \
597 _FP_FRAC_COPY_##wc(R, Y); \
598 if (_FP_FRAC_ZEROP_##wc(Y)) \
599 R##_s = (FP_ROUNDMODE == FP_RND_MINF); \
600 else \
601 { \
602 FP_SET_EXCEPTION(FP_EX_DENORM); \
603 R##_s = Y##_s; \
604 } \
605 goto sub_done; \
606 } \
607 else if (_FP_FRAC_ZEROP_##wc(Y)) \
608 { \
609 FP_SET_EXCEPTION(FP_EX_DENORM); \
610 _FP_FRAC_COPY_##wc(R, X); \
611 R##_s = X##_s; \
612 goto sub_done; \
613 } \
614 else \
615 { \
616 FP_SET_EXCEPTION(FP_EX_DENORM); \
617 _FP_FRAC_SUB_##wc(R, X, Y); \
618 R##_s = X##_s; \
619 if (_FP_FRAC_HIGH_##fs(R) & _FP_IMPLBIT_SH_##fs) \
620 { \
621 /* |X| < |Y|, negate result. */ \
622 _FP_FRAC_SUB_##wc(R, Y, X); \
623 R##_s = Y##_s; \
624 } \
625 else if (_FP_FRAC_ZEROP_##wc(R)) \
626 R##_s = (FP_ROUNDMODE == FP_RND_MINF); \
627 goto sub_done; \
628 } \
629 } \
630 else \
631 { \
632 /* X and Y are NaN or Inf, of opposite signs. */ \
633 _FP_CHECK_SIGNAN_SEMIRAW(fs, wc, X); \
634 _FP_CHECK_SIGNAN_SEMIRAW(fs, wc, Y); \
635 R##_e = _FP_EXPMAX_##fs; \
636 if (_FP_FRAC_ZEROP_##wc(X)) \
637 { \
638 if (_FP_FRAC_ZEROP_##wc(Y)) \
639 { \
640 /* Inf - Inf. */ \
641 R##_s = _FP_NANSIGN_##fs; \
642 _FP_FRAC_SET_##wc(R, _FP_NANFRAC_##fs); \
643 _FP_FRAC_SLL_##wc(R, _FP_WORKBITS); \
644 FP_SET_EXCEPTION(FP_EX_INVALID); \
645 } \
646 else \
647 { \
648 /* Inf - NaN. */ \
649 R##_s = Y##_s; \
650 _FP_FRAC_COPY_##wc(R, Y); \
651 } \
652 } \
653 else \
654 { \
655 if (_FP_FRAC_ZEROP_##wc(Y)) \
656 { \
657 /* NaN - Inf. */ \
658 R##_s = X##_s; \
659 _FP_FRAC_COPY_##wc(R, X); \
660 } \
661 else \
662 { \
663 /* NaN - NaN. */ \
664 _FP_CHOOSENAN_SEMIRAW(fs, wc, R, X, Y, OP); \
665 } \
666 } \
667 goto sub_done; \
668 } \
669 } \
670 /* The exponents of X and Y, both normal, are equal. The \
671 implicit MSBs cancel. */ \
672 R##_e = X##_e; \
673 _FP_FRAC_SUB_##wc(R, X, Y); \
674 R##_s = X##_s; \
675 if (_FP_FRAC_HIGH_##fs(R) & _FP_IMPLBIT_SH_##fs) \
676 { \
677 /* |X| < |Y|, negate result. */ \
678 _FP_FRAC_SUB_##wc(R, Y, X); \
679 R##_s = Y##_s; \
680 } \
681 else if (_FP_FRAC_ZEROP_##wc(R)) \
682 { \
683 R##_e = 0; \
684 R##_s = (FP_ROUNDMODE == FP_RND_MINF); \
685 goto sub_done; \
686 } \
687 goto norm; \
688 } \
689 sub3: \
690 if (_FP_FRAC_HIGH_##fs(R) & _FP_IMPLBIT_SH_##fs) \
691 { \
692 int diff; \
693 /* Carry into most significant bit of larger one of X and Y, \
694 canceling it; renormalize. */ \
695 _FP_FRAC_HIGH_##fs(R) &= _FP_IMPLBIT_SH_##fs - 1; \
696 norm: \
697 _FP_FRAC_CLZ_##wc(diff, R); \
698 diff -= _FP_WFRACXBITS_##fs; \
699 _FP_FRAC_SLL_##wc(R, diff); \
700 if (R##_e <= diff) \
701 { \
702 /* R is denormalized. */ \
703 diff = diff - R##_e + 1; \
704 _FP_FRAC_SRS_##wc(R, diff, _FP_WFRACBITS_##fs); \
705 R##_e = 0; \
706 } \
707 else \
708 { \
709 R##_e -= diff; \
710 _FP_FRAC_HIGH_##fs(R) &= ~(_FP_W_TYPE)_FP_IMPLBIT_SH_##fs; \
711 } \
712 } \
713 sub_done: ; \
714 } \
715 } while (0)
716
717 #define _FP_ADD(fs, wc, R, X, Y) _FP_ADD_INTERNAL(fs, wc, R, X, Y, '+')
718 #define _FP_SUB(fs, wc, R, X, Y) \
719 do { \
720 if (!(Y##_e == _FP_EXPMAX_##fs && !_FP_FRAC_ZEROP_##wc(Y))) Y##_s ^= 1; \
721 _FP_ADD_INTERNAL(fs, wc, R, X, Y, '-'); \
722 } while (0)
723
724
725 /*
726 * Main negation routine. FIXME -- when we care about setting exception
727 * bits reliably, this will not do. We should examine all of the fp classes.
728 */
729
730 #define _FP_NEG(fs, wc, R, X) \
731 do { \
732 _FP_FRAC_COPY_##wc(R, X); \
733 R##_c = X##_c; \
734 R##_e = X##_e; \
735 R##_s = 1 ^ X##_s; \
736 } while (0)
737
738
739 /*
740 * Main multiplication routine. The input values should be cooked.
741 */
742
743 #define _FP_MUL(fs, wc, R, X, Y) \
744 do { \
745 R##_s = X##_s ^ Y##_s; \
746 switch (_FP_CLS_COMBINE(X##_c, Y##_c)) \
747 { \
748 case _FP_CLS_COMBINE(FP_CLS_NORMAL,FP_CLS_NORMAL): \
749 R##_c = FP_CLS_NORMAL; \
750 R##_e = X##_e + Y##_e + 1; \
751 \
752 _FP_MUL_MEAT_##fs(R,X,Y); \
753 \
754 if (_FP_FRAC_OVERP_##wc(fs, R)) \
755 _FP_FRAC_SRS_##wc(R, 1, _FP_WFRACBITS_##fs); \
756 else \
757 R##_e--; \
758 break; \
759 \
760 case _FP_CLS_COMBINE(FP_CLS_NAN,FP_CLS_NAN): \
761 _FP_CHOOSENAN(fs, wc, R, X, Y, '*'); \
762 break; \
763 \
764 case _FP_CLS_COMBINE(FP_CLS_NAN,FP_CLS_NORMAL): \
765 case _FP_CLS_COMBINE(FP_CLS_NAN,FP_CLS_INF): \
766 case _FP_CLS_COMBINE(FP_CLS_NAN,FP_CLS_ZERO): \
767 R##_s = X##_s; \
768 \
769 case _FP_CLS_COMBINE(FP_CLS_INF,FP_CLS_INF): \
770 case _FP_CLS_COMBINE(FP_CLS_INF,FP_CLS_NORMAL): \
771 case _FP_CLS_COMBINE(FP_CLS_ZERO,FP_CLS_NORMAL): \
772 case _FP_CLS_COMBINE(FP_CLS_ZERO,FP_CLS_ZERO): \
773 _FP_FRAC_COPY_##wc(R, X); \
774 R##_c = X##_c; \
775 break; \
776 \
777 case _FP_CLS_COMBINE(FP_CLS_NORMAL,FP_CLS_NAN): \
778 case _FP_CLS_COMBINE(FP_CLS_INF,FP_CLS_NAN): \
779 case _FP_CLS_COMBINE(FP_CLS_ZERO,FP_CLS_NAN): \
780 R##_s = Y##_s; \
781 \
782 case _FP_CLS_COMBINE(FP_CLS_NORMAL,FP_CLS_INF): \
783 case _FP_CLS_COMBINE(FP_CLS_NORMAL,FP_CLS_ZERO): \
784 _FP_FRAC_COPY_##wc(R, Y); \
785 R##_c = Y##_c; \
786 break; \
787 \
788 case _FP_CLS_COMBINE(FP_CLS_INF,FP_CLS_ZERO): \
789 case _FP_CLS_COMBINE(FP_CLS_ZERO,FP_CLS_INF): \
790 R##_s = _FP_NANSIGN_##fs; \
791 R##_c = FP_CLS_NAN; \
792 _FP_FRAC_SET_##wc(R, _FP_NANFRAC_##fs); \
793 FP_SET_EXCEPTION(FP_EX_INVALID); \
794 break; \
795 \
796 default: \
797 abort(); \
798 } \
799 } while (0)
800
801
802 /*
803 * Main division routine. The input values should be cooked.
804 */
805
806 #define _FP_DIV(fs, wc, R, X, Y) \
807 do { \
808 R##_s = X##_s ^ Y##_s; \
809 switch (_FP_CLS_COMBINE(X##_c, Y##_c)) \
810 { \
811 case _FP_CLS_COMBINE(FP_CLS_NORMAL,FP_CLS_NORMAL): \
812 R##_c = FP_CLS_NORMAL; \
813 R##_e = X##_e - Y##_e; \
814 \
815 _FP_DIV_MEAT_##fs(R,X,Y); \
816 break; \
817 \
818 case _FP_CLS_COMBINE(FP_CLS_NAN,FP_CLS_NAN): \
819 _FP_CHOOSENAN(fs, wc, R, X, Y, '/'); \
820 break; \
821 \
822 case _FP_CLS_COMBINE(FP_CLS_NAN,FP_CLS_NORMAL): \
823 case _FP_CLS_COMBINE(FP_CLS_NAN,FP_CLS_INF): \
824 case _FP_CLS_COMBINE(FP_CLS_NAN,FP_CLS_ZERO): \
825 R##_s = X##_s; \
826 _FP_FRAC_COPY_##wc(R, X); \
827 R##_c = X##_c; \
828 break; \
829 \
830 case _FP_CLS_COMBINE(FP_CLS_NORMAL,FP_CLS_NAN): \
831 case _FP_CLS_COMBINE(FP_CLS_INF,FP_CLS_NAN): \
832 case _FP_CLS_COMBINE(FP_CLS_ZERO,FP_CLS_NAN): \
833 R##_s = Y##_s; \
834 _FP_FRAC_COPY_##wc(R, Y); \
835 R##_c = Y##_c; \
836 break; \
837 \
838 case _FP_CLS_COMBINE(FP_CLS_NORMAL,FP_CLS_INF): \
839 case _FP_CLS_COMBINE(FP_CLS_ZERO,FP_CLS_INF): \
840 case _FP_CLS_COMBINE(FP_CLS_ZERO,FP_CLS_NORMAL): \
841 R##_c = FP_CLS_ZERO; \
842 break; \
843 \
844 case _FP_CLS_COMBINE(FP_CLS_NORMAL,FP_CLS_ZERO): \
845 FP_SET_EXCEPTION(FP_EX_DIVZERO); \
846 case _FP_CLS_COMBINE(FP_CLS_INF,FP_CLS_ZERO): \
847 case _FP_CLS_COMBINE(FP_CLS_INF,FP_CLS_NORMAL): \
848 R##_c = FP_CLS_INF; \
849 break; \
850 \
851 case _FP_CLS_COMBINE(FP_CLS_INF,FP_CLS_INF): \
852 case _FP_CLS_COMBINE(FP_CLS_ZERO,FP_CLS_ZERO): \
853 R##_s = _FP_NANSIGN_##fs; \
854 R##_c = FP_CLS_NAN; \
855 _FP_FRAC_SET_##wc(R, _FP_NANFRAC_##fs); \
856 FP_SET_EXCEPTION(FP_EX_INVALID); \
857 break; \
858 \
859 default: \
860 abort(); \
861 } \
862 } while (0)
863
864
865 /*
866 * Main differential comparison routine. The inputs should be raw not
867 * cooked. The return is -1,0,1 for normal values, 2 otherwise.
868 */
869
870 #define _FP_CMP(fs, wc, ret, X, Y, un) \
871 do { \
872 /* NANs are unordered */ \
873 if ((X##_e == _FP_EXPMAX_##fs && !_FP_FRAC_ZEROP_##wc(X)) \
874 || (Y##_e == _FP_EXPMAX_##fs && !_FP_FRAC_ZEROP_##wc(Y))) \
875 { \
876 ret = un; \
877 } \
878 else \
879 { \
880 int __is_zero_x; \
881 int __is_zero_y; \
882 \
883 __is_zero_x = (!X##_e && _FP_FRAC_ZEROP_##wc(X)) ? 1 : 0; \
884 __is_zero_y = (!Y##_e && _FP_FRAC_ZEROP_##wc(Y)) ? 1 : 0; \
885 \
886 if (__is_zero_x && __is_zero_y) \
887 ret = 0; \
888 else if (__is_zero_x) \
889 ret = Y##_s ? 1 : -1; \
890 else if (__is_zero_y) \
891 ret = X##_s ? -1 : 1; \
892 else if (X##_s != Y##_s) \
893 ret = X##_s ? -1 : 1; \
894 else if (X##_e > Y##_e) \
895 ret = X##_s ? -1 : 1; \
896 else if (X##_e < Y##_e) \
897 ret = X##_s ? 1 : -1; \
898 else if (_FP_FRAC_GT_##wc(X, Y)) \
899 ret = X##_s ? -1 : 1; \
900 else if (_FP_FRAC_GT_##wc(Y, X)) \
901 ret = X##_s ? 1 : -1; \
902 else \
903 ret = 0; \
904 } \
905 } while (0)
906
907
908 /* Simplification for strict equality. */
909
910 #define _FP_CMP_EQ(fs, wc, ret, X, Y) \
911 do { \
912 /* NANs are unordered */ \
913 if ((X##_e == _FP_EXPMAX_##fs && !_FP_FRAC_ZEROP_##wc(X)) \
914 || (Y##_e == _FP_EXPMAX_##fs && !_FP_FRAC_ZEROP_##wc(Y))) \
915 { \
916 ret = 1; \
917 } \
918 else \
919 { \
920 ret = !(X##_e == Y##_e \
921 && _FP_FRAC_EQ_##wc(X, Y) \
922 && (X##_s == Y##_s || (!X##_e && _FP_FRAC_ZEROP_##wc(X)))); \
923 } \
924 } while (0)
925
926 /* Version to test unordered. */
927
928 #define _FP_CMP_UNORD(fs, wc, ret, X, Y) \
929 do { \
930 ret = ((X##_e == _FP_EXPMAX_##fs && !_FP_FRAC_ZEROP_##wc(X)) \
931 || (Y##_e == _FP_EXPMAX_##fs && !_FP_FRAC_ZEROP_##wc(Y))); \
932 } while (0)
933
934 /*
935 * Main square root routine. The input value should be cooked.
936 */
937
938 #define _FP_SQRT(fs, wc, R, X) \
939 do { \
940 _FP_FRAC_DECL_##wc(T); _FP_FRAC_DECL_##wc(S); \
941 _FP_W_TYPE q; \
942 switch (X##_c) \
943 { \
944 case FP_CLS_NAN: \
945 _FP_FRAC_COPY_##wc(R, X); \
946 R##_s = X##_s; \
947 R##_c = FP_CLS_NAN; \
948 break; \
949 case FP_CLS_INF: \
950 if (X##_s) \
951 { \
952 R##_s = _FP_NANSIGN_##fs; \
953 R##_c = FP_CLS_NAN; /* NAN */ \
954 _FP_FRAC_SET_##wc(R, _FP_NANFRAC_##fs); \
955 FP_SET_EXCEPTION(FP_EX_INVALID); \
956 } \
957 else \
958 { \
959 R##_s = 0; \
960 R##_c = FP_CLS_INF; /* sqrt(+inf) = +inf */ \
961 } \
962 break; \
963 case FP_CLS_ZERO: \
964 R##_s = X##_s; \
965 R##_c = FP_CLS_ZERO; /* sqrt(+-0) = +-0 */ \
966 break; \
967 case FP_CLS_NORMAL: \
968 R##_s = 0; \
969 if (X##_s) \
970 { \
971 R##_c = FP_CLS_NAN; /* sNAN */ \
972 R##_s = _FP_NANSIGN_##fs; \
973 _FP_FRAC_SET_##wc(R, _FP_NANFRAC_##fs); \
974 FP_SET_EXCEPTION(FP_EX_INVALID); \
975 break; \
976 } \
977 R##_c = FP_CLS_NORMAL; \
978 if (X##_e & 1) \
979 _FP_FRAC_SLL_##wc(X, 1); \
980 R##_e = X##_e >> 1; \
981 _FP_FRAC_SET_##wc(S, _FP_ZEROFRAC_##wc); \
982 _FP_FRAC_SET_##wc(R, _FP_ZEROFRAC_##wc); \
983 q = _FP_OVERFLOW_##fs >> 1; \
984 _FP_SQRT_MEAT_##wc(R, S, T, X, q); \
985 } \
986 } while (0)
987
988 /*
989 * Convert from FP to integer. Input is raw.
990 */
991
992 /* RSIGNED can have following values:
993 * 0: the number is required to be 0..(2^rsize)-1, if not, NV is set plus
994 * the result is either 0 or (2^rsize)-1 depending on the sign in such
995 * case.
996 * 1: the number is required to be -(2^(rsize-1))..(2^(rsize-1))-1, if not,
997 * NV is set plus the result is either -(2^(rsize-1)) or (2^(rsize-1))-1
998 * depending on the sign in such case.
999 * -1: the number is required to be -(2^(rsize-1))..(2^rsize)-1, if not, NV is
1000 * set plus the result is either -(2^(rsize-1)) or (2^(rsize-1))-1
1001 * depending on the sign in such case.
1002 */
1003 #define _FP_TO_INT(fs, wc, r, X, rsize, rsigned) \
1004 do { \
1005 if (X##_e < _FP_EXPBIAS_##fs) \
1006 { \
1007 r = 0; \
1008 if (X##_e == 0) \
1009 { \
1010 if (!_FP_FRAC_ZEROP_##wc(X)) \
1011 { \
1012 FP_SET_EXCEPTION(FP_EX_INEXACT); \
1013 FP_SET_EXCEPTION(FP_EX_DENORM); \
1014 } \
1015 } \
1016 else \
1017 FP_SET_EXCEPTION(FP_EX_INEXACT); \
1018 } \
1019 else if (X##_e >= _FP_EXPBIAS_##fs + rsize - (rsigned > 0 || X##_s) \
1020 || (!rsigned && X##_s)) \
1021 { \
1022 /* Overflow or converting to the most negative integer. */ \
1023 if (rsigned) \
1024 { \
1025 r = 1; \
1026 r <<= rsize - 1; \
1027 r -= 1 - X##_s; \
1028 } else { \
1029 r = 0; \
1030 if (X##_s) \
1031 r = ~r; \
1032 } \
1033 \
1034 if (rsigned && X##_s && X##_e == _FP_EXPBIAS_##fs + rsize - 1) \
1035 { \
1036 /* Possibly converting to most negative integer; check the \
1037 mantissa. */ \
1038 int inexact = 0; \
1039 (void)((_FP_FRACBITS_##fs > rsize) \
1040 ? ({ _FP_FRAC_SRST_##wc(X, inexact, \
1041 _FP_FRACBITS_##fs - rsize, \
1042 _FP_FRACBITS_##fs); 0; }) \
1043 : 0); \
1044 if (!_FP_FRAC_ZEROP_##wc(X)) \
1045 FP_SET_EXCEPTION(FP_EX_INVALID); \
1046 else if (inexact) \
1047 FP_SET_EXCEPTION(FP_EX_INEXACT); \
1048 } \
1049 else \
1050 FP_SET_EXCEPTION(FP_EX_INVALID); \
1051 } \
1052 else \
1053 { \
1054 _FP_FRAC_HIGH_RAW_##fs(X) |= _FP_IMPLBIT_##fs; \
1055 if (X##_e >= _FP_EXPBIAS_##fs + _FP_FRACBITS_##fs - 1) \
1056 { \
1057 _FP_FRAC_ASSEMBLE_##wc(r, X, rsize); \
1058 r <<= X##_e - _FP_EXPBIAS_##fs - _FP_FRACBITS_##fs + 1; \
1059 } \
1060 else \
1061 { \
1062 int inexact; \
1063 _FP_FRAC_SRST_##wc(X, inexact, \
1064 (_FP_FRACBITS_##fs + _FP_EXPBIAS_##fs - 1 \
1065 - X##_e), \
1066 _FP_FRACBITS_##fs); \
1067 if (inexact) \
1068 FP_SET_EXCEPTION(FP_EX_INEXACT); \
1069 _FP_FRAC_ASSEMBLE_##wc(r, X, rsize); \
1070 } \
1071 if (rsigned && X##_s) \
1072 r = -r; \
1073 } \
1074 } while (0)
1075
1076 /* Convert integer to fp. Output is raw. RTYPE is unsigned even if
1077 input is signed. */
1078 #define _FP_FROM_INT(fs, wc, X, r, rsize, rtype) \
1079 do { \
1080 if (r) \
1081 { \
1082 rtype ur_; \
1083 \
1084 if ((X##_s = (r < 0))) \
1085 r = -(rtype)r; \
1086 \
1087 ur_ = (rtype) r; \
1088 (void)((rsize <= _FP_W_TYPE_SIZE) \
1089 ? ({ \
1090 int lz_; \
1091 __FP_CLZ(lz_, (_FP_W_TYPE)ur_); \
1092 X##_e = _FP_EXPBIAS_##fs + _FP_W_TYPE_SIZE - 1 - lz_; \
1093 }) \
1094 : ((rsize <= 2 * _FP_W_TYPE_SIZE) \
1095 ? ({ \
1096 int lz_; \
1097 __FP_CLZ_2(lz_, (_FP_W_TYPE)(ur_ >> _FP_W_TYPE_SIZE), \
1098 (_FP_W_TYPE)ur_); \
1099 X##_e = (_FP_EXPBIAS_##fs + 2 * _FP_W_TYPE_SIZE - 1 \
1100 - lz_); \
1101 }) \
1102 : (abort(), 0))); \
1103 \
1104 if (rsize - 1 + _FP_EXPBIAS_##fs >= _FP_EXPMAX_##fs \
1105 && X##_e >= _FP_EXPMAX_##fs) \
1106 { \
1107 /* Exponent too big; overflow to infinity. (May also \
1108 happen after rounding below.) */ \
1109 _FP_OVERFLOW_SEMIRAW(fs, wc, X); \
1110 goto pack_semiraw; \
1111 } \
1112 \
1113 if (rsize <= _FP_FRACBITS_##fs \
1114 || X##_e < _FP_EXPBIAS_##fs + _FP_FRACBITS_##fs) \
1115 { \
1116 /* Exactly representable; shift left. */ \
1117 _FP_FRAC_DISASSEMBLE_##wc(X, ur_, rsize); \
1118 _FP_FRAC_SLL_##wc(X, (_FP_EXPBIAS_##fs \
1119 + _FP_FRACBITS_##fs - 1 - X##_e)); \
1120 } \
1121 else \
1122 { \
1123 /* More bits in integer than in floating type; need to \
1124 round. */ \
1125 if (_FP_EXPBIAS_##fs + _FP_WFRACBITS_##fs - 1 < X##_e) \
1126 ur_ = ((ur_ >> (X##_e - _FP_EXPBIAS_##fs \
1127 - _FP_WFRACBITS_##fs + 1)) \
1128 | ((ur_ << (rsize - (X##_e - _FP_EXPBIAS_##fs \
1129 - _FP_WFRACBITS_##fs + 1))) \
1130 != 0)); \
1131 _FP_FRAC_DISASSEMBLE_##wc(X, ur_, rsize); \
1132 if ((_FP_EXPBIAS_##fs + _FP_WFRACBITS_##fs - 1 - X##_e) > 0) \
1133 _FP_FRAC_SLL_##wc(X, (_FP_EXPBIAS_##fs \
1134 + _FP_WFRACBITS_##fs - 1 - X##_e)); \
1135 _FP_FRAC_HIGH_##fs(X) &= ~(_FP_W_TYPE)_FP_IMPLBIT_SH_##fs; \
1136 pack_semiraw: \
1137 _FP_PACK_SEMIRAW(fs, wc, X); \
1138 } \
1139 } \
1140 else \
1141 { \
1142 X##_s = 0; \
1143 X##_e = 0; \
1144 _FP_FRAC_SET_##wc(X, _FP_ZEROFRAC_##wc); \
1145 } \
1146 } while (0)
1147
1148
1149 /* Extend from a narrower floating-point format to a wider one. Input
1150 and output are raw. */
1151 #define FP_EXTEND(dfs,sfs,dwc,swc,D,S) \
1152 do { \
1153 if (_FP_FRACBITS_##dfs < _FP_FRACBITS_##sfs \
1154 || (_FP_EXPMAX_##dfs - _FP_EXPBIAS_##dfs \
1155 < _FP_EXPMAX_##sfs - _FP_EXPBIAS_##sfs) \
1156 || (_FP_EXPBIAS_##dfs < _FP_EXPBIAS_##sfs + _FP_FRACBITS_##sfs - 1 \
1157 && _FP_EXPBIAS_##dfs != _FP_EXPBIAS_##sfs)) \
1158 abort(); \
1159 D##_s = S##_s; \
1160 _FP_FRAC_COPY_##dwc##_##swc(D, S); \
1161 if (_FP_EXP_NORMAL(sfs, swc, S)) \
1162 { \
1163 D##_e = S##_e + _FP_EXPBIAS_##dfs - _FP_EXPBIAS_##sfs; \
1164 _FP_FRAC_SLL_##dwc(D, (_FP_FRACBITS_##dfs - _FP_FRACBITS_##sfs)); \
1165 } \
1166 else \
1167 { \
1168 if (S##_e == 0) \
1169 { \
1170 if (_FP_FRAC_ZEROP_##swc(S)) \
1171 D##_e = 0; \
1172 else if (_FP_EXPBIAS_##dfs \
1173 < _FP_EXPBIAS_##sfs + _FP_FRACBITS_##sfs - 1) \
1174 { \
1175 FP_SET_EXCEPTION(FP_EX_DENORM); \
1176 _FP_FRAC_SLL_##dwc(D, (_FP_FRACBITS_##dfs \
1177 - _FP_FRACBITS_##sfs)); \
1178 D##_e = 0; \
1179 } \
1180 else \
1181 { \
1182 int _lz; \
1183 FP_SET_EXCEPTION(FP_EX_DENORM); \
1184 _FP_FRAC_CLZ_##swc(_lz, S); \
1185 _FP_FRAC_SLL_##dwc(D, \
1186 _lz + _FP_FRACBITS_##dfs \
1187 - _FP_FRACTBITS_##sfs); \
1188 D##_e = (_FP_EXPBIAS_##dfs - _FP_EXPBIAS_##sfs + 1 \
1189 + _FP_FRACXBITS_##sfs - _lz); \
1190 } \
1191 } \
1192 else \
1193 { \
1194 D##_e = _FP_EXPMAX_##dfs; \
1195 if (!_FP_FRAC_ZEROP_##swc(S)) \
1196 { \
1197 if (!(_FP_FRAC_HIGH_RAW_##sfs(S) & _FP_QNANBIT_##sfs)) \
1198 FP_SET_EXCEPTION(FP_EX_INVALID); \
1199 _FP_FRAC_SLL_##dwc(D, (_FP_FRACBITS_##dfs \
1200 - _FP_FRACBITS_##sfs)); \
1201 } \
1202 } \
1203 } \
1204 } while (0)
1205
1206 /* Truncate from a wider floating-point format to a narrower one.
1207 Input and output are semi-raw. */
1208 #define FP_TRUNC(dfs,sfs,dwc,swc,D,S) \
1209 do { \
1210 if (_FP_FRACBITS_##sfs < _FP_FRACBITS_##dfs \
1211 || (_FP_EXPBIAS_##sfs < _FP_EXPBIAS_##dfs + _FP_FRACBITS_##dfs - 1 \
1212 && _FP_EXPBIAS_##sfs != _FP_EXPBIAS_##dfs)) \
1213 abort(); \
1214 D##_s = S##_s; \
1215 if (_FP_EXP_NORMAL(sfs, swc, S)) \
1216 { \
1217 D##_e = S##_e + _FP_EXPBIAS_##dfs - _FP_EXPBIAS_##sfs; \
1218 if (D##_e >= _FP_EXPMAX_##dfs) \
1219 _FP_OVERFLOW_SEMIRAW(dfs, dwc, D); \
1220 else \
1221 { \
1222 if (D##_e <= 0) \
1223 { \
1224 if (D##_e < 1 - _FP_FRACBITS_##dfs) \
1225 { \
1226 _FP_FRAC_SET_##swc(S, _FP_ZEROFRAC_##swc); \
1227 _FP_FRAC_LOW_##swc(S) |= 1; \
1228 } \
1229 else \
1230 { \
1231 _FP_FRAC_HIGH_##sfs(S) |= _FP_IMPLBIT_SH_##sfs; \
1232 _FP_FRAC_SRS_##swc(S, (_FP_WFRACBITS_##sfs \
1233 - _FP_WFRACBITS_##dfs + 1 - D##_e), \
1234 _FP_WFRACBITS_##sfs); \
1235 } \
1236 D##_e = 0; \
1237 } \
1238 else \
1239 _FP_FRAC_SRS_##swc(S, (_FP_WFRACBITS_##sfs \
1240 - _FP_WFRACBITS_##dfs), \
1241 _FP_WFRACBITS_##sfs); \
1242 _FP_FRAC_COPY_##dwc##_##swc(D, S); \
1243 } \
1244 } \
1245 else \
1246 { \
1247 if (S##_e == 0) \
1248 { \
1249 D##_e = 0; \
1250 if (_FP_FRAC_ZEROP_##swc(S)) \
1251 _FP_FRAC_SET_##dwc(D, _FP_ZEROFRAC_##dwc); \
1252 else \
1253 { \
1254 FP_SET_EXCEPTION(FP_EX_DENORM); \
1255 if (_FP_EXPBIAS_##sfs \
1256 < _FP_EXPBIAS_##dfs + _FP_FRACBITS_##dfs - 1) \
1257 { \
1258 _FP_FRAC_SRS_##swc(S, (_FP_WFRACBITS_##sfs \
1259 - _FP_WFRACBITS_##dfs), \
1260 _FP_WFRACBITS_##sfs); \
1261 _FP_FRAC_COPY_##dwc##_##swc(D, S); \
1262 } \
1263 else \
1264 { \
1265 _FP_FRAC_SET_##dwc(D, _FP_ZEROFRAC_##dwc); \
1266 _FP_FRAC_LOW_##dwc(D) |= 1; \
1267 } \
1268 } \
1269 } \
1270 else \
1271 { \
1272 D##_e = _FP_EXPMAX_##dfs; \
1273 if (_FP_FRAC_ZEROP_##swc(S)) \
1274 _FP_FRAC_SET_##dwc(D, _FP_ZEROFRAC_##dwc); \
1275 else \
1276 { \
1277 _FP_CHECK_SIGNAN_SEMIRAW(sfs, swc, S); \
1278 _FP_FRAC_SRL_##swc(S, (_FP_WFRACBITS_##sfs \
1279 - _FP_WFRACBITS_##dfs)); \
1280 _FP_FRAC_COPY_##dwc##_##swc(D, S); \
1281 /* Semi-raw NaN must have all workbits cleared. */ \
1282 _FP_FRAC_LOW_##dwc(D) \
1283 &= ~(_FP_W_TYPE) ((1 << _FP_WORKBITS) - 1); \
1284 _FP_FRAC_HIGH_##dfs(D) |= _FP_QNANBIT_SH_##dfs; \
1285 } \
1286 } \
1287 } \
1288 } while (0)
1289
1290 /*
1291 * Helper primitives.
1292 */
1293
1294 /* Count leading zeros in a word. */
1295
1296 #ifndef __FP_CLZ
1297 /* GCC 3.4 and later provide the builtins for us. */
1298 #define __FP_CLZ(r, x) \
1299 do { \
1300 if (sizeof (_FP_W_TYPE) == sizeof (unsigned int)) \
1301 r = __builtin_clz (x); \
1302 else if (sizeof (_FP_W_TYPE) == sizeof (unsigned long)) \
1303 r = __builtin_clzl (x); \
1304 else if (sizeof (_FP_W_TYPE) == sizeof (unsigned long long)) \
1305 r = __builtin_clzll (x); \
1306 else \
1307 abort (); \
1308 } while (0)
1309 #endif /* ndef __FP_CLZ */
1310
1311 #define _FP_DIV_HELP_imm(q, r, n, d) \
1312 do { \
1313 q = n / d, r = n % d; \
1314 } while (0)
1315
1316
1317 /* A restoring bit-by-bit division primitive. */
1318
1319 #define _FP_DIV_MEAT_N_loop(fs, wc, R, X, Y) \
1320 do { \
1321 int count = _FP_WFRACBITS_##fs; \
1322 _FP_FRAC_DECL_##wc (u); \
1323 _FP_FRAC_DECL_##wc (v); \
1324 _FP_FRAC_COPY_##wc (u, X); \
1325 _FP_FRAC_COPY_##wc (v, Y); \
1326 _FP_FRAC_SET_##wc (R, _FP_ZEROFRAC_##wc); \
1327 /* Normalize U and V. */ \
1328 _FP_FRAC_SLL_##wc (u, _FP_WFRACXBITS_##fs); \
1329 _FP_FRAC_SLL_##wc (v, _FP_WFRACXBITS_##fs); \
1330 /* First round. Since the operands are normalized, either the \
1331 first or second bit will be set in the fraction. Produce a \
1332 normalized result by checking which and adjusting the loop \
1333 count and exponent accordingly. */ \
1334 if (_FP_FRAC_GE_1 (u, v)) \
1335 { \
1336 _FP_FRAC_SUB_##wc (u, u, v); \
1337 _FP_FRAC_LOW_##wc (R) |= 1; \
1338 count--; \
1339 } \
1340 else \
1341 R##_e--; \
1342 /* Subsequent rounds. */ \
1343 do { \
1344 int msb = (_FP_WS_TYPE) _FP_FRAC_HIGH_##wc (u) < 0; \
1345 _FP_FRAC_SLL_##wc (u, 1); \
1346 _FP_FRAC_SLL_##wc (R, 1); \
1347 if (msb || _FP_FRAC_GE_1 (u, v)) \
1348 { \
1349 _FP_FRAC_SUB_##wc (u, u, v); \
1350 _FP_FRAC_LOW_##wc (R) |= 1; \
1351 } \
1352 } while (--count > 0); \
1353 /* If there's anything left in U, the result is inexact. */ \
1354 _FP_FRAC_LOW_##wc (R) |= !_FP_FRAC_ZEROP_##wc (u); \
1355 } while (0)
1356
1357 #define _FP_DIV_MEAT_1_loop(fs, R, X, Y) _FP_DIV_MEAT_N_loop (fs, 1, R, X, Y)
1358 #define _FP_DIV_MEAT_2_loop(fs, R, X, Y) _FP_DIV_MEAT_N_loop (fs, 2, R, X, Y)
1359 #define _FP_DIV_MEAT_4_loop(fs, R, X, Y) _FP_DIV_MEAT_N_loop (fs, 4, R, X, Y)