annotate libgfortran/config/fpu-387.h @ 158:494b0b89df80 default tip

...
author Shinji KONO <kono@ie.u-ryukyu.ac.jp>
date Mon, 25 May 2020 18:13:55 +0900
parents 1830386684a0
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
111
kono
parents:
diff changeset
1 /* FPU-related code for x86 and x86_64 processors.
145
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
2 Copyright (C) 2005-2020 Free Software Foundation, Inc.
111
kono
parents:
diff changeset
3 Contributed by Francois-Xavier Coudert <coudert@clipper.ens.fr>
kono
parents:
diff changeset
4
kono
parents:
diff changeset
5 This file is part of the GNU Fortran 95 runtime library (libgfortran).
kono
parents:
diff changeset
6
kono
parents:
diff changeset
7 Libgfortran is free software; you can redistribute it and/or
kono
parents:
diff changeset
8 modify it under the terms of the GNU General Public
kono
parents:
diff changeset
9 License as published by the Free Software Foundation; either
kono
parents:
diff changeset
10 version 3 of the License, or (at your option) any later version.
kono
parents:
diff changeset
11
kono
parents:
diff changeset
12 Libgfortran is distributed in the hope that it will be useful,
kono
parents:
diff changeset
13 but WITHOUT ANY WARRANTY; without even the implied warranty of
kono
parents:
diff changeset
14 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
kono
parents:
diff changeset
15 GNU General Public License for more details.
kono
parents:
diff changeset
16
kono
parents:
diff changeset
17 Under Section 7 of GPL version 3, you are granted additional
kono
parents:
diff changeset
18 permissions described in the GCC Runtime Library Exception, version
kono
parents:
diff changeset
19 3.1, as published by the Free Software Foundation.
kono
parents:
diff changeset
20
kono
parents:
diff changeset
21 You should have received a copy of the GNU General Public License and
kono
parents:
diff changeset
22 a copy of the GCC Runtime Library Exception along with this program;
kono
parents:
diff changeset
23 see the files COPYING3 and COPYING.RUNTIME respectively. If not, see
kono
parents:
diff changeset
24 <http://www.gnu.org/licenses/>. */
kono
parents:
diff changeset
25
kono
parents:
diff changeset
26 #ifndef __SSE_MATH__
kono
parents:
diff changeset
27 #include "cpuid.h"
kono
parents:
diff changeset
28 #endif
kono
parents:
diff changeset
29
kono
parents:
diff changeset
30 static int
kono
parents:
diff changeset
31 has_sse (void)
kono
parents:
diff changeset
32 {
kono
parents:
diff changeset
33 #ifndef __SSE_MATH__
kono
parents:
diff changeset
34 unsigned int eax, ebx, ecx, edx;
kono
parents:
diff changeset
35
kono
parents:
diff changeset
36 if (!__get_cpuid (1, &eax, &ebx, &ecx, &edx))
kono
parents:
diff changeset
37 return 0;
kono
parents:
diff changeset
38
kono
parents:
diff changeset
39 return edx & bit_SSE;
kono
parents:
diff changeset
40 #else
kono
parents:
diff changeset
41 return 1;
kono
parents:
diff changeset
42 #endif
kono
parents:
diff changeset
43 }
kono
parents:
diff changeset
44
kono
parents:
diff changeset
45 /* i387 exceptions -- see linux <fpu_control.h> header file for details. */
kono
parents:
diff changeset
46 #define _FPU_MASK_IM 0x01
kono
parents:
diff changeset
47 #define _FPU_MASK_DM 0x02
kono
parents:
diff changeset
48 #define _FPU_MASK_ZM 0x04
kono
parents:
diff changeset
49 #define _FPU_MASK_OM 0x08
kono
parents:
diff changeset
50 #define _FPU_MASK_UM 0x10
kono
parents:
diff changeset
51 #define _FPU_MASK_PM 0x20
kono
parents:
diff changeset
52 #define _FPU_MASK_ALL 0x3f
kono
parents:
diff changeset
53
kono
parents:
diff changeset
54 #define _FPU_EX_ALL 0x3f
kono
parents:
diff changeset
55
kono
parents:
diff changeset
56 /* i387 rounding modes. */
kono
parents:
diff changeset
57
kono
parents:
diff changeset
58 #define _FPU_RC_NEAREST 0x0
kono
parents:
diff changeset
59 #define _FPU_RC_DOWN 0x1
kono
parents:
diff changeset
60 #define _FPU_RC_UP 0x2
kono
parents:
diff changeset
61 #define _FPU_RC_ZERO 0x3
kono
parents:
diff changeset
62
kono
parents:
diff changeset
63 #define _FPU_RC_MASK 0x3
kono
parents:
diff changeset
64
kono
parents:
diff changeset
65 /* Enable flush to zero mode. */
kono
parents:
diff changeset
66
kono
parents:
diff changeset
67 #define MXCSR_FTZ (1 << 15)
kono
parents:
diff changeset
68
kono
parents:
diff changeset
69
kono
parents:
diff changeset
70 /* This structure corresponds to the layout of the block
kono
parents:
diff changeset
71 written by FSTENV. */
kono
parents:
diff changeset
72 typedef struct
kono
parents:
diff changeset
73 {
kono
parents:
diff changeset
74 unsigned short int __control_word;
kono
parents:
diff changeset
75 unsigned short int __unused1;
kono
parents:
diff changeset
76 unsigned short int __status_word;
kono
parents:
diff changeset
77 unsigned short int __unused2;
kono
parents:
diff changeset
78 unsigned short int __tags;
kono
parents:
diff changeset
79 unsigned short int __unused3;
kono
parents:
diff changeset
80 unsigned int __eip;
kono
parents:
diff changeset
81 unsigned short int __cs_selector;
kono
parents:
diff changeset
82 unsigned short int __opcode;
kono
parents:
diff changeset
83 unsigned int __data_offset;
kono
parents:
diff changeset
84 unsigned short int __data_selector;
kono
parents:
diff changeset
85 unsigned short int __unused5;
kono
parents:
diff changeset
86 unsigned int __mxcsr;
kono
parents:
diff changeset
87 }
kono
parents:
diff changeset
88 my_fenv_t;
kono
parents:
diff changeset
89
kono
parents:
diff changeset
90 /* Check we can actually store the FPU state in the allocated size. */
kono
parents:
diff changeset
91 _Static_assert (sizeof(my_fenv_t) <= (size_t) GFC_FPE_STATE_BUFFER_SIZE,
kono
parents:
diff changeset
92 "GFC_FPE_STATE_BUFFER_SIZE is too small");
kono
parents:
diff changeset
93
kono
parents:
diff changeset
94
kono
parents:
diff changeset
95 /* Raise the supported floating-point exceptions from EXCEPTS. Other
kono
parents:
diff changeset
96 bits in EXCEPTS are ignored. Code originally borrowed from
kono
parents:
diff changeset
97 libatomic/config/x86/fenv.c. */
kono
parents:
diff changeset
98
kono
parents:
diff changeset
99 static void
kono
parents:
diff changeset
100 local_feraiseexcept (int excepts)
kono
parents:
diff changeset
101 {
kono
parents:
diff changeset
102 if (excepts & _FPU_MASK_IM)
kono
parents:
diff changeset
103 {
kono
parents:
diff changeset
104 float f = 0.0f;
kono
parents:
diff changeset
105 #ifdef __SSE_MATH__
kono
parents:
diff changeset
106 volatile float r __attribute__ ((unused));
kono
parents:
diff changeset
107 __asm__ __volatile__ ("%vdivss\t{%0, %d0|%d0, %0}" : "+x" (f));
kono
parents:
diff changeset
108 r = f; /* Needed to trigger exception. */
kono
parents:
diff changeset
109 #else
kono
parents:
diff changeset
110 __asm__ __volatile__ ("fdiv\t{%y0, %0|%0, %y0}" : "+t" (f));
kono
parents:
diff changeset
111 /* No need for fwait, exception is triggered by emitted fstp. */
kono
parents:
diff changeset
112 #endif
kono
parents:
diff changeset
113 }
kono
parents:
diff changeset
114 if (excepts & _FPU_MASK_DM)
kono
parents:
diff changeset
115 {
kono
parents:
diff changeset
116 my_fenv_t temp;
kono
parents:
diff changeset
117 __asm__ __volatile__ ("fnstenv\t%0" : "=m" (temp));
kono
parents:
diff changeset
118 temp.__status_word |= _FPU_MASK_DM;
kono
parents:
diff changeset
119 __asm__ __volatile__ ("fldenv\t%0" : : "m" (temp));
kono
parents:
diff changeset
120 __asm__ __volatile__ ("fwait");
kono
parents:
diff changeset
121 }
kono
parents:
diff changeset
122 if (excepts & _FPU_MASK_ZM)
kono
parents:
diff changeset
123 {
kono
parents:
diff changeset
124 float f = 1.0f, g = 0.0f;
kono
parents:
diff changeset
125 #ifdef __SSE_MATH__
kono
parents:
diff changeset
126 volatile float r __attribute__ ((unused));
kono
parents:
diff changeset
127 __asm__ __volatile__ ("%vdivss\t{%1, %d0|%d0, %1}" : "+x" (f) : "xm" (g));
kono
parents:
diff changeset
128 r = f; /* Needed to trigger exception. */
kono
parents:
diff changeset
129 #else
kono
parents:
diff changeset
130 __asm__ __volatile__ ("fdivs\t%1" : "+t" (f) : "m" (g));
kono
parents:
diff changeset
131 /* No need for fwait, exception is triggered by emitted fstp. */
kono
parents:
diff changeset
132 #endif
kono
parents:
diff changeset
133 }
kono
parents:
diff changeset
134 if (excepts & _FPU_MASK_OM)
kono
parents:
diff changeset
135 {
kono
parents:
diff changeset
136 my_fenv_t temp;
kono
parents:
diff changeset
137 __asm__ __volatile__ ("fnstenv\t%0" : "=m" (temp));
kono
parents:
diff changeset
138 temp.__status_word |= _FPU_MASK_OM;
kono
parents:
diff changeset
139 __asm__ __volatile__ ("fldenv\t%0" : : "m" (temp));
kono
parents:
diff changeset
140 __asm__ __volatile__ ("fwait");
kono
parents:
diff changeset
141 }
kono
parents:
diff changeset
142 if (excepts & _FPU_MASK_UM)
kono
parents:
diff changeset
143 {
kono
parents:
diff changeset
144 my_fenv_t temp;
kono
parents:
diff changeset
145 __asm__ __volatile__ ("fnstenv\t%0" : "=m" (temp));
kono
parents:
diff changeset
146 temp.__status_word |= _FPU_MASK_UM;
kono
parents:
diff changeset
147 __asm__ __volatile__ ("fldenv\t%0" : : "m" (temp));
kono
parents:
diff changeset
148 __asm__ __volatile__ ("fwait");
kono
parents:
diff changeset
149 }
kono
parents:
diff changeset
150 if (excepts & _FPU_MASK_PM)
kono
parents:
diff changeset
151 {
kono
parents:
diff changeset
152 float f = 1.0f, g = 3.0f;
kono
parents:
diff changeset
153 #ifdef __SSE_MATH__
kono
parents:
diff changeset
154 volatile float r __attribute__ ((unused));
kono
parents:
diff changeset
155 __asm__ __volatile__ ("%vdivss\t{%1, %d0|%d0, %1}" : "+x" (f) : "xm" (g));
kono
parents:
diff changeset
156 r = f; /* Needed to trigger exception. */
kono
parents:
diff changeset
157 #else
kono
parents:
diff changeset
158 __asm__ __volatile__ ("fdivs\t%1" : "+t" (f) : "m" (g));
kono
parents:
diff changeset
159 /* No need for fwait, exception is triggered by emitted fstp. */
kono
parents:
diff changeset
160 #endif
kono
parents:
diff changeset
161 }
kono
parents:
diff changeset
162 }
kono
parents:
diff changeset
163
kono
parents:
diff changeset
164
kono
parents:
diff changeset
165 void
kono
parents:
diff changeset
166 set_fpu_trap_exceptions (int trap, int notrap)
kono
parents:
diff changeset
167 {
kono
parents:
diff changeset
168 int exc_set = 0, exc_clr = 0;
kono
parents:
diff changeset
169 unsigned short cw;
kono
parents:
diff changeset
170
kono
parents:
diff changeset
171 if (trap & GFC_FPE_INVALID) exc_set |= _FPU_MASK_IM;
kono
parents:
diff changeset
172 if (trap & GFC_FPE_DENORMAL) exc_set |= _FPU_MASK_DM;
kono
parents:
diff changeset
173 if (trap & GFC_FPE_ZERO) exc_set |= _FPU_MASK_ZM;
kono
parents:
diff changeset
174 if (trap & GFC_FPE_OVERFLOW) exc_set |= _FPU_MASK_OM;
kono
parents:
diff changeset
175 if (trap & GFC_FPE_UNDERFLOW) exc_set |= _FPU_MASK_UM;
kono
parents:
diff changeset
176 if (trap & GFC_FPE_INEXACT) exc_set |= _FPU_MASK_PM;
kono
parents:
diff changeset
177
kono
parents:
diff changeset
178 if (notrap & GFC_FPE_INVALID) exc_clr |= _FPU_MASK_IM;
kono
parents:
diff changeset
179 if (notrap & GFC_FPE_DENORMAL) exc_clr |= _FPU_MASK_DM;
kono
parents:
diff changeset
180 if (notrap & GFC_FPE_ZERO) exc_clr |= _FPU_MASK_ZM;
kono
parents:
diff changeset
181 if (notrap & GFC_FPE_OVERFLOW) exc_clr |= _FPU_MASK_OM;
kono
parents:
diff changeset
182 if (notrap & GFC_FPE_UNDERFLOW) exc_clr |= _FPU_MASK_UM;
kono
parents:
diff changeset
183 if (notrap & GFC_FPE_INEXACT) exc_clr |= _FPU_MASK_PM;
kono
parents:
diff changeset
184
kono
parents:
diff changeset
185 __asm__ __volatile__ ("fstcw\t%0" : "=m" (cw));
kono
parents:
diff changeset
186
kono
parents:
diff changeset
187 cw |= exc_clr;
kono
parents:
diff changeset
188 cw &= ~exc_set;
kono
parents:
diff changeset
189
kono
parents:
diff changeset
190 __asm__ __volatile__ ("fnclex\n\tfldcw\t%0" : : "m" (cw));
kono
parents:
diff changeset
191
kono
parents:
diff changeset
192 if (has_sse())
kono
parents:
diff changeset
193 {
kono
parents:
diff changeset
194 unsigned int cw_sse;
kono
parents:
diff changeset
195
kono
parents:
diff changeset
196 __asm__ __volatile__ ("%vstmxcsr\t%0" : "=m" (cw_sse));
kono
parents:
diff changeset
197
kono
parents:
diff changeset
198 /* The SSE exception masks are shifted by 7 bits. */
kono
parents:
diff changeset
199 cw_sse |= (exc_clr << 7);
kono
parents:
diff changeset
200 cw_sse &= ~(exc_set << 7);
kono
parents:
diff changeset
201
kono
parents:
diff changeset
202 /* Clear stalled exception flags. */
kono
parents:
diff changeset
203 cw_sse &= ~_FPU_EX_ALL;
kono
parents:
diff changeset
204
kono
parents:
diff changeset
205 __asm__ __volatile__ ("%vldmxcsr\t%0" : : "m" (cw_sse));
kono
parents:
diff changeset
206 }
kono
parents:
diff changeset
207 }
kono
parents:
diff changeset
208
kono
parents:
diff changeset
209 void
kono
parents:
diff changeset
210 set_fpu (void)
kono
parents:
diff changeset
211 {
kono
parents:
diff changeset
212 set_fpu_trap_exceptions (options.fpe, 0);
kono
parents:
diff changeset
213 }
kono
parents:
diff changeset
214
kono
parents:
diff changeset
215 int
kono
parents:
diff changeset
216 get_fpu_trap_exceptions (void)
kono
parents:
diff changeset
217 {
kono
parents:
diff changeset
218 unsigned short cw;
kono
parents:
diff changeset
219 int mask;
kono
parents:
diff changeset
220 int res = 0;
kono
parents:
diff changeset
221
kono
parents:
diff changeset
222 __asm__ __volatile__ ("fstcw\t%0" : "=m" (cw));
kono
parents:
diff changeset
223 mask = cw;
kono
parents:
diff changeset
224
kono
parents:
diff changeset
225 if (has_sse())
kono
parents:
diff changeset
226 {
kono
parents:
diff changeset
227 unsigned int cw_sse;
kono
parents:
diff changeset
228
kono
parents:
diff changeset
229 __asm__ __volatile__ ("%vstmxcsr\t%0" : "=m" (cw_sse));
kono
parents:
diff changeset
230
kono
parents:
diff changeset
231 /* The SSE exception masks are shifted by 7 bits. */
kono
parents:
diff changeset
232 mask |= (cw_sse >> 7);
kono
parents:
diff changeset
233 }
kono
parents:
diff changeset
234
kono
parents:
diff changeset
235 mask = ~mask & _FPU_MASK_ALL;
kono
parents:
diff changeset
236
kono
parents:
diff changeset
237 if (mask & _FPU_MASK_IM) res |= GFC_FPE_INVALID;
kono
parents:
diff changeset
238 if (mask & _FPU_MASK_DM) res |= GFC_FPE_DENORMAL;
kono
parents:
diff changeset
239 if (mask & _FPU_MASK_ZM) res |= GFC_FPE_ZERO;
kono
parents:
diff changeset
240 if (mask & _FPU_MASK_OM) res |= GFC_FPE_OVERFLOW;
kono
parents:
diff changeset
241 if (mask & _FPU_MASK_UM) res |= GFC_FPE_UNDERFLOW;
kono
parents:
diff changeset
242 if (mask & _FPU_MASK_PM) res |= GFC_FPE_INEXACT;
kono
parents:
diff changeset
243
kono
parents:
diff changeset
244 return res;
kono
parents:
diff changeset
245 }
kono
parents:
diff changeset
246
kono
parents:
diff changeset
247 int
kono
parents:
diff changeset
248 support_fpu_trap (int flag __attribute__((unused)))
kono
parents:
diff changeset
249 {
kono
parents:
diff changeset
250 return 1;
kono
parents:
diff changeset
251 }
kono
parents:
diff changeset
252
kono
parents:
diff changeset
253 int
kono
parents:
diff changeset
254 get_fpu_except_flags (void)
kono
parents:
diff changeset
255 {
kono
parents:
diff changeset
256 unsigned short cw;
kono
parents:
diff changeset
257 int excepts;
kono
parents:
diff changeset
258 int res = 0;
kono
parents:
diff changeset
259
kono
parents:
diff changeset
260 __asm__ __volatile__ ("fnstsw\t%0" : "=am" (cw));
kono
parents:
diff changeset
261 excepts = cw;
kono
parents:
diff changeset
262
kono
parents:
diff changeset
263 if (has_sse())
kono
parents:
diff changeset
264 {
kono
parents:
diff changeset
265 unsigned int cw_sse;
kono
parents:
diff changeset
266
kono
parents:
diff changeset
267 __asm__ __volatile__ ("%vstmxcsr\t%0" : "=m" (cw_sse));
kono
parents:
diff changeset
268 excepts |= cw_sse;
kono
parents:
diff changeset
269 }
kono
parents:
diff changeset
270
kono
parents:
diff changeset
271 excepts &= _FPU_EX_ALL;
kono
parents:
diff changeset
272
kono
parents:
diff changeset
273 if (excepts & _FPU_MASK_IM) res |= GFC_FPE_INVALID;
kono
parents:
diff changeset
274 if (excepts & _FPU_MASK_DM) res |= GFC_FPE_DENORMAL;
kono
parents:
diff changeset
275 if (excepts & _FPU_MASK_ZM) res |= GFC_FPE_ZERO;
kono
parents:
diff changeset
276 if (excepts & _FPU_MASK_OM) res |= GFC_FPE_OVERFLOW;
kono
parents:
diff changeset
277 if (excepts & _FPU_MASK_UM) res |= GFC_FPE_UNDERFLOW;
kono
parents:
diff changeset
278 if (excepts & _FPU_MASK_PM) res |= GFC_FPE_INEXACT;
kono
parents:
diff changeset
279
kono
parents:
diff changeset
280 return res;
kono
parents:
diff changeset
281 }
kono
parents:
diff changeset
282
kono
parents:
diff changeset
283 void
kono
parents:
diff changeset
284 set_fpu_except_flags (int set, int clear)
kono
parents:
diff changeset
285 {
kono
parents:
diff changeset
286 my_fenv_t temp;
kono
parents:
diff changeset
287 int exc_set = 0, exc_clr = 0;
kono
parents:
diff changeset
288
kono
parents:
diff changeset
289 /* Translate from GFC_PE_* values to _FPU_MASK_* values. */
kono
parents:
diff changeset
290 if (set & GFC_FPE_INVALID)
kono
parents:
diff changeset
291 exc_set |= _FPU_MASK_IM;
kono
parents:
diff changeset
292 if (clear & GFC_FPE_INVALID)
kono
parents:
diff changeset
293 exc_clr |= _FPU_MASK_IM;
kono
parents:
diff changeset
294
kono
parents:
diff changeset
295 if (set & GFC_FPE_DENORMAL)
kono
parents:
diff changeset
296 exc_set |= _FPU_MASK_DM;
kono
parents:
diff changeset
297 if (clear & GFC_FPE_DENORMAL)
kono
parents:
diff changeset
298 exc_clr |= _FPU_MASK_DM;
kono
parents:
diff changeset
299
kono
parents:
diff changeset
300 if (set & GFC_FPE_ZERO)
kono
parents:
diff changeset
301 exc_set |= _FPU_MASK_ZM;
kono
parents:
diff changeset
302 if (clear & GFC_FPE_ZERO)
kono
parents:
diff changeset
303 exc_clr |= _FPU_MASK_ZM;
kono
parents:
diff changeset
304
kono
parents:
diff changeset
305 if (set & GFC_FPE_OVERFLOW)
kono
parents:
diff changeset
306 exc_set |= _FPU_MASK_OM;
kono
parents:
diff changeset
307 if (clear & GFC_FPE_OVERFLOW)
kono
parents:
diff changeset
308 exc_clr |= _FPU_MASK_OM;
kono
parents:
diff changeset
309
kono
parents:
diff changeset
310 if (set & GFC_FPE_UNDERFLOW)
kono
parents:
diff changeset
311 exc_set |= _FPU_MASK_UM;
kono
parents:
diff changeset
312 if (clear & GFC_FPE_UNDERFLOW)
kono
parents:
diff changeset
313 exc_clr |= _FPU_MASK_UM;
kono
parents:
diff changeset
314
kono
parents:
diff changeset
315 if (set & GFC_FPE_INEXACT)
kono
parents:
diff changeset
316 exc_set |= _FPU_MASK_PM;
kono
parents:
diff changeset
317 if (clear & GFC_FPE_INEXACT)
kono
parents:
diff changeset
318 exc_clr |= _FPU_MASK_PM;
kono
parents:
diff changeset
319
kono
parents:
diff changeset
320
kono
parents:
diff changeset
321 /* Change the flags. This is tricky on 387 (unlike SSE), because we have
kono
parents:
diff changeset
322 FNSTSW but no FLDSW instruction. */
kono
parents:
diff changeset
323 __asm__ __volatile__ ("fnstenv\t%0" : "=m" (temp));
kono
parents:
diff changeset
324 temp.__status_word &= ~exc_clr;
kono
parents:
diff changeset
325 __asm__ __volatile__ ("fldenv\t%0" : : "m" (temp));
kono
parents:
diff changeset
326
kono
parents:
diff changeset
327 /* Change the flags on SSE. */
kono
parents:
diff changeset
328
kono
parents:
diff changeset
329 if (has_sse())
kono
parents:
diff changeset
330 {
kono
parents:
diff changeset
331 unsigned int cw_sse;
kono
parents:
diff changeset
332
kono
parents:
diff changeset
333 __asm__ __volatile__ ("%vstmxcsr\t%0" : "=m" (cw_sse));
kono
parents:
diff changeset
334 cw_sse &= ~exc_clr;
kono
parents:
diff changeset
335 __asm__ __volatile__ ("%vldmxcsr\t%0" : : "m" (cw_sse));
kono
parents:
diff changeset
336 }
kono
parents:
diff changeset
337
kono
parents:
diff changeset
338 local_feraiseexcept (exc_set);
kono
parents:
diff changeset
339 }
kono
parents:
diff changeset
340
kono
parents:
diff changeset
341 int
kono
parents:
diff changeset
342 support_fpu_flag (int flag __attribute__((unused)))
kono
parents:
diff changeset
343 {
kono
parents:
diff changeset
344 return 1;
kono
parents:
diff changeset
345 }
kono
parents:
diff changeset
346
kono
parents:
diff changeset
347 void
kono
parents:
diff changeset
348 set_fpu_rounding_mode (int round)
kono
parents:
diff changeset
349 {
kono
parents:
diff changeset
350 int round_mode;
kono
parents:
diff changeset
351 unsigned short cw;
kono
parents:
diff changeset
352
kono
parents:
diff changeset
353 switch (round)
kono
parents:
diff changeset
354 {
kono
parents:
diff changeset
355 case GFC_FPE_TONEAREST:
kono
parents:
diff changeset
356 round_mode = _FPU_RC_NEAREST;
kono
parents:
diff changeset
357 break;
kono
parents:
diff changeset
358 case GFC_FPE_UPWARD:
kono
parents:
diff changeset
359 round_mode = _FPU_RC_UP;
kono
parents:
diff changeset
360 break;
kono
parents:
diff changeset
361 case GFC_FPE_DOWNWARD:
kono
parents:
diff changeset
362 round_mode = _FPU_RC_DOWN;
kono
parents:
diff changeset
363 break;
kono
parents:
diff changeset
364 case GFC_FPE_TOWARDZERO:
kono
parents:
diff changeset
365 round_mode = _FPU_RC_ZERO;
kono
parents:
diff changeset
366 break;
kono
parents:
diff changeset
367 default:
kono
parents:
diff changeset
368 return; /* Should be unreachable. */
kono
parents:
diff changeset
369 }
kono
parents:
diff changeset
370
kono
parents:
diff changeset
371 __asm__ __volatile__ ("fnstcw\t%0" : "=m" (cw));
kono
parents:
diff changeset
372
kono
parents:
diff changeset
373 /* The x87 round control bits are shifted by 10 bits. */
kono
parents:
diff changeset
374 cw &= ~(_FPU_RC_MASK << 10);
kono
parents:
diff changeset
375 cw |= round_mode << 10;
kono
parents:
diff changeset
376
kono
parents:
diff changeset
377 __asm__ __volatile__ ("fldcw\t%0" : : "m" (cw));
kono
parents:
diff changeset
378
kono
parents:
diff changeset
379 if (has_sse())
kono
parents:
diff changeset
380 {
kono
parents:
diff changeset
381 unsigned int cw_sse;
kono
parents:
diff changeset
382
kono
parents:
diff changeset
383 __asm__ __volatile__ ("%vstmxcsr\t%0" : "=m" (cw_sse));
kono
parents:
diff changeset
384
kono
parents:
diff changeset
385 /* The SSE round control bits are shifted by 13 bits. */
kono
parents:
diff changeset
386 cw_sse &= ~(_FPU_RC_MASK << 13);
kono
parents:
diff changeset
387 cw_sse |= round_mode << 13;
kono
parents:
diff changeset
388
kono
parents:
diff changeset
389 __asm__ __volatile__ ("%vldmxcsr\t%0" : : "m" (cw_sse));
kono
parents:
diff changeset
390 }
kono
parents:
diff changeset
391 }
kono
parents:
diff changeset
392
kono
parents:
diff changeset
393 int
kono
parents:
diff changeset
394 get_fpu_rounding_mode (void)
kono
parents:
diff changeset
395 {
kono
parents:
diff changeset
396 int round_mode;
kono
parents:
diff changeset
397
kono
parents:
diff changeset
398 #ifdef __SSE_MATH__
kono
parents:
diff changeset
399 unsigned int cw;
kono
parents:
diff changeset
400
kono
parents:
diff changeset
401 __asm__ __volatile__ ("%vstmxcsr\t%0" : "=m" (cw));
kono
parents:
diff changeset
402
kono
parents:
diff changeset
403 /* The SSE round control bits are shifted by 13 bits. */
kono
parents:
diff changeset
404 round_mode = cw >> 13;
kono
parents:
diff changeset
405 #else
kono
parents:
diff changeset
406 unsigned short cw;
kono
parents:
diff changeset
407
kono
parents:
diff changeset
408 __asm__ __volatile__ ("fnstcw\t%0" : "=m" (cw));
kono
parents:
diff changeset
409
kono
parents:
diff changeset
410 /* The x87 round control bits are shifted by 10 bits. */
kono
parents:
diff changeset
411 round_mode = cw >> 10;
kono
parents:
diff changeset
412 #endif
kono
parents:
diff changeset
413
kono
parents:
diff changeset
414 round_mode &= _FPU_RC_MASK;
kono
parents:
diff changeset
415
kono
parents:
diff changeset
416 switch (round_mode)
kono
parents:
diff changeset
417 {
kono
parents:
diff changeset
418 case _FPU_RC_NEAREST:
kono
parents:
diff changeset
419 return GFC_FPE_TONEAREST;
kono
parents:
diff changeset
420 case _FPU_RC_UP:
kono
parents:
diff changeset
421 return GFC_FPE_UPWARD;
kono
parents:
diff changeset
422 case _FPU_RC_DOWN:
kono
parents:
diff changeset
423 return GFC_FPE_DOWNWARD;
kono
parents:
diff changeset
424 case _FPU_RC_ZERO:
kono
parents:
diff changeset
425 return GFC_FPE_TOWARDZERO;
kono
parents:
diff changeset
426 default:
kono
parents:
diff changeset
427 return 0; /* Should be unreachable. */
kono
parents:
diff changeset
428 }
kono
parents:
diff changeset
429 }
kono
parents:
diff changeset
430
kono
parents:
diff changeset
431 int
kono
parents:
diff changeset
432 support_fpu_rounding_mode (int mode __attribute__((unused)))
kono
parents:
diff changeset
433 {
kono
parents:
diff changeset
434 return 1;
kono
parents:
diff changeset
435 }
kono
parents:
diff changeset
436
kono
parents:
diff changeset
437 void
kono
parents:
diff changeset
438 get_fpu_state (void *state)
kono
parents:
diff changeset
439 {
kono
parents:
diff changeset
440 my_fenv_t *envp = state;
kono
parents:
diff changeset
441
kono
parents:
diff changeset
442 __asm__ __volatile__ ("fnstenv\t%0" : "=m" (*envp));
kono
parents:
diff changeset
443
kono
parents:
diff changeset
444 /* fnstenv has the side effect of masking all exceptions, so we need
kono
parents:
diff changeset
445 to restore the control word after that. */
kono
parents:
diff changeset
446 __asm__ __volatile__ ("fldcw\t%0" : : "m" (envp->__control_word));
kono
parents:
diff changeset
447
kono
parents:
diff changeset
448 if (has_sse())
kono
parents:
diff changeset
449 __asm__ __volatile__ ("%vstmxcsr\t%0" : "=m" (envp->__mxcsr));
kono
parents:
diff changeset
450 }
kono
parents:
diff changeset
451
kono
parents:
diff changeset
452 void
kono
parents:
diff changeset
453 set_fpu_state (void *state)
kono
parents:
diff changeset
454 {
kono
parents:
diff changeset
455 my_fenv_t *envp = state;
kono
parents:
diff changeset
456
kono
parents:
diff changeset
457 /* glibc sources (sysdeps/x86_64/fpu/fesetenv.c) do something more
kono
parents:
diff changeset
458 complex than this, but I think it suffices in our case. */
kono
parents:
diff changeset
459 __asm__ __volatile__ ("fldenv\t%0" : : "m" (*envp));
kono
parents:
diff changeset
460
kono
parents:
diff changeset
461 if (has_sse())
kono
parents:
diff changeset
462 __asm__ __volatile__ ("%vldmxcsr\t%0" : : "m" (envp->__mxcsr));
kono
parents:
diff changeset
463 }
kono
parents:
diff changeset
464
kono
parents:
diff changeset
465
kono
parents:
diff changeset
466 int
kono
parents:
diff changeset
467 support_fpu_underflow_control (int kind)
kono
parents:
diff changeset
468 {
kono
parents:
diff changeset
469 if (!has_sse())
kono
parents:
diff changeset
470 return 0;
kono
parents:
diff changeset
471
kono
parents:
diff changeset
472 return (kind == 4 || kind == 8) ? 1 : 0;
kono
parents:
diff changeset
473 }
kono
parents:
diff changeset
474
kono
parents:
diff changeset
475
kono
parents:
diff changeset
476 int
kono
parents:
diff changeset
477 get_fpu_underflow_mode (void)
kono
parents:
diff changeset
478 {
kono
parents:
diff changeset
479 unsigned int cw_sse;
kono
parents:
diff changeset
480
kono
parents:
diff changeset
481 if (!has_sse())
kono
parents:
diff changeset
482 return 1;
kono
parents:
diff changeset
483
kono
parents:
diff changeset
484 __asm__ __volatile__ ("%vstmxcsr\t%0" : "=m" (cw_sse));
kono
parents:
diff changeset
485
kono
parents:
diff changeset
486 /* Return 0 for abrupt underflow (flush to zero), 1 for gradual underflow. */
kono
parents:
diff changeset
487 return (cw_sse & MXCSR_FTZ) ? 0 : 1;
kono
parents:
diff changeset
488 }
kono
parents:
diff changeset
489
kono
parents:
diff changeset
490
kono
parents:
diff changeset
491 void
kono
parents:
diff changeset
492 set_fpu_underflow_mode (int gradual)
kono
parents:
diff changeset
493 {
kono
parents:
diff changeset
494 unsigned int cw_sse;
kono
parents:
diff changeset
495
kono
parents:
diff changeset
496 if (!has_sse())
kono
parents:
diff changeset
497 return;
kono
parents:
diff changeset
498
kono
parents:
diff changeset
499 __asm__ __volatile__ ("%vstmxcsr\t%0" : "=m" (cw_sse));
kono
parents:
diff changeset
500
kono
parents:
diff changeset
501 if (gradual)
kono
parents:
diff changeset
502 cw_sse &= ~MXCSR_FTZ;
kono
parents:
diff changeset
503 else
kono
parents:
diff changeset
504 cw_sse |= MXCSR_FTZ;
kono
parents:
diff changeset
505
kono
parents:
diff changeset
506 __asm__ __volatile__ ("%vldmxcsr\t%0" : : "m" (cw_sse));
kono
parents:
diff changeset
507 }
kono
parents:
diff changeset
508