]> git.ipfire.org Git - thirdparty/glibc.git/blame - sysdeps/powerpc/fpu/fenv_private.h
[powerpc] SET_RESTORE_ROUND optimizations and bug fix
[thirdparty/glibc.git] / sysdeps / powerpc / fpu / fenv_private.h
CommitLineData
41e8926a 1/* Private floating point rounding and exceptions handling. PowerPC version.
04277e02 2 Copyright (C) 2013-2019 Free Software Foundation, Inc.
41e8926a
AZ
3 This file is part of the GNU C Library.
4
5 The GNU C Library is free software; you can redistribute it and/or
6 modify it under the terms of the GNU Lesser General Public
7 License as published by the Free Software Foundation; either
8 version 2.1 of the License, or (at your option) any later version.
9
10 The GNU C Library is distributed in the hope that it will be useful,
11 but WITHOUT ANY WARRANTY; without even the implied warranty of
12 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
13 Lesser General Public License for more details.
14
15 You should have received a copy of the GNU Lesser General Public
16 License along with the GNU C Library. If not, see
5a82c748 17 <https://www.gnu.org/licenses/>. */
41e8926a 18
ff6b2450
JM
19#ifndef POWERPC_FENV_PRIVATE_H
20#define POWERPC_FENV_PRIVATE_H 1
41e8926a
AZ
21
22#include <fenv.h>
23#include <fenv_libc.h>
24#include <fpu_control.h>
25
84d74e42
PM
26/* Mask for the exception enable bits. */
27#define _FPU_ALL_TRAPS (_FPU_MASK_ZM | _FPU_MASK_OM | _FPU_MASK_UM \
41e8926a
AZ
28 | _FPU_MASK_XM | _FPU_MASK_IM)
29
84d74e42 30/* Mask the rounding mode bits. */
346729f6 31#define _FPU_MASK_RN 0xfffffffffffffffcLL
84d74e42 32
346729f6
PC
33/* Mask everything but the rounding modes and non-IEEE arithmetic flags. */
34#define _FPU_MASK_NOT_RN_NI 0xffffffff00000807LL
41e8926a
AZ
35
36/* Mask restore rounding mode and exception enabled. */
346729f6 37#define _FPU_MASK_TRAPS_RN 0xffffffffffffff00LL
41e8926a 38
346729f6
PC
39/* Mask FP result flags, preserve fraction rounded/inexact bits. */
40#define _FPU_MASK_FRAC_INEX_RET_CC 0xfffffffffff80fffLL
41e8926a
AZ
41
42static __always_inline void
84d74e42
PM
43__libc_feholdbits_ppc (fenv_t *envp, unsigned long long mask,
44 unsigned long long bits)
41e8926a
AZ
45{
46 fenv_union_t old, new;
47
48 old.fenv = *envp = fegetenv_register ();
49
84d74e42 50 new.l = (old.l & mask) | bits;
41e8926a
AZ
51
52 /* If the old env had any enabled exceptions, then mask SIGFPE in the
53 MSR FE0/FE1 bits. This may allow the FPU to run faster because it
54 always takes the default action and can not generate SIGFPE. */
84d74e42 55 if ((old.l & _FPU_ALL_TRAPS) != 0)
41e8926a
AZ
56 (void) __fe_mask_env ();
57
58 fesetenv_register (new.fenv);
59}
60
61static __always_inline void
84d74e42 62libc_feholdexcept_ppc (fenv_t *envp)
41e8926a 63{
84d74e42 64 __libc_feholdbits_ppc (envp, _FPU_MASK_NOT_RN_NI, 0LL);
41e8926a
AZ
65}
66
67static __always_inline void
68libc_feholdexcept_setround_ppc (fenv_t *envp, int r)
69{
84d74e42
PM
70 __libc_feholdbits_ppc (envp, _FPU_MASK_NOT_RN_NI & _FPU_MASK_RN, r);
71}
41e8926a 72
84d74e42
PM
73static __always_inline void
74libc_fesetround_ppc (int r)
75{
76 __fesetround_inline (r);
41e8926a
AZ
77}
78
79static __always_inline int
80libc_fetestexcept_ppc (int e)
81{
82 fenv_union_t u;
83 u.fenv = fegetenv_register ();
84 return u.l & e;
85}
86
87static __always_inline void
84d74e42
PM
88libc_feholdsetround_ppc (fenv_t *e, int r)
89{
90 __libc_feholdbits_ppc (e, _FPU_MASK_TRAPS_RN, r);
91}
92
93static __always_inline unsigned long long
94__libc_femergeenv_ppc (const fenv_t *envp, unsigned long long old_mask,
95 unsigned long long new_mask)
41e8926a
AZ
96{
97 fenv_union_t old, new;
98
99 new.fenv = *envp;
100 old.fenv = fegetenv_register ();
101
84d74e42
PM
102 /* Merge bits while masking unwanted bits from new and old env. */
103 new.l = (old.l & old_mask) | (new.l & new_mask);
104
41e8926a
AZ
105 /* If the old env has no enabled exceptions and the new env has any enabled
106 exceptions, then unmask SIGFPE in the MSR FE0/FE1 bits. This will put the
107 hardware into "precise mode" and may cause the FPU to run slower on some
108 hardware. */
84d74e42 109 if ((old.l & _FPU_ALL_TRAPS) == 0 && (new.l & _FPU_ALL_TRAPS) != 0)
bd12ab55 110 (void) __fe_nomask_env_priv ();
41e8926a
AZ
111
112 /* If the old env had any enabled exceptions and the new env has no enabled
113 exceptions, then mask SIGFPE in the MSR FE0/FE1 bits. This may allow the
114 FPU to run faster because it always takes the default action and can not
115 generate SIGFPE. */
84d74e42 116 if ((old.l & _FPU_ALL_TRAPS) != 0 && (new.l & _FPU_ALL_TRAPS) == 0)
41e8926a
AZ
117 (void) __fe_mask_env ();
118
84d74e42 119 /* Atomically enable and raise (if appropriate) exceptions set in `new'. */
41e8926a
AZ
120 fesetenv_register (new.fenv);
121
84d74e42 122 return old.l;
41e8926a
AZ
123}
124
125static __always_inline void
84d74e42 126libc_fesetenv_ppc (const fenv_t *envp)
41e8926a 127{
84d74e42
PM
128 /* Replace the entire environment. */
129 __libc_femergeenv_ppc (envp, 0LL, -1LL);
41e8926a
AZ
130}
131
132static __always_inline void
84d74e42 133libc_feresetround_ppc (fenv_t *envp)
41e8926a 134{
e9052126 135 fenv_union_t new = { .fenv = *envp };
f1c56cdf 136 fegetenv_and_set_rn (new.l & FPSCR_RN_MASK);
84d74e42 137}
41e8926a 138
84d74e42
PM
139static __always_inline int
140libc_feupdateenv_test_ppc (fenv_t *envp, int ex)
141{
142 return __libc_femergeenv_ppc (envp, _FPU_MASK_TRAPS_RN,
143 _FPU_MASK_FRAC_INEX_RET_CC) & ex;
41e8926a
AZ
144}
145
146static __always_inline void
84d74e42 147libc_feupdateenv_ppc (fenv_t *e)
41e8926a 148{
84d74e42 149 libc_feupdateenv_test_ppc (e, 0);
41e8926a
AZ
150}
151
152#define libc_feholdexceptf libc_feholdexcept_ppc
153#define libc_feholdexcept libc_feholdexcept_ppc
154#define libc_feholdexcept_setroundf libc_feholdexcept_setround_ppc
155#define libc_feholdexcept_setround libc_feholdexcept_setround_ppc
156#define libc_fetestexceptf libc_fetestexcept_ppc
157#define libc_fetestexcept libc_fetestexcept_ppc
158#define libc_fesetroundf libc_fesetround_ppc
159#define libc_fesetround libc_fesetround_ppc
160#define libc_fesetenvf libc_fesetenv_ppc
161#define libc_fesetenv libc_fesetenv_ppc
162#define libc_feupdateenv_testf libc_feupdateenv_test_ppc
163#define libc_feupdateenv_test libc_feupdateenv_test_ppc
164#define libc_feupdateenvf libc_feupdateenv_ppc
165#define libc_feupdateenv libc_feupdateenv_ppc
166#define libc_feholdsetroundf libc_feholdsetround_ppc
167#define libc_feholdsetround libc_feholdsetround_ppc
168#define libc_feresetroundf libc_feresetround_ppc
169#define libc_feresetround libc_feresetround_ppc
170
171
172/* We have support for rounding mode context. */
173#define HAVE_RM_CTX 1
174
175static __always_inline void
84d74e42 176libc_feholdsetround_ppc_ctx (struct rm_ctx *ctx, int r)
41e8926a 177{
f1c56cdf 178 fenv_union_t old;
41e8926a 179
f1c56cdf
PC
180 ctx->env = old.fenv = fegetenv_and_set_rn (r);
181 ctx->updated_status = (r != (old.l & FPSCR_RN_MASK));
e9052126
PC
182}
183
184static __always_inline void
185libc_feholdsetround_noex_ppc_ctx (struct rm_ctx *ctx, int r)
186{
187 fenv_union_t old, new;
188
41e8926a
AZ
189 old.fenv = fegetenv_register ();
190
e9052126 191 new.l = (old.l & ~(FPSCR_ENABLES_MASK|FPSCR_RN_MASK)) | r;
84d74e42 192
41e8926a
AZ
193 ctx->env = old.fenv;
194 if (__glibc_unlikely (new.l != old.l))
195 {
84d74e42 196 if ((old.l & _FPU_ALL_TRAPS) != 0)
41e8926a
AZ
197 (void) __fe_mask_env ();
198 fesetenv_register (new.fenv);
199 ctx->updated_status = true;
200 }
201 else
202 ctx->updated_status = false;
203}
204
205static __always_inline void
206libc_fesetenv_ppc_ctx (struct rm_ctx *ctx)
207{
208 libc_fesetenv_ppc (&ctx->env);
209}
210
211static __always_inline void
212libc_feupdateenv_ppc_ctx (struct rm_ctx *ctx)
213{
214 if (__glibc_unlikely (ctx->updated_status))
84d74e42 215 libc_feresetround_ppc (&ctx->env);
41e8926a
AZ
216}
217
218static __always_inline void
219libc_feresetround_ppc_ctx (struct rm_ctx *ctx)
220{
221 if (__glibc_unlikely (ctx->updated_status))
222 libc_feresetround_ppc (&ctx->env);
223}
224
41e8926a
AZ
225#define libc_fesetenv_ctx libc_fesetenv_ppc_ctx
226#define libc_fesetenvf_ctx libc_fesetenv_ppc_ctx
2cd925f7 227#define libc_fesetenvl_ctx libc_fesetenv_ppc_ctx
41e8926a
AZ
228#define libc_feholdsetround_ctx libc_feholdsetround_ppc_ctx
229#define libc_feholdsetroundf_ctx libc_feholdsetround_ppc_ctx
2cd925f7 230#define libc_feholdsetroundl_ctx libc_feholdsetround_ppc_ctx
e9052126
PC
231#define libc_feholdsetround_noex_ctx libc_feholdsetround_noex_ppc_ctx
232#define libc_feholdsetround_noexf_ctx libc_feholdsetround_noex_ppc_ctx
233#define libc_feholdsetround_noexl_ctx libc_feholdsetround_noex_ppc_ctx
41e8926a
AZ
234#define libc_feresetround_ctx libc_feresetround_ppc_ctx
235#define libc_feresetroundf_ctx libc_feresetround_ppc_ctx
2cd925f7 236#define libc_feresetroundl_ctx libc_feresetround_ppc_ctx
41e8926a 237#define libc_feupdateenv_ctx libc_feupdateenv_ppc_ctx
2cd925f7
AZ
238#define libc_feupdateenvf_ctx libc_feupdateenv_ppc_ctx
239#define libc_feupdateenvl_ctx libc_feupdateenv_ppc_ctx
41e8926a 240
ff6b2450
JM
241#include_next <fenv_private.h>
242
41e8926a 243#endif