i386-math-asm.h source code [glibc/sysdeps/i386/fpu/i386-math-asm.h]

1	/ Helper macros for x86 libm functions.*
2	Copyright (C) 2015-2022 Free Software Foundation, Inc.
3	This file is part of the GNU C Library.
4
5	The GNU C Library is free software; you can redistribute it and/or
6	modify it under the terms of the GNU Lesser General Public
7	License as published by the Free Software Foundation; either
8	version 2.1 of the License, or (at your option) any later version.
9
10	The GNU C Library is distributed in the hope that it will be useful,
11	but WITHOUT ANY WARRANTY; without even the implied warranty of
12	MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
13	Lesser General Public License for more details.
14
15	You should have received a copy of the GNU Lesser General Public
16	License along with the GNU C Library; if not, see
17	<https://www.gnu.org/licenses/>. /*
18
19	#ifndef _I386_MATH_ASM_H
20	#define _I386_MATH_ASM_H 1
21
22	/ Remove excess range and precision by storing a value on the stack*
23	and loading it back. /*
24	#define FLT_NARROW_EVAL \
25	subl $4, %esp; \
26	cfi_adjust_cfa_offset (4); \
27	fstps (%esp); \
28	flds (%esp); \
29	addl $4, %esp; \
30	cfi_adjust_cfa_offset (-4);
31	#define DBL_NARROW_EVAL \
32	subl $8, %esp; \
33	cfi_adjust_cfa_offset (8); \
34	fstpl (%esp); \
35	fldl (%esp); \
36	addl $8, %esp; \
37	cfi_adjust_cfa_offset (-8);
38
39	/ Define constants for the minimum value of a floating-point*
40	type. /*
41	#define DEFINE_FLT_MIN \
42	.section .rodata.cst4,"aM",@progbits,4; \
43	.p2align 2; \
44	.type flt_min,@object; \
45	flt_min: \
46	.byte 0, 0, 0x80, 0; \
47	.size flt_min, .-flt_min;
48	#define DEFINE_DBL_MIN \
49	.section .rodata.cst8,"aM",@progbits,8; \
50	.p2align 3; \
51	.type dbl_min,@object; \
52	dbl_min: \
53	.byte 0, 0, 0, 0, 0, 0, 0x10, 0; \
54	.size dbl_min, .-dbl_min;
55	#define DEFINE_LDBL_MIN \
56	.section .rodata.cst16,"aM",@progbits,16; \
57	.p2align 4; \
58	.type ldbl_min,@object; \
59	ldbl_min: \
60	.byte 0, 0, 0, 0, 0, 0, 0, 0x80, 0x1, 0; \
61	.byte 0, 0, 0, 0, 0, 0; \
62	.size ldbl_min, .-ldbl_min;
63
64	/ Remove excess range and precision by storing a value on the stack*
65	and loading it back. The value is given to be nonnegative or NaN;
66	if it is subnormal, also force an underflow exception. The
67	relevant constant for the minimum of the type must have been
68	defined, the MO macro must have been defined for access to memory
69	operands, and, if PIC, the PIC register must have been loaded. /*
70	#define FLT_NARROW_EVAL_UFLOW_NONNEG_NAN \
71	subl $4, %esp; \
72	cfi_adjust_cfa_offset (4); \
73	flds MO(flt_min); \
74	fld %st(1); \
75	fucompp; \
76	fnstsw; \
77	sahf; \
78	jnc 6424f; \
79	fld %st(0); \
80	fmul %st(0); \
81	fstps (%esp); \
82	6424: fstps (%esp); \
83	flds (%esp); \
84	addl $4, %esp; \
85	cfi_adjust_cfa_offset (-4);
86	#define DBL_NARROW_EVAL_UFLOW_NONNEG_NAN \
87	subl $8, %esp; \
88	cfi_adjust_cfa_offset (8); \
89	fldl MO(dbl_min); \
90	fld %st(1); \
91	fucompp; \
92	fnstsw; \
93	sahf; \
94	jnc 6453f; \
95	fld %st(0); \
96	fmul %st(0); \
97	fstpl (%esp); \
98	6453: fstpl (%esp); \
99	fldl (%esp); \
100	addl $8, %esp; \
101	cfi_adjust_cfa_offset (-8);
102
103	/ Likewise, but the argument is not a NaN (so fcom instructions,*
104	which support memory operands, can be used). /*
105	#define FLT_NARROW_EVAL_UFLOW_NONNEG \
106	subl $4, %esp; \
107	cfi_adjust_cfa_offset (4); \
108	fcoms MO(flt_min); \
109	fnstsw; \
110	sahf; \
111	jnc 6424f; \
112	fld %st(0); \
113	fmul %st(0); \
114	fstps (%esp); \
115	6424: fstps (%esp); \
116	flds (%esp); \
117	addl $4, %esp; \
118	cfi_adjust_cfa_offset (-4);
119	#define DBL_NARROW_EVAL_UFLOW_NONNEG \
120	subl $8, %esp; \
121	cfi_adjust_cfa_offset (8); \
122	fcoml MO(dbl_min); \
123	fnstsw; \
124	sahf; \
125	jnc 6453f; \
126	fld %st(0); \
127	fmul %st(0); \
128	fstpl (%esp); \
129	6453: fstpl (%esp); \
130	fldl (%esp); \
131	addl $8, %esp; \
132	cfi_adjust_cfa_offset (-8);
133
134	/ Likewise, but the non-NaN argument may be negative. /
135	#define FLT_NARROW_EVAL_UFLOW_NONNAN \
136	subl $4, %esp; \
137	cfi_adjust_cfa_offset (4); \
138	fld %st(0); \
139	fabs; \
140	fcomps MO(flt_min); \
141	fnstsw; \
142	sahf; \
143	jnc 6424f; \
144	fld %st(0); \
145	fmul %st(0); \
146	fstps (%esp); \
147	6424: fstps (%esp); \
148	flds (%esp); \
149	addl $4, %esp; \
150	cfi_adjust_cfa_offset (-4);
151	#define DBL_NARROW_EVAL_UFLOW_NONNAN \
152	subl $8, %esp; \
153	cfi_adjust_cfa_offset (8); \
154	fld %st(0); \
155	fabs; \
156	fcompl MO(dbl_min); \
157	fnstsw; \
158	sahf; \
159	jnc 6453f; \
160	fld %st(0); \
161	fmul %st(0); \
162	fstpl (%esp); \
163	6453: fstpl (%esp); \
164	fldl (%esp); \
165	addl $8, %esp; \
166	cfi_adjust_cfa_offset (-8);
167
168	/ Force an underflow exception if the given value is subnormal. The*
169	relevant constant for the minimum of the type must have been
170	defined, the MO macro must have been defined for access to memory
171	operands, and, if PIC, the PIC register must have been loaded. /*
172	#define FLT_CHECK_FORCE_UFLOW \
173	flds MO(flt_min); \
174	fld %st(1); \
175	fabs; \
176	fucompp; \
177	fnstsw; \
178	sahf; \
179	jnc 6424f; \
180	subl $4, %esp; \
181	cfi_adjust_cfa_offset (4); \
182	fld %st(0); \
183	fmul %st(0); \
184	fstps (%esp); \
185	addl $4, %esp; \
186	cfi_adjust_cfa_offset (-4); \
187	6424:
188	#define DBL_CHECK_FORCE_UFLOW \
189	fldl MO(dbl_min); \
190	fld %st(1); \
191	fabs; \
192	fucompp; \
193	fnstsw; \
194	sahf; \
195	jnc 6453f; \
196	subl $8, %esp; \
197	cfi_adjust_cfa_offset (8); \
198	fld %st(0); \
199	fmul %st(0); \
200	fstpl (%esp); \
201	addl $8, %esp; \
202	cfi_adjust_cfa_offset (-8); \
203	6453:
204
205	/ Likewise, but also remove excess range and precision if the value*
206	is subnormal. /*
207	#define FLT_CHECK_FORCE_UFLOW_NARROW \
208	flds MO(flt_min); \
209	fld %st(1); \
210	fabs; \
211	fucompp; \
212	fnstsw; \
213	sahf; \
214	jnc 6424f; \
215	subl $4, %esp; \
216	cfi_adjust_cfa_offset (4); \
217	fld %st(0); \
218	fmul %st(0); \
219	fstps (%esp); \
220	fstps (%esp); \
221	flds (%esp); \
222	addl $4, %esp; \
223	cfi_adjust_cfa_offset (-4); \
224	6424:
225	#define DBL_CHECK_FORCE_UFLOW_NARROW \
226	fldl MO(dbl_min); \
227	fld %st(1); \
228	fabs; \
229	fucompp; \
230	fnstsw; \
231	sahf; \
232	jnc 6453f; \
233	subl $8, %esp; \
234	cfi_adjust_cfa_offset (8); \
235	fld %st(0); \
236	fmul %st(0); \
237	fstpl (%esp); \
238	fstpl (%esp); \
239	fldl (%esp); \
240	addl $8, %esp; \
241	cfi_adjust_cfa_offset (-8); \
242	6453:
243
244	/ Likewise, but the argument is nonnegative or NaN. /
245	#define LDBL_CHECK_FORCE_UFLOW_NONNEG_NAN \
246	fldt MO(ldbl_min); \
247	fld %st(1); \
248	fucompp; \
249	fnstsw; \
250	sahf; \
251	jnc 6464f; \
252	fld %st(0); \
253	fmul %st(0); \
254	fstp %st(0); \
255	6464:
256
257	/ Likewise, but the argument is not a NaN. /
258	#define FLT_CHECK_FORCE_UFLOW_NONNAN \
259	fld %st(0); \
260	fabs; \
261	fcomps MO(flt_min); \
262	fnstsw; \
263	sahf; \
264	jnc 6424f; \
265	subl $4, %esp; \
266	cfi_adjust_cfa_offset (4); \
267	fld %st(0); \
268	fmul %st(0); \
269	fstps (%esp); \
270	addl $4, %esp; \
271	cfi_adjust_cfa_offset (-4); \
272	6424:
273	#define DBL_CHECK_FORCE_UFLOW_NONNAN \
274	fld %st(0); \
275	fabs; \
276	fcompl MO(dbl_min); \
277	fnstsw; \
278	sahf; \
279	jnc 6453f; \
280	subl $8, %esp; \
281	cfi_adjust_cfa_offset (8); \
282	fld %st(0); \
283	fmul %st(0); \
284	fstpl (%esp); \
285	addl $8, %esp; \
286	cfi_adjust_cfa_offset (-8); \
287	6453:
288	#define LDBL_CHECK_FORCE_UFLOW_NONNAN \
289	fldt MO(ldbl_min); \
290	fld %st(1); \
291	fabs; \
292	fcompp; \
293	fnstsw; \
294	sahf; \
295	jnc 6464f; \
296	fld %st(0); \
297	fmul %st(0); \
298	fstp %st(0); \
299	6464:
300
301	/ Likewise, but the argument is nonnegative and not a NaN. /
302	#define FLT_CHECK_FORCE_UFLOW_NONNEG \
303	fcoms MO(flt_min); \
304	fnstsw; \
305	sahf; \
306	jnc 6424f; \
307	subl $4, %esp; \
308	cfi_adjust_cfa_offset (4); \
309	fld %st(0); \
310	fmul %st(0); \
311	fstps (%esp); \
312	addl $4, %esp; \
313	cfi_adjust_cfa_offset (-4); \
314	6424:
315	#define DBL_CHECK_FORCE_UFLOW_NONNEG \
316	fcoml MO(dbl_min); \
317	fnstsw; \
318	sahf; \
319	jnc 6453f; \
320	subl $8, %esp; \
321	cfi_adjust_cfa_offset (8); \
322	fld %st(0); \
323	fmul %st(0); \
324	fstpl (%esp); \
325	addl $8, %esp; \
326	cfi_adjust_cfa_offset (-8); \
327	6453:
328	#define LDBL_CHECK_FORCE_UFLOW_NONNEG \
329	fldt MO(ldbl_min); \
330	fld %st(1); \
331	fcompp; \
332	fnstsw; \
333	sahf; \
334	jnc 6464f; \
335	fld %st(0); \
336	fmul %st(0); \
337	fstp %st(0); \
338	6464:
339
340	#endif /* i386-math-asm.h. */
341

source code of glibc/sysdeps/i386/fpu/i386-math-asm.h