xref: /freebsd/lib/msun/src/math_private.h (revision 884a2a699669ec61e2366e3e358342dbc94be24a)
1 /*
2  * ====================================================
3  * Copyright (C) 1993 by Sun Microsystems, Inc. All rights reserved.
4  *
5  * Developed at SunPro, a Sun Microsystems, Inc. business.
6  * Permission to use, copy, modify, and distribute this
7  * software is freely granted, provided that this notice
8  * is preserved.
9  * ====================================================
10  */
11 
12 /*
13  * from: @(#)fdlibm.h 5.1 93/09/24
14  * $FreeBSD$
15  */
16 
17 #ifndef _MATH_PRIVATE_H_
18 #define	_MATH_PRIVATE_H_
19 
20 #include <sys/types.h>
21 #include <machine/endian.h>
22 
23 /*
24  * The original fdlibm code used statements like:
25  *	n0 = ((*(int*)&one)>>29)^1;		* index of high word *
26  *	ix0 = *(n0+(int*)&x);			* high word of x *
27  *	ix1 = *((1-n0)+(int*)&x);		* low word of x *
28  * to dig two 32 bit words out of the 64 bit IEEE floating point
29  * value.  That is non-ANSI, and, moreover, the gcc instruction
30  * scheduler gets it wrong.  We instead use the following macros.
31  * Unlike the original code, we determine the endianness at compile
32  * time, not at run time; I don't see much benefit to selecting
33  * endianness at run time.
34  */
35 
36 /*
37  * A union which permits us to convert between a double and two 32 bit
38  * ints.
39  */
40 
41 #ifdef __arm__
42 #if defined(__VFP_FP__)
43 #define	IEEE_WORD_ORDER	BYTE_ORDER
44 #else
45 #define	IEEE_WORD_ORDER	BIG_ENDIAN
46 #endif
47 #else /* __arm__ */
48 #define	IEEE_WORD_ORDER	BYTE_ORDER
49 #endif
50 
51 #if IEEE_WORD_ORDER == BIG_ENDIAN
52 
53 typedef union
54 {
55   double value;
56   struct
57   {
58     u_int32_t msw;
59     u_int32_t lsw;
60   } parts;
61 } ieee_double_shape_type;
62 
63 #endif
64 
65 #if IEEE_WORD_ORDER == LITTLE_ENDIAN
66 
67 typedef union
68 {
69   double value;
70   struct
71   {
72     u_int32_t lsw;
73     u_int32_t msw;
74   } parts;
75 } ieee_double_shape_type;
76 
77 #endif
78 
79 /* Get two 32 bit ints from a double.  */
80 
81 #define EXTRACT_WORDS(ix0,ix1,d)				\
82 do {								\
83   ieee_double_shape_type ew_u;					\
84   ew_u.value = (d);						\
85   (ix0) = ew_u.parts.msw;					\
86   (ix1) = ew_u.parts.lsw;					\
87 } while (0)
88 
89 /* Get the more significant 32 bit int from a double.  */
90 
91 #define GET_HIGH_WORD(i,d)					\
92 do {								\
93   ieee_double_shape_type gh_u;					\
94   gh_u.value = (d);						\
95   (i) = gh_u.parts.msw;						\
96 } while (0)
97 
98 /* Get the less significant 32 bit int from a double.  */
99 
100 #define GET_LOW_WORD(i,d)					\
101 do {								\
102   ieee_double_shape_type gl_u;					\
103   gl_u.value = (d);						\
104   (i) = gl_u.parts.lsw;						\
105 } while (0)
106 
107 /* Set a double from two 32 bit ints.  */
108 
109 #define INSERT_WORDS(d,ix0,ix1)					\
110 do {								\
111   ieee_double_shape_type iw_u;					\
112   iw_u.parts.msw = (ix0);					\
113   iw_u.parts.lsw = (ix1);					\
114   (d) = iw_u.value;						\
115 } while (0)
116 
117 /* Set the more significant 32 bits of a double from an int.  */
118 
119 #define SET_HIGH_WORD(d,v)					\
120 do {								\
121   ieee_double_shape_type sh_u;					\
122   sh_u.value = (d);						\
123   sh_u.parts.msw = (v);						\
124   (d) = sh_u.value;						\
125 } while (0)
126 
127 /* Set the less significant 32 bits of a double from an int.  */
128 
129 #define SET_LOW_WORD(d,v)					\
130 do {								\
131   ieee_double_shape_type sl_u;					\
132   sl_u.value = (d);						\
133   sl_u.parts.lsw = (v);						\
134   (d) = sl_u.value;						\
135 } while (0)
136 
137 /*
138  * A union which permits us to convert between a float and a 32 bit
139  * int.
140  */
141 
142 typedef union
143 {
144   float value;
145   /* FIXME: Assumes 32 bit int.  */
146   unsigned int word;
147 } ieee_float_shape_type;
148 
149 /* Get a 32 bit int from a float.  */
150 
151 #define GET_FLOAT_WORD(i,d)					\
152 do {								\
153   ieee_float_shape_type gf_u;					\
154   gf_u.value = (d);						\
155   (i) = gf_u.word;						\
156 } while (0)
157 
158 /* Set a float from a 32 bit int.  */
159 
160 #define SET_FLOAT_WORD(d,i)					\
161 do {								\
162   ieee_float_shape_type sf_u;					\
163   sf_u.word = (i);						\
164   (d) = sf_u.value;						\
165 } while (0)
166 
167 #ifdef FLT_EVAL_METHOD
168 /*
169  * Attempt to get strict C99 semantics for assignment with non-C99 compilers.
170  */
171 #if FLT_EVAL_METHOD == 0 || __GNUC__ == 0
172 #define	STRICT_ASSIGN(type, lval, rval)	((lval) = (rval))
173 #else
174 #define	STRICT_ASSIGN(type, lval, rval) do {	\
175 	volatile type __lval;			\
176 						\
177 	if (sizeof(type) >= sizeof(double))	\
178 		(lval) = (rval);		\
179 	else {					\
180 		__lval = (rval);		\
181 		(lval) = __lval;		\
182 	}					\
183 } while (0)
184 #endif
185 #endif
186 
187 /*
188  * Common routine to process the arguments to nan(), nanf(), and nanl().
189  */
190 void _scan_nan(uint32_t *__words, int __num_words, const char *__s);
191 
192 #ifdef _COMPLEX_H
193 
194 /*
195  * C99 specifies that complex numbers have the same representation as
196  * an array of two elements, where the first element is the real part
197  * and the second element is the imaginary part.
198  */
199 typedef union {
200 	float complex f;
201 	float a[2];
202 } float_complex;
203 typedef union {
204 	double complex f;
205 	double a[2];
206 } double_complex;
207 typedef union {
208 	long double complex f;
209 	long double a[2];
210 } long_double_complex;
211 #define	REALPART(z)	((z).a[0])
212 #define	IMAGPART(z)	((z).a[1])
213 
214 /*
215  * Inline functions that can be used to construct complex values.
216  *
217  * The C99 standard intends x+I*y to be used for this, but x+I*y is
218  * currently unusable in general since gcc introduces many overflow,
219  * underflow, sign and efficiency bugs by rewriting I*y as
220  * (0.0+I)*(y+0.0*I) and laboriously computing the full complex product.
221  * In particular, I*Inf is corrupted to NaN+I*Inf, and I*-0 is corrupted
222  * to -0.0+I*0.0.
223  */
224 static __inline float complex
225 cpackf(float x, float y)
226 {
227 	float_complex z;
228 
229 	REALPART(z) = x;
230 	IMAGPART(z) = y;
231 	return (z.f);
232 }
233 
234 static __inline double complex
235 cpack(double x, double y)
236 {
237 	double_complex z;
238 
239 	REALPART(z) = x;
240 	IMAGPART(z) = y;
241 	return (z.f);
242 }
243 
244 static __inline long double complex
245 cpackl(long double x, long double y)
246 {
247 	long_double_complex z;
248 
249 	REALPART(z) = x;
250 	IMAGPART(z) = y;
251 	return (z.f);
252 }
253 #endif /* _COMPLEX_H */
254 
255 #ifdef __GNUCLIKE_ASM
256 
257 /* Asm versions of some functions. */
258 
259 #ifdef __amd64__
260 static __inline int
261 irint(double x)
262 {
263 	int n;
264 
265 	asm("cvtsd2si %1,%0" : "=r" (n) : "x" (x));
266 	return (n);
267 }
268 #define	HAVE_EFFICIENT_IRINT
269 #endif
270 
271 #ifdef __i386__
272 static __inline int
273 irint(double x)
274 {
275 	int n;
276 
277 	asm("fistl %0" : "=m" (n) : "t" (x));
278 	return (n);
279 }
280 #define	HAVE_EFFICIENT_IRINT
281 #endif
282 
283 #endif /* __GNUCLIKE_ASM */
284 
285 /*
286  * ieee style elementary functions
287  *
288  * We rename functions here to improve other sources' diffability
289  * against fdlibm.
290  */
291 #define	__ieee754_sqrt	sqrt
292 #define	__ieee754_acos	acos
293 #define	__ieee754_acosh	acosh
294 #define	__ieee754_log	log
295 #define	__ieee754_log2	log2
296 #define	__ieee754_atanh	atanh
297 #define	__ieee754_asin	asin
298 #define	__ieee754_atan2	atan2
299 #define	__ieee754_exp	exp
300 #define	__ieee754_cosh	cosh
301 #define	__ieee754_fmod	fmod
302 #define	__ieee754_pow	pow
303 #define	__ieee754_lgamma lgamma
304 #define	__ieee754_gamma	gamma
305 #define	__ieee754_lgamma_r lgamma_r
306 #define	__ieee754_gamma_r gamma_r
307 #define	__ieee754_log10	log10
308 #define	__ieee754_sinh	sinh
309 #define	__ieee754_hypot	hypot
310 #define	__ieee754_j0	j0
311 #define	__ieee754_j1	j1
312 #define	__ieee754_y0	y0
313 #define	__ieee754_y1	y1
314 #define	__ieee754_jn	jn
315 #define	__ieee754_yn	yn
316 #define	__ieee754_remainder remainder
317 #define	__ieee754_scalb	scalb
318 #define	__ieee754_sqrtf	sqrtf
319 #define	__ieee754_acosf	acosf
320 #define	__ieee754_acoshf acoshf
321 #define	__ieee754_logf	logf
322 #define	__ieee754_atanhf atanhf
323 #define	__ieee754_asinf	asinf
324 #define	__ieee754_atan2f atan2f
325 #define	__ieee754_expf	expf
326 #define	__ieee754_coshf	coshf
327 #define	__ieee754_fmodf	fmodf
328 #define	__ieee754_powf	powf
329 #define	__ieee754_lgammaf lgammaf
330 #define	__ieee754_gammaf gammaf
331 #define	__ieee754_lgammaf_r lgammaf_r
332 #define	__ieee754_gammaf_r gammaf_r
333 #define	__ieee754_log10f log10f
334 #define	__ieee754_log2f log2f
335 #define	__ieee754_sinhf	sinhf
336 #define	__ieee754_hypotf hypotf
337 #define	__ieee754_j0f	j0f
338 #define	__ieee754_j1f	j1f
339 #define	__ieee754_y0f	y0f
340 #define	__ieee754_y1f	y1f
341 #define	__ieee754_jnf	jnf
342 #define	__ieee754_ynf	ynf
343 #define	__ieee754_remainderf remainderf
344 #define	__ieee754_scalbf scalbf
345 
346 /* fdlibm kernel function */
347 int	__kernel_rem_pio2(double*,double*,int,int,int);
348 
349 /* double precision kernel functions */
350 #ifdef INLINE_REM_PIO2
351 __inline
352 #endif
353 int	__ieee754_rem_pio2(double,double*);
354 double	__kernel_sin(double,double,int);
355 double	__kernel_cos(double,double);
356 double	__kernel_tan(double,double,int);
357 
358 /* float precision kernel functions */
359 #ifdef INLINE_REM_PIO2F
360 __inline
361 #endif
362 int	__ieee754_rem_pio2f(float,double*);
363 #ifdef INLINE_KERNEL_SINDF
364 __inline
365 #endif
366 float	__kernel_sindf(double);
367 #ifdef INLINE_KERNEL_COSDF
368 __inline
369 #endif
370 float	__kernel_cosdf(double);
371 #ifdef INLINE_KERNEL_TANDF
372 __inline
373 #endif
374 float	__kernel_tandf(double,int);
375 
376 /* long double precision kernel functions */
377 long double __kernel_sinl(long double, long double, int);
378 long double __kernel_cosl(long double, long double);
379 long double __kernel_tanl(long double, long double, int);
380 
381 #endif /* !_MATH_PRIVATE_H_ */
382