xref: /freebsd/lib/msun/src/k_sincosl.h (revision 0dd5a5603e7a33d976f8e6015620bbc79839c609)
1e1b98d07SMichal Meloun /*-
2e1b98d07SMichal Meloun  * ====================================================
3e1b98d07SMichal Meloun  * Copyright (C) 1993 by Sun Microsystems, Inc. All rights reserved.
4e1b98d07SMichal Meloun  * Copyright (c) 2008 Steven G. Kargl, David Schultz, Bruce D. Evans.
5e1b98d07SMichal Meloun  *
6e1b98d07SMichal Meloun  * Developed at SunSoft, a Sun Microsystems, Inc. business.
7e1b98d07SMichal Meloun  * Permission to use, copy, modify, and distribute this
8e1b98d07SMichal Meloun  * software is freely granted, provided that this notice
9e1b98d07SMichal Meloun  * is preserved.
10e1b98d07SMichal Meloun  * ====================================================
11e1b98d07SMichal Meloun  *
12e1b98d07SMichal Meloun  * k_sinl.c and k_cosl.c merged by Steven G. Kargl
13e1b98d07SMichal Meloun  */
14e1b98d07SMichal Meloun 
15e1b98d07SMichal Meloun #if LDBL_MANT_DIG == 64		/* ld80 version of k_sincosl.c. */
16e1b98d07SMichal Meloun 
17e1b98d07SMichal Meloun #if defined(__amd64__) || defined(__i386__)
18e1b98d07SMichal Meloun /* Long double constants are slow on these arches, and broken on i386. */
19e1b98d07SMichal Meloun static const volatile double
20e1b98d07SMichal Meloun C1hi = 0.041666666666666664,		/*  0x15555555555555.0p-57 */
21e1b98d07SMichal Meloun C1lo = 2.2598839032744733e-18,		/*  0x14d80000000000.0p-111 */
22e1b98d07SMichal Meloun S1hi = -0.16666666666666666,		/* -0x15555555555555.0p-55 */
23e1b98d07SMichal Meloun S1lo = -9.2563760475949941e-18;		/* -0x15580000000000.0p-109 */
24e1b98d07SMichal Meloun #define	S1	((long double)S1hi + S1lo)
25e1b98d07SMichal Meloun #define	C1	((long double)C1hi + C1lo)
26e1b98d07SMichal Meloun #else
27e1b98d07SMichal Meloun static const long double
2812c4ab43SLi-Wen Hsu C1 =  0.0416666666666666666136L,	/*  0xaaaaaaaaaaaaaa9b.0p-68 */
2912c4ab43SLi-Wen Hsu S1 = -0.166666666666666666671L;		/* -0xaaaaaaaaaaaaaaab.0p-66 */
30e1b98d07SMichal Meloun #endif
31e1b98d07SMichal Meloun 
32e1b98d07SMichal Meloun static const double
33e1b98d07SMichal Meloun C2 = -0.0013888888888888874,		/* -0x16c16c16c16c10.0p-62 */
34e1b98d07SMichal Meloun C3 =  0.000024801587301571716,		/*  0x1a01a01a018e22.0p-68 */
35e1b98d07SMichal Meloun C4 = -0.00000027557319215507120,	/* -0x127e4fb7602f22.0p-74 */
36e1b98d07SMichal Meloun C5 =  0.0000000020876754400407278,	/*  0x11eed8caaeccf1.0p-81 */
37e1b98d07SMichal Meloun C6 = -1.1470297442401303e-11,		/* -0x19393412bd1529.0p-89 */
38e1b98d07SMichal Meloun C7 =  4.7383039476436467e-14,		/*  0x1aac9d9af5c43e.0p-97 */
39e1b98d07SMichal Meloun S2 =  0.0083333333333333332,		/*  0x11111111111111.0p-59 */
40e1b98d07SMichal Meloun S3 = -0.00019841269841269427,		/* -0x1a01a01a019f81.0p-65 */
41e1b98d07SMichal Meloun S4 =  0.0000027557319223597490,		/*  0x171de3a55560f7.0p-71 */
42e1b98d07SMichal Meloun S5 = -0.000000025052108218074604,	/* -0x1ae64564f16cad.0p-78 */
43e1b98d07SMichal Meloun S6 =  1.6059006598854211e-10,		/*  0x161242b90243b5.0p-85 */
44e1b98d07SMichal Meloun S7 = -7.6429779983024564e-13,		/* -0x1ae42ebd1b2e00.0p-93 */
45e1b98d07SMichal Meloun S8 =  2.6174587166648325e-15;		/*  0x179372ea0b3f64.0p-101 */
46e1b98d07SMichal Meloun 
47e1b98d07SMichal Meloun static inline void
__kernel_sincosl(long double x,long double y,int iy,long double * sn,long double * cs)48e1b98d07SMichal Meloun __kernel_sincosl(long double x, long double y, int iy, long double *sn,
49e1b98d07SMichal Meloun     long double *cs)
50e1b98d07SMichal Meloun {
51e1b98d07SMichal Meloun 	long double hz, r, v, w, z;
52e1b98d07SMichal Meloun 
53e1b98d07SMichal Meloun 	z = x * x;
54e1b98d07SMichal Meloun 	v = z * x;
55e1b98d07SMichal Meloun 	/*
56e1b98d07SMichal Meloun 	 * XXX Replace Horner scheme with an algorithm suitable for CPUs
57e1b98d07SMichal Meloun 	 * with more complex pipelines.
58e1b98d07SMichal Meloun 	 */
59e1b98d07SMichal Meloun 	r = S2 + z * (S3 + z * (S4 + z * (S5 + z * (S6 + z * (S7 + z * S8)))));
60e1b98d07SMichal Meloun 
61e1b98d07SMichal Meloun 	if (iy == 0)
62e1b98d07SMichal Meloun 		*sn = x + v * (S1 + z * r);
63e1b98d07SMichal Meloun 	else
64e1b98d07SMichal Meloun 		*sn = x - ((z * (y / 2 - v * r) - y) - v * S1);
65e1b98d07SMichal Meloun 
66e1b98d07SMichal Meloun 	hz = z / 2;
67e1b98d07SMichal Meloun 	w = 1 - hz;
68e1b98d07SMichal Meloun 	r = z * (C1 + z * (C2 + z * (C3 + z * (C4 + z * (C5 + z * (C6 +
69e1b98d07SMichal Meloun 	    z * C7))))));
70e1b98d07SMichal Meloun 	*cs = w + (((1 - w) - hz) + (z * r - x * y));
71e1b98d07SMichal Meloun }
72e1b98d07SMichal Meloun 
73e1b98d07SMichal Meloun #elif LDBL_MANT_DIG == 113	/* ld128 version of k_sincosl.c. */
74e1b98d07SMichal Meloun 
75e1b98d07SMichal Meloun static const long double
76e1b98d07SMichal Meloun S1 = -0.16666666666666666666666666666666666606732416116558L,
77e1b98d07SMichal Meloun S2 =  0.0083333333333333333333333333333331135404851288270047L,
78e1b98d07SMichal Meloun S3 = -0.00019841269841269841269841269839935785325638310428717L,
79e1b98d07SMichal Meloun S4 =  0.27557319223985890652557316053039946268333231205686e-5L,
80e1b98d07SMichal Meloun S5 = -0.25052108385441718775048214826384312253862930064745e-7L,
81e1b98d07SMichal Meloun S6 =  0.16059043836821614596571832194524392581082444805729e-9L,
82e1b98d07SMichal Meloun S7 = -0.76471637318198151807063387954939213287488216303768e-12L,
83e1b98d07SMichal Meloun S8 =  0.28114572543451292625024967174638477283187397621303e-14L;
84e1b98d07SMichal Meloun 
85e1b98d07SMichal Meloun static const double
86e1b98d07SMichal Meloun S9  = -0.82206352458348947812512122163446202498005154296863e-17,
87e1b98d07SMichal Meloun S10 =  0.19572940011906109418080609928334380560135358385256e-19,
88e1b98d07SMichal Meloun S11 = -0.38680813379701966970673724299207480965452616911420e-22,
89e1b98d07SMichal Meloun S12 =  0.64038150078671872796678569586315881020659912139412e-25;
90e1b98d07SMichal Meloun 
91*046e2d5dSSteve Kargl static const long double
92*046e2d5dSSteve Kargl C1 =  4.16666666666666666666666666666666667e-02L,
93*046e2d5dSSteve Kargl C2 = -1.38888888888888888888888888888888834e-03L,
94*046e2d5dSSteve Kargl C3 =  2.48015873015873015873015873015446795e-05L,
95*046e2d5dSSteve Kargl C4 = -2.75573192239858906525573190949988493e-07L,
96*046e2d5dSSteve Kargl C5 =  2.08767569878680989792098886701451072e-09L,
97*046e2d5dSSteve Kargl C6 = -1.14707455977297247136657111139971865e-11L,
98*046e2d5dSSteve Kargl C7 =  4.77947733238738518870113294139830239e-14L,
99*046e2d5dSSteve Kargl C8 = -1.56192069685858079920640872925306403e-16L,
100*046e2d5dSSteve Kargl C9 =  4.11031762320473354032038893429515732e-19L,
101*046e2d5dSSteve Kargl C10= -8.89679121027589608738005163931958096e-22L,
102*046e2d5dSSteve Kargl C11=  1.61171797801314301767074036661901531e-24L,
103*046e2d5dSSteve Kargl C12= -2.46748624357670948912574279501044295e-27L;
104*046e2d5dSSteve Kargl 
105e1b98d07SMichal Meloun static inline void
__kernel_sincosl(long double x,long double y,int iy,long double * sn,long double * cs)106e1b98d07SMichal Meloun __kernel_sincosl(long double x, long double y, int iy, long double *sn,
107e1b98d07SMichal Meloun     long double *cs)
108e1b98d07SMichal Meloun {
109e1b98d07SMichal Meloun 	long double hz, r, v, w, z;
110e1b98d07SMichal Meloun 
111e1b98d07SMichal Meloun 	z = x * x;
112e1b98d07SMichal Meloun 	v = z * x;
113e1b98d07SMichal Meloun 	/*
114e1b98d07SMichal Meloun 	 * XXX Replace Horner scheme with an algorithm suitable for CPUs
115e1b98d07SMichal Meloun 	 * with more complex pipelines.
116e1b98d07SMichal Meloun 	 */
117e1b98d07SMichal Meloun 	r = S2 + z * (S3 + z * (S4 + z * (S5 + z * (S6 + z * (S7 + z * (S8 +
118e1b98d07SMichal Meloun 	    z * (S9 + z * (S10 + z * (S11 + z * S12)))))))));
119e1b98d07SMichal Meloun 
120e1b98d07SMichal Meloun 	if (iy == 0)
121e1b98d07SMichal Meloun 		*sn = x + v * (S1 + z * r);
122e1b98d07SMichal Meloun 	else
123*046e2d5dSSteve Kargl 		*sn = x - ((z * (y / 2 - v * r) - y) - v * S1);
124e1b98d07SMichal Meloun 
125e1b98d07SMichal Meloun 	hz = z / 2;
126e1b98d07SMichal Meloun 	w = 1 - hz;
127e1b98d07SMichal Meloun 	r = z * (C1 + z * (C2 + z * (C3 + z * (C4 + z * (C5 + z * (C6 +
128*046e2d5dSSteve Kargl 	    z * (C7 + z * (C8 + z * (C9 + z * (C10 + z * (C11+z*C12)))))))))));
129e1b98d07SMichal Meloun 
130e1b98d07SMichal Meloun 	*cs =  w + (((1 - w) - hz) + (z * r - x * y));
131e1b98d07SMichal Meloun }
132e1b98d07SMichal Meloun #else
133e1b98d07SMichal Meloun #error "Unsupported long double format"
134e1b98d07SMichal Meloun #endif
135