1 /*
2 * CDDL HEADER START
3 *
4 * The contents of this file are subject to the terms of the
5 * Common Development and Distribution License (the "License").
6 * You may not use this file except in compliance with the License.
7 *
8 * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
9 * or http://www.opensolaris.org/os/licensing.
10 * See the License for the specific language governing permissions
11 * and limitations under the License.
12 *
13 * When distributing Covered Code, include this CDDL HEADER in each
14 * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
15 * If applicable, add the following below this CDDL HEADER, with the
16 * fields enclosed by brackets "[]" replaced with your own identifying
17 * information: Portions Copyright [yyyy] [name of copyright owner]
18 *
19 * CDDL HEADER END
20 */
21 /*
22 * Copyright 2011 Nexenta Systems, Inc. All rights reserved.
23 */
24 /*
25 * Copyright 2005 Sun Microsystems, Inc. All rights reserved.
26 * Use is subject to license terms.
27 */
28
29 #pragma weak __powf = powf
30
31 #include "libm.h"
32 #include "xpg6.h" /* __xpg6 */
33 #define _C99SUSv3_pow _C99SUSv3_pow_treats_Inf_as_an_even_int
34
35 #if defined(__i386) && !defined(__amd64)
36 extern int __swapRP(int);
37 #endif
38
39 /* INDENT OFF */
40 static const double
41 ln2 = 6.93147180559945286227e-01, /* 0x3fe62e42, 0xfefa39ef */
42 invln2 = 1.44269504088896338700e+00, /* 0x3ff71547, 0x652b82fe */
43 dtwo = 2.0,
44 done = 1.0,
45 dhalf = 0.5,
46 d32 = 32.0,
47 d1_32 = 0.03125,
48 A0 = 1.999999999813723303647511146995966439250e+0000,
49 A1 = 6.666910817935858533770138657139665608610e-0001,
50 t0 = 2.000000000004777489262405315073203746943e+0000,
51 t1 = 1.666663408349926379873111932994250726307e-0001;
52
53 static const double S[] = {
54 1.00000000000000000000e+00, /* 3FF0000000000000 */
55 1.02189714865411662714e+00, /* 3FF059B0D3158574 */
56 1.04427378242741375480e+00, /* 3FF0B5586CF9890F */
57 1.06714040067682369717e+00, /* 3FF11301D0125B51 */
58 1.09050773266525768967e+00, /* 3FF172B83C7D517B */
59 1.11438674259589243221e+00, /* 3FF1D4873168B9AA */
60 1.13878863475669156458e+00, /* 3FF2387A6E756238 */
61 1.16372485877757747552e+00, /* 3FF29E9DF51FDEE1 */
62 1.18920711500272102690e+00, /* 3FF306FE0A31B715 */
63 1.21524735998046895524e+00, /* 3FF371A7373AA9CB */
64 1.24185781207348400201e+00, /* 3FF3DEA64C123422 */
65 1.26905095719173321989e+00, /* 3FF44E086061892D */
66 1.29683955465100964055e+00, /* 3FF4BFDAD5362A27 */
67 1.32523664315974132322e+00, /* 3FF5342B569D4F82 */
68 1.35425554693689265129e+00, /* 3FF5AB07DD485429 */
69 1.38390988196383202258e+00, /* 3FF6247EB03A5585 */
70 1.41421356237309514547e+00, /* 3FF6A09E667F3BCD */
71 1.44518080697704665027e+00, /* 3FF71F75E8EC5F74 */
72 1.47682614593949934623e+00, /* 3FF7A11473EB0187 */
73 1.50916442759342284141e+00, /* 3FF82589994CCE13 */
74 1.54221082540794074411e+00, /* 3FF8ACE5422AA0DB */
75 1.57598084510788649659e+00, /* 3FF93737B0CDC5E5 */
76 1.61049033194925428347e+00, /* 3FF9C49182A3F090 */
77 1.64575547815396494578e+00, /* 3FFA5503B23E255D */
78 1.68179283050742900407e+00, /* 3FFAE89F995AD3AD */
79 1.71861929812247793414e+00, /* 3FFB7F76F2FB5E47 */
80 1.75625216037329945351e+00, /* 3FFC199BDD85529C */
81 1.79470907500310716820e+00, /* 3FFCB720DCEF9069 */
82 1.83400808640934243066e+00, /* 3FFD5818DCFBA487 */
83 1.87416763411029996256e+00, /* 3FFDFC97337B9B5F */
84 1.91520656139714740007e+00, /* 3FFEA4AFA2A490DA */
85 1.95714412417540017941e+00, /* 3FFF50765B6E4540 */
86 };
87
88 static const double TBL[] = {
89 0.00000000000000000e+00,
90 3.07716586667536873e-02,
91 6.06246218164348399e-02,
92 8.96121586896871380e-02,
93 1.17783035656383456e-01,
94 1.45182009844497889e-01,
95 1.71850256926659228e-01,
96 1.97825743329919868e-01,
97 2.23143551314209765e-01,
98 2.47836163904581269e-01,
99 2.71933715483641758e-01,
100 2.95464212893835898e-01,
101 3.18453731118534589e-01,
102 3.40926586970593193e-01,
103 3.62905493689368475e-01,
104 3.84411698910332056e-01,
105 4.05465108108164385e-01,
106 4.26084395310900088e-01,
107 4.46287102628419530e-01,
108 4.66089729924599239e-01,
109 4.85507815781700824e-01,
110 5.04556010752395312e-01,
111 5.23248143764547868e-01,
112 5.41597282432744409e-01,
113 5.59615787935422659e-01,
114 5.77315365034823613e-01,
115 5.94707107746692776e-01,
116 6.11801541105992941e-01,
117 6.28608659422374094e-01,
118 6.45137961373584701e-01,
119 6.61398482245365016e-01,
120 6.77398823591806143e-01,
121 };
122
123 static const float zero = 0.0F, one = 1.0F, huge = 1.0e25f, tiny = 1.0e-25f;
124 /* INDENT ON */
125
126 float
powf(float x,float y)127 powf(float x, float y) {
128 float fx = x, fy = y;
129 float fz;
130 int ix, iy, jx, jy, k, iw, yisint;
131
132 ix = *(int *)&x;
133 iy = *(int *)&y;
134 jx = ix & ~0x80000000;
135 jy = iy & ~0x80000000;
136
137 if (jy == 0)
138 return (one); /* x**+-0 = 1 */
139 else if (ix == 0x3f800000 && (__xpg6 & _C99SUSv3_pow) != 0)
140 return (one); /* C99: 1**anything = 1 */
141 else if (((0x7f800000 - jx) | (0x7f800000 - jy)) < 0)
142 return (fx * fy); /* at least one of x or y is NaN */
143 /* includes Sun: 1**NaN = NaN */
144 /* INDENT OFF */
145 /*
146 * determine if y is an odd int
147 * yisint = 0 ... y is not an integer
148 * yisint = 1 ... y is an odd int
149 * yisint = 2 ... y is an even int
150 */
151 /* INDENT ON */
152 yisint = 0;
153 if (ix < 0) {
154 if (jy >= 0x4b800000) {
155 yisint = 2; /* |y|>=2**24: y must be even */
156 } else if (jy >= 0x3f800000) {
157 k = (jy >> 23) - 0x7f; /* exponent */
158 iw = jy >> (23 - k);
159 if ((iw << (23 - k)) == jy)
160 yisint = 2 - (iw & 1);
161 }
162 }
163
164 /* special value of y */
165 if ((jy & ~0x7f800000) == 0) {
166 if (jy == 0x7f800000) { /* y is +-inf */
167 if (jx == 0x3f800000) {
168 if ((__xpg6 & _C99SUSv3_pow) != 0)
169 fz = one;
170 /* C99: (-1)**+-inf is 1 */
171 else
172 fz = fy - fy;
173 /* Sun: (+-1)**+-inf = NaN */
174 } else if (jx > 0x3f800000) {
175 /* (|x|>1)**+,-inf = inf,0 */
176 if (iy > 0)
177 fz = fy;
178 else
179 fz = zero;
180 } else { /* (|x|<1)**-,+inf = inf,0 */
181 if (iy < 0)
182 fz = -fy;
183 else
184 fz = zero;
185 }
186 return (fz);
187 } else if (jy == 0x3f800000) { /* y is +-1 */
188 if (iy < 0)
189 fx = one / fx; /* y is -1 */
190 return (fx);
191 } else if (iy == 0x40000000) { /* y is 2 */
192 return (fx * fx);
193 } else if (iy == 0x3f000000) { /* y is 0.5 */
194 if (jx != 0 && jx != 0x7f800000)
195 return (sqrtf(x));
196 }
197 }
198
199 /* special value of x */
200 if ((jx & ~0x7f800000) == 0) {
201 if (jx == 0x7f800000 || jx == 0 || jx == 0x3f800000) {
202 /* x is +-0,+-inf,-1; set fz = |x|**y */
203 *(int *)&fz = jx;
204 if (iy < 0)
205 fz = one / fz;
206 if (ix < 0) {
207 if (jx == 0x3f800000 && yisint == 0) {
208 /* (-1)**non-int is NaN */
209 fz = zero;
210 fz /= fz;
211 } else if (yisint == 1) {
212 /* (x<0)**odd = -(|x|**odd) */
213 fz = -fz;
214 }
215 }
216 return (fz);
217 }
218 }
219
220 /* (x<0)**(non-int) is NaN */
221 if (ix < 0 && yisint == 0) {
222 fz = zero;
223 return (fz / fz);
224 }
225
226 /*
227 * compute exp(y*log(|x|))
228 * fx = *(float *) &jx;
229 * fz = (float) exp(((double) fy) * log((double) fx));
230 */
231 {
232 double dx, dy, dz, ds;
233 int *px = (int *)&dx, *pz = (int *)&dz, i, n, m;
234 #if defined(__i386) && !defined(__amd64)
235 int rp = __swapRP(fp_extended);
236 #endif
237
238 fx = *(float *)&jx;
239 dx = (double)fx;
240
241 /* compute log(x)/ln2 */
242 i = px[HIWORD] + 0x4000;
243 n = (i >> 20) - 0x3ff;
244 pz[HIWORD] = i & 0xffff8000;
245 pz[LOWORD] = 0;
246 ds = (dx - dz) / (dx + dz);
247 i = (i >> 15) & 0x1f;
248 dz = ds * ds;
249 dy = invln2 * (TBL[i] + ds * (A0 + dz * A1));
250 if (n == 0)
251 dz = (double)fy * dy;
252 else
253 dz = (double)fy * (dy + (double)n);
254
255 /* compute exp2(dz=y*ln(x)) */
256 i = pz[HIWORD];
257 if ((i & ~0x80000000) >= 0x40640000) { /* |z| >= 160.0 */
258 fz = (i > 0)? huge : tiny;
259 if (ix < 0 && yisint == 1)
260 fz *= -fz; /* (-ve)**(odd int) */
261 else
262 fz *= fz;
263 #if defined(__i386) && !defined(__amd64)
264 if (rp != fp_extended)
265 (void) __swapRP(rp);
266 #endif
267 return (fz);
268 }
269
270 n = (int)(d32 * dz + (i > 0 ? dhalf : -dhalf));
271 i = n & 0x1f;
272 m = n >> 5;
273 dy = ln2 * (dz - d1_32 * (double)n);
274 dx = S[i] * (done - (dtwo * dy) / (dy * (done - dy * t1) - t0));
275 if (m != 0)
276 px[HIWORD] += m << 20;
277 fz = (float)dx;
278 #if defined(__i386) && !defined(__amd64)
279 if (rp != fp_extended)
280 (void) __swapRP(rp);
281 #endif
282 }
283
284 /* end of computing exp(y*log(x)) */
285 if (ix < 0 && yisint == 1)
286 fz = -fz; /* (-ve)**(odd int) */
287 return (fz);
288 }
289