xref: /illumos-gate/usr/src/lib/libm/common/R/powf.c (revision cffcfaee1e6b29ef9ceb7d80e4e053ffd029906b)
1 /*
2  * CDDL HEADER START
3  *
4  * The contents of this file are subject to the terms of the
5  * Common Development and Distribution License (the "License").
6  * You may not use this file except in compliance with the License.
7  *
8  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
9  * or http://www.opensolaris.org/os/licensing.
10  * See the License for the specific language governing permissions
11  * and limitations under the License.
12  *
13  * When distributing Covered Code, include this CDDL HEADER in each
14  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
15  * If applicable, add the following below this CDDL HEADER, with the
16  * fields enclosed by brackets "[]" replaced with your own identifying
17  * information: Portions Copyright [yyyy] [name of copyright owner]
18  *
19  * CDDL HEADER END
20  */
21 /*
22  * Copyright 2011 Nexenta Systems, Inc.  All rights reserved.
23  */
24 /*
25  * Copyright 2005 Sun Microsystems, Inc.  All rights reserved.
26  * Use is subject to license terms.
27  */
28 
29 #pragma weak powf = __powf
30 
31 #include "libm.h"
32 #include "xpg6.h"	/* __xpg6 */
33 #define	_C99SUSv3_pow	_C99SUSv3_pow_treats_Inf_as_an_even_int
34 
35 #if defined(__i386) && !defined(__amd64)
36 extern int __swapRP(int);
37 #endif
38 
39 /* INDENT OFF */
40 static const double
41 	ln2 = 6.93147180559945286227e-01,	/* 0x3fe62e42, 0xfefa39ef */
42 	invln2 = 1.44269504088896338700e+00,	/* 0x3ff71547, 0x652b82fe */
43 	dtwo = 2.0,
44 	done = 1.0,
45 	dhalf = 0.5,
46 	d32 = 32.0,
47 	d1_32 = 0.03125,
48 	A0 = 1.999999999813723303647511146995966439250e+0000,
49 	A1 = 6.666910817935858533770138657139665608610e-0001,
50 	t0 = 2.000000000004777489262405315073203746943e+0000,
51 	t1 = 1.666663408349926379873111932994250726307e-0001;
52 
53 static const double S[] = {
54 	1.00000000000000000000e+00,	/* 3FF0000000000000 */
55 	1.02189714865411662714e+00,	/* 3FF059B0D3158574 */
56 	1.04427378242741375480e+00,	/* 3FF0B5586CF9890F */
57 	1.06714040067682369717e+00,	/* 3FF11301D0125B51 */
58 	1.09050773266525768967e+00,	/* 3FF172B83C7D517B */
59 	1.11438674259589243221e+00,	/* 3FF1D4873168B9AA */
60 	1.13878863475669156458e+00,	/* 3FF2387A6E756238 */
61 	1.16372485877757747552e+00,	/* 3FF29E9DF51FDEE1 */
62 	1.18920711500272102690e+00,	/* 3FF306FE0A31B715 */
63 	1.21524735998046895524e+00,	/* 3FF371A7373AA9CB */
64 	1.24185781207348400201e+00,	/* 3FF3DEA64C123422 */
65 	1.26905095719173321989e+00,	/* 3FF44E086061892D */
66 	1.29683955465100964055e+00,	/* 3FF4BFDAD5362A27 */
67 	1.32523664315974132322e+00,	/* 3FF5342B569D4F82 */
68 	1.35425554693689265129e+00,	/* 3FF5AB07DD485429 */
69 	1.38390988196383202258e+00,	/* 3FF6247EB03A5585 */
70 	1.41421356237309514547e+00,	/* 3FF6A09E667F3BCD */
71 	1.44518080697704665027e+00,	/* 3FF71F75E8EC5F74 */
72 	1.47682614593949934623e+00,	/* 3FF7A11473EB0187 */
73 	1.50916442759342284141e+00,	/* 3FF82589994CCE13 */
74 	1.54221082540794074411e+00,	/* 3FF8ACE5422AA0DB */
75 	1.57598084510788649659e+00,	/* 3FF93737B0CDC5E5 */
76 	1.61049033194925428347e+00,	/* 3FF9C49182A3F090 */
77 	1.64575547815396494578e+00,	/* 3FFA5503B23E255D */
78 	1.68179283050742900407e+00,	/* 3FFAE89F995AD3AD */
79 	1.71861929812247793414e+00,	/* 3FFB7F76F2FB5E47 */
80 	1.75625216037329945351e+00,	/* 3FFC199BDD85529C */
81 	1.79470907500310716820e+00,	/* 3FFCB720DCEF9069 */
82 	1.83400808640934243066e+00,	/* 3FFD5818DCFBA487 */
83 	1.87416763411029996256e+00,	/* 3FFDFC97337B9B5F */
84 	1.91520656139714740007e+00,	/* 3FFEA4AFA2A490DA */
85 	1.95714412417540017941e+00,	/* 3FFF50765B6E4540 */
86 };
87 
88 static const double TBL[] = {
89 	0.00000000000000000e+00,
90 	3.07716586667536873e-02,
91 	6.06246218164348399e-02,
92 	8.96121586896871380e-02,
93 	1.17783035656383456e-01,
94 	1.45182009844497889e-01,
95 	1.71850256926659228e-01,
96 	1.97825743329919868e-01,
97 	2.23143551314209765e-01,
98 	2.47836163904581269e-01,
99 	2.71933715483641758e-01,
100 	2.95464212893835898e-01,
101 	3.18453731118534589e-01,
102 	3.40926586970593193e-01,
103 	3.62905493689368475e-01,
104 	3.84411698910332056e-01,
105 	4.05465108108164385e-01,
106 	4.26084395310900088e-01,
107 	4.46287102628419530e-01,
108 	4.66089729924599239e-01,
109 	4.85507815781700824e-01,
110 	5.04556010752395312e-01,
111 	5.23248143764547868e-01,
112 	5.41597282432744409e-01,
113 	5.59615787935422659e-01,
114 	5.77315365034823613e-01,
115 	5.94707107746692776e-01,
116 	6.11801541105992941e-01,
117 	6.28608659422374094e-01,
118 	6.45137961373584701e-01,
119 	6.61398482245365016e-01,
120 	6.77398823591806143e-01,
121 };
122 
123 static const float zero = 0.0F, one = 1.0F, huge = 1.0e25f, tiny = 1.0e-25f;
124 /* INDENT ON */
125 
126 float
127 powf(float x, float y) {
128 	float	fx = x, fy = y;
129 	float	fz;
130 	int	ix, iy, jx, jy, k, iw, yisint;
131 
132 	ix = *(int *)&x;
133 	iy = *(int *)&y;
134 	jx = ix & ~0x80000000;
135 	jy = iy & ~0x80000000;
136 
137 	if (jy == 0)
138 		return (one);	/* x**+-0 = 1 */
139 	else if (ix == 0x3f800000 && (__xpg6 & _C99SUSv3_pow) != 0)
140 		return (one);	/* C99: 1**anything = 1 */
141 	else if (((0x7f800000 - jx) | (0x7f800000 - jy)) < 0)
142 		return (fx * fy);	/* at least one of x or y is NaN */
143 					/* includes Sun: 1**NaN = NaN */
144 	/* INDENT OFF */
145 	/*
146 	 * determine if y is an odd int
147 	 * yisint = 0 ... y is not an integer
148 	 * yisint = 1 ... y is an odd int
149 	 * yisint = 2 ... y is an even int
150 	 */
151 	/* INDENT ON */
152 	yisint = 0;
153 	if (ix < 0) {
154 		if (jy >= 0x4b800000) {
155 			yisint = 2;	/* |y|>=2**24: y must be even */
156 		} else if (jy >= 0x3f800000) {
157 			k = (jy >> 23) - 0x7f;	/* exponent */
158 			iw = jy >> (23 - k);
159 			if ((iw << (23 - k)) == jy)
160 				yisint = 2 - (iw & 1);
161 		}
162 	}
163 
164 	/* special value of y */
165 	if ((jy & ~0x7f800000) == 0) {
166 		if (jy == 0x7f800000) {		/* y is +-inf */
167 			if (jx == 0x3f800000) {
168 				if ((__xpg6 & _C99SUSv3_pow) != 0)
169 					fz = one;
170 						/* C99: (-1)**+-inf is 1 */
171 				else
172 					fz = fy - fy;
173 						/* Sun: (+-1)**+-inf = NaN */
174 			} else if (jx > 0x3f800000) {
175 						/* (|x|>1)**+,-inf = inf,0 */
176 				if (iy > 0)
177 					fz = fy;
178 				else
179 					fz = zero;
180 			} else {		/* (|x|<1)**-,+inf = inf,0 */
181 				if (iy < 0)
182 					fz = -fy;
183 				else
184 					fz = zero;
185 			}
186 			return (fz);
187 		} else if (jy == 0x3f800000) {	/* y is +-1 */
188 			if (iy < 0)
189 				fx = one / fx;	/* y is -1 */
190 			return (fx);
191 		} else if (iy == 0x40000000) {	/* y is 2 */
192 			return (fx * fx);
193 		} else if (iy == 0x3f000000) {	/* y is 0.5 */
194 			if (jx != 0 && jx != 0x7f800000)
195 				return (sqrtf(x));
196 		}
197 	}
198 
199 	/* special value of x */
200 	if ((jx & ~0x7f800000) == 0) {
201 		if (jx == 0x7f800000 || jx == 0 || jx == 0x3f800000) {
202 			/* x is +-0,+-inf,-1; set fz = |x|**y */
203 			*(int *)&fz = jx;
204 			if (iy < 0)
205 				fz = one / fz;
206 			if (ix < 0) {
207 				if (jx == 0x3f800000 && yisint == 0) {
208 					/* (-1)**non-int is NaN */
209 					fz = zero;
210 					fz /= fz;
211 				} else if (yisint == 1) {
212 					/* (x<0)**odd = -(|x|**odd) */
213 					fz = -fz;
214 				}
215 			}
216 			return (fz);
217 		}
218 	}
219 
220 	/* (x<0)**(non-int) is NaN */
221 	if (ix < 0 && yisint == 0) {
222 		fz = zero;
223 		return (fz / fz);
224 	}
225 
226 	/*
227 	 * compute exp(y*log(|x|))
228 	 * fx = *(float *) &jx;
229 	 * fz = (float) exp(((double) fy) * log((double) fx));
230 	 */
231 	{
232 		double	dx, dy, dz, ds;
233 		int	*px = (int *)&dx, *pz = (int *)&dz, i, n, m;
234 #if defined(__i386) && !defined(__amd64)
235 		int	rp = __swapRP(fp_extended);
236 #endif
237 
238 		fx = *(float *)&jx;
239 		dx = (double)fx;
240 
241 		/* compute log(x)/ln2 */
242 		i = px[HIWORD] + 0x4000;
243 		n = (i >> 20) - 0x3ff;
244 		pz[HIWORD] = i & 0xffff8000;
245 		pz[LOWORD] = 0;
246 		ds = (dx - dz) / (dx + dz);
247 		i = (i >> 15) & 0x1f;
248 		dz = ds * ds;
249 		dy = invln2 * (TBL[i] + ds * (A0 + dz * A1));
250 		if (n == 0)
251 			dz = (double)fy * dy;
252 		else
253 			dz = (double)fy * (dy + (double)n);
254 
255 		/* compute exp2(dz=y*ln(x)) */
256 		i = pz[HIWORD];
257 		if ((i & ~0x80000000) >= 0x40640000) {	/* |z| >= 160.0 */
258 			fz = (i > 0)? huge : tiny;
259 			if (ix < 0 && yisint == 1)
260 				fz *= -fz;	/* (-ve)**(odd int) */
261 			else
262 				fz *= fz;
263 #if defined(__i386) && !defined(__amd64)
264 			if (rp != fp_extended)
265 				(void) __swapRP(rp);
266 #endif
267 			return (fz);
268 		}
269 
270 		n = (int)(d32 * dz + (i > 0 ? dhalf : -dhalf));
271 		i = n & 0x1f;
272 		m = n >> 5;
273 		dy = ln2 * (dz - d1_32 * (double)n);
274 		dx = S[i] * (done - (dtwo * dy) / (dy * (done - dy * t1) - t0));
275 		if (m != 0)
276 			px[HIWORD] += m << 20;
277 		fz = (float)dx;
278 #if defined(__i386) && !defined(__amd64)
279 		if (rp != fp_extended)
280 			(void) __swapRP(rp);
281 #endif
282 	}
283 
284 	/* end of computing exp(y*log(x)) */
285 	if (ix < 0 && yisint == 1)
286 		fz = -fz;	/* (-ve)**(odd int) */
287 	return (fz);
288 }
289