xref: /illumos-gate/usr/src/lib/libm/common/C/exp.c (revision e86372a01d2d16a5dd4a64e144ed978ba17fe7dd)
1 /*
2  * CDDL HEADER START
3  *
4  * The contents of this file are subject to the terms of the
5  * Common Development and Distribution License (the "License").
6  * You may not use this file except in compliance with the License.
7  *
8  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
9  * or http://www.opensolaris.org/os/licensing.
10  * See the License for the specific language governing permissions
11  * and limitations under the License.
12  *
13  * When distributing Covered Code, include this CDDL HEADER in each
14  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
15  * If applicable, add the following below this CDDL HEADER, with the
16  * fields enclosed by brackets "[]" replaced with your own identifying
17  * information: Portions Copyright [yyyy] [name of copyright owner]
18  *
19  * CDDL HEADER END
20  */
21 /*
22  * Copyright 2011 Nexenta Systems, Inc.  All rights reserved.
23  */
24 /*
25  * Copyright 2006 Sun Microsystems, Inc.  All rights reserved.
26  * Use is subject to license terms.
27  */
28 
29 #pragma weak __exp = exp
30 
31 /*
32  * exp(x)
33  * Hybrid algorithm of Peter Tang's Table driven method (for large
34  * arguments) and an accurate table (for small arguments).
35  * Written by K.C. Ng, November 1988.
36  * Method (large arguments):
37  *	1. Argument Reduction: given the input x, find r and integer k
38  *	   and j such that
39  *	             x = (k+j/32)*(ln2) + r,  |r| <= (1/64)*ln2
40  *
41  *	2. exp(x) = 2^k * (2^(j/32) + 2^(j/32)*expm1(r))
42  *	   a. expm1(r) is approximated by a polynomial:
43  *	      expm1(r) ~ r + t1*r^2 + t2*r^3 + ... + t5*r^6
44  *	      Here t1 = 1/2 exactly.
45  *	   b. 2^(j/32) is represented to twice double precision
46  *	      as TBL[2j]+TBL[2j+1].
47  *
48  * Note: If divide were fast enough, we could use another approximation
49  *	 in 2.a:
50  *	      expm1(r) ~ (2r)/(2-R), R = r - r^2*(t1 + t2*r^2)
51  *	      (for the same t1 and t2 as above)
52  *
53  * Special cases:
54  *	exp(INF) is INF, exp(NaN) is NaN;
55  *	exp(-INF)=  0;
56  *	for finite argument, only exp(0)=1 is exact.
57  *
58  * Accuracy:
59  *	According to an error analysis, the error is always less than
60  *	an ulp (unit in the last place).  The largest errors observed
61  *	are less than 0.55 ulp for normal results and less than 0.75 ulp
62  *	for subnormal results.
63  *
64  * Misc. info.
65  *	For IEEE double
66  *		if x >  7.09782712893383973096e+02 then exp(x) overflow
67  *		if x < -7.45133219101941108420e+02 then exp(x) underflow
68  */
69 
70 #include "libm.h"
71 
72 static const double TBL[] = {
73 	1.00000000000000000000e+00,  0.00000000000000000000e+00,
74 	1.02189714865411662714e+00,  5.10922502897344389359e-17,
75 	1.04427378242741375480e+00,  8.55188970553796365958e-17,
76 	1.06714040067682369717e+00, -7.89985396684158212226e-17,
77 	1.09050773266525768967e+00, -3.04678207981247114697e-17,
78 	1.11438674259589243221e+00,  1.04102784568455709549e-16,
79 	1.13878863475669156458e+00,  8.91281267602540777782e-17,
80 	1.16372485877757747552e+00,  3.82920483692409349872e-17,
81 	1.18920711500272102690e+00,  3.98201523146564611098e-17,
82 	1.21524735998046895524e+00, -7.71263069268148813091e-17,
83 	1.24185781207348400201e+00,  4.65802759183693679123e-17,
84 	1.26905095719173321989e+00,  2.66793213134218609523e-18,
85 	1.29683955465100964055e+00,  2.53825027948883149593e-17,
86 	1.32523664315974132322e+00, -2.85873121003886075697e-17,
87 	1.35425554693689265129e+00,  7.70094837980298946162e-17,
88 	1.38390988196383202258e+00, -6.77051165879478628716e-17,
89 	1.41421356237309514547e+00, -9.66729331345291345105e-17,
90 	1.44518080697704665027e+00, -3.02375813499398731940e-17,
91 	1.47682614593949934623e+00, -3.48399455689279579579e-17,
92 	1.50916442759342284141e+00, -1.01645532775429503911e-16,
93 	1.54221082540794074411e+00,  7.94983480969762085616e-17,
94 	1.57598084510788649659e+00, -1.01369164712783039808e-17,
95 	1.61049033194925428347e+00,  2.47071925697978878522e-17,
96 	1.64575547815396494578e+00, -1.01256799136747726038e-16,
97 	1.68179283050742900407e+00,  8.19901002058149652013e-17,
98 	1.71861929812247793414e+00, -1.85138041826311098821e-17,
99 	1.75625216037329945351e+00,  2.96014069544887330703e-17,
100 	1.79470907500310716820e+00,  1.82274584279120867698e-17,
101 	1.83400808640934243066e+00,  3.28310722424562658722e-17,
102 	1.87416763411029996256e+00, -6.12276341300414256164e-17,
103 	1.91520656139714740007e+00, -1.06199460561959626376e-16,
104 	1.95714412417540017941e+00,  8.96076779103666776760e-17,
105 };
106 
107 /*
108  * For i = 0, ..., 66,
109  *   TBL2[2*i] is a double precision number near (i+1)*2^-6, and
110  *   TBL2[2*i+1] = exp(TBL2[2*i]) to within a relative error less
111  *   than 2^-60.
112  *
113  * For i = 67, ..., 133,
114  *   TBL2[2*i] is a double precision number near -(i+1)*2^-6, and
115  *   TBL2[2*i+1] = exp(TBL2[2*i]) to within a relative error less
116  *   than 2^-60.
117  */
118 static const double TBL2[] = {
119 	1.56249999999984491572e-02, 1.01574770858668417262e+00,
120 	3.12499999999998716305e-02, 1.03174340749910253834e+00,
121 	4.68750000000011102230e-02, 1.04799100201663386578e+00,
122 	6.24999999999990632493e-02, 1.06449445891785843266e+00,
123 	7.81249999999999444888e-02, 1.08125780744903954300e+00,
124 	9.37500000000013322676e-02, 1.09828514030782731226e+00,
125 	1.09375000000001346145e-01, 1.11558061464248226002e+00,
126 	1.24999999999999417133e-01, 1.13314845306682565607e+00,
127 	1.40624999999995337063e-01, 1.15099294469117108264e+00,
128 	1.56249999999996141975e-01, 1.16911844616949989195e+00,
129 	1.71874999999992894573e-01, 1.18752938276309216725e+00,
130 	1.87500000000000888178e-01, 1.20623024942098178158e+00,
131 	2.03124999999361649516e-01, 1.22522561187652545556e+00,
132 	2.18750000000000416334e-01, 1.24452010776609567344e+00,
133 	2.34375000000003524958e-01, 1.26411844775347081971e+00,
134 	2.50000000000006328271e-01, 1.28402541668774961003e+00,
135 	2.65624999999982791543e-01, 1.30424587476761533189e+00,
136 	2.81249999999993727240e-01, 1.32478475872885725906e+00,
137 	2.96875000000003275158e-01, 1.34564708304941493822e+00,
138 	3.12500000000002886580e-01, 1.36683794117380030819e+00,
139 	3.28124999999993394173e-01, 1.38836250675661765364e+00,
140 	3.43749999999998612221e-01, 1.41022603492570874906e+00,
141 	3.59374999999992450483e-01, 1.43243386356506730017e+00,
142 	3.74999999999991395772e-01, 1.45499141461818881638e+00,
143 	3.90624999999997613020e-01, 1.47790419541173490003e+00,
144 	4.06249999999991895372e-01, 1.50117780000011058483e+00,
145 	4.21874999999996613820e-01, 1.52481791053132154090e+00,
146 	4.37500000000004607426e-01, 1.54883029863414023453e+00,
147 	4.53125000000004274359e-01, 1.57322082682725961078e+00,
148 	4.68750000000008326673e-01, 1.59799544995064657371e+00,
149 	4.84374999999985456078e-01, 1.62316021661928200359e+00,
150 	4.99999999999997335465e-01, 1.64872127070012375327e+00,
151 	5.15625000000000222045e-01, 1.67468485281178436352e+00,
152 	5.31250000000003441691e-01, 1.70105730184840653330e+00,
153 	5.46874999999999111822e-01, 1.72784505652716169344e+00,
154 	5.62499999999999333866e-01, 1.75505465696029738787e+00,
155 	5.78124999999993338662e-01, 1.78269274625180318417e+00,
156 	5.93749999999999666933e-01, 1.81076607211938656050e+00,
157 	6.09375000000003441691e-01, 1.83928148854178719063e+00,
158 	6.24999999999995559108e-01, 1.86824595743221411048e+00,
159 	6.40625000000009103829e-01, 1.89766655033813602671e+00,
160 	6.56249999999993782751e-01, 1.92755045016753268072e+00,
161 	6.71875000000002109424e-01, 1.95790495294292221651e+00,
162 	6.87499999999992450483e-01, 1.98873746958227681780e+00,
163 	7.03125000000004996004e-01, 2.02005552770870666635e+00,
164 	7.18750000000007105427e-01, 2.05186677348799140219e+00,
165 	7.34375000000008770762e-01, 2.08417897349558689513e+00,
166 	7.49999999999983901766e-01, 2.11700001661264058939e+00,
167 	7.65624999999997002398e-01, 2.15033791595229351046e+00,
168 	7.81250000000005884182e-01, 2.18420081081563077774e+00,
169 	7.96874999999991451283e-01, 2.21859696867912603579e+00,
170 	8.12500000000000000000e-01, 2.25353478721320854561e+00,
171 	8.28125000000008215650e-01, 2.28902279633221983346e+00,
172 	8.43749999999997890576e-01, 2.32506966027711614586e+00,
173 	8.59374999999999444888e-01, 2.36168417973090827289e+00,
174 	8.75000000000003219647e-01, 2.39887529396710563745e+00,
175 	8.90625000000013433699e-01, 2.43665208303232461162e+00,
176 	9.06249999999980571097e-01, 2.47502376996297712708e+00,
177 	9.21874999999984456878e-01, 2.51399972303748420188e+00,
178 	9.37500000000001887379e-01, 2.55358945806293169412e+00,
179 	9.53125000000003330669e-01, 2.59380264069854327147e+00,
180 	9.68749999999989119814e-01, 2.63464908881560244680e+00,
181 	9.84374999999997890576e-01, 2.67613877489447116176e+00,
182 	1.00000000000001154632e+00, 2.71828182845907662113e+00,
183 	1.01562499999999333866e+00, 2.76108853855008318234e+00,
184 	1.03124999999995980993e+00, 2.80456935623711389738e+00,
185 	1.04687499999999933387e+00, 2.84873489717039740654e+00,
186 	-1.56249999999999514277e-02, 9.84496437005408453480e-01,
187 	-3.12499999999955972718e-02, 9.69233234476348348707e-01,
188 	-4.68749999999993824384e-02, 9.54206665969188905230e-01,
189 	-6.24999999999976130205e-02, 9.39413062813478028090e-01,
190 	-7.81249999999989314103e-02, 9.24848813216205822840e-01,
191 	-9.37499999999995975442e-02, 9.10510361380034494161e-01,
192 	-1.09374999999998584466e-01, 8.96394206635151680196e-01,
193 	-1.24999999999998556710e-01, 8.82496902584596676355e-01,
194 	-1.40624999999999361622e-01, 8.68815056262843721235e-01,
195 	-1.56249999999999111822e-01, 8.55345327307423297647e-01,
196 	-1.71874999999924144012e-01, 8.42084427143446223596e-01,
197 	-1.87499999999996752598e-01, 8.29029118180403035154e-01,
198 	-2.03124999999988037347e-01, 8.16176213022349550386e-01,
199 	-2.18749999999995947686e-01, 8.03522573689063990265e-01,
200 	-2.34374999999996419531e-01, 7.91065110850298847112e-01,
201 	-2.49999999999996280753e-01, 7.78800783071407765057e-01,
202 	-2.65624999999999888978e-01, 7.66726596070820165529e-01,
203 	-2.81249999999989397370e-01, 7.54839601989015340777e-01,
204 	-2.96874999999996114219e-01, 7.43136898668761203268e-01,
205 	-3.12499999999999555911e-01, 7.31615628946642115871e-01,
206 	-3.28124999999993782751e-01, 7.20272979955444259126e-01,
207 	-3.43749999999997946087e-01, 7.09106182437399867879e-01,
208 	-3.59374999999994337863e-01, 6.98112510068129799023e-01,
209 	-3.74999999999994615418e-01, 6.87289278790975899369e-01,
210 	-3.90624999999999000799e-01, 6.76633846161729612945e-01,
211 	-4.06249999999947264406e-01, 6.66143610703522903727e-01,
212 	-4.21874999999988453681e-01, 6.55816011271509125002e-01,
213 	-4.37499999999999111822e-01, 6.45648526427892610613e-01,
214 	-4.53124999999999278355e-01, 6.35638673826052436056e-01,
215 	-4.68749999999999278355e-01, 6.25784009604591573428e-01,
216 	-4.84374999999992894573e-01, 6.16082127790682609891e-01,
217 	-4.99999999999998168132e-01, 6.06530659712634534486e-01,
218 	-5.15625000000000000000e-01, 5.97127273421627413619e-01,
219 	-5.31249999999989785948e-01, 5.87869673122352498496e-01,
220 	-5.46874999999972688514e-01, 5.78755598612500032907e-01,
221 	-5.62500000000000000000e-01, 5.69782824730923009859e-01,
222 	-5.78124999999992339461e-01, 5.60949160814475100700e-01,
223 	-5.93749999999948707696e-01, 5.52252450163048691500e-01,
224 	-6.09374999999552580121e-01, 5.43690569513243682209e-01,
225 	-6.24999999999984789945e-01, 5.35261428518998383375e-01,
226 	-6.40624999999983457677e-01, 5.26962969243379708573e-01,
227 	-6.56249999999998334665e-01, 5.18793165653890220312e-01,
228 	-6.71874999999943378626e-01, 5.10750023129039609771e-01,
229 	-6.87499999999997002398e-01, 5.02831577970942467104e-01,
230 	-7.03124999999991118216e-01, 4.95035896926202978463e-01,
231 	-7.18749999999991340260e-01, 4.87361076713623331269e-01,
232 	-7.34374999999985678123e-01, 4.79805243559684402310e-01,
233 	-7.49999999999997335465e-01, 4.72366552741015965911e-01,
234 	-7.65624999999993782751e-01, 4.65043188134059204408e-01,
235 	-7.81249999999863220523e-01, 4.57833361771676883301e-01,
236 	-7.96874999999998112621e-01, 4.50735313406363247157e-01,
237 	-8.12499999999990119015e-01, 4.43747310081084256339e-01,
238 	-8.28124999999996003197e-01, 4.36867645705559026759e-01,
239 	-8.43749999999988120614e-01, 4.30094640640067360504e-01,
240 	-8.59374999999994115818e-01, 4.23426641285265303871e-01,
241 	-8.74999999999977129406e-01, 4.16862019678517936594e-01,
242 	-8.90624999999983346655e-01, 4.10399173096376801428e-01,
243 	-9.06249999999991784350e-01, 4.04036523663345414903e-01,
244 	-9.21874999999994004796e-01, 3.97772517966614058693e-01,
245 	-9.37499999999994337863e-01, 3.91605626676801210628e-01,
246 	-9.53124999999999444888e-01, 3.85534344174578935682e-01,
247 	-9.68749999999986677324e-01, 3.79557188183094640355e-01,
248 	-9.84374999999992339461e-01, 3.73672699406045860648e-01,
249 	-9.99999999999995892175e-01, 3.67879441171443832825e-01,
250 	-1.01562499999994315658e+00, 3.62175999080846300338e-01,
251 	-1.03124999999991096011e+00, 3.56560980663978732697e-01,
252 	-1.04687499999999067413e+00, 3.51033015038813400732e-01,
253 };
254 
255 static const double C[] = {
256 	0.5,
257 	4.61662413084468283841e+01,	/* 0x40471547, 0x652b82fe */
258 	2.16608493865351192653e-02,	/* 0x3f962e42, 0xfee00000 */
259 	5.96317165397058656257e-12,	/* 0x3d9a39ef, 0x35793c76 */
260 	1.6666666666526086527e-1,	/* 3fc5555555548f7c */
261 	4.1666666666226079285e-2,	/* 3fa5555555545d4e */
262 	8.3333679843421958056e-3,	/* 3f811115b7aa905e */
263 	1.3888949086377719040e-3,	/* 3f56c1728d739765 */
264 	1.0,
265 	0.0,
266 	7.09782712893383973096e+02,	/* 0x40862E42, 0xFEFA39EF */
267 	7.45133219101941108420e+02,	/* 0x40874910, 0xD52D3051 */
268 	5.55111512312578270212e-17,	/* 0x3c900000, 0x00000000 */
269 };
270 
271 #define	half		C[0]
272 #define	invln2_32	C[1]
273 #define	ln2_32hi	C[2]
274 #define	ln2_32lo	C[3]
275 #define	t2		C[4]
276 #define	t3		C[5]
277 #define	t4		C[6]
278 #define	t5		C[7]
279 #define	one		C[8]
280 #define	zero		C[9]
281 #define	threshold1	C[10]
282 #define	threshold2	C[11]
283 #define	twom54		C[12]
284 
285 double
286 exp(double x) {
287 	double	y, z, t;
288 	int	hx, ix, k, j, m;
289 
290 	ix = ((int *)&x)[HIWORD];
291 	hx = ix & ~0x80000000;
292 
293 	if (hx < 0x3ff0a2b2) {	/* |x| < 3/2 ln 2 */
294 		if (hx < 0x3f862e42) {	/* |x| < 1/64 ln 2 */
295 			if (hx < 0x3ed00000) {	/* |x| < 2^-18 */
296 				volatile int dummy __unused;
297 
298 				dummy = (int)x;	/* raise inexact if x != 0 */
299 #ifdef lint
300 				dummy = dummy;
301 #endif
302 				if (hx < 0x3e300000)
303 					return (one + x);
304 				return (one + x * (one + half * x));
305 			}
306 			t = x * x;
307 			y = x + (t * (half + x * t2) +
308 			    (t * t) * (t3 + x * t4 + t * t5));
309 			return (one + y);
310 		}
311 
312 		/* find the multiple of 2^-6 nearest x */
313 		k = hx >> 20;
314 		j = (0x00100000 | (hx & 0x000fffff)) >> (0x40c - k);
315 		j = (j - 1) & ~1;
316 		if (ix < 0)
317 			j += 134;
318 		z = x - TBL2[j];
319 		t = z * z;
320 		y = z + (t * (half + z * t2) +
321 		    (t * t) * (t3 + z * t4 + t * t5));
322 		return (TBL2[j+1] + TBL2[j+1] * y);
323 	}
324 
325 	if (hx >= 0x40862e42) {	/* x is large, infinite, or nan */
326 		if (hx >= 0x7ff00000) {
327 			if (ix == 0xfff00000 && ((int *)&x)[LOWORD] == 0)
328 				return (zero);
329 			return (x * x);
330 		}
331 		if (x > threshold1)
332 			return (_SVID_libm_err(x, x, 6));
333 		if (-x > threshold2)
334 			return (_SVID_libm_err(x, x, 7));
335 	}
336 
337 	t = invln2_32 * x;
338 	if (ix < 0)
339 		t -= half;
340 	else
341 		t += half;
342 	k = (int)t;
343 	j = (k & 0x1f) << 1;
344 	m = k >> 5;
345 	z = (x - k * ln2_32hi) - k * ln2_32lo;
346 
347 	/* z is now in primary range */
348 	t = z * z;
349 	y = z + (t * (half + z * t2) + (t * t) * (t3 + z * t4 + t * t5));
350 	y = TBL[j] + (TBL[j+1] + TBL[j] * y);
351 	if (m < -1021) {
352 		((int *)&y)[HIWORD] += (m + 54) << 20;
353 		return (twom54 * y);
354 	}
355 	((int *)&y)[HIWORD] += m << 20;
356 	return (y);
357 }
358