1*12188b77SDavid Schultz /*- 2*12188b77SDavid Schultz * Copyright (c) 2011 David Schultz <das@FreeBSD.ORG> 3*12188b77SDavid Schultz * All rights reserved. 4*12188b77SDavid Schultz * 5*12188b77SDavid Schultz * Redistribution and use in source and binary forms, with or without 6*12188b77SDavid Schultz * modification, are permitted provided that the following conditions 7*12188b77SDavid Schultz * are met: 8*12188b77SDavid Schultz * 1. Redistributions of source code must retain the above copyright 9*12188b77SDavid Schultz * notice, this list of conditions and the following disclaimer. 10*12188b77SDavid Schultz * 2. Redistributions in binary form must reproduce the above copyright 11*12188b77SDavid Schultz * notice, this list of conditions and the following disclaimer in the 12*12188b77SDavid Schultz * documentation and/or other materials provided with the distribution. 13*12188b77SDavid Schultz * 14*12188b77SDavid Schultz * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND 15*12188b77SDavid Schultz * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 16*12188b77SDavid Schultz * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 17*12188b77SDavid Schultz * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE 18*12188b77SDavid Schultz * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 19*12188b77SDavid Schultz * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 20*12188b77SDavid Schultz * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 21*12188b77SDavid Schultz * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 22*12188b77SDavid Schultz * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 23*12188b77SDavid Schultz * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 24*12188b77SDavid Schultz * SUCH DAMAGE. 25*12188b77SDavid Schultz */ 26*12188b77SDavid Schultz 27*12188b77SDavid Schultz #include <sys/cdefs.h> 28*12188b77SDavid Schultz __FBSDID("$FreeBSD$"); 29*12188b77SDavid Schultz 30*12188b77SDavid Schultz #include <complex.h> 31*12188b77SDavid Schultz 32*12188b77SDavid Schultz #include "math.h" 33*12188b77SDavid Schultz #include "math_private.h" 34*12188b77SDavid Schultz 35*12188b77SDavid Schultz static const uint32_t k = 1799; /* constant for reduction */ 36*12188b77SDavid Schultz static const double kln2 = 1246.97177782734161156; /* k * ln2 */ 37*12188b77SDavid Schultz 38*12188b77SDavid Schultz /* 39*12188b77SDavid Schultz * Compute exp(x), scaled to avoid spurious overflow. An exponent is 40*12188b77SDavid Schultz * returned separately in 'expt'. 41*12188b77SDavid Schultz * 42*12188b77SDavid Schultz * Input: ln(DBL_MAX) <= x < ln(2 * DBL_MAX / DBL_MIN_DENORM) ~= 1454.91 43*12188b77SDavid Schultz * Output: 2**1023 <= y < 2**1024 44*12188b77SDavid Schultz */ 45*12188b77SDavid Schultz static double 46*12188b77SDavid Schultz __frexp_exp(double x, int *expt) 47*12188b77SDavid Schultz { 48*12188b77SDavid Schultz double exp_x; 49*12188b77SDavid Schultz uint32_t hx; 50*12188b77SDavid Schultz 51*12188b77SDavid Schultz /* 52*12188b77SDavid Schultz * We use exp(x) = exp(x - kln2) * 2**k, carefully chosen to 53*12188b77SDavid Schultz * minimize |exp(kln2) - 2**k|. We also scale the exponent of 54*12188b77SDavid Schultz * exp_x to MAX_EXP so that the result can be multiplied by 55*12188b77SDavid Schultz * a tiny number without losing accuracy due to denormalization. 56*12188b77SDavid Schultz */ 57*12188b77SDavid Schultz exp_x = exp(x - kln2); 58*12188b77SDavid Schultz GET_HIGH_WORD(hx, exp_x); 59*12188b77SDavid Schultz *expt = (hx >> 20) - (0x3ff + 1023) + k; 60*12188b77SDavid Schultz SET_HIGH_WORD(exp_x, (hx & 0xfffff) | ((0x3ff + 1023) << 20)); 61*12188b77SDavid Schultz return (exp_x); 62*12188b77SDavid Schultz } 63*12188b77SDavid Schultz 64*12188b77SDavid Schultz /* 65*12188b77SDavid Schultz * __ldexp_exp(x, expt) and __ldexp_cexp(x, expt) compute exp(x) * 2**expt. 66*12188b77SDavid Schultz * They are intended for large arguments (real part >= ln(DBL_MAX)) 67*12188b77SDavid Schultz * where care is needed to avoid overflow. 68*12188b77SDavid Schultz * 69*12188b77SDavid Schultz * The present implementation is narrowly tailored for our hyperbolic and 70*12188b77SDavid Schultz * exponential functions. We assume expt is small (0 or -1), and the caller 71*12188b77SDavid Schultz * has filtered out very large x, for which overflow would be inevitable. 72*12188b77SDavid Schultz */ 73*12188b77SDavid Schultz 74*12188b77SDavid Schultz double 75*12188b77SDavid Schultz __ldexp_exp(double x, int expt) 76*12188b77SDavid Schultz { 77*12188b77SDavid Schultz double exp_x, scale; 78*12188b77SDavid Schultz int ex_expt; 79*12188b77SDavid Schultz 80*12188b77SDavid Schultz exp_x = __frexp_exp(x, &ex_expt); 81*12188b77SDavid Schultz expt += ex_expt; 82*12188b77SDavid Schultz INSERT_WORDS(scale, (0x3ff + expt) << 20, 0); 83*12188b77SDavid Schultz return (exp_x * scale); 84*12188b77SDavid Schultz } 85*12188b77SDavid Schultz 86*12188b77SDavid Schultz double complex 87*12188b77SDavid Schultz __ldexp_cexp(double complex z, int expt) 88*12188b77SDavid Schultz { 89*12188b77SDavid Schultz double x, y, exp_x, scale1, scale2; 90*12188b77SDavid Schultz int ex_expt, half_expt; 91*12188b77SDavid Schultz 92*12188b77SDavid Schultz x = creal(z); 93*12188b77SDavid Schultz y = cimag(z); 94*12188b77SDavid Schultz exp_x = __frexp_exp(x, &ex_expt); 95*12188b77SDavid Schultz expt += ex_expt; 96*12188b77SDavid Schultz 97*12188b77SDavid Schultz /* 98*12188b77SDavid Schultz * Arrange so that scale1 * scale2 == 2**expt. We use this to 99*12188b77SDavid Schultz * compensate for scalbn being horrendously slow. 100*12188b77SDavid Schultz */ 101*12188b77SDavid Schultz half_expt = expt / 2; 102*12188b77SDavid Schultz INSERT_WORDS(scale1, (0x3ff + half_expt) << 20, 0); 103*12188b77SDavid Schultz half_expt = expt - half_expt; 104*12188b77SDavid Schultz INSERT_WORDS(scale2, (0x3ff + half_expt) << 20, 0); 105*12188b77SDavid Schultz 106*12188b77SDavid Schultz return (cpack(cos(y) * exp_x * scale1 * scale2, 107*12188b77SDavid Schultz sin(y) * exp_x * scale1 * scale2)); 108*12188b77SDavid Schultz } 109