xref: /titanic_44/usr/src/lib/libm/common/m9x/llrintl.c (revision ddc0e0b53c661f6e439e3b7072b3ef353eadb4af)
125c28e83SPiotr Jasiukajtis /*
225c28e83SPiotr Jasiukajtis  * CDDL HEADER START
325c28e83SPiotr Jasiukajtis  *
425c28e83SPiotr Jasiukajtis  * The contents of this file are subject to the terms of the
525c28e83SPiotr Jasiukajtis  * Common Development and Distribution License (the "License").
625c28e83SPiotr Jasiukajtis  * You may not use this file except in compliance with the License.
725c28e83SPiotr Jasiukajtis  *
825c28e83SPiotr Jasiukajtis  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
925c28e83SPiotr Jasiukajtis  * or http://www.opensolaris.org/os/licensing.
1025c28e83SPiotr Jasiukajtis  * See the License for the specific language governing permissions
1125c28e83SPiotr Jasiukajtis  * and limitations under the License.
1225c28e83SPiotr Jasiukajtis  *
1325c28e83SPiotr Jasiukajtis  * When distributing Covered Code, include this CDDL HEADER in each
1425c28e83SPiotr Jasiukajtis  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
1525c28e83SPiotr Jasiukajtis  * If applicable, add the following below this CDDL HEADER, with the
1625c28e83SPiotr Jasiukajtis  * fields enclosed by brackets "[]" replaced with your own identifying
1725c28e83SPiotr Jasiukajtis  * information: Portions Copyright [yyyy] [name of copyright owner]
1825c28e83SPiotr Jasiukajtis  *
1925c28e83SPiotr Jasiukajtis  * CDDL HEADER END
2025c28e83SPiotr Jasiukajtis  */
2125c28e83SPiotr Jasiukajtis 
2225c28e83SPiotr Jasiukajtis /*
2325c28e83SPiotr Jasiukajtis  * Copyright 2011 Nexenta Systems, Inc.  All rights reserved.
2425c28e83SPiotr Jasiukajtis  */
2525c28e83SPiotr Jasiukajtis /*
2625c28e83SPiotr Jasiukajtis  * Copyright 2006 Sun Microsystems, Inc.  All rights reserved.
2725c28e83SPiotr Jasiukajtis  * Use is subject to license terms.
2825c28e83SPiotr Jasiukajtis  */
2925c28e83SPiotr Jasiukajtis 
30*ddc0e0b5SRichard Lowe #pragma weak __llrintl = llrintl
3125c28e83SPiotr Jasiukajtis #if defined(__sparcv9) || defined(__amd64)
32*ddc0e0b5SRichard Lowe #pragma weak lrintl = llrintl
33*ddc0e0b5SRichard Lowe #pragma weak __lrintl = llrintl
3425c28e83SPiotr Jasiukajtis #endif
3525c28e83SPiotr Jasiukajtis 
3625c28e83SPiotr Jasiukajtis #include "libm.h"
3725c28e83SPiotr Jasiukajtis 
3825c28e83SPiotr Jasiukajtis #if defined(__sparc)
3925c28e83SPiotr Jasiukajtis 
4025c28e83SPiotr Jasiukajtis #include "fma.h"
4125c28e83SPiotr Jasiukajtis #include "fenv_inlines.h"
4225c28e83SPiotr Jasiukajtis 
4325c28e83SPiotr Jasiukajtis long long
llrintl(long double x)4425c28e83SPiotr Jasiukajtis llrintl(long double x) {
4525c28e83SPiotr Jasiukajtis 	union {
4625c28e83SPiotr Jasiukajtis 		unsigned i[4];
4725c28e83SPiotr Jasiukajtis 		long double q;
4825c28e83SPiotr Jasiukajtis 	} xx;
4925c28e83SPiotr Jasiukajtis 	union {
5025c28e83SPiotr Jasiukajtis 		unsigned i[2];
5125c28e83SPiotr Jasiukajtis 		long long l;
5225c28e83SPiotr Jasiukajtis 	} zz;
5325c28e83SPiotr Jasiukajtis 	union {
5425c28e83SPiotr Jasiukajtis 		unsigned i;
5525c28e83SPiotr Jasiukajtis 		float f;
5625c28e83SPiotr Jasiukajtis 	} tt;
5725c28e83SPiotr Jasiukajtis 	unsigned int hx, sx, frac, fsr;
5825c28e83SPiotr Jasiukajtis 	int rm, j;
5925c28e83SPiotr Jasiukajtis 	volatile float dummy;
6025c28e83SPiotr Jasiukajtis 
6125c28e83SPiotr Jasiukajtis 	xx.q = x;
6225c28e83SPiotr Jasiukajtis 	sx = xx.i[0] & 0x80000000;
6325c28e83SPiotr Jasiukajtis 	hx = xx.i[0] & ~0x80000000;
6425c28e83SPiotr Jasiukajtis 
6525c28e83SPiotr Jasiukajtis 	/* handle trivial cases */
6625c28e83SPiotr Jasiukajtis 	if (hx > 0x403e0000) { /* |x| > 2^63 + ... or x is nan */
6725c28e83SPiotr Jasiukajtis 		/* convert an out-of-range float */
6825c28e83SPiotr Jasiukajtis 		tt.i = sx | 0x7f000000;
6925c28e83SPiotr Jasiukajtis 		return ((long long) tt.f);
7025c28e83SPiotr Jasiukajtis 	} else if ((hx | xx.i[1] | xx.i[2] | xx.i[3]) == 0) /* x is zero */
7125c28e83SPiotr Jasiukajtis 		return (0LL);
7225c28e83SPiotr Jasiukajtis 
7325c28e83SPiotr Jasiukajtis 	/* get the rounding mode */
7425c28e83SPiotr Jasiukajtis 	__fenv_getfsr32(&fsr);
7525c28e83SPiotr Jasiukajtis 	rm = fsr >> 30;
7625c28e83SPiotr Jasiukajtis 
7725c28e83SPiotr Jasiukajtis 	/* flip the sense of directed roundings if x is negative */
7825c28e83SPiotr Jasiukajtis 	if (sx)
7925c28e83SPiotr Jasiukajtis 		rm ^= rm >> 1;
8025c28e83SPiotr Jasiukajtis 
8125c28e83SPiotr Jasiukajtis 	/* handle |x| < 1 */
8225c28e83SPiotr Jasiukajtis 	if (hx < 0x3fff0000) {
8325c28e83SPiotr Jasiukajtis 		dummy = 1.0e30f; /* x is nonzero, so raise inexact */
8425c28e83SPiotr Jasiukajtis 		dummy += 1.0e-30f;
8525c28e83SPiotr Jasiukajtis 		if (rm == FSR_RP || (rm == FSR_RN && (hx >= 0x3ffe0000 &&
8625c28e83SPiotr Jasiukajtis 			((hx & 0xffff) | xx.i[1] | xx.i[2] | xx.i[3]))))
8725c28e83SPiotr Jasiukajtis 			return (sx ? -1LL : 1LL);
8825c28e83SPiotr Jasiukajtis 		return (0LL);
8925c28e83SPiotr Jasiukajtis 	}
9025c28e83SPiotr Jasiukajtis 
9125c28e83SPiotr Jasiukajtis 	/* extract the integer and fractional parts of x */
9225c28e83SPiotr Jasiukajtis 	j = 0x406f - (hx >> 16);
9325c28e83SPiotr Jasiukajtis 	xx.i[0] = 0x10000 | (xx.i[0] & 0xffff);
9425c28e83SPiotr Jasiukajtis 	if (j >= 96) {
9525c28e83SPiotr Jasiukajtis 		zz.i[0] = 0;
9625c28e83SPiotr Jasiukajtis 		zz.i[1] = xx.i[0] >> (j - 96);
9725c28e83SPiotr Jasiukajtis 		frac = ((xx.i[0] << 1) << (127 - j)) | (xx.i[1] >> (j - 96));
9825c28e83SPiotr Jasiukajtis 		if (((xx.i[1] << 1) << (127 - j)) | xx.i[2] | xx.i[3])
9925c28e83SPiotr Jasiukajtis 			frac |= 1;
10025c28e83SPiotr Jasiukajtis 	} else if (j >= 64) {
10125c28e83SPiotr Jasiukajtis 		zz.i[0] = xx.i[0] >> (j - 64);
10225c28e83SPiotr Jasiukajtis 		zz.i[1] = ((xx.i[0] << 1) << (95 - j)) | (xx.i[1] >> (j - 64));
10325c28e83SPiotr Jasiukajtis 		frac = ((xx.i[1] << 1) << (95 - j)) | (xx.i[2] >> (j - 64));
10425c28e83SPiotr Jasiukajtis 		if (((xx.i[2] << 1) << (95 - j)) | xx.i[3])
10525c28e83SPiotr Jasiukajtis 			frac |= 1;
10625c28e83SPiotr Jasiukajtis 	} else {
10725c28e83SPiotr Jasiukajtis 		zz.i[0] = ((xx.i[0] << 1) << (63 - j)) | (xx.i[1] >> (j - 32));
10825c28e83SPiotr Jasiukajtis 		zz.i[1] = ((xx.i[1] << 1) << (63 - j)) | (xx.i[2] >> (j - 32));
10925c28e83SPiotr Jasiukajtis 		frac = ((xx.i[2] << 1) << (63 - j)) | (xx.i[3] >> (j - 32));
11025c28e83SPiotr Jasiukajtis 		if ((xx.i[3] << 1) << (63 - j))
11125c28e83SPiotr Jasiukajtis 			frac |= 1;
11225c28e83SPiotr Jasiukajtis 	}
11325c28e83SPiotr Jasiukajtis 
11425c28e83SPiotr Jasiukajtis 	/* round */
11525c28e83SPiotr Jasiukajtis 	if (frac && (rm == FSR_RP || (rm == FSR_RN && (frac > 0x80000000u ||
11625c28e83SPiotr Jasiukajtis 		(frac == 0x80000000 && (zz.i[1] & 1)))))) {
11725c28e83SPiotr Jasiukajtis 		if (++zz.i[1] == 0)
11825c28e83SPiotr Jasiukajtis 			zz.i[0]++;
11925c28e83SPiotr Jasiukajtis 	}
12025c28e83SPiotr Jasiukajtis 
12125c28e83SPiotr Jasiukajtis 	/* check for result out of range (note that z is |x| at this point) */
12225c28e83SPiotr Jasiukajtis 	if (zz.i[0] > 0x80000000u || (zz.i[0] == 0x80000000 && (zz.i[1] ||
12325c28e83SPiotr Jasiukajtis 		!sx))) {
12425c28e83SPiotr Jasiukajtis 		tt.i = sx | 0x7f000000;
12525c28e83SPiotr Jasiukajtis 		return ((long long) tt.f);
12625c28e83SPiotr Jasiukajtis 	}
12725c28e83SPiotr Jasiukajtis 
12825c28e83SPiotr Jasiukajtis 	/* raise inexact if need be */
12925c28e83SPiotr Jasiukajtis 	if (frac) {
13025c28e83SPiotr Jasiukajtis 		dummy = 1.0e30F;
13125c28e83SPiotr Jasiukajtis 		dummy += 1.0e-30F;
13225c28e83SPiotr Jasiukajtis 	}
13325c28e83SPiotr Jasiukajtis 
13425c28e83SPiotr Jasiukajtis 	/* negate result if need be */
13525c28e83SPiotr Jasiukajtis 	if (sx) {
13625c28e83SPiotr Jasiukajtis 		zz.i[0] = ~zz.i[0];
13725c28e83SPiotr Jasiukajtis 		zz.i[1] = -zz.i[1];
13825c28e83SPiotr Jasiukajtis 		if (zz.i[1] == 0)
13925c28e83SPiotr Jasiukajtis 			zz.i[0]++;
14025c28e83SPiotr Jasiukajtis 	}
14125c28e83SPiotr Jasiukajtis 	return (zz.l);
14225c28e83SPiotr Jasiukajtis }
14325c28e83SPiotr Jasiukajtis #elif defined(__x86)
14425c28e83SPiotr Jasiukajtis long long
llrintl(long double x)14525c28e83SPiotr Jasiukajtis llrintl(long double x) {
14625c28e83SPiotr Jasiukajtis 	/*
14725c28e83SPiotr Jasiukajtis 	 * Note: The following code works on x86 (in the default rounding
14825c28e83SPiotr Jasiukajtis 	 * precision mode), but one ought to just use the fistpll instruction
14925c28e83SPiotr Jasiukajtis 	 * instead.
15025c28e83SPiotr Jasiukajtis 	 */
15125c28e83SPiotr Jasiukajtis 	union {
15225c28e83SPiotr Jasiukajtis 		unsigned i[3];
15325c28e83SPiotr Jasiukajtis 		long double e;
15425c28e83SPiotr Jasiukajtis 	} xx, yy;
15525c28e83SPiotr Jasiukajtis 	int ex;
15625c28e83SPiotr Jasiukajtis 
15725c28e83SPiotr Jasiukajtis 	xx.e = x;
15825c28e83SPiotr Jasiukajtis 	ex = xx.i[2] & 0x7fff;
15925c28e83SPiotr Jasiukajtis 
16025c28e83SPiotr Jasiukajtis 	if (ex < 0x403e) { /* |x| < 2^63 */
16125c28e83SPiotr Jasiukajtis 		/* add and subtract a power of two to round x to an integer */
16225c28e83SPiotr Jasiukajtis 		yy.i[2] = (xx.i[2] & 0x8000) | 0x403e;
16325c28e83SPiotr Jasiukajtis 		yy.i[1] = 0x80000000;
16425c28e83SPiotr Jasiukajtis 		yy.i[0] = 0;
16525c28e83SPiotr Jasiukajtis 		x = (x + yy.e) - yy.e;
16625c28e83SPiotr Jasiukajtis 	}
16725c28e83SPiotr Jasiukajtis 
16825c28e83SPiotr Jasiukajtis 	/* now x is nan, inf, or integral */
16925c28e83SPiotr Jasiukajtis 	return ((long long) x);
17025c28e83SPiotr Jasiukajtis }
17125c28e83SPiotr Jasiukajtis #else
17225c28e83SPiotr Jasiukajtis #error Unknown architecture
17325c28e83SPiotr Jasiukajtis #endif
174