llrintl.c revision 25c28e83beb90e7c80452a7c818c5e6f73a07dc8
29949e866e40b95795203f3ee46f44a197c946e4stevel/*
29949e866e40b95795203f3ee46f44a197c946e4stevel * CDDL HEADER START
29949e866e40b95795203f3ee46f44a197c946e4stevel *
29949e866e40b95795203f3ee46f44a197c946e4stevel * The contents of this file are subject to the terms of the
29949e866e40b95795203f3ee46f44a197c946e4stevel * Common Development and Distribution License (the "License").
29949e866e40b95795203f3ee46f44a197c946e4stevel * You may not use this file except in compliance with the License.
29949e866e40b95795203f3ee46f44a197c946e4stevel *
29949e866e40b95795203f3ee46f44a197c946e4stevel * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
29949e866e40b95795203f3ee46f44a197c946e4stevel * or http://www.opensolaris.org/os/licensing.
29949e866e40b95795203f3ee46f44a197c946e4stevel * See the License for the specific language governing permissions
29949e866e40b95795203f3ee46f44a197c946e4stevel * and limitations under the License.
29949e866e40b95795203f3ee46f44a197c946e4stevel *
29949e866e40b95795203f3ee46f44a197c946e4stevel * When distributing Covered Code, include this CDDL HEADER in each
29949e866e40b95795203f3ee46f44a197c946e4stevel * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
29949e866e40b95795203f3ee46f44a197c946e4stevel * If applicable, add the following below this CDDL HEADER, with the
29949e866e40b95795203f3ee46f44a197c946e4stevel * fields enclosed by brackets "[]" replaced with your own identifying
29949e866e40b95795203f3ee46f44a197c946e4stevel * information: Portions Copyright [yyyy] [name of copyright owner]
29949e866e40b95795203f3ee46f44a197c946e4stevel *
29949e866e40b95795203f3ee46f44a197c946e4stevel * CDDL HEADER END
29949e866e40b95795203f3ee46f44a197c946e4stevel */
29949e866e40b95795203f3ee46f44a197c946e4stevel
29949e866e40b95795203f3ee46f44a197c946e4stevel/*
29949e866e40b95795203f3ee46f44a197c946e4stevel * Copyright 2011 Nexenta Systems, Inc. All rights reserved.
29949e866e40b95795203f3ee46f44a197c946e4stevel */
29949e866e40b95795203f3ee46f44a197c946e4stevel/*
29949e866e40b95795203f3ee46f44a197c946e4stevel * Copyright 2006 Sun Microsystems, Inc. All rights reserved.
29949e866e40b95795203f3ee46f44a197c946e4stevel * Use is subject to license terms.
29949e866e40b95795203f3ee46f44a197c946e4stevel */
29949e866e40b95795203f3ee46f44a197c946e4stevel
29949e866e40b95795203f3ee46f44a197c946e4stevel#if defined(ELFOBJ)
29949e866e40b95795203f3ee46f44a197c946e4stevel#pragma weak llrintl = __llrintl
29949e866e40b95795203f3ee46f44a197c946e4stevel#if defined(__sparcv9) || defined(__amd64)
29949e866e40b95795203f3ee46f44a197c946e4stevel#pragma weak lrintl = __llrintl
29949e866e40b95795203f3ee46f44a197c946e4stevel#pragma weak __lrintl = __llrintl
29949e866e40b95795203f3ee46f44a197c946e4stevel#endif
29949e866e40b95795203f3ee46f44a197c946e4stevel#endif
29949e866e40b95795203f3ee46f44a197c946e4stevel
29949e866e40b95795203f3ee46f44a197c946e4stevel#include "libm.h"
29949e866e40b95795203f3ee46f44a197c946e4stevel
29949e866e40b95795203f3ee46f44a197c946e4stevel#if defined(__sparc)
29949e866e40b95795203f3ee46f44a197c946e4stevel
29949e866e40b95795203f3ee46f44a197c946e4stevel#include "fma.h"
29949e866e40b95795203f3ee46f44a197c946e4stevel#include "fenv_inlines.h"
29949e866e40b95795203f3ee46f44a197c946e4stevel
29949e866e40b95795203f3ee46f44a197c946e4stevellong long
29949e866e40b95795203f3ee46f44a197c946e4stevelllrintl(long double x) {
29949e866e40b95795203f3ee46f44a197c946e4stevel union {
29949e866e40b95795203f3ee46f44a197c946e4stevel unsigned i[4];
29949e866e40b95795203f3ee46f44a197c946e4stevel long double q;
29949e866e40b95795203f3ee46f44a197c946e4stevel } xx;
29949e866e40b95795203f3ee46f44a197c946e4stevel union {
29949e866e40b95795203f3ee46f44a197c946e4stevel unsigned i[2];
29949e866e40b95795203f3ee46f44a197c946e4stevel long long l;
29949e866e40b95795203f3ee46f44a197c946e4stevel } zz;
29949e866e40b95795203f3ee46f44a197c946e4stevel union {
29949e866e40b95795203f3ee46f44a197c946e4stevel unsigned i;
29949e866e40b95795203f3ee46f44a197c946e4stevel float f;
29949e866e40b95795203f3ee46f44a197c946e4stevel } tt;
29949e866e40b95795203f3ee46f44a197c946e4stevel unsigned int hx, sx, frac, fsr;
29949e866e40b95795203f3ee46f44a197c946e4stevel int rm, j;
29949e866e40b95795203f3ee46f44a197c946e4stevel volatile float dummy;
29949e866e40b95795203f3ee46f44a197c946e4stevel
29949e866e40b95795203f3ee46f44a197c946e4stevel xx.q = x;
29949e866e40b95795203f3ee46f44a197c946e4stevel sx = xx.i[0] & 0x80000000;
29949e866e40b95795203f3ee46f44a197c946e4stevel hx = xx.i[0] & ~0x80000000;
29949e866e40b95795203f3ee46f44a197c946e4stevel
29949e866e40b95795203f3ee46f44a197c946e4stevel /* handle trivial cases */
29949e866e40b95795203f3ee46f44a197c946e4stevel if (hx > 0x403e0000) { /* |x| > 2^63 + ... or x is nan */
29949e866e40b95795203f3ee46f44a197c946e4stevel /* convert an out-of-range float */
29949e866e40b95795203f3ee46f44a197c946e4stevel tt.i = sx | 0x7f000000;
29949e866e40b95795203f3ee46f44a197c946e4stevel return ((long long) tt.f);
29949e866e40b95795203f3ee46f44a197c946e4stevel } else if ((hx | xx.i[1] | xx.i[2] | xx.i[3]) == 0) /* x is zero */
29949e866e40b95795203f3ee46f44a197c946e4stevel return (0LL);
29949e866e40b95795203f3ee46f44a197c946e4stevel
29949e866e40b95795203f3ee46f44a197c946e4stevel /* get the rounding mode */
29949e866e40b95795203f3ee46f44a197c946e4stevel __fenv_getfsr32(&fsr);
29949e866e40b95795203f3ee46f44a197c946e4stevel rm = fsr >> 30;
29949e866e40b95795203f3ee46f44a197c946e4stevel
29949e866e40b95795203f3ee46f44a197c946e4stevel /* flip the sense of directed roundings if x is negative */
29949e866e40b95795203f3ee46f44a197c946e4stevel if (sx)
29949e866e40b95795203f3ee46f44a197c946e4stevel rm ^= rm >> 1;
29949e866e40b95795203f3ee46f44a197c946e4stevel
29949e866e40b95795203f3ee46f44a197c946e4stevel /* handle |x| < 1 */
29949e866e40b95795203f3ee46f44a197c946e4stevel if (hx < 0x3fff0000) {
29949e866e40b95795203f3ee46f44a197c946e4stevel dummy = 1.0e30f; /* x is nonzero, so raise inexact */
29949e866e40b95795203f3ee46f44a197c946e4stevel dummy += 1.0e-30f;
29949e866e40b95795203f3ee46f44a197c946e4stevel if (rm == FSR_RP || (rm == FSR_RN && (hx >= 0x3ffe0000 &&
29949e866e40b95795203f3ee46f44a197c946e4stevel ((hx & 0xffff) | xx.i[1] | xx.i[2] | xx.i[3]))))
29949e866e40b95795203f3ee46f44a197c946e4stevel return (sx ? -1LL : 1LL);
29949e866e40b95795203f3ee46f44a197c946e4stevel return (0LL);
29949e866e40b95795203f3ee46f44a197c946e4stevel }
29949e866e40b95795203f3ee46f44a197c946e4stevel
29949e866e40b95795203f3ee46f44a197c946e4stevel /* extract the integer and fractional parts of x */
29949e866e40b95795203f3ee46f44a197c946e4stevel j = 0x406f - (hx >> 16);
29949e866e40b95795203f3ee46f44a197c946e4stevel xx.i[0] = 0x10000 | (xx.i[0] & 0xffff);
29949e866e40b95795203f3ee46f44a197c946e4stevel if (j >= 96) {
29949e866e40b95795203f3ee46f44a197c946e4stevel zz.i[0] = 0;
29949e866e40b95795203f3ee46f44a197c946e4stevel zz.i[1] = xx.i[0] >> (j - 96);
29949e866e40b95795203f3ee46f44a197c946e4stevel frac = ((xx.i[0] << 1) << (127 - j)) | (xx.i[1] >> (j - 96));
29949e866e40b95795203f3ee46f44a197c946e4stevel if (((xx.i[1] << 1) << (127 - j)) | xx.i[2] | xx.i[3])
29949e866e40b95795203f3ee46f44a197c946e4stevel frac |= 1;
29949e866e40b95795203f3ee46f44a197c946e4stevel } else if (j >= 64) {
29949e866e40b95795203f3ee46f44a197c946e4stevel zz.i[0] = xx.i[0] >> (j - 64);
29949e866e40b95795203f3ee46f44a197c946e4stevel zz.i[1] = ((xx.i[0] << 1) << (95 - j)) | (xx.i[1] >> (j - 64));
29949e866e40b95795203f3ee46f44a197c946e4stevel frac = ((xx.i[1] << 1) << (95 - j)) | (xx.i[2] >> (j - 64));
29949e866e40b95795203f3ee46f44a197c946e4stevel if (((xx.i[2] << 1) << (95 - j)) | xx.i[3])
29949e866e40b95795203f3ee46f44a197c946e4stevel frac |= 1;
29949e866e40b95795203f3ee46f44a197c946e4stevel } else {
29949e866e40b95795203f3ee46f44a197c946e4stevel zz.i[0] = ((xx.i[0] << 1) << (63 - j)) | (xx.i[1] >> (j - 32));
29949e866e40b95795203f3ee46f44a197c946e4stevel zz.i[1] = ((xx.i[1] << 1) << (63 - j)) | (xx.i[2] >> (j - 32));
29949e866e40b95795203f3ee46f44a197c946e4stevel frac = ((xx.i[2] << 1) << (63 - j)) | (xx.i[3] >> (j - 32));
29949e866e40b95795203f3ee46f44a197c946e4stevel if ((xx.i[3] << 1) << (63 - j))
29949e866e40b95795203f3ee46f44a197c946e4stevel frac |= 1;
29949e866e40b95795203f3ee46f44a197c946e4stevel }
29949e866e40b95795203f3ee46f44a197c946e4stevel
29949e866e40b95795203f3ee46f44a197c946e4stevel /* round */
29949e866e40b95795203f3ee46f44a197c946e4stevel if (frac && (rm == FSR_RP || (rm == FSR_RN && (frac > 0x80000000u ||
29949e866e40b95795203f3ee46f44a197c946e4stevel (frac == 0x80000000 && (zz.i[1] & 1)))))) {
29949e866e40b95795203f3ee46f44a197c946e4stevel if (++zz.i[1] == 0)
29949e866e40b95795203f3ee46f44a197c946e4stevel zz.i[0]++;
29949e866e40b95795203f3ee46f44a197c946e4stevel }
29949e866e40b95795203f3ee46f44a197c946e4stevel
29949e866e40b95795203f3ee46f44a197c946e4stevel /* check for result out of range (note that z is |x| at this point) */
29949e866e40b95795203f3ee46f44a197c946e4stevel if (zz.i[0] > 0x80000000u || (zz.i[0] == 0x80000000 && (zz.i[1] ||
29949e866e40b95795203f3ee46f44a197c946e4stevel !sx))) {
29949e866e40b95795203f3ee46f44a197c946e4stevel tt.i = sx | 0x7f000000;
29949e866e40b95795203f3ee46f44a197c946e4stevel return ((long long) tt.f);
29949e866e40b95795203f3ee46f44a197c946e4stevel }
29949e866e40b95795203f3ee46f44a197c946e4stevel
29949e866e40b95795203f3ee46f44a197c946e4stevel /* raise inexact if need be */
29949e866e40b95795203f3ee46f44a197c946e4stevel if (frac) {
29949e866e40b95795203f3ee46f44a197c946e4stevel dummy = 1.0e30F;
29949e866e40b95795203f3ee46f44a197c946e4stevel dummy += 1.0e-30F;
29949e866e40b95795203f3ee46f44a197c946e4stevel }
29949e866e40b95795203f3ee46f44a197c946e4stevel
29949e866e40b95795203f3ee46f44a197c946e4stevel /* negate result if need be */
29949e866e40b95795203f3ee46f44a197c946e4stevel if (sx) {
29949e866e40b95795203f3ee46f44a197c946e4stevel zz.i[0] = ~zz.i[0];
29949e866e40b95795203f3ee46f44a197c946e4stevel zz.i[1] = -zz.i[1];
29949e866e40b95795203f3ee46f44a197c946e4stevel if (zz.i[1] == 0)
29949e866e40b95795203f3ee46f44a197c946e4stevel zz.i[0]++;
29949e866e40b95795203f3ee46f44a197c946e4stevel }
29949e866e40b95795203f3ee46f44a197c946e4stevel return (zz.l);
29949e866e40b95795203f3ee46f44a197c946e4stevel}
29949e866e40b95795203f3ee46f44a197c946e4stevel#elif defined(__x86)
29949e866e40b95795203f3ee46f44a197c946e4stevellong long
29949e866e40b95795203f3ee46f44a197c946e4stevelllrintl(long double x) {
29949e866e40b95795203f3ee46f44a197c946e4stevel /*
29949e866e40b95795203f3ee46f44a197c946e4stevel * Note: The following code works on x86 (in the default rounding
29949e866e40b95795203f3ee46f44a197c946e4stevel * precision mode), but one ought to just use the fistpll instruction
29949e866e40b95795203f3ee46f44a197c946e4stevel * instead.
29949e866e40b95795203f3ee46f44a197c946e4stevel */
29949e866e40b95795203f3ee46f44a197c946e4stevel union {
29949e866e40b95795203f3ee46f44a197c946e4stevel unsigned i[3];
29949e866e40b95795203f3ee46f44a197c946e4stevel long double e;
29949e866e40b95795203f3ee46f44a197c946e4stevel } xx, yy;
29949e866e40b95795203f3ee46f44a197c946e4stevel int ex;
29949e866e40b95795203f3ee46f44a197c946e4stevel
29949e866e40b95795203f3ee46f44a197c946e4stevel xx.e = x;
29949e866e40b95795203f3ee46f44a197c946e4stevel ex = xx.i[2] & 0x7fff;
29949e866e40b95795203f3ee46f44a197c946e4stevel
29949e866e40b95795203f3ee46f44a197c946e4stevel if (ex < 0x403e) { /* |x| < 2^63 */
29949e866e40b95795203f3ee46f44a197c946e4stevel /* add and subtract a power of two to round x to an integer */
29949e866e40b95795203f3ee46f44a197c946e4stevel yy.i[2] = (xx.i[2] & 0x8000) | 0x403e;
29949e866e40b95795203f3ee46f44a197c946e4stevel yy.i[1] = 0x80000000;
29949e866e40b95795203f3ee46f44a197c946e4stevel yy.i[0] = 0;
29949e866e40b95795203f3ee46f44a197c946e4stevel x = (x + yy.e) - yy.e;
29949e866e40b95795203f3ee46f44a197c946e4stevel }
29949e866e40b95795203f3ee46f44a197c946e4stevel
29949e866e40b95795203f3ee46f44a197c946e4stevel /* now x is nan, inf, or integral */
29949e866e40b95795203f3ee46f44a197c946e4stevel return ((long long) x);
29949e866e40b95795203f3ee46f44a197c946e4stevel}
29949e866e40b95795203f3ee46f44a197c946e4stevel#else
29949e866e40b95795203f3ee46f44a197c946e4stevel#error Unknown architecture
29949e866e40b95795203f3ee46f44a197c946e4stevel#endif
29949e866e40b95795203f3ee46f44a197c946e4stevel