common/C/log2.c

	log2.c revision ddc0e0b53c661f6e439e3b7072b3ef353eadb4af
/*
 * CDDL HEADER START
 *
 * The contents of this file are subject to the terms of the
 * Common Development and Distribution License (the "License").
 * You may not use this file except in compliance with the License.
 *
 * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
 * or http://www.opensolaris.org/os/licensing.
 * See the License for the specific language governing permissions
 * and limitations under the License.
 *
 * When distributing Covered Code, include this CDDL HEADER in each
 * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
 * If applicable, add the following below this CDDL HEADER, with the
 * fields enclosed by brackets "[]" replaced with your own identifying
 * information: Portions Copyright [yyyy] [name of copyright owner]
 *
 * CDDL HEADER END
 */

/*
 * Copyright 2011 Nexenta Systems, Inc.  All rights reserved.
 */
/*
 * Copyright 2006 Sun Microsystems, Inc.  All rights reserved.
 * Use is subject to license terms.
 */

#pragma weak __log2 = log2

/* INDENT OFF */
/*
 * log2(x) = log(x)/log2
 *
 * Base on Table look-up algorithm with product polynomial
 * approximation for log(x).
 *
 * By K.C. Ng, Nov 29, 2004
 *
 * (a). For x in [1-0.125, 1+0.125], from log.c we have
 *  log(x) =  f + ((a1*f^2) *
 *         ((a2 + (a3*f)*(a4+f)) + (f^3)*(a5+f))) *
 *         (((a6 + f*(a7+f)) + (f^3)*(a8+f)) *
 *         ((a9 + (a10*f)*(a11+f)) + (f^3)*(a12+f)))
 *  where f = x - 1.
 *  (i) modify a1 <- a1 / log2
 *  (ii) 1/log2 = 1.4426950408889634...
 *          = 1.5 - 0.057304959... (4 bit shift)
 *       Let lv = 1.5 - 1/log2, then
 *       lv = 0.057304959111036592640075318998107956665325,
 *  (iii) f*1.5 is exact because f has 3 trailing zero.
 *  (iv) Thus, log2(x) = f*1.5 - (lv*f - PPoly)
 *
 * (b). For 0.09375 <= x < 24
 *  Let j = (ix - 0x3fb80000) >> 15. Look up Y[j], 1/Y[j], and log(Y[j])
 *  from _TBL_log.c. Then
 *      log2(x)  = log2(Y[j]) + log2(1 + (x-Y[j])*(1/Y[j]))
 *            = log(Y[j])(1/log2) + log2(1 + s)
 *  where
 *      s = (x-Y[j])*(1/Y[j])
 *  From log.c, we have log(1+s) =
 *                2              2                     2
 *      (b s) (b + b s + s ) [b + b s + s (b + s)] (b + b s + s )
 *        1     2   3          4   5        6        7   8
 *
 *  By setting b1 <- b1/log2, we have
 *      log2(x) = 1.5 * T - (lv * T - POLY(s))
 *
 * (c). Otherwise, get "n", the exponent of x, and then normalize x to
 *  z in [1,2). Then similar to (b) find a Y[i] that matches z to 5.5
 *  significant bits. Then
 *      log2(x) = n + log2(z).
 *
 * Special cases:
 *  log2(x) is NaN with signal if x < 0 (including -INF) ;
 *  log2(+INF) is +INF; log2(0) is -INF with signal;
 *  log2(NaN) is that NaN with no signal.
 *
 * Maximum error observed: less than 0.84 ulp
 *
 * Constants:
 * The hexadecimal values are the intended ones for the following constants.
 * The decimal values may be used, provided that the compiler will convert
 * from decimal to binary accurately enough to produce the hexadecimal values
 * shown.
 */
/* INDENT ON */

#include "libm.h"
#include "libm_protos.h"

extern const double _TBL_log[];

static const double P[] = {
/* ONE   */  1.0,
/* TWO52 */  4503599627370496.0,
/* LN10V */  1.4426950408889634073599246810018920433347,   /* 1/log10 */
/* ZERO  */  0.0,
/* A1    */ -9.6809362455249638217841932228967194640116e-02,
/* A2    */  1.99628461483039965074226529395673424005508422852e+0000,
/* A3    */  2.26812367662950720159642514772713184356689453125e+0000,
/* A4    */ -9.05030639084976384900471657601883634924888610840e-0001,
/* A5    */ -1.48275767132434044270894446526654064655303955078e+0000,
/* A6    */  1.88158320939722756293122074566781520843505859375e+0000,
/* A7    */  1.83309386046986411145098827546462416648864746094e+0000,
/* A8    */  1.24847063988317086291601754055591300129890441895e+0000,
/* A9    */  1.98372421445537705508854742220137268304824829102e+0000,
/* A10   */ -3.94711735767898475035764249696512706577777862549e-0001,
/* A11   */  3.07890395362954372160402272129431366920471191406e+0000,
/* A12   */ -9.60099585275022149311041630426188930869102478027e-0001,
/* B1    */ -1.8039695622547469514898963204616532885451e-01,
/* B2    */  1.87161713283355151891381127914642725337613123482e+0000,
/* B3    */ -1.89082956295731507978530316904652863740921020508e+0000,
/* B4    */ -2.50562891673640253387134180229622870683670043945e+0000,
/* B5    */  1.64822828085258366037635369139024987816810607910e+0000,
/* B6    */ -1.24409107065868340669112512841820716857910156250e+0000,
/* B7    */  1.70534231658220414296067701798165217041969299316e+0000,
/* B8    */  1.99196833784655646937267192697618156671524047852e+0000,
/* LGH   */  1.5,
/* LGL   */  0.057304959111036592640075318998107956665325,
};

#define ONE   P[0]
#define TWO52 P[1]
#define LN10V P[2]
#define ZERO  P[3]
#define A1    P[4]
#define A2    P[5]
#define A3    P[6]
#define A4    P[7]
#define A5    P[8]
#define A6    P[9]
#define A7    P[10]
#define A8    P[11]
#define A9    P[12]
#define A10   P[13]
#define A11   P[14]
#define A12   P[15]
#define B1    P[16]
#define B2    P[17]
#define B3    P[18]
#define B4    P[19]
#define B5    P[20]
#define B6    P[21]
#define B7    P[22]
#define B8    P[23]
#define LGH   P[24]
#define LGL   P[25]

double
log2(double x) {
    int i, hx, ix, n, lx;

    n = 0;
    hx = ((int *) &x)[HIWORD]; ix = hx & 0x7fffffff;
    lx = ((int *) &x)[LOWORD];

    /* subnormal,0,negative,inf,nan */
    if ((hx + 0x100000) < 0x200000) {
#if defined(FPADD_TRAPS_INCOMPLETE_ON_NAN)
        if (ix >= 0x7ff80000)       /* assumes sparc-like QNaN */
            return (x);     /* for Cheetah when x is QNaN */
#endif
        if (((hx << 1) | lx) == 0)  /* log(0.0) = -inf */
            return (A5 / fabs(x));
        if (hx < 0) {   /* x < 0 */
            if (ix >= 0x7ff00000)
                return (x - x); /* x is -inf or NaN */
            else
                return (ZERO / (x - x));
        }
        if (((hx - 0x7ff00000) | lx) == 0)  /* log(inf) = inf */
            return (x);
        if (ix >= 0x7ff00000)       /* log(NaN) = NaN */
            return (x - x);
        x *= TWO52;
        n = -52;
        hx = ((int *) &x)[HIWORD]; ix = hx & 0x7fffffff;
        lx = ((int *) &x)[LOWORD];
    }

    /* 0.09375 (0x3fb80000) <= x < 24 (0x40380000) */
    i = ix >> 19;
    if (i >= 0x7f7 && i <= 0x806) {
        /* 0.875 <= x < 1.125 */
        if (ix >= 0x3fec0000 && ix < 0x3ff20000) {
            double s, z, r, w;
            s = x - ONE; z = s * s; r = (A10 * s) * (A11 + s);
            w = z * s;
            if (((ix << 12) | lx) == 0)
                return (z);
            else
                return (LGH * s - (LGL * s - ((A1 * z) *
                ((A2 + (A3 * s) * (A4 + s)) + w * (A5 + s))) *
                (((A6 + s * (A7 + s)) + w * (A8 + s)) *
                ((A9 + r) + w * (A12 + s)))));
        } else {
            double *tb, s;
            i = (ix - 0x3fb80000) >> 15;
            tb = (double *) _TBL_log + (i + i + i);
            if (((ix << 12) | lx) == 0) /* 2's power */
                return ((double) ((ix >> 20) - 0x3ff));
            s = (x - tb[0]) * tb[1];
            return (LGH * tb[2] - (LGL * tb[2] - ((B1 * s) *
                (B2 + s * (B3 + s))) *
                (((B4 + s * B5) + (s * s) * (B6 + s)) *
                (B7 + s * (B8 + s)))));
        }
    } else {
        double *tb, dn, s;
        dn = (double) (n + ((ix >> 20) - 0x3ff));
        ix <<= 12;
        if ((ix | lx) == 0)
            return (dn);
        i = ((unsigned) ix >> 12) | 0x3ff00000; /* scale x to [1,2) */
        ((int *) &x)[HIWORD] = i;
        i = (i - 0x3fb80000) >> 15;
        tb = (double *) _TBL_log + (i + i + i);
        s = (x - tb[0]) * tb[1];
        return (dn + (tb[2] * LN10V + ((B1 * s) *
            (B2 + s * (B3 + s))) *
            (((B4 + s * B5) + (s * s) * (B6 + s)) *
            (B7 + s * (B8 + s)))));
    }
}