exp.c revision 25c28e83beb90e7c80452a7c818c5e6f73a07dc8
/*
* CDDL HEADER START
*
* The contents of this file are subject to the terms of the
* Common Development and Distribution License (the "License").
* You may not use this file except in compliance with the License.
*
* You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
* or http://www.opensolaris.org/os/licensing.
* See the License for the specific language governing permissions
* and limitations under the License.
*
* When distributing Covered Code, include this CDDL HEADER in each
* file and include the License file at usr/src/OPENSOLARIS.LICENSE.
* If applicable, add the following below this CDDL HEADER, with the
* fields enclosed by brackets "[]" replaced with your own identifying
* information: Portions Copyright [yyyy] [name of copyright owner]
*
* CDDL HEADER END
*/
/*
* Copyright 2011 Nexenta Systems, Inc. All rights reserved.
*/
/*
* Copyright 2006 Sun Microsystems, Inc. All rights reserved.
* Use is subject to license terms.
*/
#pragma weak exp = __exp
/*
* exp(x)
* Hybrid algorithm of Peter Tang's Table driven method (for large
* arguments) and an accurate table (for small arguments).
* Written by K.C. Ng, November 1988.
* Method (large arguments):
* 1. Argument Reduction: given the input x, find r and integer k
* and j such that
* x = (k+j/32)*(ln2) + r, |r| <= (1/64)*ln2
*
* 2. exp(x) = 2^k * (2^(j/32) + 2^(j/32)*expm1(r))
* a. expm1(r) is approximated by a polynomial:
* expm1(r) ~ r + t1*r^2 + t2*r^3 + ... + t5*r^6
* Here t1 = 1/2 exactly.
* b. 2^(j/32) is represented to twice double precision
* as TBL[2j]+TBL[2j+1].
*
* Note: If divide were fast enough, we could use another approximation
* in 2.a:
* expm1(r) ~ (2r)/(2-R), R = r - r^2*(t1 + t2*r^2)
* (for the same t1 and t2 as above)
*
* Special cases:
* exp(INF) is INF, exp(NaN) is NaN;
* exp(-INF)= 0;
* for finite argument, only exp(0)=1 is exact.
*
* Accuracy:
* According to an error analysis, the error is always less than
* an ulp (unit in the last place). The largest errors observed
* are less than 0.55 ulp for normal results and less than 0.75 ulp
* for subnormal results.
*
* Misc. info.
* For IEEE double
* if x > 7.09782712893383973096e+02 then exp(x) overflow
* if x < -7.45133219101941108420e+02 then exp(x) underflow
*/
#include "libm.h"
static const double TBL[] = {
1.00000000000000000000e+00, 0.00000000000000000000e+00,
1.02189714865411662714e+00, 5.10922502897344389359e-17,
1.04427378242741375480e+00, 8.55188970553796365958e-17,
1.06714040067682369717e+00, -7.89985396684158212226e-17,
1.09050773266525768967e+00, -3.04678207981247114697e-17,
1.11438674259589243221e+00, 1.04102784568455709549e-16,
1.13878863475669156458e+00, 8.91281267602540777782e-17,
1.16372485877757747552e+00, 3.82920483692409349872e-17,
1.18920711500272102690e+00, 3.98201523146564611098e-17,
1.21524735998046895524e+00, -7.71263069268148813091e-17,
1.24185781207348400201e+00, 4.65802759183693679123e-17,
1.26905095719173321989e+00, 2.66793213134218609523e-18,
1.29683955465100964055e+00, 2.53825027948883149593e-17,
1.32523664315974132322e+00, -2.85873121003886075697e-17,
1.35425554693689265129e+00, 7.70094837980298946162e-17,
1.38390988196383202258e+00, -6.77051165879478628716e-17,
1.41421356237309514547e+00, -9.66729331345291345105e-17,
1.44518080697704665027e+00, -3.02375813499398731940e-17,
1.47682614593949934623e+00, -3.48399455689279579579e-17,
1.50916442759342284141e+00, -1.01645532775429503911e-16,
1.54221082540794074411e+00, 7.94983480969762085616e-17,
1.57598084510788649659e+00, -1.01369164712783039808e-17,
1.61049033194925428347e+00, 2.47071925697978878522e-17,
1.64575547815396494578e+00, -1.01256799136747726038e-16,
1.68179283050742900407e+00, 8.19901002058149652013e-17,
1.71861929812247793414e+00, -1.85138041826311098821e-17,
1.75625216037329945351e+00, 2.96014069544887330703e-17,
1.79470907500310716820e+00, 1.82274584279120867698e-17,
1.83400808640934243066e+00, 3.28310722424562658722e-17,
1.87416763411029996256e+00, -6.12276341300414256164e-17,
1.91520656139714740007e+00, -1.06199460561959626376e-16,
1.95714412417540017941e+00, 8.96076779103666776760e-17,
};
/*
* For i = 0, ..., 66,
* TBL2[2*i] is a double precision number near (i+1)*2^-6, and
* TBL2[2*i+1] = exp(TBL2[2*i]) to within a relative error less
* than 2^-60.
*
* For i = 67, ..., 133,
* TBL2[2*i] is a double precision number near -(i+1)*2^-6, and
* TBL2[2*i+1] = exp(TBL2[2*i]) to within a relative error less
* than 2^-60.
*/
static const double TBL2[] = {
1.56249999999984491572e-02, 1.01574770858668417262e+00,
3.12499999999998716305e-02, 1.03174340749910253834e+00,
4.68750000000011102230e-02, 1.04799100201663386578e+00,
6.24999999999990632493e-02, 1.06449445891785843266e+00,
7.81249999999999444888e-02, 1.08125780744903954300e+00,
9.37500000000013322676e-02, 1.09828514030782731226e+00,
1.09375000000001346145e-01, 1.11558061464248226002e+00,
1.24999999999999417133e-01, 1.13314845306682565607e+00,
1.40624999999995337063e-01, 1.15099294469117108264e+00,
1.56249999999996141975e-01, 1.16911844616949989195e+00,
1.71874999999992894573e-01, 1.18752938276309216725e+00,
1.87500000000000888178e-01, 1.20623024942098178158e+00,
2.03124999999361649516e-01, 1.22522561187652545556e+00,
2.18750000000000416334e-01, 1.24452010776609567344e+00,
2.34375000000003524958e-01, 1.26411844775347081971e+00,
2.50000000000006328271e-01, 1.28402541668774961003e+00,
2.65624999999982791543e-01, 1.30424587476761533189e+00,
2.81249999999993727240e-01, 1.32478475872885725906e+00,
2.96875000000003275158e-01, 1.34564708304941493822e+00,
3.12500000000002886580e-01, 1.36683794117380030819e+00,
3.28124999999993394173e-01, 1.38836250675661765364e+00,
3.43749999999998612221e-01, 1.41022603492570874906e+00,
3.59374999999992450483e-01, 1.43243386356506730017e+00,
3.74999999999991395772e-01, 1.45499141461818881638e+00,
3.90624999999997613020e-01, 1.47790419541173490003e+00,
4.06249999999991895372e-01, 1.50117780000011058483e+00,
4.21874999999996613820e-01, 1.52481791053132154090e+00,
4.37500000000004607426e-01, 1.54883029863414023453e+00,
4.53125000000004274359e-01, 1.57322082682725961078e+00,
4.68750000000008326673e-01, 1.59799544995064657371e+00,
4.84374999999985456078e-01, 1.62316021661928200359e+00,
4.99999999999997335465e-01, 1.64872127070012375327e+00,
5.15625000000000222045e-01, 1.67468485281178436352e+00,
5.31250000000003441691e-01, 1.70105730184840653330e+00,
5.46874999999999111822e-01, 1.72784505652716169344e+00,
5.62499999999999333866e-01, 1.75505465696029738787e+00,
5.78124999999993338662e-01, 1.78269274625180318417e+00,
5.93749999999999666933e-01, 1.81076607211938656050e+00,
6.09375000000003441691e-01, 1.83928148854178719063e+00,
6.24999999999995559108e-01, 1.86824595743221411048e+00,
6.40625000000009103829e-01, 1.89766655033813602671e+00,
6.56249999999993782751e-01, 1.92755045016753268072e+00,
6.71875000000002109424e-01, 1.95790495294292221651e+00,
6.87499999999992450483e-01, 1.98873746958227681780e+00,
7.03125000000004996004e-01, 2.02005552770870666635e+00,
7.18750000000007105427e-01, 2.05186677348799140219e+00,
7.34375000000008770762e-01, 2.08417897349558689513e+00,
7.49999999999983901766e-01, 2.11700001661264058939e+00,
7.65624999999997002398e-01, 2.15033791595229351046e+00,
7.81250000000005884182e-01, 2.18420081081563077774e+00,
7.96874999999991451283e-01, 2.21859696867912603579e+00,
8.12500000000000000000e-01, 2.25353478721320854561e+00,
8.28125000000008215650e-01, 2.28902279633221983346e+00,
8.43749999999997890576e-01, 2.32506966027711614586e+00,
8.59374999999999444888e-01, 2.36168417973090827289e+00,
8.75000000000003219647e-01, 2.39887529396710563745e+00,
8.90625000000013433699e-01, 2.43665208303232461162e+00,
9.06249999999980571097e-01, 2.47502376996297712708e+00,
9.21874999999984456878e-01, 2.51399972303748420188e+00,
9.37500000000001887379e-01, 2.55358945806293169412e+00,
9.53125000000003330669e-01, 2.59380264069854327147e+00,
9.68749999999989119814e-01, 2.63464908881560244680e+00,
9.84374999999997890576e-01, 2.67613877489447116176e+00,
1.00000000000001154632e+00, 2.71828182845907662113e+00,
1.01562499999999333866e+00, 2.76108853855008318234e+00,
1.03124999999995980993e+00, 2.80456935623711389738e+00,
1.04687499999999933387e+00, 2.84873489717039740654e+00,
-1.56249999999999514277e-02, 9.84496437005408453480e-01,
-3.12499999999955972718e-02, 9.69233234476348348707e-01,
-4.68749999999993824384e-02, 9.54206665969188905230e-01,
-6.24999999999976130205e-02, 9.39413062813478028090e-01,
-7.81249999999989314103e-02, 9.24848813216205822840e-01,
-9.37499999999995975442e-02, 9.10510361380034494161e-01,
-1.09374999999998584466e-01, 8.96394206635151680196e-01,
-1.24999999999998556710e-01, 8.82496902584596676355e-01,
-1.40624999999999361622e-01, 8.68815056262843721235e-01,
-1.56249999999999111822e-01, 8.55345327307423297647e-01,
-1.71874999999924144012e-01, 8.42084427143446223596e-01,
-1.87499999999996752598e-01, 8.29029118180403035154e-01,
-2.03124999999988037347e-01, 8.16176213022349550386e-01,
-2.18749999999995947686e-01, 8.03522573689063990265e-01,
-2.34374999999996419531e-01, 7.91065110850298847112e-01,
-2.49999999999996280753e-01, 7.78800783071407765057e-01,
-2.65624999999999888978e-01, 7.66726596070820165529e-01,
-2.81249999999989397370e-01, 7.54839601989015340777e-01,
-2.96874999999996114219e-01, 7.43136898668761203268e-01,
-3.12499999999999555911e-01, 7.31615628946642115871e-01,
-3.28124999999993782751e-01, 7.20272979955444259126e-01,
-3.43749999999997946087e-01, 7.09106182437399867879e-01,
-3.59374999999994337863e-01, 6.98112510068129799023e-01,
-3.74999999999994615418e-01, 6.87289278790975899369e-01,
-3.90624999999999000799e-01, 6.76633846161729612945e-01,
-4.06249999999947264406e-01, 6.66143610703522903727e-01,
-4.21874999999988453681e-01, 6.55816011271509125002e-01,
-4.37499999999999111822e-01, 6.45648526427892610613e-01,
-4.53124999999999278355e-01, 6.35638673826052436056e-01,
-4.68749999999999278355e-01, 6.25784009604591573428e-01,
-4.84374999999992894573e-01, 6.16082127790682609891e-01,
-4.99999999999998168132e-01, 6.06530659712634534486e-01,
-5.15625000000000000000e-01, 5.97127273421627413619e-01,
-5.31249999999989785948e-01, 5.87869673122352498496e-01,
-5.46874999999972688514e-01, 5.78755598612500032907e-01,
-5.62500000000000000000e-01, 5.69782824730923009859e-01,
-5.78124999999992339461e-01, 5.60949160814475100700e-01,
-5.93749999999948707696e-01, 5.52252450163048691500e-01,
-6.09374999999552580121e-01, 5.43690569513243682209e-01,
-6.24999999999984789945e-01, 5.35261428518998383375e-01,
-6.40624999999983457677e-01, 5.26962969243379708573e-01,
-6.56249999999998334665e-01, 5.18793165653890220312e-01,
-6.71874999999943378626e-01, 5.10750023129039609771e-01,
-6.87499999999997002398e-01, 5.02831577970942467104e-01,
-7.03124999999991118216e-01, 4.95035896926202978463e-01,
-7.18749999999991340260e-01, 4.87361076713623331269e-01,
-7.34374999999985678123e-01, 4.79805243559684402310e-01,
-7.49999999999997335465e-01, 4.72366552741015965911e-01,
-7.65624999999993782751e-01, 4.65043188134059204408e-01,
-7.81249999999863220523e-01, 4.57833361771676883301e-01,
-7.96874999999998112621e-01, 4.50735313406363247157e-01,
-8.12499999999990119015e-01, 4.43747310081084256339e-01,
-8.28124999999996003197e-01, 4.36867645705559026759e-01,
-8.43749999999988120614e-01, 4.30094640640067360504e-01,
-8.59374999999994115818e-01, 4.23426641285265303871e-01,
-8.74999999999977129406e-01, 4.16862019678517936594e-01,
-8.90624999999983346655e-01, 4.10399173096376801428e-01,
-9.06249999999991784350e-01, 4.04036523663345414903e-01,
-9.21874999999994004796e-01, 3.97772517966614058693e-01,
-9.37499999999994337863e-01, 3.91605626676801210628e-01,
-9.53124999999999444888e-01, 3.85534344174578935682e-01,
-9.68749999999986677324e-01, 3.79557188183094640355e-01,
-9.84374999999992339461e-01, 3.73672699406045860648e-01,
-9.99999999999995892175e-01, 3.67879441171443832825e-01,
-1.01562499999994315658e+00, 3.62175999080846300338e-01,
-1.03124999999991096011e+00, 3.56560980663978732697e-01,
-1.04687499999999067413e+00, 3.51033015038813400732e-01,
};
static const double C[] = {
0.5,
4.61662413084468283841e+01, /* 0x40471547, 0x652b82fe */
2.16608493865351192653e-02, /* 0x3f962e42, 0xfee00000 */
5.96317165397058656257e-12, /* 0x3d9a39ef, 0x35793c76 */
1.6666666666526086527e-1, /* 3fc5555555548f7c */
4.1666666666226079285e-2, /* 3fa5555555545d4e */
8.3333679843421958056e-3, /* 3f811115b7aa905e */
1.3888949086377719040e-3, /* 3f56c1728d739765 */
1.0,
0.0,
7.09782712893383973096e+02, /* 0x40862E42, 0xFEFA39EF */
7.45133219101941108420e+02, /* 0x40874910, 0xD52D3051 */
5.55111512312578270212e-17, /* 0x3c900000, 0x00000000 */
};
#define half C[0]
#define invln2_32 C[1]
#define ln2_32hi C[2]
#define ln2_32lo C[3]
#define t2 C[4]
#define t3 C[5]
#define t4 C[6]
#define t5 C[7]
#define one C[8]
#define zero C[9]
#define threshold1 C[10]
#define threshold2 C[11]
#define twom54 C[12]
double
exp(double x) {
double y, z, t;
int hx, ix, k, j, m;
ix = ((int *)&x)[HIWORD];
hx = ix & ~0x80000000;
if (hx < 0x3ff0a2b2) { /* |x| < 3/2 ln 2 */
if (hx < 0x3f862e42) { /* |x| < 1/64 ln 2 */
if (hx < 0x3ed00000) { /* |x| < 2^-18 */
volatile int dummy;
dummy = (int)x; /* raise inexact if x != 0 */
#ifdef lint
dummy = dummy;
#endif
if (hx < 0x3e300000)
return (one + x);
return (one + x * (one + half * x));
}
t = x * x;
y = x + (t * (half + x * t2) +
(t * t) * (t3 + x * t4 + t * t5));
return (one + y);
}
/* find the multiple of 2^-6 nearest x */
k = hx >> 20;
j = (0x00100000 | (hx & 0x000fffff)) >> (0x40c - k);
j = (j - 1) & ~1;
if (ix < 0)
j += 134;
z = x - TBL2[j];
t = z * z;
y = z + (t * (half + z * t2) +
(t * t) * (t3 + z * t4 + t * t5));
return (TBL2[j+1] + TBL2[j+1] * y);
}
if (hx >= 0x40862e42) { /* x is large, infinite, or nan */
if (hx >= 0x7ff00000) {
if (ix == 0xfff00000 && ((int *)&x)[LOWORD] == 0)
return (zero);
return (x * x);
}
if (x > threshold1)
return (_SVID_libm_err(x, x, 6));
if (-x > threshold2)
return (_SVID_libm_err(x, x, 7));
}
t = invln2_32 * x;
if (ix < 0)
t -= half;
else
t += half;
k = (int)t;
j = (k & 0x1f) << 1;
m = k >> 5;
z = (x - k * ln2_32hi) - k * ln2_32lo;
/* z is now in primary range */
t = z * z;
y = z + (t * (half + z * t2) + (t * t) * (t3 + z * t4 + t * t5));
y = TBL[j] + (TBL[j+1] + TBL[j] * y);
if (m < -1021) {
((int *)&y)[HIWORD] += (m + 54) << 20;
return (twom54 * y);
}
((int *)&y)[HIWORD] += m << 20;
return (y);
}