Source File
expm1.go
Belonging Package
math
// Copyright 2010 The Go Authors. All rights reserved.
// Use of this source code is governed by a BSD-style
// license that can be found in the LICENSE file.
package math
// The original C code, the long comment, and the constants
// below are from FreeBSD's /usr/src/lib/msun/src/s_expm1.c
// and came with this notice. The go code is a simplified
// version of the original C.
//
// ====================================================
// Copyright (C) 1993 by Sun Microsystems, Inc. All rights reserved.
//
// Developed at SunPro, a Sun Microsystems, Inc. business.
// Permission to use, copy, modify, and distribute this
// software is freely granted, provided that this notice
// is preserved.
// ====================================================
//
// expm1(x)
// Returns exp(x)-1, the exponential of x minus 1.
//
// Method
// 1. Argument reduction:
// Given x, find r and integer k such that
//
// x = k*ln2 + r, |r| <= 0.5*ln2 ~ 0.34658
//
// Here a correction term c will be computed to compensate
// the error in r when rounded to a floating-point number.
//
// 2. Approximating expm1(r) by a special rational function on
// the interval [0,0.34658]:
// Since
// r*(exp(r)+1)/(exp(r)-1) = 2+ r**2/6 - r**4/360 + ...
// we define R1(r*r) by
// r*(exp(r)+1)/(exp(r)-1) = 2+ r**2/6 * R1(r*r)
// That is,
// R1(r**2) = 6/r *((exp(r)+1)/(exp(r)-1) - 2/r)
// = 6/r * ( 1 + 2.0*(1/(exp(r)-1) - 1/r))
// = 1 - r**2/60 + r**4/2520 - r**6/100800 + ...
// We use a special Reme algorithm on [0,0.347] to generate
// a polynomial of degree 5 in r*r to approximate R1. The
// maximum error of this polynomial approximation is bounded
// by 2**-61. In other words,
// R1(z) ~ 1.0 + Q1*z + Q2*z**2 + Q3*z**3 + Q4*z**4 + Q5*z**5
// where Q1 = -1.6666666666666567384E-2,
// Q2 = 3.9682539681370365873E-4,
// Q3 = -9.9206344733435987357E-6,
// Q4 = 2.5051361420808517002E-7,
// Q5 = -6.2843505682382617102E-9;
// (where z=r*r, and the values of Q1 to Q5 are listed below)
// with error bounded by
// | 5 | -61
// | 1.0+Q1*z+...+Q5*z - R1(z) | <= 2
// | |
//
// expm1(r) = exp(r)-1 is then computed by the following
// specific way which minimize the accumulation rounding error:
// 2 3
// r r [ 3 - (R1 + R1*r/2) ]
// expm1(r) = r + --- + --- * [--------------------]
// 2 2 [ 6 - r*(3 - R1*r/2) ]
//
// To compensate the error in the argument reduction, we use
// expm1(r+c) = expm1(r) + c + expm1(r)*c
// ~ expm1(r) + c + r*c
// Thus c+r*c will be added in as the correction terms for
// expm1(r+c). Now rearrange the term to avoid optimization
// screw up:
// ( 2 2 )
// ({ ( r [ R1 - (3 - R1*r/2) ] ) } r )
// expm1(r+c)~r - ({r*(--- * [--------------------]-c)-c} - --- )
// ({ ( 2 [ 6 - r*(3 - R1*r/2) ] ) } 2 )
// ( )
//
// = r - E
// 3. Scale back to obtain expm1(x):
// From step 1, we have
// expm1(x) = either 2**k*[expm1(r)+1] - 1
// = or 2**k*[expm1(r) + (1-2**-k)]
// 4. Implementation notes:
// (A). To save one multiplication, we scale the coefficient Qi
// to Qi*2**i, and replace z by (x**2)/2.
// (B). To achieve maximum accuracy, we compute expm1(x) by
// (i) if x < -56*ln2, return -1.0, (raise inexact if x!=inf)
// (ii) if k=0, return r-E
// (iii) if k=-1, return 0.5*(r-E)-0.5
// (iv) if k=1 if r < -0.25, return 2*((r+0.5)- E)
// else return 1.0+2.0*(r-E);
// (v) if (k<-2||k>56) return 2**k(1-(E-r)) - 1 (or exp(x)-1)
// (vi) if k <= 20, return 2**k((1-2**-k)-(E-r)), else
// (vii) return 2**k(1-((E+2**-k)-r))
//
// Special cases:
// expm1(INF) is INF, expm1(NaN) is NaN;
// expm1(-INF) is -1, and
// for finite argument, only expm1(0)=0 is exact.
//
// Accuracy:
// according to an error analysis, the error is always less than
// 1 ulp (unit in the last place).
//
// Misc. info.
// For IEEE double
// if x > 7.09782712893383973096e+02 then expm1(x) overflow
//
// Constants:
// The hexadecimal values are the intended ones for the following
// constants. The decimal values may be used, provided that the
// compiler will convert from decimal to binary accurately enough
// to produce the hexadecimal values shown.
//
// Expm1 returns e**x - 1, the base-e exponential of x minus 1.
// It is more accurate than [Exp](x) - 1 when x is near zero.
//
// Special cases are:
//
// Expm1(+Inf) = +Inf
// Expm1(-Inf) = -1
// Expm1(NaN) = NaN
//
// Very large values overflow to -1 or +Inf.
func ( float64) float64 {
if haveArchExpm1 {
return archExpm1()
}
return expm1()
}
func expm1( float64) float64 {
const (
= 7.09782712893383973096e+02 // 0x40862E42FEFA39EF
= 3.88162421113569373274e+01 // 0x4043687a9f1af2b1
= 1.03972077083991796413e+00 // 0x3ff0a2b23f3bab73
= 3.46573590279972654709e-01 // 0x3fd62e42fefa39ef
= 6.93147180369123816490e-01 // 0x3fe62e42fee00000
= 1.90821492927058770002e-10 // 0x3dea39ef35793c76
= 1.44269504088896338700e+00 // 0x3ff71547652b82fe
= 1.0 / (1 << 54) // 2**-54 = 0x3c90000000000000
// scaled coefficients related to expm1
= -3.33333333333331316428e-02 // 0xBFA11111111110F4
= 1.58730158725481460165e-03 // 0x3F5A01A019FE5585
= -7.93650757867487942473e-05 // 0xBF14CE199EAADBB7
= 4.00821782732936239552e-06 // 0x3ED0CFCA86E65239
= -2.01099218183624371326e-07 // 0xBE8AFDB76E09C32D
)
// special cases
switch {
case IsInf(, 1) || IsNaN():
return
case IsInf(, -1):
return -1
}
:=
:= false
if < 0 {
= -
= true
}
// filter out huge argument
if >= { // if |x| >= 56 * ln2
if {
return -1 // x < -56*ln2, return -1
}
if >= { // if |x| >= 709.78...
return Inf(1)
}
}
// argument reduction
var float64
var int
if > { // if |x| > 0.5 * ln2
var , float64
if < { // and |x| < 1.5 * ln2
if ! {
= -
=
= 1
} else {
= +
= -
= -1
}
} else {
if ! {
= int(* + 0.5)
} else {
= int(* - 0.5)
}
:= float64()
= - * // t * Ln2Hi is exact here
= *
}
= -
= ( - ) -
} else if < { // when |x| < 2**-54, return x
return
} else {
= 0
}
// x is now in primary range
:= 0.5 *
:= *
:= 1 + *(+*(+*(+*(+*))))
:= 3 - *
:= * (( - ) / (6.0 - *))
if == 0 {
return - (* - ) // c is 0
}
= (*(-) - )
-=
switch {
case == -1:
return 0.5*(-) - 0.5
case == 1:
if < -0.25 {
return -2 * ( - ( + 0.5))
}
return 1 + 2*(-)
case <= -2 || > 56: // suffice to return exp(x)-1
:= 1 - ( - )
= Float64frombits(Float64bits() + uint64()<<52) // add k to y's exponent
return - 1
}
if < 20 {
:= Float64frombits(0x3ff0000000000000 - (0x20000000000000 >> uint())) // t=1-2**-k
:= - ( - )
= Float64frombits(Float64bits() + uint64()<<52) // add k to y's exponent
return
}
= Float64frombits(uint64(0x3ff-) << 52) // 2**-k
:= - ( + )
++
= Float64frombits(Float64bits() + uint64()<<52) // add k to y's exponent
return
}
The pages are generated with Golds v0.7.0-preview. (GOOS=linux GOARCH=amd64) Golds is a Go 101 project developed by Tapir Liu. PR and bug reports are welcome and can be submitted to the issue list. Please follow @zigo_101 (reachable from the left QR code) to get the latest news of Golds. |