mirror of https://git.musl-libc.org/git/musl
Browse Source
comments are kept in the double version of the function compared to fdlibm/freebsd we partition the domain into one more part and select different threshold points: now the [log(5/3)/2,log(3)/2] and [log(3)/2,inf] domains should have <1.5ulp error (so only the last bit may be wrong, assuming good exp, expm1) (note that log(3)/2 and log(5/3)/2 are the points where tanh changes resolution: tanh(log(3)/2)=0.5, tanh(log(5/3)/2)=0.25) for some x < log(5/3)/2 (~=0.2554) the error can be >1.5ulp but it should be <2ulp (the freebsd code had some >2ulp errors in [0.255,1]) even with the extra logic the new code produces smaller object filesrs-1.0
3 changed files with 83 additions and 173 deletions
@ -1,73 +1,41 @@ |
|||||
/* origin: FreeBSD /usr/src/lib/msun/src/s_tanh.c */ |
|
||||
/*
|
|
||||
* ==================================================== |
|
||||
* Copyright (C) 1993 by Sun Microsystems, Inc. All rights reserved. |
|
||||
* |
|
||||
* Developed at SunPro, a Sun Microsystems, Inc. business. |
|
||||
* Permission to use, copy, modify, and distribute this |
|
||||
* software is freely granted, provided that this notice |
|
||||
* is preserved. |
|
||||
* ==================================================== |
|
||||
*/ |
|
||||
/* Tanh(x)
|
|
||||
* Return the Hyperbolic Tangent of x |
|
||||
* |
|
||||
* Method : |
|
||||
* x -x |
|
||||
* e - e |
|
||||
* 0. tanh(x) is defined to be ----------- |
|
||||
* x -x |
|
||||
* e + e |
|
||||
* 1. reduce x to non-negative by tanh(-x) = -tanh(x). |
|
||||
* 2. 0 <= x < 2**-28 : tanh(x) := x with inexact if x != 0 |
|
||||
* -t |
|
||||
* 2**-28 <= x < 1 : tanh(x) := -----; t = expm1(-2x) |
|
||||
* t + 2 |
|
||||
* 2 |
|
||||
* 1 <= x < 22 : tanh(x) := 1 - -----; t = expm1(2x) |
|
||||
* t + 2 |
|
||||
* 22 <= x <= INF : tanh(x) := 1. |
|
||||
* |
|
||||
* Special cases: |
|
||||
* tanh(NaN) is NaN; |
|
||||
* only tanh(0)=0 is exact for finite argument. |
|
||||
*/ |
|
||||
|
|
||||
#include "libm.h" |
#include "libm.h" |
||||
|
|
||||
static const double tiny = 1.0e-300, huge = 1.0e300; |
/* tanh(x) = (exp(x) - exp(-x))/(exp(x) + exp(-x))
|
||||
|
* = (exp(2*x) - 1)/(exp(2*x) - 1 + 2) |
||||
|
* = (1 - exp(-2*x))/(exp(-2*x) - 1 + 2) |
||||
|
*/ |
||||
double tanh(double x) |
double tanh(double x) |
||||
{ |
{ |
||||
double t,z; |
union {double f; uint64_t i;} u = {.f = x}; |
||||
int32_t jx,ix; |
uint32_t w; |
||||
|
int sign; |
||||
GET_HIGH_WORD(jx, x); |
double t; |
||||
ix = jx & 0x7fffffff; |
|
||||
|
|
||||
/* x is INF or NaN */ |
/* x = |x| */ |
||||
if (ix >= 0x7ff00000) { |
sign = u.i >> 63; |
||||
if (jx >= 0) |
u.i &= (uint64_t)-1/2; |
||||
return 1.0f/x + 1.0f; /* tanh(+-inf)=+-1 */ |
x = u.f; |
||||
else |
w = u.i >> 32; |
||||
return 1.0f/x - 1.0f; /* tanh(NaN) = NaN */ |
|
||||
} |
|
||||
|
|
||||
if (ix < 0x40360000) { /* |x| < 22 */ |
if (w > 0x3fe193ea) { |
||||
if (ix < 0x3e300000) { /* |x| < 2**-28 */ |
/* |x| > log(3)/2 ~= 0.5493 or nan */ |
||||
/* tanh(tiny) = tiny with inexact */ |
if (w > 0x40340000) { |
||||
if (huge+x > 1.0f) |
/* |x| > 20 or nan */ |
||||
return x; |
/* note: this branch avoids raising overflow */ |
||||
} |
/* raise inexact if x!=+-inf and handle nan */ |
||||
if (ix >= 0x3ff00000) { /* |x| >= 1 */ |
t = 1 + 0/(x + 0x1p-120f); |
||||
t = expm1(2.0f*fabs(x)); |
|
||||
z = 1.0f - 2.0f/(t+2.0f); |
|
||||
} else { |
} else { |
||||
t = expm1(-2.0f*fabs(x)); |
t = expm1(2*x); |
||||
z= -t/(t+2.0f); |
t = 1 - 2/(t+2); |
||||
} |
} |
||||
} else { /* |x| >= 22, return +-1 */ |
} else if (w > 0x3fd058ae) { |
||||
z = 1.0f - tiny; /* raise inexact */ |
/* |x| > log(5/3)/2 ~= 0.2554 */ |
||||
|
t = expm1(2*x); |
||||
|
t = t/(t+2); |
||||
|
} else { |
||||
|
/* |x| is small, up to 2ulp error in [0.1,0.2554] */ |
||||
|
t = expm1(-2*x); |
||||
|
t = -t/(t+2); |
||||
} |
} |
||||
return jx >= 0 ? z : -z; |
return sign ? -t : t; |
||||
} |
} |
||||
|
|||||
@ -1,55 +1,35 @@ |
|||||
/* origin: FreeBSD /usr/src/lib/msun/src/s_tanhf.c */ |
|
||||
/*
|
|
||||
* Conversion to float by Ian Lance Taylor, Cygnus Support, ian@cygnus.com. |
|
||||
*/ |
|
||||
/*
|
|
||||
* ==================================================== |
|
||||
* Copyright (C) 1993 by Sun Microsystems, Inc. All rights reserved. |
|
||||
* |
|
||||
* Developed at SunPro, a Sun Microsystems, Inc. business. |
|
||||
* Permission to use, copy, modify, and distribute this |
|
||||
* software is freely granted, provided that this notice |
|
||||
* is preserved. |
|
||||
* ==================================================== |
|
||||
*/ |
|
||||
|
|
||||
#include "libm.h" |
#include "libm.h" |
||||
|
|
||||
static const float |
|
||||
tiny = 1.0e-30, |
|
||||
huge = 1.0e30; |
|
||||
|
|
||||
float tanhf(float x) |
float tanhf(float x) |
||||
{ |
{ |
||||
float t,z; |
union {float f; uint32_t i;} u = {.f = x}; |
||||
int32_t jx,ix; |
uint32_t w; |
||||
|
int sign; |
||||
|
float t; |
||||
|
|
||||
GET_FLOAT_WORD(jx, x); |
/* x = |x| */ |
||||
ix = jx & 0x7fffffff; |
sign = u.i >> 31; |
||||
|
u.i &= 0x7fffffff; |
||||
|
x = u.f; |
||||
|
w = u.i; |
||||
|
|
||||
/* x is INF or NaN */ |
if (w > 0x3f0c9f54) { |
||||
if(ix >= 0x7f800000) { |
/* |x| > log(3)/2 ~= 0.5493 or nan */ |
||||
if (jx >= 0) |
if (w > 0x41200000) { |
||||
return 1.0f/x + 1.0f; /* tanh(+-inf)=+-1 */ |
/* |x| > 10 */ |
||||
else |
t = 1 + 0/(x + 0x1p-120f); |
||||
return 1.0f/x - 1.0f; /* tanh(NaN) = NaN */ |
|
||||
} |
|
||||
|
|
||||
if (ix < 0x41100000) { /* |x| < 9 */ |
|
||||
if (ix < 0x39800000) { /* |x| < 2**-12 */ |
|
||||
/* tanh(tiny) = tiny with inexact */ |
|
||||
if (huge+x > 1.0f) |
|
||||
return x; |
|
||||
} |
|
||||
if (ix >= 0x3f800000) { /* |x|>=1 */ |
|
||||
t = expm1f(2.0f*fabsf(x)); |
|
||||
z = 1.0f - 2.0f/(t+2.0f); |
|
||||
} else { |
} else { |
||||
t = expm1f(-2.0f*fabsf(x)); |
t = expm1f(2*x); |
||||
z = -t/(t+2.0f); |
t = 1 - 2/(t+2); |
||||
} |
} |
||||
} else { /* |x| >= 9, return +-1 */ |
} else if (w > 0x3e82c578) { |
||||
z = 1.0f - tiny; /* raise inexact */ |
/* |x| > log(5/3)/2 ~= 0.2554 */ |
||||
|
t = expm1f(2*x); |
||||
|
t = t/(t+2); |
||||
|
} else { |
||||
|
/* |x| is small */ |
||||
|
t = expm1f(-2*x); |
||||
|
t = -t/(t+2); |
||||
} |
} |
||||
return jx >= 0 ? z : -z; |
return sign ? -t : t; |
||||
} |
} |
||||
|
|||||
Loading…
Reference in new issue