Joseph Myers fded7ed684 Fix ldbl-128 / ldbl-128ibm asinl for -Wuninitialized.
The ldbl-128 and ldbl-128ibm implementations of asinl produce
uninitialized variable warnings with -Wuninitialized because the code
for small arguments in fact always returns but the compiler cannot see
this and instead sees that a variable would be uninitialized if the
"if (huge + x > one)" conditional used to force the "inexact"
exception were false.

All the code in libm trying to force "inexact" for functions that are
not exactly defined is suspect and should be removed at some point
given that we now have a clear definition of the accuracy goals for
libm functions which, following C99/C11, does not require anything
about "inexact" for most functions (likewise, the multi-precision code
that tries to give correctly-rounded results, very slowly, for
functions for which the goals clearly do not include correct rounding,
if the faster paths are accurate enough).  However, for now this patch
simply changes the code to use math_force_eval, rather than "if", to
ensure the evaluation of the inexact computation.

Tested for powerpc and mips64.

	* sysdeps/ieee754/ldbl-128/e_asinl.c (__ieee754_asinl): Don't use
	a conditional in forcing "inexact".
	* sysdeps/ieee754/ldbl-128ibm/e_asinl.c (__ieee754_asinl):
	Likewise.
2015-05-22 17:36:52 +00:00

255 lines
7.3 KiB
C

/*
* ====================================================
* Copyright (C) 1993 by Sun Microsystems, Inc. All rights reserved.
*
* Developed at SunPro, a Sun Microsystems, Inc. business.
* Permission to use, copy, modify, and distribute this
* software is freely granted, provided that this notice
* is preserved.
* ====================================================
*/
/*
Long double expansions are
Copyright (C) 2001 Stephen L. Moshier <moshier@na-net.ornl.gov>
and are incorporated herein by permission of the author. The author
reserves the right to distribute this material elsewhere under different
copying permissions. These modifications are distributed here under the
following terms:
This library is free software; you can redistribute it and/or
modify it under the terms of the GNU Lesser General Public
License as published by the Free Software Foundation; either
version 2.1 of the License, or (at your option) any later version.
This library is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
Lesser General Public License for more details.
You should have received a copy of the GNU Lesser General Public
License along with this library; if not, see
<http://www.gnu.org/licenses/>. */
/* __ieee754_asin(x)
* Method :
* Since asin(x) = x + x^3/6 + x^5*3/40 + x^7*15/336 + ...
* we approximate asin(x) on [0,0.5] by
* asin(x) = x + x*x^2*R(x^2)
* Between .5 and .625 the approximation is
* asin(0.5625 + x) = asin(0.5625) + x rS(x) / sS(x)
* For x in [0.625,1]
* asin(x) = pi/2-2*asin(sqrt((1-x)/2))
* Let y = (1-x), z = y/2, s := sqrt(z), and pio2_hi+pio2_lo=pi/2;
* then for x>0.98
* asin(x) = pi/2 - 2*(s+s*z*R(z))
* = pio2_hi - (2*(s+s*z*R(z)) - pio2_lo)
* For x<=0.98, let pio4_hi = pio2_hi/2, then
* f = hi part of s;
* c = sqrt(z) - f = (z-f*f)/(s+f) ...f+c=sqrt(z)
* and
* asin(x) = pi/2 - 2*(s+s*z*R(z))
* = pio4_hi+(pio4-2s)-(2s*z*R(z)-pio2_lo)
* = pio4_hi+(pio4-2f)-(2s*z*R(z)-(pio2_lo+2c))
*
* Special cases:
* if x is NaN, return x itself;
* if |x|>1, return NaN with invalid signal.
*
*/
#include <float.h>
#include <math.h>
#include <math_private.h>
long double sqrtl (long double);
static const long double
one = 1.0L,
huge = 1.0e+300L,
pio2_hi = 1.5707963267948966192313216916397514420986L,
pio2_lo = 4.3359050650618905123985220130216759843812E-35L,
pio4_hi = 7.8539816339744830961566084581987569936977E-1L,
/* coefficient for R(x^2) */
/* asin(x) = x + x^3 pS(x^2) / qS(x^2)
0 <= x <= 0.5
peak relative error 1.9e-35 */
pS0 = -8.358099012470680544198472400254596543711E2L,
pS1 = 3.674973957689619490312782828051860366493E3L,
pS2 = -6.730729094812979665807581609853656623219E3L,
pS3 = 6.643843795209060298375552684423454077633E3L,
pS4 = -3.817341990928606692235481812252049415993E3L,
pS5 = 1.284635388402653715636722822195716476156E3L,
pS6 = -2.410736125231549204856567737329112037867E2L,
pS7 = 2.219191969382402856557594215833622156220E1L,
pS8 = -7.249056260830627156600112195061001036533E-1L,
pS9 = 1.055923570937755300061509030361395604448E-3L,
qS0 = -5.014859407482408326519083440151745519205E3L,
qS1 = 2.430653047950480068881028451580393430537E4L,
qS2 = -4.997904737193653607449250593976069726962E4L,
qS3 = 5.675712336110456923807959930107347511086E4L,
qS4 = -3.881523118339661268482937768522572588022E4L,
qS5 = 1.634202194895541569749717032234510811216E4L,
qS6 = -4.151452662440709301601820849901296953752E3L,
qS7 = 5.956050864057192019085175976175695342168E2L,
qS8 = -4.175375777334867025769346564600396877176E1L,
/* 1.000000000000000000000000000000000000000E0 */
/* asin(0.5625 + x) = asin(0.5625) + x rS(x) / sS(x)
-0.0625 <= x <= 0.0625
peak relative error 3.3e-35 */
rS0 = -5.619049346208901520945464704848780243887E0L,
rS1 = 4.460504162777731472539175700169871920352E1L,
rS2 = -1.317669505315409261479577040530751477488E2L,
rS3 = 1.626532582423661989632442410808596009227E2L,
rS4 = -3.144806644195158614904369445440583873264E1L,
rS5 = -9.806674443470740708765165604769099559553E1L,
rS6 = 5.708468492052010816555762842394927806920E1L,
rS7 = 1.396540499232262112248553357962639431922E1L,
rS8 = -1.126243289311910363001762058295832610344E1L,
rS9 = -4.956179821329901954211277873774472383512E-1L,
rS10 = 3.313227657082367169241333738391762525780E-1L,
sS0 = -4.645814742084009935700221277307007679325E0L,
sS1 = 3.879074822457694323970438316317961918430E1L,
sS2 = -1.221986588013474694623973554726201001066E2L,
sS3 = 1.658821150347718105012079876756201905822E2L,
sS4 = -4.804379630977558197953176474426239748977E1L,
sS5 = -1.004296417397316948114344573811562952793E2L,
sS6 = 7.530281592861320234941101403870010111138E1L,
sS7 = 1.270735595411673647119592092304357226607E1L,
sS8 = -1.815144839646376500705105967064792930282E1L,
sS9 = -7.821597334910963922204235247786840828217E-2L,
/* 1.000000000000000000000000000000000000000E0 */
asinr5625 = 5.9740641664535021430381036628424864397707E-1L;
long double
__ieee754_asinl (long double x)
{
long double a, t, w, p, q, c, r, s;
int flag;
if (__glibc_unlikely (__isnanl (x)))
return x + x;
flag = 0;
a = __builtin_fabsl (x);
if (a == 1.0L) /* |x|>= 1 */
return x * pio2_hi + x * pio2_lo; /* asin(1)=+-pi/2 with inexact */
else if (a >= 1.0L)
return (x - x) / (x - x); /* asin(|x|>1) is NaN */
else if (a < 0.5L)
{
if (a < 6.938893903907228e-18L) /* |x| < 2**-57 */
{
if (fabsl (x) < LDBL_MIN)
{
long double force_underflow = x * x;
math_force_eval (force_underflow);
}
long double force_inexact = huge + x;
math_force_eval (force_inexact);
return x; /* return x with inexact if x!=0 */
}
else
{
t = x * x;
/* Mark to use pS, qS later on. */
flag = 1;
}
}
else if (a < 0.625L)
{
t = a - 0.5625;
p = ((((((((((rS10 * t
+ rS9) * t
+ rS8) * t
+ rS7) * t
+ rS6) * t
+ rS5) * t
+ rS4) * t
+ rS3) * t
+ rS2) * t
+ rS1) * t
+ rS0) * t;
q = ((((((((( t
+ sS9) * t
+ sS8) * t
+ sS7) * t
+ sS6) * t
+ sS5) * t
+ sS4) * t
+ sS3) * t
+ sS2) * t
+ sS1) * t
+ sS0;
t = asinr5625 + p / q;
if (x > 0.0L)
return t;
else
return -t;
}
else
{
/* 1 > |x| >= 0.625 */
w = one - a;
t = w * 0.5;
}
p = (((((((((pS9 * t
+ pS8) * t
+ pS7) * t
+ pS6) * t
+ pS5) * t
+ pS4) * t
+ pS3) * t
+ pS2) * t
+ pS1) * t
+ pS0) * t;
q = (((((((( t
+ qS8) * t
+ qS7) * t
+ qS6) * t
+ qS5) * t
+ qS4) * t
+ qS3) * t
+ qS2) * t
+ qS1) * t
+ qS0;
if (flag) /* 2^-57 < |x| < 0.5 */
{
w = p / q;
return x + x * w;
}
s = __ieee754_sqrtl (t);
if (a > 0.975L)
{
w = p / q;
t = pio2_hi - (2.0 * (s + s * w) - pio2_lo);
}
else
{
w = ldbl_high (s);
c = (t - w * w) / (s + w);
r = p / q;
p = 2.0 * s * r - (pio2_lo - 2.0 * c);
q = pio4_hi - 2.0 * w;
t = pio4_hi - (p - q);
}
if (x > 0.0L)
return t;
else
return -t;
}
strong_alias (__ieee754_asinl, __asinl_finite)