summaryrefslogtreecommitdiff
path: root/src/math/__rem_pio2f.c
diff options
context:
space:
mode:
authorSzabolcs Nagy <nsz@port70.net>2020-01-18 17:55:25 +0000
committerRich Felker <dalias@aerifal.cx>2020-02-21 23:42:05 -0500
commitb3797d3b2e10e6fff2a6b04af917e61e95838b08 (patch)
tree31e7b1858b566167f4303bbeab58d6074549e321 /src/math/__rem_pio2f.c
parent040c1d16b468c50c04fc94edff521f1637708328 (diff)
downloadmusl-b3797d3b2e10e6fff2a6b04af917e61e95838b08.tar.gz
musl-b3797d3b2e10e6fff2a6b04af917e61e95838b08.tar.bz2
musl-b3797d3b2e10e6fff2a6b04af917e61e95838b08.tar.xz
musl-b3797d3b2e10e6fff2a6b04af917e61e95838b08.zip
math: fix __rem_pio2 in non-nearest rounding modes
Handle when after reduction |y| > pi/4+tiny. This happens in directed rounding modes because the fast round to int code does not give the nearest integer. In such cases the reduction may not be symmetric between x and -x so e.g. cos(x)==cos(-x) may not hold (but polynomial evaluation is not symmetric either with directed rounding so fixing that would require more changes with bigger performance impact). The fix only adds two predictable branches in nearest rounding mode, simple ubenchmark does not show relevant performance regression in nearest rounding mode. The code could be improved: e.g reducing the medium size threshold such that two step reduction is enough instead of three, and the single precision case can avoid the issue by doing the round to int differently, but this fix was kept minimal.
Diffstat (limited to 'src/math/__rem_pio2f.c')
-rw-r--r--src/math/__rem_pio2f.c13
1 files changed, 12 insertions, 1 deletions
diff --git a/src/math/__rem_pio2f.c b/src/math/__rem_pio2f.c
index 4473c1c4..e6765643 100644
--- a/src/math/__rem_pio2f.c
+++ b/src/math/__rem_pio2f.c
@@ -35,6 +35,7 @@
*/
static const double
toint = 1.5/EPS,
+pio4 = 0x1.921fb6p-1,
invpio2 = 6.36619772367581382433e-01, /* 0x3FE45F30, 0x6DC9C883 */
pio2_1 = 1.57079631090164184570e+00, /* 0x3FF921FB, 0x50000000 */
pio2_1t = 1.58932547735281966916e-08; /* 0x3E5110b4, 0x611A6263 */
@@ -50,10 +51,20 @@ int __rem_pio2f(float x, double *y)
ix = u.i & 0x7fffffff;
/* 25+53 bit pi is good enough for medium size */
if (ix < 0x4dc90fdb) { /* |x| ~< 2^28*(pi/2), medium size */
- /* Use a specialized rint() to get fn. Assume round-to-nearest. */
+ /* Use a specialized rint() to get fn. */
fn = (double_t)x*invpio2 + toint - toint;
n = (int32_t)fn;
*y = x - fn*pio2_1 - fn*pio2_1t;
+ /* Matters with directed rounding. */
+ if (predict_false(*y < -pio4)) {
+ n--;
+ fn--;
+ *y = x - fn*pio2_1 - fn*pio2_1t;
+ } else if (predict_false(*y > pio4)) {
+ n++;
+ fn++;
+ *y = x - fn*pio2_1 - fn*pio2_1t;
+ }
return n;
}
if(ix>=0x7f800000) { /* x is inf or NaN */