diff options
author | Szabolcs Nagy <nsz@port70.net> | 2020-01-18 17:55:25 +0000 |
---|---|---|
committer | Rich Felker <dalias@aerifal.cx> | 2020-02-21 23:42:05 -0500 |
commit | b3797d3b2e10e6fff2a6b04af917e61e95838b08 (patch) | |
tree | 31e7b1858b566167f4303bbeab58d6074549e321 /src/math/__rem_pio2f.c | |
parent | 040c1d16b468c50c04fc94edff521f1637708328 (diff) | |
download | musl-b3797d3b2e10e6fff2a6b04af917e61e95838b08.tar.gz musl-b3797d3b2e10e6fff2a6b04af917e61e95838b08.tar.bz2 musl-b3797d3b2e10e6fff2a6b04af917e61e95838b08.tar.xz musl-b3797d3b2e10e6fff2a6b04af917e61e95838b08.zip |
math: fix __rem_pio2 in non-nearest rounding modes
Handle when after reduction |y| > pi/4+tiny. This happens in directed
rounding modes because the fast round to int code does not give the
nearest integer. In such cases the reduction may not be symmetric
between x and -x so e.g. cos(x)==cos(-x) may not hold (but polynomial
evaluation is not symmetric either with directed rounding so fixing
that would require more changes with bigger performance impact).
The fix only adds two predictable branches in nearest rounding mode,
simple ubenchmark does not show relevant performance regression in
nearest rounding mode.
The code could be improved: e.g reducing the medium size threshold
such that two step reduction is enough instead of three, and the
single precision case can avoid the issue by doing the round to int
differently, but this fix was kept minimal.
Diffstat (limited to 'src/math/__rem_pio2f.c')
-rw-r--r-- | src/math/__rem_pio2f.c | 13 |
1 files changed, 12 insertions, 1 deletions
diff --git a/src/math/__rem_pio2f.c b/src/math/__rem_pio2f.c index 4473c1c4..e6765643 100644 --- a/src/math/__rem_pio2f.c +++ b/src/math/__rem_pio2f.c @@ -35,6 +35,7 @@ */ static const double toint = 1.5/EPS, +pio4 = 0x1.921fb6p-1, invpio2 = 6.36619772367581382433e-01, /* 0x3FE45F30, 0x6DC9C883 */ pio2_1 = 1.57079631090164184570e+00, /* 0x3FF921FB, 0x50000000 */ pio2_1t = 1.58932547735281966916e-08; /* 0x3E5110b4, 0x611A6263 */ @@ -50,10 +51,20 @@ int __rem_pio2f(float x, double *y) ix = u.i & 0x7fffffff; /* 25+53 bit pi is good enough for medium size */ if (ix < 0x4dc90fdb) { /* |x| ~< 2^28*(pi/2), medium size */ - /* Use a specialized rint() to get fn. Assume round-to-nearest. */ + /* Use a specialized rint() to get fn. */ fn = (double_t)x*invpio2 + toint - toint; n = (int32_t)fn; *y = x - fn*pio2_1 - fn*pio2_1t; + /* Matters with directed rounding. */ + if (predict_false(*y < -pio4)) { + n--; + fn--; + *y = x - fn*pio2_1 - fn*pio2_1t; + } else if (predict_false(*y > pio4)) { + n++; + fn++; + *y = x - fn*pio2_1 - fn*pio2_1t; + } return n; } if(ix>=0x7f800000) { /* x is inf or NaN */ |