aboutsummaryrefslogtreecommitdiffstats
path: root/src
diff options
context:
space:
mode:
authorDavid Robillard <d@drobilla.net>2019-10-06 23:34:36 +0200
committerDavid Robillard <d@drobilla.net>2020-10-27 13:13:59 +0100
commit03e3b6c156f2b5809bfe0d65c52a1ad1df1da4fd (patch)
tree4c94c182d026bc91ba9d0ef4001d59df66c56591 /src
parent78c87ccdda887a4b49373cd2dfb20936e704a44a (diff)
downloadserd-03e3b6c156f2b5809bfe0d65c52a1ad1df1da4fd.tar.gz
serd-03e3b6c156f2b5809bfe0d65c52a1ad1df1da4fd.tar.bz2
serd-03e3b6c156f2b5809bfe0d65c52a1ad1df1da4fd.zip
Add precise floating point parsing
Diffstat (limited to 'src')
-rw-r--r--src/int_math.h1
-rw-r--r--src/string.c185
2 files changed, 182 insertions, 4 deletions
diff --git a/src/int_math.h b/src/int_math.h
index 85305a4a..d36a44d2 100644
--- a/src/int_math.h
+++ b/src/int_math.h
@@ -21,6 +21,7 @@
#define MIN(x, y) ((x) < (y) ? (x) : (y))
#define MAX(x, y) ((x) > (y) ? (x) : (y))
+#define CLAMP(x, l, h) MAX(l, MIN(h, x))
static const uint64_t POW10[] = {1ull,
10ull,
diff --git a/src/string.c b/src/string.c
index 2ef062e7..1f91862f 100644
--- a/src/string.c
+++ b/src/string.c
@@ -14,12 +14,15 @@
OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
*/
+#include "bigint.h"
+#include "ieee_float.h"
#include "int_math.h"
-#include "string_utils.h"
-
#include "serd/serd.h"
+#include "soft_float.h"
+#include "string_utils.h"
#include <assert.h>
+#include <float.h>
#include <math.h>
#include <stdbool.h>
#include <stdint.h>
@@ -212,12 +215,150 @@ serd_parse_double(const char* const str)
return result;
}
+static uint64_t
+normalize(SerdSoftFloat* value, const uint64_t error)
+{
+ const int original_e = value->e;
+
+ *value = soft_float_normalize(*value);
+
+ return error << (original_e - value->e);
+}
+
+/**
+ Return the error added by floating point multiplication.
+
+ Should be l + r + l*r/(2^64) + 0.5, but we short the denominator to 63 due
+ to lack of precision, which effectively rounds up.
+*/
+static inline uint64_t
+product_error(const uint64_t lerror,
+ const uint64_t rerror,
+ const uint64_t half_ulp)
+{
+ return lerror + rerror + ((lerror * rerror) >> 63) + half_ulp;
+}
+
+/**
+ Guess the binary floating point value for decimal input.
+
+ @param significand Significand from the input.
+ @param expt10 Decimal exponent from the input.
+ @param n_digits Number of decimal digits in the significand.
+ @param[out] guess Either the exact number, or its predecessor.
+ @return True if `guess` is correct.
+*/
+static bool
+sftod(const uint64_t significand,
+ const int expt10,
+ const int n_digits,
+ SerdSoftFloat* const guess)
+{
+ assert(expt10 <= max_dec_expt);
+ assert(expt10 >= min_dec_expt);
+
+ /* The general idea here is to try and find a power of 10 that we can
+ multiply by the significand to get the number. We get one from the
+ cache which is possibly too small, then multiply by another power of 10
+ to make up the difference if necessary. For example, with a target
+ power of 10^70, if we get 10^68 from the cache, then we multiply again
+ by 10^2. This, as well as normalization, accumulates error, which is
+ tracked throughout to know if we got the precise number. */
+
+ // Use a common denominator of 2^3 to avoid fractions
+ static const int lg_denom = 3;
+ static const uint64_t denom = 1 << 3;
+ static const uint64_t half_ulp = 4;
+
+ // Start out with just the significand, and no error
+ SerdSoftFloat input = {significand, 0};
+ uint64_t error = normalize(&input, 0);
+
+ // Get a power of 10 that takes us most of the way without overshooting
+ int cached_expt10 = 0;
+ SerdSoftFloat pow10 = soft_float_pow10_under(expt10, &cached_expt10);
+
+ // Get an exact fixup power if necessary
+ const int d_expt10 = expt10 - cached_expt10;
+ if (d_expt10) {
+ input = soft_float_multiply(input, soft_float_exact_pow10(d_expt10));
+ if (d_expt10 > uint64_digits10 - n_digits) {
+ error += half_ulp; // Product does not fit in an integer
+ }
+ }
+
+ // Multiply the significand by the power, normalize, and update the error
+ input = soft_float_multiply(input, pow10);
+ error = normalize(&input, product_error(error, half_ulp, half_ulp));
+
+ // Get the effective number of significant bits from the order of magnitude
+ const int magnitude = 64 + input.e;
+ const int real_magnitude = magnitude - dbl_subnormal_expt;
+ const int n_significant_bits = CLAMP(real_magnitude, 0, DBL_MANT_DIG);
+
+ // Calculate the number of "extra" bits of precision we have
+ int n_extra_bits = 64 - n_significant_bits;
+ if (n_extra_bits + lg_denom >= 64) {
+ // Very small subnormal where extra * denom does not fit in an integer
+ // Shift right (and accumulate some more error) to compensate
+ const int amount = (n_extra_bits + lg_denom) - 63;
+
+ input.f >>= amount;
+ input.e += amount;
+ error = product_error((error >> amount) + 1, half_ulp, half_ulp);
+ n_extra_bits -= amount;
+ }
+
+ // Calculate boundaries for the extra bits (with the common denominator)
+ assert(n_extra_bits < 64);
+ const uint64_t extra_mask = (1ull << n_extra_bits) - 1;
+ const uint64_t extra_bits = (input.f & extra_mask) * denom;
+ const uint64_t middle = (1ull << (n_extra_bits - 1)) * denom;
+ const uint64_t low = middle - error;
+ const uint64_t high = middle + error;
+
+ // Round to nearest representable double
+ guess->f = (input.f >> n_extra_bits) + (extra_bits >= high);
+ guess->e = input.e + n_extra_bits;
+
+ // Too inaccurate if the extra bits are within the error around the middle
+ return extra_bits <= low || extra_bits >= high;
+}
+
+static int
+compare_buffer(const char* buf, const int expt, const SerdSoftFloat upper)
+{
+ SerdBigint buf_bigint;
+ serd_bigint_set_decimal_string(&buf_bigint, buf);
+
+ SerdBigint upper_bigint;
+ serd_bigint_set_u64(&upper_bigint, upper.f);
+
+ if (expt >= 0) {
+ serd_bigint_multiply_pow10(&buf_bigint, (unsigned)expt);
+ } else {
+ serd_bigint_multiply_pow10(&upper_bigint, (unsigned)-expt);
+ }
+
+ if (upper.e > 0) {
+ serd_bigint_shift_left(&upper_bigint, (unsigned)upper.e);
+ } else {
+ serd_bigint_shift_left(&buf_bigint, (unsigned)-upper.e);
+ }
+
+ return serd_bigint_compare(&buf_bigint, &upper_bigint);
+}
double
-serd_strtod(const char* str, size_t* end)
+serd_strtod(const char* const str, size_t* const end)
{
#define SET_END(index) do { if (end) { *end = (size_t)(index); } } while (0)
+ static const int n_exact_pow10 = sizeof(POW10) / sizeof(POW10[0]);
+ static const int max_exact_int_digits = 15; // Digits that fit exactly
+ static const int max_decimal_power = 309; // Max finite power
+ static const int min_decimal_power = -324; // Min non-zero power
+
// Point s at the first non-whitespace character
const char* s = str;
while (is_space(*s)) {
@@ -250,5 +391,41 @@ serd_strtod(const char* str, size_t* end)
return (double)NAN;
}
- return in.sign * ((double)in.frac * pow(10, in.frac_expt));
+ const int expt = in.frac_expt;
+ const int result_power = in.n_digits + expt;
+
+ // Return early for simple exact cases
+ if (result_power > max_decimal_power) {
+ return (double)in.sign * (double)INFINITY;
+ } else if (result_power < min_decimal_power) {
+ return in.sign * 0.0;
+ } else if (in.n_digits < max_exact_int_digits) {
+ if (expt < 0 && -expt < n_exact_pow10) {
+ return in.sign * ((double)in.frac / (double)POW10[-expt]);
+ } else if (expt >= 0 && expt < n_exact_pow10) {
+ return in.sign * ((double)in.frac * (double)POW10[expt]);
+ }
+ }
+
+ // Try to guess the number using only soft floating point (fast path)
+ SerdSoftFloat guess = {0, 0};
+ const bool exact = sftod(in.frac, expt, in.n_digits, &guess);
+ const double g = soft_float_to_double(guess);
+ if (exact) {
+ return (double)in.sign * g;
+ }
+
+ // Not sure, guess is either the number or its predecessor (rare slow path)
+ // Compare it with the buffer using bigints to find out which
+ const SerdSoftFloat upper = {guess.f * 2 + 1, guess.e - 1};
+ const int cmp = compare_buffer(in.digits, in.digits_expt, upper);
+ if (cmp < 0) {
+ return in.sign * g;
+ } else if (cmp > 0) {
+ return in.sign * nextafter(g, (double)INFINITY);
+ } else if ((guess.f & 1) == 0) {
+ return in.sign * g; // Round towards even
+ } else {
+ return in.sign * nextafter(g, (double)INFINITY); // Round odd up
+ }
}