compile-time f32, f64 operations are now correctly lossy

previously we used the bigfloat abstraction to do all
compile-time float math. but runtime code and comptime code
are supposed to get the same result. so now if you add a
f32 to a f32 at compile time it does it with f32 math
instead of the bigfloat. float literals still get the
bigfloat math.

closes #424
This commit is contained in:
Andrew Kelley
2017-08-20 00:33:05 -04:00
parent c73a0c92d0
commit 09bd4a9a86
14 changed files with 808 additions and 110 deletions

View File

@@ -8,19 +8,19 @@
#include "bigfloat.hpp"
#include "bigint.hpp"
#include "buffer.hpp"
#include "quadmath.hpp"
#include <math.h>
#include <errno.h>
extern "C" {
__float128 fmodq(__float128 a, __float128 b);
__float128 ceilq(__float128 a);
__float128 floorq(__float128 a);
__float128 strtoflt128 (const char *s, char **sp);
int quadmath_snprintf (char *s, size_t size, const char *format, ...);
void bigfloat_init_128(BigFloat *dest, __float128 x) {
dest->value = x;
}
void bigfloat_init_32(BigFloat *dest, float x) {
dest->value = x;
}
void bigfloat_init_float(BigFloat *dest, __float128 x) {
void bigfloat_init_64(BigFloat *dest, double x) {
dest->value = x;
}
@@ -104,11 +104,13 @@ void bigfloat_mod(BigFloat *dest, const BigFloat *op1, const BigFloat *op2) {
dest->value = fmodq(fmodq(op1->value, op2->value) + op2->value, op2->value);
}
void bigfloat_write_buf(Buf *buf, const BigFloat *op) {
buf_resize(buf, 256);
int len = quadmath_snprintf(buf_ptr(buf), buf_len(buf), "%Qf", op->value);
void bigfloat_append_buf(Buf *buf, const BigFloat *op) {
const size_t extra_len = 100;
size_t old_len = buf_len(buf);
buf_resize(buf, old_len + extra_len);
int len = quadmath_snprintf(buf_ptr(buf) + old_len, extra_len, "%Qf", op->value);
assert(len > 0);
buf_resize(buf, len);
buf_resize(buf, old_len + len);
}
Cmp bigfloat_cmp(const BigFloat *op1, const BigFloat *op2) {
@@ -121,42 +123,15 @@ Cmp bigfloat_cmp(const BigFloat *op1, const BigFloat *op2) {
}
}
// TODO this is wrong when compiler running on big endian systems. caught by tests
void bigfloat_write_ieee597(const BigFloat *op, uint8_t *buf, size_t bit_count, bool is_big_endian) {
if (bit_count == 32) {
float f32 = op->value;
memcpy(buf, &f32, 4);
} else if (bit_count == 64) {
double f64 = op->value;
memcpy(buf, &f64, 8);
} else if (bit_count == 128) {
__float128 f128 = op->value;
memcpy(buf, &f128, 16);
} else {
zig_unreachable();
}
float bigfloat_to_f32(const BigFloat *bigfloat) {
return (float)bigfloat->value;
}
// TODO this is wrong when compiler running on big endian systems. caught by tests
void bigfloat_read_ieee597(BigFloat *dest, const uint8_t *buf, size_t bit_count, bool is_big_endian) {
if (bit_count == 32) {
float f32;
memcpy(&f32, buf, 4);
dest->value = f32;
} else if (bit_count == 64) {
double f64;
memcpy(&f64, buf, 8);
dest->value = f64;
} else if (bit_count == 128) {
__float128 f128;
memcpy(&f128, buf, 16);
dest->value = f128;
} else {
zig_unreachable();
}
double bigfloat_to_f64(const BigFloat *bigfloat) {
return (double)bigfloat->value;
}
double bigfloat_to_double(const BigFloat *bigfloat) {
__float128 bigfloat_to_f128(const BigFloat *bigfloat) {
return bigfloat->value;
}