branchless fpclassify

2022-08-05 22:47:19 +11:00 · 2022-08-05 22:47:19 +11:00 · bfaa80c628
parent bc443e31c3
commit bfaa80c628
9 changed files with 141 additions and 88 deletions
--- a/bake-test.cmd
+++ b/bake-test.cmd
@ -1 +0,0 @@
-clang test\test_%test%.c utf8.obj -Iinc -g -lciabatta.lib
--- a/inc/math.h
+++ b/inc/math.h
@ -23,11 +23,11 @@ typedef double double_t;
 #define math_errhandling (MATH_ERRNO | MATH_ERREXCEPT)

 // Classification
-#define FP_INFINITE  0
-#define FP_NAN       1
+#define FP_ZERO      0
+#define FP_SUBNORMAL 1
 #define FP_NORMAL    2
-#define FP_SUBNORMAL 3
-#define FP_ZERO      4
+#define FP_INFINITE  4
+#define FP_NAN       5
 int     _fpclassify(double);
 int     _fpclassifyf(float);
 int     _fpclassifyl(long double);
--- a/inc/stdio.h
+++ b/inc/stdio.h
@ -27,7 +27,7 @@
 typedef struct FILE FILE;

 typedef struct {
-    int64_t   offset;
+    unsigned long long offset;
    mbstate_t mbstate;
 } fpos_t;

--- a/src/ciabatta.c
+++ b/src/ciabatta.c
@ -46,7 +46,7 @@
 #include "math/basic.c"
 #include "math/division.c"
 #include "math/gen_math.c"
-#include "math/ieee754.c"
+#include "math/bits.c"
 #include "math/round.c"
 #include "conv/digits.c"
 #include "conv/strpfx.c"
--- a/src/math/bits.c
+++ b/src/math/bits.c
@ -0,0 +1,106 @@
+
+// This thing doesn't compile branchlessly on MSVC lmao
+// This is a branchless version of fpclassify
+// The way it works is by assuming the following structure of float class
+// bit 2 | bit 1 | bit 0
+//   e       n      m
+// e is 1 for infinities and nan, 0 otherwise
+// n is 1 for normal numbers, 0 otherwise
+// m is 1 for nan and subnormal numbers, 0 otherwise
+// This leaves the following values for classes:
+//  0 - FP_ZERO
+//  1 - FP_SUBNORMAL
+//  2 - FP_NORMAL
+//  4 - FP_INFINITE
+//  5 - FP_NAN
+int _fpclassify(f64 x) {
+    // First, extract bits
+    u64 bits = F64_BITS(x);
+    i64 exp  = F64_BEXP(bits);
+    i64 mant = F64_MANT(bits);
+    // Get the number that's only zero when exp = 0x7ff
+    i64 ee = F64_BEXP_MAX - exp;
+    // Invert it to get number that's 1 iff x is infinity or nan
+    i64 e = !(ee);
+    // The value (ee*exp) is zero in two cases:
+    //   exp = 0x7ff, (infinities, nan)
+    //   exp = 0 (zero, subnormal)
+    // We negate this to make it so that this value is 1 only if number is not
+    // normal
+    i64 nn = !(ee*exp);
+    // Negate the previous thing. Now n is 1 iff number is normal
+    i64 n = !nn;
+    // m is 1 if mantissa is nonzero and the number is not normal
+    i64 m = !!mant & nn;
+    // Construct the float class
+    return (e<<2) | (n<<1) | m;
+}
+
+// Same recipe as above, different constants
+int _fpclassifyf(float x) {
+    u64 bits = F32_BITS(x);
+    i64 exp  = F32_BEXP(bits);
+    i64 mant = F32_MANT(bits);
+    i64 ee = F32_BEXP_MAX - exp;
+    i64 e = !(ee);
+    i64 nn = !(ee*exp);
+    i64 n = !nn;
+    i64 m = !!mant & nn;
+    return (e<<2) | (n<<1) | m;
+}
+
+int _fpclassifyl(fl64 x) {
+    return _fpclassify((f64)x);
+}
+
+
+int _signbit(f64 x) {
+    union {
+        f64 d;
+        uint64_t i;
+    } y = { x };
+    return y.i>>63;
+}
+
+int _signbitf(float x) {
+    union {
+        float f;
+        uint32_t i;
+    } y = { x };
+    return y.i>>31;
+}
+
+int _signbitl(fl64 x) {
+    return _signbit(x);
+}
+
+f64 copysign(f64 x, f64 y) {
+    union {f64 f; uint64_t i;} ux={x}, uy={y};
+    ux.i &= ~(1ULL<<63);
+    ux.i |= uy.i & (1ULL<<63);
+    return ux.f;
+}
+
+float copysignf(float x, float y) {
+    union {float f; uint32_t i;} ux={x}, uy={y};
+    ux.i &= 0x7fffffff;
+    ux.i |= uy.i & 0x80000000;
+    return ux.f;
+}
+
+fl64 copysignl(fl64 x, fl64 y) {
+    return copysign(x, y);
+}
+
+f64 nan(const char *s) {
+    return NAN;
+}
+
+float nanf(const char *s) {
+    return NAN;
+}
+
+fl64 nanl(const char *s) {
+    return NAN;
+}
+
--- a/src/math/ieee754.c
+++ b/src/math/ieee754.c
@ -1,77 +0,0 @@
-
-#include <math.h>
-#include <fenv.h>
-#include <stdint.h>
-#include <float.h>
-
-int _fpclassify(double x) {
-    union {double f; uint64_t i;} u = {x};
-    int e = u.i>>52 & 0x7ff;
-    if (!e) return u.i<<1 ? FP_SUBNORMAL : FP_ZERO;
-    if (e==0x7ff) return u.i<<12 ? FP_NAN : FP_INFINITE;
-    return FP_NORMAL;
-}
-
-int _fpclassifyf(float x) {
-    union {float f; uint32_t i;} u = {x};
-    int e = u.i>>23 & 0xff;
-    if (!e) return u.i<<1 ? FP_SUBNORMAL : FP_ZERO;
-    if (e==0xff) return u.i<<9 ? FP_NAN : FP_INFINITE;
-    return FP_NORMAL;
-}
-
-int _fpclassifyl(long double x) {
-    return _fpclassify(x);
-}
-
-
-int _signbit(double x) {
-    union {
-        double d;
-        uint64_t i;
-    } y = { x };
-    return y.i>>63;
-}
-
-int _signbitf(float x) {
-    union {
-        float f;
-        uint32_t i;
-    } y = { x };
-    return y.i>>31;
-}
-
-int _signbitl(long double x) {
-    return _signbit(x);
-}
-
-double copysign(double x, double y) {
-    union {double f; uint64_t i;} ux={x}, uy={y};
-    ux.i &= ~(1ULL<<63);
-    ux.i |= uy.i & (1ULL<<63);
-    return ux.f;
-}
-
-float copysignf(float x, float y) {
-    union {float f; uint32_t i;} ux={x}, uy={y};
-    ux.i &= 0x7fffffff;
-    ux.i |= uy.i & 0x80000000;
-    return ux.f;
-}
-
-long double copysignl(long double x, long double y) {
-    return copysign(x, y);
-}
-
-double nan(const char *s) {
-    return NAN;
-}
-
-float nanf(const char *s) {
-    return NAN;
-}
-
-long double nanl(const char *s) {
-    return NAN;
-}
-
--- a/src/util.c
+++ b/src/util.c
@ -44,8 +44,30 @@ typedef wchar_t wchar;
 #define STR_(a) #a
 #define STR(a) STR_(a)

-#define DOUBLE_BITS(x) ((union {double f; u64 i;}){x}).i
-#define DOUBLE_CONS(x) ((union {double f; u64 i;}){x}).f
-#define FLOAT_BITS(x)  ((union {float f;  u32 i;}){x}).i
-#define FLOAT_CONS(x)  ((union {float f;  u32 i;}){x}).f
+#define F64_BITS(x) ((union {f64 f; u64 i;}){x}).i
+#define F64_CONS(x) ((union {f64 f; u64 i;}){x}).f
+#define F32_BITS(x) ((union {f32 f; u32 i;}){x}).i
+#define F32_CONS(x) ((union {f32 f; u32 i;}){x}).f

+#define F64_MANT_MASK UINT64_C(0xfffffffffffff)
+#define F64_MANT_MAX  UINT64_C(0xfffffffffffff)
+#define F64_MANT_BITS 52
+#define F64_BEXP_BITS 11
+#define F64_BEXP_MASK 0x7ff
+#define F64_BEXP_MAX  0x7ff
+
+#define F32_MANT_MASK 0x7fffff
+#define F32_MANT_MAX  0x7fffff
+#define F32_MANT_BITS 23
+#define F32_BEXP_BITS 8
+#define F32_BEXP_MASK 0xff
+#define F32_BEXP_MAX  0xff
+
+
+#define F64_SIGN(bits) (bits >> (F64_MANT_BITS + F64_BEXP_BITS))
+#define F64_BEXP(bits) ((bits >> F64_MANT_BITS) & F64_BEXP_MASK)
+#define F64_MANT(bits) ((bits) & F64_MANT_MASK)
+
+#define F32_SIGN(bits) (bits >> (F32_MANT_BITS + F32_BEXP_BITS))
+#define F32_BEXP(bits) ((bits >> F32_MANT_BITS) & F32_BEXP_MASK)
+#define F32_MANT(bits) ((bits) & F32_MANT_MASK)
--- a/test.cmd
+++ b/test.cmd
@ -0,0 +1,2 @@
+
+clang test\%1 utf8.obj -Iinc -g -lciabatta.lib -nostdlib
--- a/test/test_math.c
+++ b/test/test_math.c
@ -5,6 +5,7 @@
 #include <fenv.h>
 #include <inttypes.h>
 #include <errno.h>
+#include <limits.h>

 const char *show_classification(double x) {
    switch(fpclassify(x)) {
				`@ -1 +0,0 @@`
				`clang test\test_%test%.c utf8.obj -Iinc -g -lciabatta.lib`
				`@ -0,0 +1,2 @@`

				`clang test\%1 utf8.obj -Iinc -g -lciabatta.lib -nostdlib`