ciabatta/src/math/bits.c


// This thing doesn't compile branchlessly on MSVC lmao
// This is a branchless version of fpclassify
// The way it works is by assuming the following structure of float class
// bit 2 | bit 1 | bit 0
//   e       n      m
// e is 1 for infinities and nan, 0 otherwise
// n is 1 for normal numbers, 0 otherwise
// m is 1 for nan and subnormal numbers, 0 otherwise
// This leaves the following values for classes:
//  0 - FP_ZERO
//  1 - FP_SUBNORMAL
//  2 - FP_NORMAL
//  4 - FP_INFINITE
//  5 - FP_NAN
int _fpclassify(f64 x) {
    // First, extract bits
    u64 bits = F64_BITS(x);
    i64 exp  = F64_BEXP(bits);
    i64 mant = F64_MANT(bits);
    // Get the number that's only zero when exp = 0x7ff
    i64 ee = F64_BEXP_MAX - exp;
    // Invert it to get number that's 1 iff x is infinity or nan
    i64 e = !(ee);
    // The value (ee*exp) is zero in two cases:
    //   exp = 0x7ff, (infinities, nan)
    //   exp = 0 (zero, subnormal)
    // We negate this to make it so that this value is 1 only if number is not
    // normal
    i64 nn = !(ee*exp);
    // Negate the previous thing. Now n is 1 iff number is normal
    i64 n = !nn;
    // m is 1 if mantissa is nonzero and the number is not normal
    i64 m = !!mant & nn;
    // Construct the float class
    return (e<<2) | (n<<1) | m;
}

// Same recipe as above, different constants
int _fpclassifyf(float x) {
    u64 bits = F32_BITS(x);
    i64 exp  = F32_BEXP(bits);
    i64 mant = F32_MANT(bits);
    i64 ee = F32_BEXP_MAX - exp;
    i64 e = !(ee);
    i64 nn = !(ee*exp);
    i64 n = !nn;
    i64 m = !!mant & nn;
    return (e<<2) | (n<<1) | m;
}

int _fpclassifyl(fl64 x) {
    return _fpclassify((f64)x);
}


int _signbit(f64 x) {
    return F64_BITS(x)>>63;
}

int _signbitf(float x) {
    return F32_BITS(x)>>31;
}

int _signbitl(fl64 x) {
    return _signbit((f64)x);
}

f64 copysign(f64 x, f64 y) {
    u64 xbits = F64_BITS(x);
    u64 ybits = F64_BITS(y);
    xbits &= ~(UINT64_C(1)<<63);
    xbits |= ybits & (UINT64_C(1)<<63);
    return F64_CONS(xbits);
}

float copysignf(float x, float y) {
    u32 xbits = F32_BITS(x);
    u32 ybits = F32_BITS(y);
    xbits &= ~(UINT32_C(1)<<31);
    xbits |= ybits & (1u<<31);
    return F64_CONS(xbits);
}

fl64 copysignl(fl64 x, fl64 y) {
    return copysign((f64)x, (f64)y);
}

f64 nan(const char *s) {
    return NAN;
}

float nanf(const char *s) {
    return NAN;
}

fl64 nanl(const char *s) {
    return NAN;
}