basic sqrt implementation

2022-06-10 13:08:45 +11:00 · 2022-06-10 13:08:45 +11:00 · 1a834c303d
parent 5890659112
commit 1a834c303d
7 changed files with 185 additions and 16 deletions
--- a/bake.cmd
+++ b/bake.cmd
@ -51,4 +51,4 @@ del build\*.obj

 :skip_crt_compilation
 echo Compiling test..
-clang test\test4.c ciabatta.lib -std=c11 -lkernel32 -luser32 -lshell32 -nostdlib %CIABATTA_OPTIONS%
+clang test\test5.c ciabatta.lib -std=c11 -lkernel32 -luser32 -lshell32 -nostdlib %CIABATTA_OPTIONS%
--- a/code/math/ieee754.h
+++ b/code/math/ieee754.h
@ -11,6 +11,7 @@
 #define f_nbits (1+f_ebits+f_mbits)
 #define f_emax  ((1ULL << (f_ebits-1)) - 1)
 #define f_emin  (1 - f_emax)
+#define f_ebias f_emax

 // Extracting fields from the float
 #define f_eoffs   (f_mbits)
@ -22,8 +23,12 @@
 #define f_sval(b) (((b) >> f_soffs) & f_smask)
 #define f_mval(b) (((b) >> 0) & f_mmask)
 #define f_abs(b)  ((b) & ~(f_smask << f_soffs))
+#define f_exp(b)  (f_eval(b) - f_ebias)

-#define b_cons(s,e,m) ((s << f_soffs) | (e << f_eoffs) | (m))
+#define f_qexp(b) (f_eval(b) - f_ebias - f_mbits)
+#define f_qman(b) (((b) & f_mmask) | (f_mmask+1))
+
+#define b_cons(s,e,m) (((itype)s << f_soffs) | ((itype)e << f_eoffs) | (itype)(m))

 // Converting float to integer bits
 static inline itype suffix(f_bits)(ftype f) {
@ -35,7 +40,7 @@ static inline itype suffix(f_bits)(ftype f) {
    return u.b;
 }

-static inline itype suffix(f_frombits)(itype b) {
+static inline ftype suffix(f_frombits)(itype b) {
    union _u {
        ftype f;
        itype b;
@ -49,7 +54,7 @@ int suffix(_fpclassify)(ftype f) {
    itype bits = suffix(f_bits)(f);
    itype exp = f_eval(bits);
    itype man = f_mval(bits);
-    if(exp == f_emax) {
+    if(exp == f_emask) {
        if(man == 0) return FP_INFINITE;
        else return FP_NAN;
    }
--- a/code/math/math.c
+++ b/code/math/math.c
@ -16,6 +16,7 @@ enum Ordering {
 #define f_mbits 23
 #define suffix(n) n ## f
 #include "ieee754.h"
+#include "pow.h"
 #undef suffix
 #undef f_mbits
 #undef f_ebits
@ -28,6 +29,7 @@ enum Ordering {
 #define f_mbits 52
 #define suffix(n) n
 #include "ieee754.h"
+#include "pow.h"
 #undef suffix
 #undef f_mbits
 #undef f_ebits
@ -42,7 +44,8 @@ _Static_assert(sizeof(long double) == sizeof(double),
 #define f_ebits 11
 #define f_mbits 52
 #define suffix(n) n ## l
-//#include "ieee754.h"
+#include "ieee754.h"
+#include "pow.h"
 #undef suffix
 #undef f_mbits
 #undef f_ebits
--- a/code/math/pow.h
+++ b/code/math/pow.h
@ -0,0 +1,95 @@
+
+#include <errno.h>
+
+#if !defined(_isqrt_defined)
+#define _isqrt_defined
+static uint64_t _isqrt(uint64_t num, uint64_t *remp) {
+    // To find a square root of a number
+    // We get rid of zero
+    if(num == 0) {
+        *remp = 0;
+        return 0;
+    }
+    // Then, starting from the bottom, split num into 2-digit pairs
+    // and find the top-most non-zero pair
+    uint64_t i = 0;
+    while(i != (sizeof(uint64_t)*8) && (num >> i) != 0) {
+        i += 2;
+    }
+    // Then we start taking guesses such that at each step
+    // sqrt^2 <= number made of consequent pairs of exausted integers
+    uint64_t sqrt = 0;
+    uint64_t rem = 0;
+    // Repeat until remainder is equal to zero:
+    do {
+        i -= 2;
+        // Bring the next two digits of the number to our remainder
+        rem = (rem << 2) | ((num >> i) & 0x3);
+        // Find d such that d(2sqrt+d) <= rem
+        // Since d could be either 0 or 1 we simply check 1, otherwise its 0
+        uint64_t d = 1;
+        uint64_t t = ((sqrt<<2)|1);
+        if(t <= rem) {
+            rem -= t;
+        }
+        else {
+            d = 0;
+        }
+        // Append the digit to sqrt from the right
+        sqrt = (sqrt<<1)|d;
+    } while(i != 0);
+
+    *remp = rem;
+    return sqrt;
+}
+#endif
+
+// For all it's worth this shit is simply equivalent to
+// _isqrt((uint64)x)
+// I hate porgaming.
+ftype suffix(sqrt)(ftype x) {
+    if(x < 0) {
+        #if math_errhandling & MATH_ERRNO
+            errno = EDOM;
+        #endif
+        return NAN;
+    }
+    if(x == 0 || isinf(x)) {
+        return x;
+    }
+    if(isnan(x)) {
+        return NAN;
+    }
+    itype bits = suffix(f_bits)(x);
+    itype exp = f_qexp(bits);
+    itype man = f_qman(bits);
+    // Get lots of precision by shifting man right by max bits
+    // and subtracting this from the exponent
+    itype bit = 0; // highest set-bit of man
+    while((man >> (bit+1)) != 0) ++bit;
+    itype prec_shift_n = f_nbits - bit - 3;
+    man <<= prec_shift_n;
+    exp -= prec_shift_n;
+    // Now do the sqrt of 2^exp * man
+    // If exp is odd then 2^{2k+1}*sqrt(man) = 2^{2k}*sqrt{2*man}
+    if((2 + (exp % 2)) % 2 != 0) {
+        man <<= 1;
+    }
+    // Take exp sqrt
+    exp >>= 1;
+    // Take sqrt of mantissa
+    uint64_t rem;
+    man = (itype)_isqrt(man, &rem);
+    // Now sqrt(x) = 2^exp * man
+    // we need to normalize this shit
+    bit = 0; // highest set-bit of man
+    while((man >> (bit+1)) != 0) ++bit;
+    exp += bit;
+    man <<= f_nbits-bit;
+    exp += f_ebias;
+    man >>= f_nbits-f_mbits;
+    man &= f_mmask;
+    // Cons it back
+    bits = b_cons(0, exp, man);
+    return suffix(f_frombits)(bits);
+}
--- a/code/printf.h
+++ b/code/printf.h
@ -1,3 +1,7 @@
+
+//TODO: verify printf("%d", 0). From the code it looked like it would print
+// an empty string.
+
 // NOTE: this file doesn't exist in a vacuum, it's a template for generating
 // the formatted print, you should define FMT_CHAR_TYPE before including it
 inline static int FMT_FUNC_NAME (void *ctx, OutputFunc out, const FMT_CHAR_TYPE *fmt, va_list args) {
@ -83,6 +87,9 @@ inline static int FMT_FUNC_NAME (void *ctx, OutputFunc out, const FMT_CHAR_TYPE
        }

        FMT_CHAR_TYPE ch = *fmt++;
+        const char* characters = "0123456789abcdef";
+        if (ch == 'X') characters = "0123456789ABCDEF";
+
        switch (ch) {
            case 'c': {
                const char chr = va_arg(args, int);
@ -90,6 +97,45 @@ inline static int FMT_FUNC_NAME (void *ctx, OutputFunc out, const FMT_CHAR_TYPE
                full_length ++;
                break;
            }
+            case 'f':
+            case 'L': {
+                double d = va_arg(args, double);
+
+                if(isinf(d)) {
+                    out(ctx, sizeof"inf"-1, "inf");
+                    break;
+                }
+                else if(isnan(d)) {
+                    out(ctx, sizeof"nan"-1, "nan");
+                    break;
+                }
+
+                if(d < 0) { // TODO: negative zero
+                    out(ctx, 1, "-");
+                    d = -d;
+                }
+
+                uint64_t w = (uint64_t)d;
+                d -= w;
+                FMT_CHAR_TYPE buffer[20];
+                size_t len = sizeof(buffer);
+                do {
+                    buffer[--len] = characters[w % 10];
+                    w /= 10;
+                } while(w != 0);
+                out(ctx, sizeof(buffer) - (len * sizeof(FMT_CHAR_TYPE)), buffer + len);
+
+                char dot = '.';
+                out(ctx, 1, &dot);
+
+                for(int i = 0; i != 6; ++i) {
+                    d *= 10;
+                    int dv = (int)d;
+                    d -= dv;
+                    char digit = characters[dv];
+                    out(ctx, 1, &digit);
+                }
+            } break;
            case 's': {
                const FMT_CHAR_TYPE *str = va_arg(args, FMT_CHAR_TYPE*);
                size_t len = FMT_STRLEN_S(str, precision ? precision : SIZE_MAX);
@ -114,9 +160,6 @@ inline static int FMT_FUNC_NAME (void *ctx, OutputFunc out, const FMT_CHAR_TYPE
                    default:            base = 10; break;
                }

-                const char* characters = "0123456789abcdef";
-                if (ch == 'X') characters = "0123456789ABCDEF";
-
                uintmax_t i;
                if (ch == 'd' || ch == 'i') {
                    intmax_t num = 0;
--- a/code/stdio.c
+++ b/code/stdio.c
@ -2,6 +2,7 @@
 #include <stdarg.h>
 #include <ctype.h>
 #include <stdbool.h>
+#include <math.h>

 #include <_os.h>

--- a/test/test5.c
+++ b/test/test5.c
@ -0,0 +1,22 @@
+
+#include <stdio.h>
+#include <math.h>
+
+void test_sqrt(float f) {
+    float s = sqrtf(f);
+    printf("sqrt of %f is %f\n", f, s);
+}
+
+int main() {
+    test_sqrt(0.0f);
+    test_sqrt(1.0f);
+    test_sqrt(2.0f);
+    test_sqrt(3.0f);
+    test_sqrt(4.0f);
+    test_sqrt(7.0f);
+    test_sqrt(9.0f);
+    test_sqrt(16.0f);
+    test_sqrt(256.0f);
+    test_sqrt(257.0f);
+    return 0;
+}