Document what compiler is doing for diffxi

2021-03-25 22:39:00 +01:00
parent 76f5291131
commit a33e1d37ba
2 changed files with 42 additions and 15 deletions
--- a/utils/constmatrix/src/lib.rs
+++ b/utils/constmatrix/src/lib.rs
@@ -123,10 +123,15 @@ impl<const M: usize, const P: usize> Matrix<Float, M, P> {
    ) {
        for i in 0..M {
            for j in 0..P {
-                let mut t = 0.0;
-                for k in 0..N {
+                // Slightly cheaper to do first computation separately
+                // rather than store zero and issue all ops as fma
+                let mut t = if N == 0 {
+                    0.0
+                } else {
+                    lhs[(i, 0)] * rhs[(0, j)]
+                };
+                for k in 1..N {
                    t = Float::mul_add(lhs[(i, k)], rhs[(k, j)], t);
-                    // t = t + lhs[(i, k)] * rhs[(k, j)];
                }
                self[(i, j)] = t;
            }