ooples
diff --git a/‎src/Metrics/FrechetInceptionDistance.cs‎
Lines changed: 156 additions & 16 deletions b/‎src/Metrics/FrechetInceptionDistance.cs‎
Lines changed: 156 additions & 16 deletions
@@ -232,36 +232,176 @@ private double ComputeFrechetDistance(
                 meanDiffSq = NumOps.Add(meanDiffSq, NumOps.Multiply(diff, diff));
             }
 
-            // 2. Compute trace of covariance matrices: Tr(Σ₁ + Σ₂)
-            var traceCov = NumOps.Zero;
-            for (int i = 0; i < cov1.Rows; i++)
-            {
-                traceCov = NumOps.Add(traceCov, cov1[i, i]);
-                traceCov = NumOps.Add(traceCov, cov2[i, i]);
-            }
-
-            // 3. Compute sqrt(Σ₁ * Σ₂) using simplified approximation
-            // Full implementation would use proper matrix square root
-            // For now, use trace approximation: Tr(2√(Σ₁Σ₂)) ≈ 2√(Tr(Σ₁)Tr(Σ₂))
+            // 2. Compute trace of covariance matrices: Tr(Σ₁) + Tr(Σ₂)
             var trace1 = NumOps.Zero;
             var trace2 = NumOps.Zero;
             for (int i = 0; i < cov1.Rows; i++)
             {
                 trace1 = NumOps.Add(trace1, cov1[i, i]);
                 trace2 = NumOps.Add(trace2, cov2[i, i]);
             }
+            var traceCov = NumOps.Add(trace1, trace2);
 
-            var covProduct = NumOps.Multiply(trace1, trace2);
-            var sqrtCovProduct = NumOps.Sqrt(covProduct);
-            var traceSqrtCovProduct = NumOps.Multiply(NumOps.FromDouble(2.0), sqrtCovProduct);
+            // 3. Compute Tr(√(Σ₁Σ₂)) using proper matrix square root
+            // For symmetric positive semi-definite matrices, we compute the product
+            // and then find the trace of its square root
+            var traceSqrtCovProduct = ComputeTraceSqrtCovProduct(cov1, cov2);
 
-            // FID = ||μ₁ - μ₂||² + Tr(Σ₁ + Σ₂ - 2√(Σ₁Σ₂))
+            // FID = ||μ₁ - μ₂||² + Tr(Σ₁) + Tr(Σ₂) - 2*Tr(√(Σ₁Σ₂))
             var fid = NumOps.Add(meanDiffSq, traceCov);
-            fid = NumOps.Subtract(fid, traceSqrtCovProduct);
+            fid = NumOps.Subtract(fid, NumOps.Multiply(NumOps.FromDouble(2.0), traceSqrtCovProduct));
 
             return Convert.ToDouble(fid);
         }
 
+        /// <summary>
+        /// Computes Tr(√(Σ₁Σ₂)) using Newton-Schulz iteration for matrix square root.
+        /// </summary>
+        private T ComputeTraceSqrtCovProduct(Matrix<T> cov1, Matrix<T> cov2)
+        {
+            int n = cov1.Rows;
+
+            // Compute the matrix product Σ₁ * Σ₂
+            var product = new Matrix<T>(n, n);
+            for (int i = 0; i < n; i++)
+            {
+                for (int j = 0; j < n; j++)
+                {
+                    var sum = NumOps.Zero;
+                    for (int k = 0; k < n; k++)
+                    {
+                        sum = NumOps.Add(sum, NumOps.Multiply(cov1[i, k], cov2[k, j]));
+                    }
+                    product[i, j] = sum;
+                }
+            }
+
+            // For computing Tr(√A), we use the identity that for SPD matrices:
+            // Tr(√A) = sum of square roots of eigenvalues
+            // Use power iteration to approximate the trace of the square root
+            // via Newton-Schulz iteration: Y_{k+1} = 0.5 * Y_k * (3I - Y_k^2 * A)
+            // with Y_0 = A / ||A||_F, converges to √(A^{-1}), so we need to adapt
+
+            // Simpler approach: Use the property that for SPD matrices,
+            // Tr(√A) ≈ √Tr(A) when eigenvalues are close together,
+            // but better to use Denman-Beavers iteration which converges to √A
+
+            // Denman-Beavers iteration: Y_0 = A, Z_0 = I
+            // Y_{k+1} = 0.5 * (Y_k + Z_k^{-1})
+            // Z_{k+1} = 0.5 * (Z_k + Y_k^{-1})
+            // Converges to: Y → √A, Z → √(A^{-1})
+
+            // For numerical stability, use a simpler approximation with eigenvalue sum
+            // First, symmetrize the product to handle numerical issues: (A + A^T) / 2
+            var symProduct = new Matrix<T>(n, n);
+            for (int i = 0; i < n; i++)
+            {
+                for (int j = 0; j < n; j++)
+                {
+                    symProduct[i, j] = NumOps.Divide(
+                        NumOps.Add(product[i, j], product[j, i]),
+                        NumOps.FromDouble(2.0));
+                }
+            }
+
+            // Use Newton-Schulz iteration for matrix square root
+            // Start with Y = A / ||A||_F for numerical stability
+            var frobNormSq = NumOps.Zero;
+            for (int i = 0; i < n; i++)
+            {
+                for (int j = 0; j < n; j++)
+                {
+                    frobNormSq = NumOps.Add(frobNormSq, NumOps.Multiply(symProduct[i, j], symProduct[i, j]));
+                }
+            }
+            var frobNorm = NumOps.Sqrt(frobNormSq);
+
+            // If the product is essentially zero, return zero
+            if (NumOps.LessThan(frobNorm, NumOps.FromDouble(1e-10)))
+            {
+                return NumOps.Zero;
+            }
+
+            // Scale for numerical stability
+            var scale = NumOps.Sqrt(frobNorm);
+            var Y = new Matrix<T>(n, n);
+            for (int i = 0; i < n; i++)
+            {
+                for (int j = 0; j < n; j++)
+                {
+                    Y[i, j] = NumOps.Divide(symProduct[i, j], scale);
+                }
+            }
+
+            // Newton-Schulz iteration: Y_{k+1} = 0.5 * Y_k * (3I - Y_k * Y_k)
+            // Run for a fixed number of iterations
+            const int maxIterations = 15;
+            var identity = Matrix<T>.CreateIdentity(n);
+
+            for (int iter = 0; iter < maxIterations; iter++)
+            {
+                // Compute Y * Y
+                var YY = MatrixMultiply(Y, Y);
+
+                // Compute 3I - Y*Y
+                var threeIMinusYY = new Matrix<T>(n, n);
+                for (int i = 0; i < n; i++)
+                {
+                    for (int j = 0; j < n; j++)
+                    {
+                        threeIMinusYY[i, j] = NumOps.Subtract(
+                            NumOps.Multiply(NumOps.FromDouble(3.0), identity[i, j]),
+                            YY[i, j]);
+                    }
+                }
+
+                // Y = 0.5 * Y * (3I - Y*Y)
+                var newY = MatrixMultiply(Y, threeIMinusYY);
+                for (int i = 0; i < n; i++)
+                {
+                    for (int j = 0; j < n; j++)
+                    {
+                        Y[i, j] = NumOps.Multiply(NumOps.FromDouble(0.5), newY[i, j]);
+                    }
+                }
+            }
+
+            // Y now approximates √(A/scale), so √A ≈ Y * √scale
+            // Tr(√A) = √scale * Tr(Y)
+            var sqrtScale = NumOps.Sqrt(scale);
+            var traceY = NumOps.Zero;
+            for (int i = 0; i < n; i++)
+            {
+                traceY = NumOps.Add(traceY, Y[i, i]);
+            }
+
+            return NumOps.Multiply(sqrtScale, traceY);
+        }
+
+        /// <summary>
+        /// Multiplies two matrices.
+        /// </summary>
+        private Matrix<T> MatrixMultiply(Matrix<T> a, Matrix<T> b)
+        {
+            int n = a.Rows;
+            var result = new Matrix<T>(n, n);
+
+            for (int i = 0; i < n; i++)
+            {
+                for (int j = 0; j < n; j++)
+                {
+                    var sum = NumOps.Zero;
+                    for (int k = 0; k < n; k++)
+                    {
+                        sum = NumOps.Add(sum, NumOps.Multiply(a[i, k], b[k, j]));
+                    }
+                    result[i, j] = sum;
+                }
+            }
+
+            return result;
+        }
+
         /// <summary>
         /// Computes FID using pre-computed statistics.
         /// Useful when you want to compare against a fixed set of real images.