SCIInstitute
diff --git a/‎Libs/Optimize/Function/CorrespondenceFunction.cpp‎
Lines changed: 290 additions & 56 deletions b/‎Libs/Optimize/Function/CorrespondenceFunction.cpp‎
Lines changed: 290 additions & 56 deletions
@@ -1,7 +1,6 @@
 
 #include "CorrespondenceFunction.h"
 
-#include <Libs/Utils/PlatformUtils.h>
 #include <math.h>
 
 #include "Libs/Utils/Utils.h"
@@ -12,7 +11,6 @@
 namespace shapeworks {
 
 void CorrespondenceFunction::ComputeUpdates(const ParticleSystem* c) {
-  TIME_SCOPE("CorrespondenceFunction::ComputeUpdates");
   num_dims = m_ShapeData->rows();
   num_samples = m_ShapeData->cols();
 
@@ -26,6 +24,147 @@ void CorrespondenceFunction::ComputeUpdates(const ParticleSystem* c) {
 
   m_PointsUpdate->fill(0.0);
 
+  // Lazy precomputation: do it on first call when shape data is populated
+  if (m_NeedsPrecomputation && !m_HasPrecomputedFixedDomains && num_samples > 0) {
+    m_NeedsPrecomputation = false;
+    PrecomputeForFixedDomains(c);
+  }
+
+  // =========================================================================
+  // FIXED SHAPE SPACE PATH: Use precomputed data if available
+  // =========================================================================
+  if (m_HasPrecomputedFixedDomains && !m_UseMeanEnergy) {
+    TIME_SCOPE("ComputeUpdates::FixedShapeSpace");
+
+    // Use precomputed mean from fixed shapes
+    m_points_mean = m_FixedMean;
+
+    // For each non-fixed shape, compute its gradient using precomputed data
+    vnl_matrix_type Q(num_dims, num_samples);
+    Q.fill(0.0);
+
+    // Compute centered data for all shapes using fixed mean
+    vnl_matrix_type points_minus_mean(num_dims, num_samples);
+    for (int j = 0; j < num_samples; j++) {
+      for (int i = 0; i < num_dims; i++) {
+        points_minus_mean(i, j) = m_ShapeData->get(i, j) - (*m_FixedMean)(i, 0);
+      }
+    }
+
+    // Create Eigen maps for precomputed matrices (VNL uses row-major storage)
+    Eigen::Map<Eigen::Matrix<double, Eigen::Dynamic, Eigen::Dynamic, Eigen::RowMajor>> Y_fixed_map(
+        m_FixedY->data_block(), num_dims, m_PrecomputedNumFixedSamples);
+    Eigen::Map<Eigen::Matrix<double, Eigen::Dynamic, Eigen::Dynamic, Eigen::RowMajor>> GradientBasis_map(
+        m_FixedGradientBasis->data_block(), num_dims, m_PrecomputedNumFixedSamples);
+    Eigen::Map<Eigen::Matrix<double, Eigen::Dynamic, Eigen::Dynamic, Eigen::RowMajor>> pinvMat_map(
+        m_FixedPinvMat->data_block(), m_PrecomputedNumFixedSamples, m_PrecomputedNumFixedSamples);
+
+    // Regularization denominator
+    const double N = m_PrecomputedNumFixedSamples - 1;
+    const double N_sq = N * N;
+
+    // For each non-fixed shape, compute gradient using Schur complement
+    for (int j = 0; j < num_samples; j++) {
+      // Check if this shape is fixed (skip gradient computation for fixed shapes)
+      bool is_fixed = false;
+      for (int idx : m_FixedDomainIndices) {
+        if (idx == j) {
+          is_fixed = true;
+          break;
+        }
+      }
+
+      if (!is_fixed) {
+        // Extract y_j from points_minus_mean column (VNL is row-major, so column is strided)
+        Eigen::VectorXd y_j(num_dims);
+        for (int i = 0; i < num_dims; i++) {
+          y_j[i] = points_minus_mean(i, j);
+        }
+
+        // proj = Y_fixed^T * y_j  (N_fixed × 1)
+        Eigen::VectorXd proj = Y_fixed_map.transpose() * y_j;
+
+        // grad = GradientBasis * proj  (num_dims × 1)
+        Eigen::VectorXd grad = GradientBasis_map * proj;
+
+        // pinv_proj = pinvMat_fixed * proj  (N_fixed × 1)
+        Eigen::VectorXd pinv_proj = pinvMat_map * proj;
+
+        // Schur complement scalars
+        double y_j_norm_sq = y_j.squaredNorm();
+        double proj_pinv_proj = proj.dot(pinv_proj);
+
+        // s = ||y_j||^2/N + α - proj^T * pinvMat * proj / N^2
+        double s = y_j_norm_sq / N + m_MinimumVariance - proj_pinv_proj / N_sq;
+
+        // Q[:, j] = (y_j - grad / N) / s
+        for (int i = 0; i < num_dims; i++) {
+          Q(i, j) = (y_j[i] - grad[i] / N) / s;
+        }
+      }
+    }
+
+    // Now compute the updates from Q (same as original code)
+    {
+      vnl_matrix_type Jmatrix;
+      vnl_matrix_type v;
+      for (int j = 0; j < num_samples; j++) {
+        int num = 0;
+        int num2 = 0;
+        for (unsigned int d = 0; d < m_DomainsPerShape; d++) {
+          int dom = d + j * m_DomainsPerShape;
+          if (c->GetDomainFlag(dom) == false) {
+            if (d > 0) {
+              num += m_AttributesPerDomain[d - 1] * c->GetNumberOfParticles(d - 1);
+              if (m_UseXYZ[d - 1]) num += 3 * c->GetNumberOfParticles(d - 1);
+              if (m_UseNormals[d - 1]) num += 3 * c->GetNumberOfParticles(d - 1);
+              num2 += VDimension * c->GetNumberOfParticles(d - 1);
+            }
+
+            int num_attr = m_AttributesPerDomain[d];
+            if (m_UseXYZ[d]) num_attr += 3;
+            if (m_UseNormals[d]) num_attr += 3;
+
+            Jmatrix.clear();
+            Jmatrix.set_size(num_attr, VDimension);
+            Jmatrix.fill(0.0);
+            v.clear();
+            v.set_size(num_attr, 1);
+            v.fill(0.0);
+
+            for (unsigned int p = 0; p < c->GetNumberOfParticles(dom); p++) {
+              v = Q.extract(num_attr, 1, num + p * num_attr, j);
+              Jmatrix = m_ShapeGradient->extract(num_attr, 3, num + p * num_attr, 3 * j);
+              vnl_matrix_type dx = Jmatrix.transpose() * v;
+              for (unsigned int vd = 0; vd < VDimension; vd++) {
+                m_PointsUpdate->put(num2 + p * VDimension + vd, j, dx(vd, 0));
+              }
+            }
+          }
+        }
+      }
+    }
+
+    // Compute energy using precomputed eigenvalues
+    m_CurrentEnergy = 0.0;
+    m_MinimumEigenValue = (*m_FixedW)(0, 0);
+    for (int i = 0; i < m_PrecomputedNumFixedSamples; i++) {
+      double w_i = (*m_FixedW)(i, i);
+      double val = w_i * w_i / (m_PrecomputedNumFixedSamples - 1) + m_MinimumVariance;
+      if (val < m_MinimumEigenValue) m_MinimumEigenValue = val;
+      m_CurrentEnergy += log(val);
+    }
+    m_CurrentEnergy /= 2.0;
+
+    return;  // Done with fixed shape space path
+  }
+
+  // =========================================================================
+  // ORIGINAL PATH: Full computation (no precomputed data or using mean energy)
+  // =========================================================================
+  // Use different profiling scopes to distinguish mean energy (init) vs entropy (optimize)
+  TIME_SCOPE(m_UseMeanEnergy ? "ComputeUpdates::MeanEnergy" : "ComputeUpdates::Entropy");
+
   vnl_matrix_type points_minus_mean(num_dims, num_samples, 0.0);
 
   m_points_mean->clear();
@@ -44,7 +183,6 @@ void CorrespondenceFunction::ComputeUpdates(const ParticleSystem* c) {
 
   if (this->m_UseMeanEnergy) {
     pinvMat.set_identity();
-    m_InverseCovMatrix->setZero();
   } else {
     TIME_START("correspondence::gramMat");
 
@@ -75,40 +213,9 @@ void CorrespondenceFunction::ComputeUpdates(const ParticleSystem* c) {
     pinvMat = (UG * invLambda) * UG.transpose();
     TIME_STOP("correspondence::pinvMat");
 
-    TIME_START("correspondence::lhs_rhs");
-
-    // Create Eigen maps for the VNL matrices
-    Eigen::Map<Eigen::Matrix<double, Eigen::Dynamic, Eigen::Dynamic, Eigen::RowMajor>> UG_map(UG.data_block(),
-                                                                                              UG.rows(), UG.cols());
-    // Create temporary Eigen matrices for the computations
-    Eigen::MatrixXd projMat_eigen = points_minus_mean_map * UG_map;
-
-    // Convert invLambda diagonal matrix to Eigen
-    // Since invLambda is a vnl_diag_matrix, we'll need to extract the diagonal
-    Eigen::VectorXd invLambda_diag(invLambda.size());
-    for (int i = 0; i < invLambda.size(); i++) {
-      invLambda_diag(i) = invLambda(i, i);
-    }
-    Eigen::DiagonalMatrix<double, Eigen::Dynamic> invLambda_eigen(invLambda_diag);
-
-    // Perform the computations using Eigen
-    const auto lhs = projMat_eigen * invLambda_eigen;
-    const auto rhs = invLambda_eigen * projMat_eigen.transpose();
-    TIME_STOP("correspondence::lhs_rhs");
-
-    // resize the inverse covariance matrix if necessary
-    if (m_InverseCovMatrix->rows() != num_dims || m_InverseCovMatrix->cols() != num_dims) {
-      m_InverseCovMatrix->resize(num_dims, num_dims);
-    }
-
-    TIME_START("correspondence::covariance_multiply");
-    if (PlatformUtils::is_macos()) {
-      // this is about 2x faster on MacOS, but slower on Linux
-      m_InverseCovMatrix->selfadjointView<Eigen::Upper>().rankUpdate(lhs);
-    } else {
-      m_InverseCovMatrix->noalias() = lhs * rhs;
-    }
-    TIME_STOP("correspondence::covariance_multiply");
+    // Note: The full dM × dM inverse covariance matrix is NOT needed.
+    // Per thesis equation 2.35, the gradient is simply: Y × (Y^T Y + αI)^{-1}
+    // which is Y × pinvMat. No covariance_multiply required.
   }
 
   vnl_matrix_type Q = points_minus_mean * pinvMat;
@@ -208,28 +315,15 @@ CorrespondenceFunction::VectorType CorrespondenceFunction::evaluate(unsigned int
     num += num1 * system->GetNumberOfParticles(i);
   }
 
-  vnl_matrix_type tmp1(sz_Yidx, sz_Yidx, 0.0);
-
-  if (this->m_UseMeanEnergy) {
-    tmp1.set_identity();
-  } else {
-    // extract 3x3 submatrix at k,k
-    Eigen::MatrixXd region = m_InverseCovMatrix->block(sz_Yidx, sz_Yidx, 3, 3);
-    // convert to vnl
-    for (unsigned int i = 0; i < 3; i++) {
-      for (unsigned int j = 0; j < 3; j++) {
-        tmp1(i, j) = region(i, j);
-      }
-    }
-  }
-
+  // Per-particle energy: squared Euclidean distance from mean
+  // This is used for line search step-size adaptation.
+  // Note: We always use Euclidean distance (identity matrix) regardless of m_UseMeanEnergy,
+  // because the full inverse covariance matrix is not computed.
   vnl_matrix_type Y_dom_idx(sz_Yidx, 1, 0.0);
-
   Y_dom_idx = m_ShapeData->extract(sz_Yidx, 1, num, sampNum) - m_points_mean->extract(sz_Yidx, 1, num);
 
-  vnl_matrix_type tmp = Y_dom_idx.transpose() * tmp1;
-  tmp *= Y_dom_idx;
-
+  // energy = ||y - mean||^2
+  vnl_matrix_type tmp = Y_dom_idx.transpose() * Y_dom_idx;
   energy = tmp(0, 0);
 
   maxdt = m_MinimumEigenValue;
@@ -246,4 +340,144 @@ CorrespondenceFunction::VectorType CorrespondenceFunction::evaluate(unsigned int
   return system->TransformVector(gradE, system->GetInversePrefixTransform(d) * system->GetInverseTransform(d));
 }
 
+//---------------------------------------------------------------------------
+void CorrespondenceFunction::ClearPrecomputedFixedDomains() {
+  m_HasPrecomputedFixedDomains = false;
+  m_PrecomputedNumFixedSamples = 0;
+  m_PrecomputedNumDims = 0;
+  m_FixedMean.reset();
+  m_FixedY.reset();
+  m_FixedPinvMat.reset();
+  m_FixedGradientBasis.reset();
+  m_FixedU.reset();
+  m_FixedW.reset();
+  m_FixedDomainIndices.clear();
+}
+
+//---------------------------------------------------------------------------
+void CorrespondenceFunction::PrecomputeForFixedDomains(const ParticleSystem* ps) {
+  TIME_SCOPE("CorrespondenceFunction::PrecomputeForFixedDomains");
+
+  // Clear any existing precomputed data
+  ClearPrecomputedFixedDomains();
+
+  // Count fixed and non-fixed shapes
+  int total_shapes = m_ShapeData->cols();
+  int num_fixed = 0;
+  int num_unfixed = 0;
+
+  SW_LOG("PrecomputeForFixedDomains: ShapeData rows={}, cols={}, DomainsPerShape={}, PS domains={}",
+         m_ShapeData->rows(), total_shapes, m_DomainsPerShape, ps->GetNumberOfDomains());
+
+  // Identify which shapes are fixed
+  // A shape is considered fixed if ALL its domains are fixed
+  for (int shape = 0; shape < total_shapes; shape++) {
+    bool shape_is_fixed = true;
+    for (int d = 0; d < m_DomainsPerShape; d++) {
+      int dom = shape * m_DomainsPerShape + d;
+      if (!ps->GetDomainFlag(dom)) {
+        shape_is_fixed = false;
+        break;
+      }
+    }
+    if (shape_is_fixed) {
+      m_FixedDomainIndices.push_back(shape);
+      num_fixed++;
+    } else {
+      num_unfixed++;
+    }
+  }
+
+  // If no fixed shapes or all shapes are fixed, precomputation won't help
+  if (num_fixed == 0 || num_unfixed == 0) {
+    SW_LOG("PrecomputeForFixedDomains: No benefit from precomputation "
+           "(fixed={}, unfixed={})", num_fixed, num_unfixed);
+    return;
+  }
+
+  SW_LOG("PrecomputeForFixedDomains: Precomputing for {} fixed shapes, {} unfixed shapes",
+         num_fixed, num_unfixed);
+
+  int num_dims = m_ShapeData->rows();
+  int num_fixed_samples = num_fixed;
+
+  // Store dimensions for validation later
+  m_PrecomputedNumFixedSamples = num_fixed_samples;
+  m_PrecomputedNumDims = num_dims;
+
+  // Step 1: Extract fixed shape data and compute mean
+  // Build Y_fixed matrix: dM × N_fixed
+  m_FixedY = std::make_shared<vnl_matrix_type>(num_dims, num_fixed_samples);
+  m_FixedMean = std::make_shared<vnl_matrix_type>(num_dims, 1);
+  m_FixedMean->fill(0.0);
+
+  // Copy fixed shape data
+  for (int i = 0; i < num_fixed_samples; i++) {
+    int fixed_shape_idx = m_FixedDomainIndices[i];
+    for (int r = 0; r < num_dims; r++) {
+      double val = m_ShapeData->get(r, fixed_shape_idx);
+      m_FixedY->put(r, i, val);
+      (*m_FixedMean)(r, 0) += val;
+    }
+  }
+
+  // Compute mean
+  for (int r = 0; r < num_dims; r++) {
+    (*m_FixedMean)(r, 0) /= num_fixed_samples;
+  }
+
+  // Center the data: Y_fixed = Y_fixed - mean
+  for (int i = 0; i < num_fixed_samples; i++) {
+    for (int r = 0; r < num_dims; r++) {
+      (*m_FixedY)(r, i) -= (*m_FixedMean)(r, 0);
+    }
+  }
+
+  // Step 2: Compute Gram matrix G = Y_fixed^T * Y_fixed
+  TIME_START("precompute::gramMat");
+  Eigen::Map<Eigen::Matrix<double, Eigen::Dynamic, Eigen::Dynamic, Eigen::RowMajor>>
+      Y_fixed_map(m_FixedY->data_block(), num_dims, num_fixed_samples);
+
+  Eigen::MatrixXd gramMat_eigen = Y_fixed_map.transpose() * Y_fixed_map;
+  TIME_STOP("precompute::gramMat");
+
+  // Step 3: SVD of Gram matrix
+  TIME_START("precompute::svd");
+  vnl_matrix_type gramMat(num_fixed_samples, num_fixed_samples);
+  for (int i = 0; i < num_fixed_samples; i++) {
+    for (int j = 0; j < num_fixed_samples; j++) {
+      gramMat(i, j) = gramMat_eigen(i, j);
+    }
+  }
+
+  vnl_svd<double> svd(gramMat);
+  m_FixedU = std::make_shared<vnl_matrix_type>(svd.U());
+  m_FixedW = std::make_shared<vnl_diag_matrix<double>>(svd.W());
+  TIME_STOP("precompute::svd");
+
+  // Step 4: Compute regularized inverse: pinvMat = U * (W/(N-1) + αI)^{-1} * U^T
+  TIME_START("precompute::pinvMat");
+  vnl_diag_matrix<double> invLambda = *m_FixedW;
+  for (int i = 0; i < num_fixed_samples; i++) {
+    double val = invLambda(i, i) / (num_fixed_samples - 1) + m_MinimumVariance;
+    invLambda(i, i) = 1.0 / val;  // Invert
+  }
+
+  m_FixedPinvMat = std::make_shared<vnl_matrix_type>(num_fixed_samples, num_fixed_samples);
+  *m_FixedPinvMat = (*m_FixedU) * invLambda * m_FixedU->transpose();
+  TIME_STOP("precompute::pinvMat");
+
+  // Step 5: Precompute gradient basis: M = Y_fixed * pinvMat
+  // This is dM × N_fixed
+  TIME_START("precompute::gradientBasis");
+  m_FixedGradientBasis = std::make_shared<vnl_matrix_type>(num_dims, num_fixed_samples);
+  *m_FixedGradientBasis = (*m_FixedY) * (*m_FixedPinvMat);
+  TIME_STOP("precompute::gradientBasis");
+
+  m_HasPrecomputedFixedDomains = true;
+
+  SW_LOG("PrecomputeForFixedDomains: Precomputation complete. "
+         "Fixed shapes: {}, Dimensions: {}", num_fixed_samples, num_dims);
+}
+
 }  // namespace shapeworks