add smoothing

geraseva · geraseva · commit 4781517c433c · 2025-12-08T16:06:20.000+03:00
diff --git a/rfdiffusion/inference/model_runners.py b/rfdiffusion/inference/model_runners.py
@@ -216,6 +216,7 @@ def assemble_config_from_chk(self) -> None:
                 print(f'WARNING: You are changing {override.split("=")[0]} from the value this model was trained with. Are you sure you know what you are doing?') 
                 mytype = type(self._conf[override.split(".")[0]][override.split(".")[1].split("=")[0]])
                 self._conf[override.split(".")[0]][override.split(".")[1].split("=")[0]] = mytype(override.split("=")[1])
+                print(override, self._conf[override.split(".")[0]][override.split(".")[1].split("=")[0]])
 
     def load_model(self):
         """Create RosettaFold model from preloaded checkpoint."""
@@ -266,7 +267,7 @@ def sample_init(self, return_forward_trajectory=False):
         ### Parse input pdb ###
         #######################
 
-        self.target_feats = iu.process_target(self.inf_conf.input_pdb, parse_hetatom=True, parse_na=True, center=False)
+        self.target_feats = iu.process_target(self.inf_conf.input_pdb, parse_hetatom=True, parse_na=True, center=True)
 
         ################################
         ### Generate specific contig ###
@@ -428,7 +429,9 @@ def sample_init(self, return_forward_trajectory=False):
                 het_names = np.array([i['name'].strip() for i in self.target_feats['info_het']])
                 xyz_het = self.target_feats['xyz_het'][het_names == self._conf.potentials.substrate]
                 xyz_het = torch.from_numpy(xyz_het)
-                info_het={x: self.target_feats['info_het'][x][het_names == self._conf.potentials.substrate] for x in self.target_feats['info_het']}
+                info_het={x: np.array([y[x] for y in self.target_feats['info_het'] 
+                                       if y['name'] == self._conf.potentials.substrate]) 
+                                       for x in self.target_feats['info_het'][0]}
                 assert xyz_het.shape[0] > 0, f'expected >0 heteroatoms from ligand with name {self._conf.potentials.substrate}'
                 xyz_motif_prealign = xyz_motif_prealign[0,0][self.diffusion_mask.squeeze()]
                 motif_prealign_com = xyz_motif_prealign[:,1].mean(dim=0)
diff --git a/rfdiffusion/inference/utils.py b/rfdiffusion/inference/utils.py
@@ -123,21 +123,77 @@ def get_mu_xt_x0(xt, px0, t, beta_schedule, alphabar_schedule, eps=1e-6):
 
 
 def rigid_rotation_from_grads(Cas, Ca_grads, eps=1e-8):
+
+    """
+    Estimate best-fit infinitesimal rigid motion (translation + rotation)
+    from per-residue gradients Ca_grads at positions Cas.
+
+    Intuition
+    ---------
+    We decompose the gradient field on Ca atoms into:
+      - a global translation (mean over residues), and
+      - a small rigid rotation around the geometric center.
+
+    The rotation is solved in the least-squares sense via the 3x3 linear
+    system (I + eps*I) · omega = tau, where
+      - I = Σ(||r_i||^2)·I3 - Σ(r_i r_i^T) is an inertia-like matrix of the point set,
+      - tau = Σ(r_i x d_i) is a torque-like vector of centered gradients,
+      - r_i = Cas_i - center, d_i = Ca_grads_i - trans.
+    This returns the angular-velocity vector omega that best explains the
+    rotational component of the gradients.
+
+    Returns:
+        trans (1,3): mean translation component applied to all residues
+        omega (3,): angular velocity vector defining small rotation
+        center (3,): geometric center of Cas
+        rot (L,3): per-residue rotational component omega x (Cas - center)
+    """
+    device, dtype = Cas.device, Cas.dtype
+    L = Cas.shape[0]
+
+    # Guard empty input
+    if L == 0:
+        return (
+            torch.zeros(1, 3, device=device, dtype=dtype),
+            torch.zeros(3, device=device, dtype=dtype),
+            torch.zeros(3, device=device, dtype=dtype),
+            torch.zeros(0, 3, device=device, dtype=dtype),
+        )
+
+    # Geometric center and centered positions r_i
     center=Cas.mean(dim=0) # (3,)
     r=Cas-center # (L,3)
 
-    trans=Ca_grads.mean(dim=0, keepdim=True) # (L, 3)
+    # Mean translation across residues (global shift suggested by gradients)
+    trans=Ca_grads.mean(dim=0, keepdim=True) # (1, 3)
+    # Centered gradients remove the pure-translation component
     d=Ca_grads-trans # (L,3)
-    eye=torch.eye(3, device=Cas.device, dtype=Cas.dtype)
+
+    eye=torch.eye(3, device=device, dtype=dtype)
+    # Inertia-like matrix of centered points (well-known identity for Σ [r]_x^T [r]_x)
+    # I = Σ(||r_i||^2)·I3 − Σ(r_i r_i^T) ∈ R^{3x3}
+    '''
     r2=(r**2).sum(dim=1) # (L,)
     rrT=r[:,:,None]*r[:,None,:] # (L,3,3)
     I=(r2[:, None, None] * eye[None, :, :] - rrT).sum(dim=0) # (3,3)
+    '''
+    r2_sum = (r * r).sum()  # scalar Σ ||r_i||^2
+    rr_sum = r.T @ r  # (3,3) Σ r_i r_i^T
+    I = r2_sum * eye - rr_sum  # (3,3)
+
+    # Torque-like vector: τ = Σ (r_i × d_i)
+    # Captures the net tendency of gradients to induce rotation about the center.
     tau=torch.cross(r,d, dim=1).sum(dim=0) # (3,)
+        
+    # Solve for small-rotation vector ω from (I + eps·I3)·ω = τ.
+    # eps stabilizes near-singular geometries (e.g., collinear or coplanar points).
     try:
         omega = torch.linalg.solve(I + eps*eye, tau) # (3,)
     except RuntimeError:
+        # Fallback in case of numerical issues (rare): least-squares solution.
         omega = torch.linalg.lstsq(I + eps*eye, tau.unsqueeze(-1)).solution.squeeze(-1)
 
+    # Per-residue rotational component: ω × r_i
     rot = torch.cross(omega.unsqueeze(0).expand_as(r), r, dim=1) #(L,3)
 
     return trans, omega, center, rot
@@ -652,7 +708,7 @@ def parse_pdb_lines(lines, parse_hetatom=False, parse_na=False, ignore_het_h=Tru
                 )
                 xyz_het.append([float(l[30:38]), float(l[38:46]), float(l[46:54])])
 
-        out["xyz_het"] = np.array(xyz_het)
+        out["xyz_het"] = np.array(xyz_het).reshape((len(xyz_het),3))
         out["info_het"] = info_het
     
     # nucleic acids
@@ -671,7 +727,7 @@ def parse_pdb_lines(lines, parse_hetatom=False, parse_na=False, ignore_het_h=Tru
         ]  # chain letter, res num
 
         # 3 BB + up to 20 SC atoms
-        xyz = np.full((len(res), 23, 3), np.nan, dtype=np.float32)
+        xyz = np.full((len(res), 23, 3), np.nan, dtype=np.float64)
         atom_id = np.full((len(res), 23), np.nan, dtype=np.object)
         atom_type = np.full((len(res), 23), np.nan, dtype=np.object)
         for l in lines:
@@ -751,7 +807,7 @@ def process_target(pdb_path, parse_hetatom=False, parse_na=False, center=True):
         "pdb_idx": target_struct["pdb_idx"],
     }
     if parse_hetatom:
-        out["xyz_het"] = target_struct["xyz_het"]
+        out["xyz_het"] = target_struct["xyz_het"] - ca_center
         out["info_het"] = target_struct["info_het"]
     
     if parse_na:
@@ -760,7 +816,7 @@ def process_target(pdb_path, parse_hetatom=False, parse_na=False, center=True):
                         'atom_type':target_struct['na_atom_type'],
                         'seq':target_struct["na_seq"],
                         'pdb_idx':target_struct["na_pdb_idx"]}
-        out["na_xyz"]= target_struct["na_xyz"]
+        out["na_xyz"]= target_struct["na_xyz"] - ca_center
 
     return out
 
diff --git a/rfdiffusion/potentials/potentials.py b/rfdiffusion/potentials/potentials.py
@@ -378,14 +378,17 @@ class substrate_contacts(Potential):
     Implicitly models a ligand with an attractive-repulsive potential.
     '''
 
-    def __init__(self, weight=1, r_0=8, d_0=2, s=1, eps=1e-6, rep_r_0=5, rep_s=2, rep_r_min=1, sidechain=False):
+    def __init__(self, weight=1, r_0=8, d_0=2, s=1, eps=1e-6, rep_r_0=5, rep_s=2, rep_r_min=1, 
+                 sidechain=False, smooth=0, predicted=False):
 
         super().__init__()
         self.r_0       = r_0
         self.weight    = weight
         self.d_0       = d_0
         self.eps       = eps
         self.sidechain=sidechain
+        self.predicted=predicted
+        self.smooth=smooth
         
         # motif frame coordinates
         # NOTE: these probably need to be set after sample_init() call, because the motif sequence position in design must be known
@@ -451,7 +454,7 @@ def compute(self, xyz):
         self.current_substrate_atoms = substrate_atoms.clone().detach()
         energy = sum(all_energies)
         print('SUBSTRATE CONTACT LOSS:',energy.item())
-        return self.weight * energy
+        return - self.weight * energy
 
         #Potential value is the average of both radii of gyration (is avg. the best way to do this?)
         return self.weight * ncontacts.sum()
@@ -544,22 +547,26 @@ def __init__(self, weight=1, r_0=8, d_0=2, s=1, eps=1e-6, rep_r_0=5, rep_s=2, re
     def compute(self, xyz):
         
         if self.xyz_motif==None or self.xyz_motif.shape[0]<3:
-            substrate_atoms=(self.na_atoms-self.na_atoms[:,:11,:].mean(dim=(0,1))[None,None,:]).detach()
+            substrate_atoms=self.na_atoms.clone().detach()
+            #substrate_atoms=(self.na_atoms-self.na_atoms[:,:11,:].mean(dim=(0,1))[None,None,:]).detach()
+            self.current_na_atoms = substrate_atoms.clone().detach()
             
         else:
             self._grab_motif_residues(self.xyz_motif)
         
-            first_distance = torch.sqrt(torch.sqrt(torch.sum(torch.square(self.motif_substrate_atoms[0] - self.motif_frame[0]), dim=-1))) 
+            L, D, _ = self.na_atoms.shape
+            idx=torch.argmin(torch.sum(torch.square(self.na_atoms.view(-1,3) - self.motif_frame[0]), dim=-1))
+            first_distance = torch.sqrt(torch.sqrt(torch.sum(torch.square(self.na_atoms.view(-1,3)[idx] - self.motif_frame[0]), dim=-1))) 
 
             res = torch.tensor([k[0] for k in self.motif_mapping])
             atoms = torch.tensor([k[1] for k in self.motif_mapping])
             new_frame = xyz[self.diffusion_mask][res,atoms,:]
             A, t = self._recover_affine(self.motif_frame, new_frame)
-            substrate_atoms = torch.mm(A, self.motif_substrate_atoms.transpose(0,1)).transpose(0,1) + t
-            second_distance = torch.sqrt(torch.sqrt(torch.sum(torch.square(new_frame[0] - substrate_atoms[0]), dim=-1)))
+            substrate_atoms = torch.mm(A, self.na_atoms.view(-1,3).transpose(0,1)).transpose(0,1) + t
+            second_distance = torch.sqrt(torch.sqrt(torch.sum(torch.square(new_frame[0] - substrate_atoms[idx]), dim=-1)))
             assert abs(first_distance - second_distance) < 0.01, "Alignment seems to be bad" 
+            self.current_na_atoms = substrate_atoms.view(L, D, 3).clone().detach()
 
-        self.current_na_atoms = substrate_atoms.clone().detach()
         substrate_atoms=substrate_atoms.view(-1,3)
         mask=torch.from_numpy(self.na_info['mask']).view(-1)
         substrate_atoms=substrate_atoms[mask,:]
@@ -580,7 +587,7 @@ def compute(self, xyz):
             all_energies.append(energy.sum())
         energy = sum(all_energies)
         print('NA CONTACT LOSS:',energy.item())
-        return self.weight * energy
+        return - self.weight * energy
 
     
 class dmasif_interactions(Potential):
@@ -628,7 +635,7 @@ def compute(self, xyz):
             potential.requires_grad_()
             xyz.grad=torch.zeros_like(xyz)
                    
-        return potential
+        return - potential
 
 # Dictionary of types of potentials indexed by name of potential. Used by PotentialManager.
 # If you implement a new potential you must add it to this dictionary for it to be used by