test(pt_expt): distinct seeds for multi-task heads + RUF059 cleanup

Han Wang · Han Wang · commit d3a57f259497 · 2026-04-29T17:20:16.000+08:00
CodeRabbit flagged that `TestPtExptLoadPtMultiTask` built both heads
with the same `GLOBAL_SEED`, so `test_select_head_matches_single_task_forward`
would still pass if `_load_pt` accidentally loaded the wrong head's
weights. Mirror the spin variant: pass distinct seeds (42/7) to
`_build_model_and_params` for the two heads, and add
`test_distinct_heads_produce_distinct_outputs` as a sanity guard.

Also prefix unused unpack vars with `_` to satisfy RUF059.
diff --git a/source/tests/pt_expt/infer/test_deep_eval_pt_checkpoint.py b/source/tests/pt_expt/infer/test_deep_eval_pt_checkpoint.py
@@ -52,8 +52,14 @@
 )
 
 
-def _build_model_and_params(rcut: float = 4.0) -> tuple[EnergyModel, dict]:
-    """Build a small pt_expt EnergyModel and the matching ``model_params`` dict."""
+def _build_model_and_params(
+    rcut: float = 4.0, seed: int = GLOBAL_SEED
+) -> tuple[EnergyModel, dict]:
+    """Build a small pt_expt EnergyModel and the matching ``model_params`` dict.
+
+    The ``seed`` parameter lets callers build distinguishable models when
+    they need head-selection tests to produce different outputs per head.
+    """
     type_map = ["foo", "bar"]
     sel = [8, 6]
     descriptor_args = {
@@ -64,13 +70,13 @@ def _build_model_and_params(rcut: float = 4.0) -> tuple[EnergyModel, dict]:
         "neuron": [4, 8],
         "axis_neuron": 4,
         "type_one_side": True,
-        "seed": GLOBAL_SEED,
+        "seed": seed,
     }
     fitting_args = {
         "type": "ener",
         "neuron": [8, 8],
         "resnet_dt": True,
-        "seed": GLOBAL_SEED,
+        "seed": seed,
     }
 
     ds = DescrptSeA(
@@ -80,15 +86,15 @@ def _build_model_and_params(rcut: float = 4.0) -> tuple[EnergyModel, dict]:
         neuron=[4, 8],
         axis_neuron=4,
         type_one_side=True,
-        seed=GLOBAL_SEED,
+        seed=seed,
     )
     ft = EnergyFittingNet(
         len(type_map),
         ds.get_dim_out(),
         neuron=[8, 8],
         resnet_dt=True,
         mixed_types=ds.mixed_types(),
-        seed=GLOBAL_SEED,
+        seed=seed,
     )
     model = EnergyModel(ds, ft, type_map=type_map).to(torch.float64).eval()
 
@@ -388,9 +394,11 @@ class TestPtExptLoadPtMultiTask(unittest.TestCase):
     @classmethod
     def setUpClass(cls) -> None:
         # Build two single-task models with the same architecture but
-        # different seeds, then save a multi-task-style checkpoint.
-        cls.model_a, params_a = _build_model_and_params(rcut=4.0)
-        cls.model_b, params_b = _build_model_and_params(rcut=4.0)
+        # different seeds. Distinct seeds matter so that a head-routing
+        # bug (loading head_b's weights when head_a is requested, or
+        # vice versa) actually shows up as an assertion failure.
+        cls.model_a, params_a = _build_model_and_params(rcut=4.0, seed=42)
+        cls.model_b, params_b = _build_model_and_params(rcut=4.0, seed=7)
         cls.models = {"head_a": cls.model_a, "head_b": cls.model_b}
         cls.model_params = {"model_dict": {"head_a": params_a, "head_b": params_b}}
 
@@ -423,7 +431,7 @@ def test_select_head_matches_single_task_forward(self) -> None:
             # Build a DeepPot wrapping this DeepEval for end-to-end eval.
             dp = DeepPot(self.pt_path, head=head)
             de = dp.deep_eval
-            e, f, v = dp.eval(coords, cells, atom_types, atomic=False)
+            e, f, _v = dp.eval(coords, cells, atom_types, atomic=False)
 
             coord_t = torch.tensor(
                 coords, dtype=torch.float64, device=DEVICE
@@ -450,6 +458,25 @@ def test_select_head_matches_single_task_forward(self) -> None:
             )
             self.assertEqual(de.get_type_map(), src.get_type_map())
 
+    def test_distinct_heads_produce_distinct_outputs(self) -> None:
+        """Sanity check that head_a and head_b really resolve to different weights."""
+        rng = np.random.default_rng(GLOBAL_SEED + 2)
+        natoms = 4
+        coords = rng.random((1, natoms, 3)) * 8.0
+        cells = np.eye(3).reshape(1, 9) * 10.0
+        atom_types = np.array([i % 2 for i in range(natoms)], dtype=np.int32)
+        e_a = DeepPot(self.pt_path, head="head_a").eval(
+            coords, cells, atom_types, atomic=False
+        )[0]
+        e_b = DeepPot(self.pt_path, head="head_b").eval(
+            coords, cells, atom_types, atomic=False
+        )[0]
+        self.assertFalse(
+            np.allclose(e_a, e_b),
+            "head_a and head_b produced identical outputs — head selection "
+            "may be loading the wrong weights",
+        )
+
     def test_missing_head_raises(self) -> None:
         with self.assertRaisesRegex(ValueError, "Head 'no_such_head' not found"):
             DeepPot(self.pt_path, head="no_such_head")
@@ -469,7 +496,7 @@ def test_select_head_compiled_layout_matches(self) -> None:
 
         for head, src in (("head_a", self.model_a), ("head_b", self.model_b)):
             dp = DeepPot(self.pt_path_compiled, head=head)
-            e, f, v = dp.eval(coords, cells, atom_types, atomic=False)
+            e, f, _v = dp.eval(coords, cells, atom_types, atomic=False)
 
             coord_t = torch.tensor(
                 coords, dtype=torch.float64, device=DEVICE
@@ -610,7 +637,7 @@ def test_metadata_flags_spin(self) -> None:
 
     def test_eval_pbc_atomic_matches_reference(self) -> None:
         dp = DeepPot(self.files[".pt"])
-        e, f, v, ae, av, fm, mm = dp.eval(
+        e, f, v, ae, _av, fm, _mm = dp.eval(
             self.COORD, self.BOX, self.ATYPE, atomic=True, spin=self.SPIN
         )
         np.testing.assert_allclose(
@@ -915,7 +942,7 @@ def test_each_head_matches_its_eager_reference(self) -> None:
             self.assertEqual(dp.use_spin, [True, False], msg=f"head={head}")
 
             ref = self._eager_ref(src)
-            e, f, v, ae, av, fm, mm = dp.eval(
+            e, f, v, _ae, _av, fm, _mm = dp.eval(
                 self.COORD, self.BOX, self.ATYPE, atomic=True, spin=self.SPIN
             )
             np.testing.assert_allclose(