change where dtype is found in checkpoint export

pstjohn · pstjohn · commit f08bbee4070b · 2025-07-18T12:46:54.000-07:00
Signed-off-by: Peter St. John &lt;pstjohn@nvidia.com&gt;
diff --git a/sub-packages/bionemo-esm2/src/bionemo/esm2/model/convert.py b/sub-packages/bionemo-esm2/src/bionemo/esm2/model/convert.py
@@ -134,7 +134,7 @@ def apply(self, output_path: Path) -> Path:
         )
         source, _ = self.nemo_load(self, trainer=trainer, cpu=cpu)
 
-        dtype = torch.bfloat16 if source.config.bf16 else torch.float32
+        dtype = source.dtype
 
         # Not sure why we need to do this, for some reason lm_head stays as fp32
         source.module.lm_head.to(dtype)
diff --git a/sub-packages/bionemo-esm2/tests/bionemo/esm2/model/test_convert.py b/sub-packages/bionemo-esm2/tests/bionemo/esm2/model/test_convert.py
@@ -104,6 +104,14 @@ def test_nemo2_conversion_equivalent_650m(tmp_path):
         assert_esm2_equivalence(tmp_path / "nemo_checkpoint", model_tag, atol=1e-4, rtol=1e-4)
 
 
+@pytest.mark.slow
+def test_nemo2_export_equivalent_650m(tmp_path):
+    ckpt_path = load("esm2/nv_650m:2.1")
+    output_path = io.export_ckpt(ckpt_path, "hf", tmp_path / "hf_checkpoint")
+    with megatron_parallel_state_utils.distributed_model_parallel_state():
+        assert_esm2_equivalence(ckpt_path, output_path, precision="bf16")
+
+
 def test_cli_nemo2_conversion_equivalent_8m(tmp_path):
     """Test that the CLI conversion functions maintain model equivalence."""
     model_tag = "facebook/esm2_t6_8M_UR50D"

Original file line number	Diff line number	Diff line change
`@@ -134,7 +134,7 @@ def apply(self, output_path: Path) -> Path:`
`134`	`134`	`)`
`135`	`135`	`source, _ = self.nemo_load(self, trainer=trainer, cpu=cpu)`
`136`	`136`
`137`		`- dtype = torch.bfloat16 if source.config.bf16 else torch.float32`
	`137`	`+ dtype = source.dtype`
`138`	`138`
`139`	`139`	`# Not sure why we need to do this, for some reason lm_head stays as fp32`
`140`	`140`	`source.module.lm_head.to(dtype)`