feat: support resuming SAE training from pretrained checkpoints

Hzfinfdu · Hzfinfdu · commit 95281ac7ea40 · 2026-05-11T12:32:58.000+08:00
diff --git a/pyproject.toml b/pyproject.toml
@@ -25,6 +25,8 @@ dependencies = [
     "more-itertools>=10.7.0",
     "json-repair>=0.44.1",
     "cattrs>=26.1.0",
+    "jupyter>=1.1.1",
+    "ipykernel>=7.2.0",
 ]
 requires-python = ">=3.11,<3.13"
 readme = "README.md"
diff --git a/src/llamascopium/initializer.py b/src/llamascopium/initializer.py
@@ -183,6 +183,9 @@ def initialize_sae_from_config(
             device_mesh=device_mesh,
         )
 
+        if cfg.sae_pretrained_name_or_path is not None:
+            return sae
+
         sae = self.initialize_parameters(sae)
         if sae.cfg.norm_activation == "dataset-wise":
             if activation_norm is None:
diff --git a/src/llamascopium/models/sparse_dictionary.py b/src/llamascopium/models/sparse_dictionary.py
@@ -132,6 +132,12 @@ class SparseDictionaryConfig(BaseModelConfig, ABC):
     top_k: int = 50
     """The k value to use for the topk family of activation functions. For vanilla TopK, the L0 norm of the feature activations will be exactly equal to `top_k`."""
 
+    sae_pretrained_name_or_path: str | None = None
+    """Optional pretrained SAE path or identifier used to restore model weights."""
+
+    strict_loading: bool = True
+    """Whether to strictly enforce an exact state_dict key match when loading pretrained weights."""
+
     use_triton_kernel: bool = False
     """Whether to use the Triton SpMM kernel for the sparse matrix multiplication. Currently only supported for vanilla SAE."""
 
@@ -148,7 +154,7 @@ def d_sae(self) -> int:
         return d_sae
 
     @classmethod
-    def from_pretrained(cls, pretrained_name_or_path: str, **kwargs):
+    def from_pretrained(cls, pretrained_name_or_path: str, strict_loading: bool = True, **kwargs):
         """Load the config of the sparse dictionary from a pretrained name or path. Config is read from <pretrained_name_or_path>/config.json (for local storage) or <repo_id>/<name>/config.json (for HuggingFace Hub).
 
         Args:
@@ -171,6 +177,9 @@ def from_pretrained(cls, pretrained_name_or_path: str, **kwargs):
         with open(path, "r") as f:
             sae_config = json.load(f)
 
+        sae_config["sae_pretrained_name_or_path"] = pretrained_name_or_path
+        sae_config["strict_loading"] = strict_loading
+
         if cls is SparseDictionaryConfig:
             cls = SAE_TYPE_TO_CONFIG_CLASS[sae_config["sae_type"]]
 
@@ -179,6 +188,9 @@ def from_pretrained(cls, pretrained_name_or_path: str, **kwargs):
     def save_hyperparameters(self, sae_path: str | Path, remove_loading_info: bool = True):
         assert os.path.exists(sae_path), f"{sae_path} does not exist. Unable to save hyperparameters."
         d = self.model_dump()
+        if remove_loading_info:
+            d.pop("sae_pretrained_name_or_path", None)
+            d.pop("strict_loading", None)
 
         with open(os.path.join(sae_path, "config.json"), "w") as f:
             json.dump(d, f, indent=4)
@@ -517,6 +529,16 @@ def from_config(cls, cfg: SparseDictionaryConfig, device_mesh: DeviceMesh | None
         if cls is SparseDictionary:
             cls = SAE_TYPE_TO_MODEL_CLASS[cfg.sae_type]
 
+        if cfg.sae_pretrained_name_or_path is not None:
+            return cls.from_pretrained(
+                cfg.sae_pretrained_name_or_path,
+                device_mesh=device_mesh,
+                fold_activation_scale=False,
+                strict_loading=cfg.strict_loading,
+                device=cfg.device,
+                dtype=cfg.dtype,
+            )
+
         model = cls(cfg, device_mesh)
         total_params = sum(param.numel() for param in model.parameters()) / 1e9
         logger.info(f"Initializing {cfg.sae_type} with {total_params:.2f} B parameters")
@@ -534,7 +556,8 @@ def from_local(
     ):
         """Load a pretrained sparse dictionary from a local directory."""
 
-        cfg = SparseDictionaryConfig.from_pretrained(path, **kwargs)
+        cfg = SparseDictionaryConfig.from_pretrained(path, strict_loading=strict_loading, **kwargs)
+        cfg.sae_pretrained_name_or_path = None
         model = cls.from_config(cfg, device_mesh=device_mesh)
 
         if path.endswith(".pt") or path.endswith(".safetensors") or path.endswith(".dcp"):
diff --git a/uv.lock b/uv.lock

Original file line number	Diff line number	Diff line change
`@@ -25,6 +25,8 @@ dependencies = [`
`25`	`25`	`"more-itertools>=10.7.0",`
`26`	`26`	`"json-repair>=0.44.1",`
`27`	`27`	`"cattrs>=26.1.0",`
	`28`	`+ "jupyter>=1.1.1",`
	`29`	`+ "ipykernel>=7.2.0",`
`28`	`30`	`]`
`29`	`31`	`requires-python = ">=3.11,<3.13"`
`30`	`32`	`readme = "README.md"`
Original file line number	Diff line number	Diff line change
`@@ -183,6 +183,9 @@ def initialize_sae_from_config(`
`183`	`183`	`device_mesh=device_mesh,`
`184`	`184`	`)`
`185`	`185`
	`186`	`+ if cfg.sae_pretrained_name_or_path is not None:`
	`187`	`+ return sae`
	`188`	`+`
`186`	`189`	`sae = self.initialize_parameters(sae)`
`187`	`190`	`if sae.cfg.norm_activation == "dataset-wise":`
`188`	`191`	`if activation_norm is None:`