Merge pull request #62 from KempnerInstitute/train-state-ownership-check

mmshad · web-flow · commit ac71e0ebc68d · 2026-04-26T14:10:31.000-04:00
Gate train_state.pt load behind an ownership check
diff --git a/kempnerforge/checkpoint/manager.py b/kempnerforge/checkpoint/manager.py
@@ -11,7 +11,9 @@
 
 import json
 import logging
+import os
 import shutil
+import stat
 from pathlib import Path
 from typing import Any
 
@@ -30,6 +32,44 @@
 _METADATA_FILE = "metadata.json"
 
 
+def _load_train_state(path: Path) -> dict[str, Any]:
+    """Load ``train_state.pt`` under an explicit trust boundary.
+
+    ``train_state.pt`` carries scheduler state, dataloader state, and a
+    caller-supplied ``extra`` dict, so it is loaded with ``weights_only=False``
+    (i.e. full pickle). Any object in the file whose class defines
+    ``__reduce__`` runs arbitrary Python during ``torch.load``. On shared
+    filesystems this is a real attack surface: anyone who can write into
+    another user's checkpoint directory gets code execution in that user's
+    training process on next resume.
+
+    Refuses to load files not owned by the current UID and warns when the
+    file is group- or world-writable. This does not defend against a
+    same-UID compromise — if the attacker can write as you, they already
+    win — but it closes the common "group-writable shared checkpoint dir"
+    foot-gun and makes the trust boundary visible.
+
+    Checkpoints imported from outside the lab (HuggingFace Hub, colleague
+    transfers, etc.) will fail this check and must be either chown'd to the
+    current user after inspection or converted to a weights-only-safe form.
+    """
+    st = path.stat()
+    uid = os.getuid()
+    if st.st_uid != uid:
+        raise PermissionError(
+            f"Refusing to load {path}: owned by uid={st.st_uid}, current uid={uid}. "
+            f"train_state.pt is a pickle and loading it executes arbitrary Python. "
+            f"If you trust this checkpoint, chown it to the current user after inspection."
+        )
+    if st.st_mode & (stat.S_IWGRP | stat.S_IWOTH):
+        logger.warning(
+            f"{path} is group/world-writable (mode={oct(st.st_mode & 0o777)}); "
+            f"train_state.pt is a pickle and any writer can inject arbitrary code "
+            f"at load time. Consider chmod g-w,o-w on the checkpoint directory."
+        )
+    return torch.load(path, map_location="cpu", weights_only=False)
+
+
 class CheckpointManager:
     """Manages save/load/cleanup of distributed checkpoints.
 
@@ -203,8 +243,12 @@ def load(
             train_state_exists = train_state_path.exists()
 
         if train_state_exists:
+            # Rank-0-authoritative: only rank 0 reads the file. The
+            # ownership check inside ``_load_train_state`` runs there and
+            # the resulting state is broadcast to all ranks below. Other
+            # ranks pass ``None`` into the broadcast.
             train_state = (
-                torch.load(train_state_path, map_location="cpu", weights_only=False)
+                _load_train_state(train_state_path)
                 if self._rank == 0 or not dist.is_initialized()
                 else None
             )
diff --git a/tests/unit/test_checkpoint_security.py b/tests/unit/test_checkpoint_security.py
@@ -0,0 +1,199 @@
+"""Tests for the train_state.pt trust boundary.
+
+``train_state.pt`` is loaded with ``weights_only=False`` (full pickle),
+because it carries scheduler state and an arbitrary caller-supplied
+``extra`` dict. That means any ``__reduce__`` in the file runs at load
+time. Shared-FS clusters (HolyLFS, Kempner lab storage) and imported
+"pretrained" checkpoints both make the write side of that file
+attacker-reachable, so the loader MUST at minimum refuse to execute
+pickles planted by a different UID.
+"""
+
+from __future__ import annotations
+
+import os
+import stat
+from pathlib import Path
+from unittest.mock import MagicMock
+
+import pytest
+import torch
+
+import kempnerforge.checkpoint.manager as manager_mod
+from kempnerforge.checkpoint.manager import CheckpointManager, _load_train_state
+from kempnerforge.config.schema import CheckpointConfig
+
+
+class _Payload:
+    """Pickle-time side effect. If ``__reduce__`` runs, the marker file appears."""
+
+    def __init__(self, marker: Path) -> None:
+        self._marker = marker
+
+    def __reduce__(self):
+        # Tells pickle: on load, call os.system(cmd). os.system is a stand-in
+        # for any arbitrary command the attacker chooses.
+        return (os.system, (f"touch {self._marker}",))
+
+
+def _write_malicious_train_state(path: Path, marker: Path) -> None:
+    """Write a torch-format file that fires a side effect on load.
+
+    ``torch.save`` wraps pickle, so a ``__reduce__`` on any object inside
+    still runs when the file is opened with ``torch.load(weights_only=False)``.
+    """
+    train_state = {
+        "step": 42,
+        "tokens_seen": 1000,
+        "rng": {},
+        "payload": _Payload(marker),
+    }
+    torch.save(train_state, path)
+
+
+def _write_benign_train_state(path: Path, step: int = 7, tokens_seen: int = 128) -> None:
+    torch.save({"step": step, "tokens_seen": tokens_seen, "rng": {}}, path)
+
+
+def _fake_ckpt_dir(tmp_path: Path, marker: Path) -> Path:
+    """Build a ``step_42`` checkpoint dir with a malicious train_state.pt
+    and point ``latest`` at it so ``_resolve_load_path`` picks it up."""
+    ckpt_dir = tmp_path / "step_42"
+    ckpt_dir.mkdir()
+    _write_malicious_train_state(ckpt_dir / "train_state.pt", marker)
+    (tmp_path / "latest").symlink_to("step_42")
+    return ckpt_dir
+
+
+def _make_manager(tmp_path: Path) -> CheckpointManager:
+    config = CheckpointConfig(dir=str(tmp_path))
+    model = MagicMock()
+    model.state_dict.return_value = {}
+    optimizer = MagicMock()
+    optimizer.state_dict.return_value = {}
+    return CheckpointManager(config=config, model=model, optimizer=optimizer)
+
+
+class TestLoadTrainStateOwnershipGate:
+    def test_rejects_foreign_owned_file(self, tmp_path: Path) -> None:
+        """_load_train_state refuses when st_uid != current uid."""
+        marker = tmp_path / "rce_marker"
+        path = tmp_path / "train_state.pt"
+        _write_malicious_train_state(path, marker)
+
+        real_uid = os.getuid()
+        orig_getuid = manager_mod.os.getuid
+        try:
+            manager_mod.os.getuid = lambda: real_uid + 12345
+            with pytest.raises(PermissionError, match="Refusing to load"):
+                _load_train_state(path)
+        finally:
+            manager_mod.os.getuid = orig_getuid
+
+        assert not marker.exists(), (
+            "payload fired despite ownership gate — torch.load was reached before the check"
+        )
+
+    def test_accepts_own_file(self, tmp_path: Path) -> None:
+        """_load_train_state loads when st_uid matches current uid."""
+        path = tmp_path / "train_state.pt"
+        _write_benign_train_state(path)
+
+        loaded = _load_train_state(path)
+        assert loaded["step"] == 7
+        assert loaded["tokens_seen"] == 128
+
+    def test_warns_on_group_writable(self, tmp_path: Path) -> None:
+        """_load_train_state warns (but still loads) on group-writable files.
+
+        Same-UID group-writable is the footgun this case addresses: a
+        colleague in your lab group can plant the file. We warn instead of
+        refusing because the same-UID assumption typically holds on HPC
+        shared FS and the user deserves a heads-up, not a hard block.
+
+        Asserts via a direct logger handler rather than pytest's caplog so
+        the test is robust to other tests mutating logger propagation.
+        """
+        path = tmp_path / "train_state.pt"
+        _write_benign_train_state(path, step=1, tokens_seen=1)
+        path.chmod(path.stat().st_mode | stat.S_IWGRP)
+
+        import logging
+
+        records: list[logging.LogRecord] = []
+
+        class _Capture(logging.Handler):
+            def emit(self, record: logging.LogRecord) -> None:
+                records.append(record)
+
+        handler = _Capture(level=logging.WARNING)
+        logger = logging.getLogger("kempnerforge.checkpoint.manager")
+        prior_level = logger.level
+        logger.setLevel(logging.WARNING)
+        logger.addHandler(handler)
+        try:
+            _load_train_state(path)
+        finally:
+            logger.removeHandler(handler)
+            logger.setLevel(prior_level)
+
+        assert any("group/world-writable" in r.getMessage() for r in records), (
+            "expected a warning about group/world-writable train_state.pt"
+        )
+
+    def test_no_warning_on_private_mode(self, tmp_path: Path) -> None:
+        """Files with a tight mode (600/640 without group write) don't warn."""
+        path = tmp_path / "train_state.pt"
+        _write_benign_train_state(path, step=1, tokens_seen=1)
+        path.chmod(0o600)
+
+        import logging
+
+        records: list[logging.LogRecord] = []
+
+        class _Capture(logging.Handler):
+            def emit(self, record: logging.LogRecord) -> None:
+                records.append(record)
+
+        handler = _Capture(level=logging.WARNING)
+        logger = logging.getLogger("kempnerforge.checkpoint.manager")
+        prior_level = logger.level
+        logger.setLevel(logging.WARNING)
+        logger.addHandler(handler)
+        try:
+            _load_train_state(path)
+        finally:
+            logger.removeHandler(handler)
+            logger.setLevel(prior_level)
+
+        assert not any("group/world-writable" in r.getMessage() for r in records)
+
+
+class TestManagerLoadRejectsForeignCheckpoint:
+    def test_load_raises_before_executing_pickle(self, tmp_path: Path) -> None:
+        """CheckpointManager.load() blocks a foreign-owned pickle before it fires.
+
+        Pre-fix, the pickle ran through ``torch.load(..., weights_only=False)``
+        with no provenance check. Post-fix, ``_load_train_state`` raises
+        ``PermissionError`` before ``torch.load`` is reached, so the
+        ``__reduce__`` side effect never executes.
+
+        ``exclude_keys`` skips the DCP model/optimizer load so we don't need
+        a real checkpoint to reach the train_state.pt branch.
+        """
+        marker = tmp_path / "rce_marker_2"
+        _fake_ckpt_dir(tmp_path, marker)
+
+        real_uid = os.getuid()
+        orig_getuid = manager_mod.os.getuid
+        mgr = _make_manager(tmp_path)
+        try:
+            manager_mod.os.getuid = lambda: real_uid + 12345
+            with pytest.raises(PermissionError, match="Refusing to load"):
+                mgr.load(exclude_keys=["model", "optimizer"])
+        finally:
+            manager_mod.os.getuid = orig_getuid
+
+        assert not marker.exists(), (
+            "ownership gate did not block the load — payload fired despite the check"
+        )