docs: update output structure with complete checkpoint details

Harahan · Harahan · commit d10da7d5b0f9 · 2026-02-11T10:22:37.000+08:00
- Add optimizer_0/ directory for optimizer states
- Add pytorch_model_fsdp_0/ for FSDP sharded model states
- Add random_states_*.pkl for reproducibility (per-rank random states)
- Add README.md in transformer/ directory
- Clarify EMA states are optional (if enabled)
diff --git a/README.md b/README.md
@@ -388,8 +388,15 @@ logs/
     └── <run_name>_<timestamp>/
         ├── 📁 checkpoints/                    # Periodic checkpoints
         │   └── checkpoint-{step}/
-        │       ├── ema/                        # EMA states
-        │       ├── unwrapped_model/transformer/ # Model weights
+        │       ├── ema/                        # EMA states (if enabled)
+        │       ├── unwrapped_model/            # Model weights
+        │       │   └── transformer/
+        │       │       ├── adapter_config.json         # LoRA config (if LoRA)
+        │       │       ├── adapter_model.safetensors   # LoRA weights (if LoRA)
+        │       │       └── README.md                   # Model card
+        │       ├── optimizer_0/                # Optimizer states (for resuming)
+        │       ├── pytorch_model_fsdp_0/       # FSDP sharded model states
+        │       ├── random_states_*.pkl         # Random states for each rank (for reproducibility)
         │       └── metadata.json               # Step & config metadata
         ├── 📁 final_model/                    # Final trained model
         │   └── transformer/