nv-auto-deploy
diff --git a/‎examples/auto_deploy/model_registry/configs/glm_5.yaml‎
Lines changed: 6 additions & 0 deletions b/‎examples/auto_deploy/model_registry/configs/glm_5.yaml‎
Lines changed: 6 additions & 0 deletions
diff --git a/‎examples/auto_deploy/model_registry/models.yaml‎
Lines changed: 2 additions & 2 deletions b/‎examples/auto_deploy/model_registry/models.yaml‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎tensorrt_llm/_torch/auto_deploy/models/custom/__init__.py‎
Lines changed: 2 additions & 0 deletions b/‎tensorrt_llm/_torch/auto_deploy/models/custom/__init__.py‎
Lines changed: 2 additions & 0 deletions
@@ -0,0 +1,6 @@
+# Configuration for GLM-5 (zai-org/GLM-5)
+# Workaround: extra_special_tokens is a list in the GLM-5 tokenizer config but
+# transformers 4.57.x expects a dict in _set_model_specific_special_tokens.
+# Passing extra_special_tokens={} overrides the problematic list with an empty dict.
+tokenizer_kwargs:
+  extra_special_tokens: {}
@@ -224,9 +224,9 @@ models:
   yaml_extra: ['qwen3.5_moe_400b.yaml']
 # --- GLM-5 (Feb 2026) ---
 - name: zai-org/GLM-5
-  yaml_extra: ['dashboard_default.yaml', 'world_size_8.yaml']
+  yaml_extra: ['dashboard_default.yaml', 'world_size_8.yaml', 'glm_5.yaml', 'num_hidden_layers_5.yaml']
 - name: zai-org/GLM-5-FP8
-  yaml_extra: ['dashboard_default.yaml', 'world_size_8.yaml']
+  yaml_extra: ['dashboard_default.yaml', 'world_size_8.yaml', 'glm_5.yaml', 'num_hidden_layers_5.yaml']
 # --- MiniMax-M2.5 (Feb 2026) ---
 - name: MiniMaxAI/MiniMax-M2.5
   yaml_extra: ['dashboard_default.yaml', 'world_size_8.yaml', 'minimax_m2.yaml']
 
@@ -7,6 +7,7 @@
 from .modeling_gemma2 import Gemma2ForCausalLM
 from .modeling_glm4_moe import Glm4MoeForCausalLM
 from .modeling_glm4_moe_lite import Glm4MoeLiteForCausalLM
+from .modeling_glm_moe_dsa import GlmMoeDsaForCausalLM
 from .modeling_granite import GraniteForCausalLM
 from .modeling_granite_moe_hybrid import GraniteMoeHybridForCausalLM
 from .modeling_hunyuan_dense import HunYuanDenseForCausalLM
@@ -39,6 +40,7 @@
     "Gemma2ForCausalLM",
     "Glm4MoeForCausalLM",
     "Glm4MoeLiteForCausalLM",
+    "GlmMoeDsaForCausalLM",
     "GraniteForCausalLM",
     "GraniteMoeHybridForCausalLM",
     "HunYuanDenseForCausalLM",