Skip to content

Commit 582affb

Browse files
committed
Address review
Signed-off-by: Hollow Man <hollowman@opensuse.org>
1 parent c506693 commit 582affb

3 files changed

Lines changed: 14 additions & 17 deletions

File tree

src/megatron/bridge/perf_recipes/glm_moe_dsa/common.py

Lines changed: 0 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -21,8 +21,6 @@
2121
from megatron.bridge.training.config import ConfigContainer
2222

2323

24-
GLM51_MODEL_ID = "zai-org/GLM-5.1"
25-
GLM52_MODEL_ID = "zai-org/GLM-5.2"
2624
GLM5_LONG_CONTEXT = 131072
2725

2826

src/megatron/bridge/perf_recipes/glm_moe_dsa/gb200/glm5.py

Lines changed: 2 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -14,8 +14,6 @@
1414
"""GB200 performance recipes for GLM-5.1 and GLM-5.2 SFT."""
1515

1616
from megatron.bridge.perf_recipes.glm_moe_dsa.common import (
17-
GLM51_MODEL_ID,
18-
GLM52_MODEL_ID,
1917
ConfigContainer,
2018
_glm5_cudnn_sft_base,
2119
)
@@ -41,9 +39,9 @@ def _glm5_gb200_cudnn_sft_config(model_id: str) -> ConfigContainer:
4139

4240
def glm51_sft_192gpu_gb200_bf16_config() -> ConfigContainer:
4341
"""GLM-5.1 SFT: 192× GB200, BF16, 128K packed THD, CP=32, cuDNN DSA."""
44-
return _glm5_gb200_cudnn_sft_config(GLM51_MODEL_ID)
42+
return _glm5_gb200_cudnn_sft_config("zai-org/GLM-5.1")
4543

4644

4745
def glm52_sft_192gpu_gb200_bf16_config() -> ConfigContainer:
4846
"""GLM-5.2 SFT: 192× GB200, BF16, 128K packed THD, CP=32, cuDNN DSA."""
49-
return _glm5_gb200_cudnn_sft_config(GLM52_MODEL_ID)
47+
return _glm5_gb200_cudnn_sft_config("zai-org/GLM-5.2")

src/megatron/bridge/perf_recipes/glm_moe_dsa/h100/glm5.py

Lines changed: 12 additions & 11 deletions
Original file line numberDiff line numberDiff line change
@@ -14,8 +14,6 @@
1414
"""H100 performance recipes for GLM-5.1 and GLM-5.2 SFT."""
1515

1616
from megatron.bridge.perf_recipes.glm_moe_dsa.common import (
17-
GLM51_MODEL_ID,
18-
GLM52_MODEL_ID,
1917
ConfigContainer,
2018
_glm5_cudnn_sft_base,
2119
)
@@ -28,10 +26,10 @@
2826
_GLM5_H100_GBS = 520
2927

3028

31-
def _glm5_h100_cudnn_sft_config(model_id: str) -> ConfigContainer:
32-
"""Return the 52-node H100 GLM5 cuDNN SFT benchmark shape."""
29+
def glm51_sft_416gpu_h100_bf16_config() -> ConfigContainer:
30+
"""GLM-5.1 SFT: 416x H100, BF16, 128K packed THD, CP=4, cuDNN DSA."""
3331
return _glm5_cudnn_sft_base(
34-
model_id,
32+
"zai-org/GLM-5.1",
3533
tensor_model_parallel_size=_GLM5_H100_TP,
3634
pipeline_model_parallel_size=_GLM5_H100_PP,
3735
context_parallel_size=_GLM5_H100_CP,
@@ -41,11 +39,14 @@ def _glm5_h100_cudnn_sft_config(model_id: str) -> ConfigContainer:
4139
)
4240

4341

44-
def glm51_sft_416gpu_h100_bf16_config() -> ConfigContainer:
45-
"""GLM-5.1 SFT: 416x H100, BF16, 128K packed THD, CP=4, cuDNN DSA."""
46-
return _glm5_h100_cudnn_sft_config(GLM51_MODEL_ID)
47-
48-
4942
def glm52_sft_416gpu_h100_bf16_config() -> ConfigContainer:
5043
"""GLM-5.2 SFT: 416x H100, BF16, 128K packed THD, CP=4, cuDNN DSA."""
51-
return _glm5_h100_cudnn_sft_config(GLM52_MODEL_ID)
44+
return _glm5_cudnn_sft_base(
45+
"zai-org/GLM-5.2",
46+
tensor_model_parallel_size=_GLM5_H100_TP,
47+
pipeline_model_parallel_size=_GLM5_H100_PP,
48+
context_parallel_size=_GLM5_H100_CP,
49+
expert_model_parallel_size=_GLM5_H100_EP,
50+
global_batch_size=_GLM5_H100_GBS,
51+
sequence_parallel=True,
52+
)

0 commit comments

Comments
 (0)