Skip to content

Commit 5506165

Browse files
committed
Amend
1 parent 348355c commit 5506165

2 files changed

Lines changed: 3 additions & 0 deletions

File tree

src/maxtext/checkpoint_conversion/utils/hf_shape.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -930,6 +930,7 @@ def MIXTRAL_HF_WEIGHTS_TO_SHAPE(config):
930930
"qwen3-14b": QWEN_HF_WEIGHTS_TO_SHAPE,
931931
"qwen3-32b": QWEN_HF_WEIGHTS_TO_SHAPE,
932932
"llama3.1-8b": LLAMA31_HF_WEIGHTS_TO_SHAPE,
933+
"llama3.1-8b-Instruct": LLAMA31_HF_WEIGHTS_TO_SHAPE,
933934
"llama3.1-70b": LLAMA31_HF_WEIGHTS_TO_SHAPE,
934935
"llama3.1-405b": LLAMA31_HF_WEIGHTS_TO_SHAPE,
935936
"qwen3-30b-a3b": QWEN_HF_WEIGHTS_TO_SHAPE,

src/maxtext/checkpoint_conversion/utils/param_mapping.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -2930,6 +2930,7 @@ def pad_hf_embedding_layer(input_tensor, target_shape):
29302930
"qwen3-14b-base": QWEN_MAXTEXT_TO_HF_PARAM_MAPPING,
29312931
"qwen3-32b": QWEN_MAXTEXT_TO_HF_PARAM_MAPPING,
29322932
"llama3.1-8b": LLAMA31_MAXTEXT_TO_HF_PARAM_MAPPING,
2933+
"llama3.1-8b-Instruct": LLAMA31_MAXTEXT_TO_HF_PARAM_MAPPING,
29332934
"llama3.1-70b": LLAMA31_MAXTEXT_TO_HF_PARAM_MAPPING,
29342935
"llama3.1-405b": LLAMA31_MAXTEXT_TO_HF_PARAM_MAPPING,
29352936
"qwen3-30b-a3b": QWEN_MAXTEXT_TO_HF_PARAM_MAPPING,
@@ -2975,6 +2976,7 @@ def pad_hf_embedding_layer(input_tensor, target_shape):
29752976
"qwen3-14b-base": QWEN_MAXTEXT_TO_HF_PARAM_HOOK_FN,
29762977
"qwen3-32b": QWEN_MAXTEXT_TO_HF_PARAM_HOOK_FN,
29772978
"llama3.1-8b": LLAMA31_MAXTEXT_TO_HF_PARAM_HOOK_FN,
2979+
"llama3.1-8b-Instruct": LLAMA31_MAXTEXT_TO_HF_PARAM_HOOK_FN,
29782980
"llama3.1-70b": LLAMA31_MAXTEXT_TO_HF_PARAM_HOOK_FN,
29792981
"llama3.1-405b": LLAMA31_MAXTEXT_TO_HF_PARAM_HOOK_FN,
29802982
"qwen3-30b-a3b": QWEN_MAXTEXT_TO_HF_PARAM_HOOK_FN,

0 commit comments

Comments
 (0)