2727 description : " DeepSeek-R1-0528-MXFP4 FP4 TP8 EP8"
2828 type : boolean
2929 default : false
30+ qwen3-5-397b-a17b-fp8-tp4 :
31+ description : " Qwen3.5-397B-A17B-FP8 TP4"
32+ type : boolean
33+ default : false
34+ qwen3-5-397b-a17b-fp8-tp8 :
35+ description : " Qwen3.5-397B-A17B-FP8 TP8"
36+ type : boolean
37+ default : false
3038 sglang_image :
3139 description : " Optional SGLang benchmark image override. Leave empty to use sglang-latest on main or rebuild from the selected non-main branch."
3240 type : string
@@ -217,6 +225,8 @@ jobs:
217225 ENABLE_DEEPSEEK_R1_FP4_TP8 : ${{ inputs.deepseek-r1-fp4-tp8 }}
218226 ENABLE_DEEPSEEK_R1_FP4_TP4 : ${{ inputs.deepseek-r1-fp4-tp4 }}
219227 ENABLE_DEEPSEEK_R1_FP4_TP8_EP8 : ${{ inputs.deepseek-r1-fp4-tp8-ep8 }}
228+ ENABLE_QWEN3_5_397B_A17B_FP8_TP4 : ${{ inputs.qwen3-5-397b-a17b-fp8-tp4 }}
229+ ENABLE_QWEN3_5_397B_A17B_FP8_TP8 : ${{ inputs.qwen3-5-397b-a17b-fp8-tp8 }}
220230 run : |
221231 MODELS_JSON="$(jq -c '
222232 map(select(
@@ -225,6 +235,8 @@ jobs:
225235 or (.prefix == "deepseek-r1-fp4-tp8" and env.ENABLE_DEEPSEEK_R1_FP4_TP8 == "true")
226236 or (.prefix == "deepseek-r1-fp4-tp4" and env.ENABLE_DEEPSEEK_R1_FP4_TP4 == "true")
227237 or (.prefix == "deepseek-r1-fp4-tp8-ep8" and env.ENABLE_DEEPSEEK_R1_FP4_TP8_EP8 == "true")
238+ or (.prefix == "qwen3-5-397b-a17b-fp8-tp4" and env.ENABLE_QWEN3_5_397B_A17B_FP8_TP4 == "true")
239+ or (.prefix == "qwen3-5-397b-a17b-fp8-tp8" and env.ENABLE_QWEN3_5_397B_A17B_FP8_TP8 == "true")
228240 ))
229241 ' .github/benchmark/sglang_benchmark_models.json)"
230242 echo "models_json=${MODELS_JSON}" >> "$GITHUB_OUTPUT"
@@ -475,6 +487,8 @@ jobs:
475487 deepseek-r1-fp4-tp8) echo "enabled=${{ inputs.deepseek-r1-fp4-tp8 }}" >> "$GITHUB_OUTPUT" ;;
476488 deepseek-r1-fp4-tp4) echo "enabled=${{ inputs.deepseek-r1-fp4-tp4 }}" >> "$GITHUB_OUTPUT" ;;
477489 deepseek-r1-fp4-tp8-ep8) echo "enabled=${{ inputs.deepseek-r1-fp4-tp8-ep8 }}" >> "$GITHUB_OUTPUT" ;;
490+ qwen3-5-397b-a17b-fp8-tp4) echo "enabled=${{ inputs.qwen3-5-397b-a17b-fp8-tp4 }}" >> "$GITHUB_OUTPUT" ;;
491+ qwen3-5-397b-a17b-fp8-tp8) echo "enabled=${{ inputs.qwen3-5-397b-a17b-fp8-tp8 }}" >> "$GITHUB_OUTPUT" ;;
478492 *) echo "enabled=true" >> "$GITHUB_OUTPUT" ;;
479493 esac
480494
0 commit comments