|
| 1 | +# arch: MODEL_CLASS_MAPPING key; required when model has get_model_defaults. Add when adding entries. |
| 2 | +- model: Qwen/Qwen3-Next-80B-A3B-Thinking |
| 3 | + arch: Qwen3NextForCausalLM |
| 4 | + config_path: examples/configs/curated/qwen3-next.yaml |
| 5 | +- model: Qwen/Qwen3-30B-A3B |
| 6 | + arch: Qwen3MoeForCausalLM |
| 7 | + config_path: examples/configs/curated/qwen3.yaml |
| 8 | +- model: Qwen/Qwen3-30B-A3B |
| 9 | + arch: Qwen3MoeForCausalLM |
| 10 | + config_path: examples/configs/curated/qwen3-disagg-prefill.yaml |
| 11 | +- model: deepseek-ai/DeepSeek-R1-0528 |
| 12 | + arch: DeepseekV3ForCausalLM |
| 13 | + config_path: examples/configs/curated/deepseek-r1-latency.yaml |
| 14 | +- model: deepseek-ai/DeepSeek-R1-0528 |
| 15 | + arch: DeepseekV3ForCausalLM |
| 16 | + config_path: examples/configs/curated/deepseek-r1-throughput.yaml |
| 17 | +- model: deepseek-ai/DeepSeek-R1-0528 |
| 18 | + arch: DeepseekV3ForCausalLM |
| 19 | + config_path: examples/configs/curated/deepseek-r1-deepgemm.yaml |
| 20 | +- model: openai/gpt-oss-120b |
| 21 | + arch: GptOssForCausalLM |
| 22 | + config_path: examples/configs/curated/gpt-oss-120b-latency.yaml |
| 23 | +- model: openai/gpt-oss-120b |
| 24 | + arch: GptOssForCausalLM |
| 25 | + config_path: examples/configs/curated/gpt-oss-120b-throughput.yaml |
| 26 | +- model: nvidia/Llama-3.3-70B-Instruct-FP8 |
| 27 | + arch: LlamaForCausalLM |
| 28 | + config_path: examples/configs/curated/llama-3.3-70b.yaml |
| 29 | +- model: nvidia/Llama-4-Scout-17B-16E-Instruct-FP8 |
| 30 | + arch: Llama4ForConditionalGeneration |
| 31 | + config_path: examples/configs/curated/llama-4-scout.yaml |
| 32 | +- model: nvidia/Kimi-K2-Thinking-NVFP4 |
| 33 | + arch: DeepseekV3ForCausalLM |
| 34 | + config_path: examples/configs/curated/kimi-k2-thinking.yaml |
0 commit comments