1+ # Copyright 2023–2025 Google LLC
2+ #
3+ # Licensed under the Apache License, Version 2.0 (the "License");
4+ # you may not use this file except in compliance with the License.
5+ # You may obtain a copy of the License at
6+ #
7+ # https://www.apache.org/licenses/LICENSE-2.0
8+ #
9+ # Unless required by applicable law or agreed to in writing, software
10+ # distributed under the License is distributed on an "AS IS" BASIS,
11+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12+ # See the License for the specific language governing permissions and
13+ # limitations under the License.
14+
15+
16+ base_config : " vllm.yml"
17+
18+ logical_axis_rules : [
19+ ['activation_batch', ['']],
20+ ['activation_batch_no_exp', []],
21+ ['activation_embed_and_logits_batch', ['expert']],
22+ ['activation_embed_and_logits_batch_sequence', ['expert']],
23+ ['activation_heads', ['model']],
24+ ['activation_kv_heads', ['model']],
25+ ['activation_attn_length', ['expert']],
26+ ['activation_attn_length_no_exp', []],
27+ ['activation_length', ['data', 'expert']],
28+ ['activation_length_no_exp', 'data'],
29+ ['activation_q_length', ['expert']],
30+ ['activation_attn_embed', 'model'],
31+ ['activation_embed', ['model', 'attn_dp']],
32+ ['activation_mlp', ['model', 'attn_dp', 'expert']],
33+ ['activation_kv', ['model']],
34+ ['activation_prefill_kv_batch', ['expert']],
35+ ['activation_kv_batch', ['']],
36+ ['activation_kv_batch_no_exp', []],
37+ ['activation_kv_head_dim', ['model', 'attn_dp', 'expert']],
38+ ['activation_vocab', ['model', 'attn_dp']],
39+ ['activation_norm_length', []],
40+ ['activation_exp', ['expert']],
41+ ['decode_batch', ['expert']],
42+ ['decode_length', []],
43+ ['mlp_no_fsdp', ['model', 'attn_dp', 'expert']],
44+ ['vocab', ['model', 'attn_dp', 'expert']],
45+ ['heads', ['expert', 'attn_dp', 'model']],
46+ ['q_heads', []],
47+ ['kv_heads', []],
48+ ['kv_head_dim', ['model', 'attn_dp', 'expert']],
49+ ['kv', ['model', 'attn_dp', 'expert']],
50+ ['kv', []],
51+ ['embed', []],
52+ ['mlp', ['model', 'attn_dp', 'expert']],
53+ ['moe_mlp', []],
54+ ['embed_tensor_transpose', ['attn_dp', 'model']],
55+ ['embed_no_exp', []],
56+ ['q_lora', []],
57+ ['kv_lora', []],
58+ ['norm', []],
59+ ['cache_heads', ['model']],
60+ ['exp', ['expert', 'attn_dp', 'model']],
61+ ['paged_kv_heads', ['model']],
62+ ['cache_batch_prefill', []],
63+ ['cache_batch', []],
64+ ['cache_sequence', []],
65+ ['cache_heads_none', []],
66+ ['cache_kv', []],
67+ ['kv_lora_up_proj',['expert', 'attn_dp', 'model']],
68+ ['q_lora_up_proj',['expert', 'attn_dp', 'model']],
69+ ]
0 commit comments