Skip to content

Commit b866178

Browse files
committed
adding testing workflows
1 parent 3994996 commit b866178

5 files changed

Lines changed: 2036 additions & 1540 deletions

File tree

.github/workflows/benchmark-tmpl.yml

Lines changed: 8 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -41,6 +41,12 @@ on:
4141
conc:
4242
required: true
4343
type: string
44+
spec-decoding:
45+
required: true
46+
type: string
47+
disagg:
48+
required: true
49+
type: string
4450
random-range-ratio:
4551
required: false
4652
type: string
@@ -62,6 +68,8 @@ env:
6268
EP_SIZE: ${{ inputs.ep }}
6369
DP_ATTENTION: ${{ inputs.dp-attn }}
6470
CONC: ${{ inputs.conc }}
71+
SPEC_DECODING: ${{ inputs.spec-decoding }}
72+
DISAGG: ${{ inputs.disagg }}
6573

6674
permissions:
6775
contents: read

utils/matrix-logic/generate_sweep_configs.py

Lines changed: 4 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -156,6 +156,7 @@ def generate_full_sweep(args, all_config_data, runner_data):
156156
conc_end = bmk[Fields.CONC_END.value]
157157
ep = bmk.get(Fields.EP.value)
158158
dp_attn = bmk.get(Fields.DP_ATTN.value)
159+
spec_decoding = bmk.get(Fields.SPEC_DECODING.value, "none")
159160

160161
# Apply max-tp filter if specified
161162
if args.max_tp and tp > args.max_tp:
@@ -187,6 +188,7 @@ def generate_full_sweep(args, all_config_data, runner_data):
187188
Fields.MAX_MODEL_LEN.value: isl + osl + 200,
188189
Fields.EP.value: 1, # Default
189190
Fields.DP_ATTN.value: False, # Default
191+
Fields.SPEC_DECODING.value: spec_decoding,
190192
Fields.EXP_NAME.value: f"{model_code}_{seq_len_str}",
191193
Fields.DISAGG.value: disagg,
192194
}
@@ -217,7 +219,7 @@ def generate_runner_model_sweep_config(args, all_config_data, runner_data):
217219

218220
if not runner_nodes:
219221
raise ValueError(
220-
f"Runner '{args.runner_type}' does not exist in runner config '{args.runner_config}'. Must choose from existing runner types: '{', '.join(runner_config.keys())}'.")
222+
f"Runner '{args.runner_type}' does not exist in runner config '{args.runner_config}'. Must choose from existing runner types: '{', '.join(runner_data.keys())}'.")
221223

222224
# Filter runner nodes if filter is specified
223225
if args.runner_node_filter:
@@ -269,6 +271,7 @@ def generate_runner_model_sweep_config(args, all_config_data, runner_data):
269271
Fields.TP.value: highest_tp,
270272
Fields.EP.value: 1, # Default,
271273
Fields.DP_ATTN.value: False, # Default
274+
Fields.SPEC_DECODING.value: "none", # Default
272275
Fields.CONC.value: lowest_conc,
273276
Fields.MAX_MODEL_LEN.value: 2048,
274277
Fields.EXP_NAME.value: f"{model_code}_test",

0 commit comments

Comments
 (0)