Skip to content

Commit 5d7f415

Browse files
committed
fix gpt-oss args
1 parent 92fba62 commit 5d7f415

2 files changed

Lines changed: 6 additions & 4 deletions

File tree

autotest/utils/benchmark_utils.py

Lines changed: 6 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -8,7 +8,10 @@
88
from utils.config_utils import get_case_str_by_config, get_cli_common_param, get_cuda_prefix_by_workerid, get_workerid
99
from utils.run_restful_chat import health_check, start_openai_service, terminate_restful_api
1010

11-
SERVE_ONLY_PARAMS = {'max-batch-size', 'max-prefill-token-num', 'server-name', 'enable-prefix-caching', 'session-len'} # yapf: disable
11+
SERVE_ONLY_PARAMS = { # yapf: disable
12+
'max-batch-size', 'max-prefill-token-num', 'server-name',
13+
'enable-prefix-caching', 'session-len',
14+
}
1215

1316

1417
def throughput_test(config, run_config, worker_id: str = '', is_smoke: bool = False):
@@ -34,6 +37,8 @@ def throughput_test(config, run_config, worker_id: str = '', is_smoke: bool = Fa
3437
k: v
3538
for k, v in bench_config.get('extra_params', {}).items() if k not in SERVE_ONLY_PARAMS
3639
}
40+
if 'openai/gpt-oss' in run_config.get('model', ''):
41+
bench_config['extra_params']['model-format'] = 'mxfp4'
3742
command = f'{cuda_prefix} python3 benchmark/profile_throughput.py {dataset_path} {model_path} {get_cli_common_param(bench_config)}' # noqa
3843

3944
if is_smoke:

autotest/utils/config_utils.py

Lines changed: 0 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -135,9 +135,6 @@ def get_func_config_list(backend: str,
135135
run_config['extra_params']['max-prefill-token-num'] = 1024
136136
run_config['extra_params']['max-batch-size'] = 128
137137

138-
if 'openai/gpt-oss' in run_config['model']:
139-
run_config['extra_params']['model-format'] = 'mxfp4'
140-
141138
return run_configs
142139

143140

0 commit comments

Comments
 (0)