Skip to content

Commit ef11755

Browse files
committed
fix(profile): capture eight Flash vLLM decode steps
1 parent 39f3b7c commit ef11755

1 file changed

Lines changed: 1 addition & 1 deletion

File tree

benchmarks/single_node/dsv4_fp4_b300_vllm_mtp.sh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -48,7 +48,7 @@ PROFILE_ARGS=()
4848
if [[ "${PROFILE:-}" == "1" ]]; then
4949
PROFILER_CONFIG="{\"profiler\":\"torch\",\"torch_profiler_dir\":\"${VLLM_TORCH_PROFILER_DIR:-/workspace/}\"}"
5050
if [[ "$MODEL" == "deepseek-ai/DeepSeek-V4-Flash" ]]; then
51-
PROFILER_CONFIG="{\"profiler\":\"torch\",\"torch_profiler_dir\":\"${VLLM_TORCH_PROFILER_DIR:-/workspace/}\",\"ignore_frontend\":true,\"delay_iterations\":1,\"max_iterations\":3,\"active_iterations\":3,\"torch_profiler_with_stack\":false}"
51+
PROFILER_CONFIG="{\"profiler\":\"torch\",\"torch_profiler_dir\":\"${VLLM_TORCH_PROFILER_DIR:-/workspace/}\",\"ignore_frontend\":true,\"delay_iterations\":1,\"max_iterations\":8,\"active_iterations\":8,\"torch_profiler_with_stack\":false}"
5252
fi
5353
PROFILE_ARGS=(
5454
--profiler-config

0 commit comments

Comments
 (0)