Skip to content

Commit 5eb4b65

Browse files
committed
fix(profile): capture three Flash vLLM decode steps
1 parent fc21e40 commit 5eb4b65

1 file changed

Lines changed: 1 addition & 1 deletion

File tree

benchmarks/single_node/dsv4_fp4_b300_vllm_mtp.sh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -48,7 +48,7 @@ PROFILE_ARGS=()
4848
if [[ "${PROFILE:-}" == "1" ]]; then
4949
PROFILER_CONFIG="{\"profiler\":\"torch\",\"torch_profiler_dir\":\"${VLLM_TORCH_PROFILER_DIR:-/workspace/}\"}"
5050
if [[ "$MODEL" == "deepseek-ai/DeepSeek-V4-Flash" ]]; then
51-
PROFILER_CONFIG="{\"profiler\":\"torch\",\"torch_profiler_dir\":\"${VLLM_TORCH_PROFILER_DIR:-/workspace/}\",\"ignore_frontend\":true,\"delay_iterations\":1,\"max_iterations\":2,\"active_iterations\":2,\"torch_profiler_with_stack\":false}"
51+
PROFILER_CONFIG="{\"profiler\":\"torch\",\"torch_profiler_dir\":\"${VLLM_TORCH_PROFILER_DIR:-/workspace/}\",\"ignore_frontend\":true,\"delay_iterations\":1,\"max_iterations\":3,\"active_iterations\":3,\"torch_profiler_with_stack\":false}"
5252
fi
5353
PROFILE_ARGS=(
5454
--profiler-config

0 commit comments

Comments
 (0)