@@ -951,13 +951,12 @@ install_agentic_deps() {
951951build_replay_cmd () {
952952 # aiperf invocation for the inferencex-agentx-mvp scenario.
953953 #
954- # Live-assistant mode is the default
955- # (AIPERF_DATASET_WEKA_LIVE_ASSISTANT_RESPONSES=1): the loader emits
956- # user-only deltas and the worker threads the server's live assistant
957- # response back into the session. Set
958- # AIPERF_DATASET_WEKA_LIVE_ASSISTANT_RESPONSES=0 explicitly to compare
959- # against pre-canned assistant replay, where the server response is
960- # discarded for future prompt construction.
954+ # Pre-canned assistant replay is the default: recorded assistant responses
955+ # are used for future prompt construction, and live server responses are
956+ # discarded. Set AIPERF_DATASET_WEKA_LIVE_ASSISTANT_RESPONSES=1 explicitly
957+ # to use live-assistant mode, where the loader emits user-only deltas and
958+ # the worker threads the server's live assistant response back into the
959+ # session.
961960 #
962961 # The scenario plugin locks: --cache-bust first_turn_prefix and
963962 # --trace-idle-gap-cap-seconds 60 (per-trace idle-gap compression
@@ -968,7 +967,7 @@ build_replay_cmd() {
968967 local result_dir=" $1 "
969968 local duration=" ${DURATION:- 1800} "
970969
971- export AIPERF_DATASET_WEKA_LIVE_ASSISTANT_RESPONSES=" ${AIPERF_DATASET_WEKA_LIVE_ASSISTANT_RESPONSES:- 1 } "
970+ export AIPERF_DATASET_WEKA_LIVE_ASSISTANT_RESPONSES=" ${AIPERF_DATASET_WEKA_LIVE_ASSISTANT_RESPONSES:- 0 } "
972971 # Dataset configuration (load + reconstruct + inputs.json + mmap)
973972 # routinely takes 4-5 min for the 949-trace weka corpus on fast /tmp
974973 # (B300) but can stretch to 14 min on slower /tmp + parallel contention
0 commit comments