@@ -904,14 +904,14 @@ ensure_hf_cli() {
904904}
905905
906906resolve_trace_source () {
907- local dataset=" semianalysisai/cc-traces-weka-with-subagents-051926 "
907+ local dataset=" semianalysisai/cc-traces-weka-with-subagents-052726 "
908908 # aiperf reads the corpus via its public-dataset registry. The
909909 # inferencex-agentx-mvp scenario hard-requires loader=one of
910910 # ['semianalysis_cc_traces_weka_with_subagents', 'weka_trace'] (see
911911 # aiperf src/aiperf/common/scenario/inferencex_agentx_mvp.py's
912912 # `require_loader`). The with-subagents corpus captures the parent +
913913 # Task-tool sub-agent fan-out structure of real Claude Code sessions
914- # (219 traces, v5-only, CC >= 2.1.139, classifier-call OSL spike
914+ # (472 traces, v5-only, CC >= 2.1.139, classifier-call OSL spike
915915 # filtered).
916916 TRACE_SOURCE_FLAG=" --public-dataset semianalysis_cc_traces_weka_with_subagents"
917917 echo " Loading traces via aiperf public-dataset: semianalysis_cc_traces_weka_with_subagents ($dataset )"
@@ -969,7 +969,7 @@ build_replay_cmd() {
969969
970970 export AIPERF_DATASET_WEKA_LIVE_ASSISTANT_RESPONSES=" ${AIPERF_DATASET_WEKA_LIVE_ASSISTANT_RESPONSES:- 0} "
971971 # Dataset configuration (load + reconstruct + inputs.json + mmap)
972- # routinely takes 4-5 min for the 949-trace weka corpus on fast /tmp
972+ # routinely takes 4-5 min for the Weka corpus on fast /tmp
973973 # (B300) but can stretch to 14 min on slower /tmp + parallel contention
974974 # (observed on H200 where all 14 R3 jobs hit aiperf's 900s Configure
975975 # Profiling timeout simultaneously). Bump to 1800s to absorb 3x
@@ -1019,11 +1019,11 @@ build_replay_cmd() {
10191019 if [ -n " ${MAX_MODEL_LEN:- } " ] && [ " $MAX_MODEL_LEN " != " 0" ]; then
10201020 REPLAY_CMD+=" --max-context-length $MAX_MODEL_LEN "
10211021 fi
1022- # Default --num-dataset-entries is 100; the with-subagents weka corpus
1023- # has 219 . Cap at 219 so all unique traces are loaded (the loader treats
1022+ # Default --num-dataset-entries is 100; the with-subagents Weka corpus
1023+ # has 472 . Cap at 472 so all unique traces are loaded (the loader treats
10241024 # this as a ``min(cap, available)`` ceiling, not a target — see
10251025 # semianalysis_cc_traces_weka.py).
1026- REPLAY_CMD+=" --num-dataset-entries 219 "
1026+ REPLAY_CMD+=" --num-dataset-entries 472 "
10271027 # 1-second timeslices on the server-metrics scrape so the post-run
10281028 # plotter has per-window time series (KV usage, cache hit rate,
10291029 # throughput, etc.). Matches kv-cache-tester's poll_interval=1.0
0 commit comments