Skip to content

Commit 711cb85

Browse files
committed
chore: update agentx weka dataset
1 parent 049a873 commit 711cb85

2 files changed

Lines changed: 7 additions & 7 deletions

File tree

benchmarks/benchmark_lib.sh

Lines changed: 6 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -904,14 +904,14 @@ ensure_hf_cli() {
904904
}
905905

906906
resolve_trace_source() {
907-
local dataset="semianalysisai/cc-traces-weka-with-subagents-051926"
907+
local dataset="semianalysisai/cc-traces-weka-with-subagents-052726"
908908
# aiperf reads the corpus via its public-dataset registry. The
909909
# inferencex-agentx-mvp scenario hard-requires loader=one of
910910
# ['semianalysis_cc_traces_weka_with_subagents', 'weka_trace'] (see
911911
# aiperf src/aiperf/common/scenario/inferencex_agentx_mvp.py's
912912
# `require_loader`). The with-subagents corpus captures the parent +
913913
# Task-tool sub-agent fan-out structure of real Claude Code sessions
914-
# (219 traces, v5-only, CC >= 2.1.139, classifier-call OSL spike
914+
# (472 traces, v5-only, CC >= 2.1.139, classifier-call OSL spike
915915
# filtered).
916916
TRACE_SOURCE_FLAG="--public-dataset semianalysis_cc_traces_weka_with_subagents"
917917
echo "Loading traces via aiperf public-dataset: semianalysis_cc_traces_weka_with_subagents ($dataset)"
@@ -969,7 +969,7 @@ build_replay_cmd() {
969969

970970
export AIPERF_DATASET_WEKA_LIVE_ASSISTANT_RESPONSES="${AIPERF_DATASET_WEKA_LIVE_ASSISTANT_RESPONSES:-0}"
971971
# Dataset configuration (load + reconstruct + inputs.json + mmap)
972-
# routinely takes 4-5 min for the 949-trace weka corpus on fast /tmp
972+
# routinely takes 4-5 min for the Weka corpus on fast /tmp
973973
# (B300) but can stretch to 14 min on slower /tmp + parallel contention
974974
# (observed on H200 where all 14 R3 jobs hit aiperf's 900s Configure
975975
# Profiling timeout simultaneously). Bump to 1800s to absorb 3x
@@ -1019,11 +1019,11 @@ build_replay_cmd() {
10191019
if [ -n "${MAX_MODEL_LEN:-}" ] && [ "$MAX_MODEL_LEN" != "0" ]; then
10201020
REPLAY_CMD+=" --max-context-length $MAX_MODEL_LEN"
10211021
fi
1022-
# Default --num-dataset-entries is 100; the with-subagents weka corpus
1023-
# has 219. Cap at 219 so all unique traces are loaded (the loader treats
1022+
# Default --num-dataset-entries is 100; the with-subagents Weka corpus
1023+
# has 472. Cap at 472 so all unique traces are loaded (the loader treats
10241024
# this as a ``min(cap, available)`` ceiling, not a target — see
10251025
# semianalysis_cc_traces_weka.py).
1026-
REPLAY_CMD+=" --num-dataset-entries 219"
1026+
REPLAY_CMD+=" --num-dataset-entries 472"
10271027
# 1-second timeslices on the server-metrics scrape so the post-run
10281028
# plotter has per-window time series (KV usage, cache hit rate,
10291029
# throughput, etc.). Matches kv-cache-tester's poll_interval=1.0

0 commit comments

Comments
 (0)