Skip to content

Commit 4be3ef0

Browse files
committed
fix(agentx): re-enable weka live assistant replay
1 parent 967c50c commit 4be3ef0

2 files changed

Lines changed: 9 additions & 9 deletions

File tree

benchmarks/benchmark_lib.sh

Lines changed: 8 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -949,13 +949,13 @@ install_agentic_deps() {
949949
build_replay_cmd() {
950950
# aiperf invocation for the inferencex-agentx-mvp scenario.
951951
#
952-
# Weka pre-canned assistant mode is the default
953-
# (AIPERF_DATASET_WEKA_LIVE_ASSISTANT_RESPONSES=0): the loader emits
954-
# reconstructed assistant segments from the trace and AIPerf discards
955-
# the server's live response for future prompt construction. This keeps
956-
# reset_context payloads self-contained and preserves hash-id fidelity.
957-
# Set AIPERF_DATASET_WEKA_LIVE_ASSISTANT_RESPONSES=1 explicitly to test
958-
# live-response threading.
952+
# Live-assistant mode is the default
953+
# (AIPERF_DATASET_WEKA_LIVE_ASSISTANT_RESPONSES=1): the loader emits
954+
# user-only deltas and the worker threads the server's live assistant
955+
# response back into the session. Set
956+
# AIPERF_DATASET_WEKA_LIVE_ASSISTANT_RESPONSES=0 explicitly to compare
957+
# against pre-canned assistant replay, where the server response is
958+
# discarded for future prompt construction.
959959
#
960960
# The scenario plugin locks: --cache-bust first_turn_prefix and
961961
# --trace-idle-gap-cap-seconds 60 (per-trace idle-gap compression
@@ -966,7 +966,7 @@ build_replay_cmd() {
966966
local result_dir="$1"
967967
local duration="${DURATION:-1800}"
968968

969-
export AIPERF_DATASET_WEKA_LIVE_ASSISTANT_RESPONSES="${AIPERF_DATASET_WEKA_LIVE_ASSISTANT_RESPONSES:-0}"
969+
export AIPERF_DATASET_WEKA_LIVE_ASSISTANT_RESPONSES="${AIPERF_DATASET_WEKA_LIVE_ASSISTANT_RESPONSES:-1}"
970970
# Dataset configuration (load + reconstruct + inputs.json + mmap)
971971
# routinely takes 4-5 min for the 949-trace weka corpus on fast /tmp
972972
# (B300) but can stretch to 14 min on slower /tmp + parallel contention

0 commit comments

Comments
 (0)