@@ -949,13 +949,13 @@ install_agentic_deps() {
949949build_replay_cmd () {
950950 # aiperf invocation for the inferencex-agentx-mvp scenario.
951951 #
952- # Weka pre-canned assistant mode is the default
953- # (AIPERF_DATASET_WEKA_LIVE_ASSISTANT_RESPONSES=0 ): the loader emits
954- # reconstructed assistant segments from the trace and AIPerf discards
955- # the server's live response for future prompt construction. This keeps
956- # reset_context payloads self-contained and preserves hash-id fidelity.
957- # Set AIPERF_DATASET_WEKA_LIVE_ASSISTANT_RESPONSES=1 explicitly to test
958- # live-response threading .
952+ # Live- assistant mode is the default
953+ # (AIPERF_DATASET_WEKA_LIVE_ASSISTANT_RESPONSES=1 ): the loader emits
954+ # user-only deltas and the worker threads the server's live assistant
955+ # response back into the session. Set
956+ # AIPERF_DATASET_WEKA_LIVE_ASSISTANT_RESPONSES=0 explicitly to compare
957+ # against pre-canned assistant replay, where the server response is
958+ # discarded for future prompt construction .
959959 #
960960 # The scenario plugin locks: --cache-bust first_turn_prefix and
961961 # --trace-idle-gap-cap-seconds 60 (per-trace idle-gap compression
@@ -966,7 +966,7 @@ build_replay_cmd() {
966966 local result_dir=" $1 "
967967 local duration=" ${DURATION:- 1800} "
968968
969- export AIPERF_DATASET_WEKA_LIVE_ASSISTANT_RESPONSES=" ${AIPERF_DATASET_WEKA_LIVE_ASSISTANT_RESPONSES:- 0 } "
969+ export AIPERF_DATASET_WEKA_LIVE_ASSISTANT_RESPONSES=" ${AIPERF_DATASET_WEKA_LIVE_ASSISTANT_RESPONSES:- 1 } "
970970 # Dataset configuration (load + reconstruct + inputs.json + mmap)
971971 # routinely takes 4-5 min for the 949-trace weka corpus on fast /tmp
972972 # (B300) but can stretch to 14 min on slower /tmp + parallel contention
0 commit comments