File tree Expand file tree Collapse file tree 4 files changed +50
-19
lines changed
Expand file tree Collapse file tree 4 files changed +50
-19
lines changed Original file line number Diff line number Diff line change 22 # -----------------------------------------------------------------
33 # TEST STEPS - Calling wrapper
44 # -----------------------------------------------------------------
5- - label : " Wait for 20 mins"
6- if : build.env("NIGHTLY") == "1"
7- key : " wait_20_minutes"
8- depends_on : " record_verified_commit_hashes"
9- agents :
10- queue : cpu
11- commands :
12- - " echo 'Starting 20 minute delay...'"
13- - " sleep 1200"
14- - " echo 'Delay finished, starting benchmarks.'"
15-
165 - label : " Performance benchmarks for meta-llama/Llama-3.1-8B-Instruct"
176 key : " meta-llama_Llama-3_1-8B-Instruct_Benchmark"
18- if : build.env("NIGHTLY") == "1"
19- depends_on : " wait_20_minutes "
7+ # if: build.env("NIGHTLY") == "1"
8+ depends_on : " record_verified_commit_hashes "
209 agents :
2110 queue : tpu_v6e_queue
2211 env :
3423 .buildkite/scripts/run_with_pypi.sh bash /workspace/tpu_inference/tests/e2e/benchmarking/benchmark.sh
3524
3625 - label : " Performance benchmarks for Qwen/Qwen3-4B"
37- if : build.env("NIGHTLY") == "1"
26+ # if: build.env("NIGHTLY") == "1"
3827 key : " Qwen_Qwen3-4B_Benchmark"
39- depends_on : " wait_20_minutes "
28+ depends_on : " record_verified_commit_hashes "
4029 agents :
4130 queue : tpu_v6e_queue
4231 env :
Original file line number Diff line number Diff line change @@ -24,11 +24,11 @@ upload_pipeline() {
2424 VLLM_COMMIT_HASH=$( git ls-remote https://github.com/vllm-project/vllm.git HEAD | awk ' { print $1}' )
2525 buildkite-agent meta-data set " VLLM_COMMIT_HASH" " ${VLLM_COMMIT_HASH} "
2626 echo " Using vllm commit hash: $( buildkite-agent meta-data get " VLLM_COMMIT_HASH" ) "
27- buildkite-agent pipeline upload .buildkite/pipeline_jax.yml
28- buildkite-agent pipeline upload .buildkite/pipeline_jax_tpu7x.yml
27+ # buildkite-agent pipeline upload .buildkite/pipeline_jax.yml
28+ # buildkite-agent pipeline upload .buildkite/pipeline_jax_tpu7x.yml
2929 # buildkite-agent pipeline upload .buildkite/pipeline_torch.yml
3030 buildkite-agent pipeline upload .buildkite/main.yml
31- buildkite-agent pipeline upload .buildkite/nightly_releases.yml
31+ # buildkite-agent pipeline upload .buildkite/nightly_releases.yml
3232 buildkite-agent pipeline upload .buildkite/pipeline_pypi.yml
3333}
3434
Original file line number Diff line number Diff line change 22# Exit on error, exit on unset variable, fail on pipe errors.
33set -euo pipefail
44
5+ # Get the nightly TPU_INFERENCE_VERSION based on the latest stable tag and current date.
6+ LATEST_STABLE_TAG=$( git tag --sort=-v:refname | grep -E ' ^v[0-9]+\.[0-9]+\.[0-9]+$' | head -n 1)
7+ BASE_VERSION=${LATEST_STABLE_TAG# v}
8+ # TODO: Temporary logic for testing. Remove 'yesterday' before merging.
9+ DATETIME_STR=$( date -d ' yesterday' +%Y%m%d)
10+ TPU_INFERENCE_VERSION=" ${BASE_VERSION} .dev${DATETIME_STR} "
11+
12+ echo " Target Nightly Version: ${TPU_INFERENCE_VERSION} "
13+
14+ # Configuration
15+ PACKAGE_NAME=" tpu-inference"
16+ MAX_RETRIES=20
17+ SLEEP_SEC=60
18+ FOUND_VERSION=false
19+
20+ echo " Checking PyPI for ${PACKAGE_NAME} == ${TPU_INFERENCE_VERSION} ..."
21+
22+ # Retry logic to check if the version is available on PyPI
23+ for (( i= 1 ; i<= MAX_RETRIES; i++ )) ; do
24+ if pip index versions " ${PACKAGE_NAME} " --pre 2> /dev/null | grep -q " ${TPU_INFERENCE_VERSION} " ; then
25+ echo " Success! Found version ${TPU_INFERENCE_VERSION} on PyPI."
26+ FOUND_VERSION=true
27+ break
28+ fi
29+
30+ echo " [Attempt $i /$MAX_RETRIES ] Version not found yet. Waiting ${SLEEP_SEC} seconds..."
31+ if [ " $i " -lt " $MAX_RETRIES " ]; then
32+ sleep " $SLEEP_SEC "
33+ fi
34+ done
35+
36+ if [ " $FOUND_VERSION " = " false" ]; then
37+ echo " The version ${TPU_INFERENCE_VERSION} was not found on PyPI."
38+ exit 1
39+ fi
40+
541# Build vllm-tpu with nightly tpu-inference from PyPI (using docker/Dockerfile.pypi instead of docker/Dockerfile).
642export RUN_WITH_PYPI=" true"
743SCRIPT_DIR=$( cd -- " $( dirname -- " ${BASH_SOURCE[0]} " ) " & > /dev/null && pwd)
Original file line number Diff line number Diff line change @@ -5,6 +5,8 @@ ARG VLLM_COMMIT_HASH=""
55
66FROM $BASE_IMAGE
77
8+ ARG IS_FOR_V7X="false"
9+
810# Remove existing versions of dependencies
911RUN pip uninstall -y torch torch_xla torchvision
1012
@@ -17,7 +19,11 @@ RUN apt-get update && apt-get install -y \
1719WORKDIR /workspace/tpu_inference
1820COPY requirements_benchmarking.txt .
1921# These are needed for the E2E benchmarking tests (i.e. tests/e2e/benchmarking/mlperf.sh)
20- RUN pip install -r requirements_benchmarking.txt --retries 3
22+ RUN --mount=type=cache,target=/root/.cache/pip pip install -r requirements_benchmarking.txt --retries 3
23+ COPY requirements_v7x.txt .
24+ RUN --mount=type=cache,target=/root/.cache/pip if [ "$IS_FOR_V7X" = "true" ]; then \
25+ pip install -r requirements_v7x.txt; \
26+ fi
2127COPY . .
2228
2329# Build vllm-tpu wheel
You can’t perform that action at this time.
0 commit comments