Skip to content

Commit 3c1e18f

Browse files
author
Ylang Tsou
committed
benchmark.sh with 2 repo
Signed-off-by: Ylang Tsou <ylangt@google.com>
1 parent c3dc998 commit 3c1e18f

File tree

2 files changed

+4
-17
lines changed

2 files changed

+4
-17
lines changed

.buildkite/pipeline_test_pypi.yml

Lines changed: 2 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -4,7 +4,6 @@ steps:
44
# -----------------------------------------------------------------
55
- label: "Performance benchmarks for meta-llama/Llama-3.1-8B-Instruct"
66
key: "meta-llama_Llama-3_1-8B-Instruct_Benchmark"
7-
soft_fail: true
87
agents:
98
queue: tpu_v6e_queue
109
env:
@@ -19,7 +18,7 @@ steps:
1918
MAX_NUM_BATCHED_TOKENS: 1024
2019
commands:
2120
- |
22-
.buildkite/scripts/run_with_pypi.sh bash /usr/local/lib/python3.12/site-packages/tpu_inference/tests/e2e/benchmarking/benchmark.sh
21+
.buildkite/scripts/run_with_pypi.sh bash /workspace/tpu_inference/tests/e2e/benchmarking/benchmark.sh
2322
2423
- label: "Performance benchmarks for Qwen/Qwen3-4B"
2524
key: "Qwen_Qwen3-4B_Benchmark"
@@ -37,4 +36,4 @@ steps:
3736
MAX_NUM_BATCHED_TOKENS: 4096
3837
commands:
3938
- |
40-
.buildkite/scripts/run_with_pypi.sh bash /usr/local/lib/python3.12/site-packages/tpu_inference/tests/e2e/benchmarking/benchmark.sh
39+
.buildkite/scripts/run_with_pypi.sh bash /workspace/tpu_inference/tests/e2e/benchmarking/benchmark.sh

docker/Dockerfile.pypi

Lines changed: 2 additions & 14 deletions
Original file line numberDiff line numberDiff line change
@@ -17,26 +17,14 @@ COPY . .
1717
RUN export TPU_INFERENCE_VERSION=$(pip index versions tpu-inference --pre 2>/dev/null | grep -oE "[0-9]+\.[0-9]+\.[0-9]+\.dev[0-9]+" | head -n 1) && \
1818
echo -n "${TPU_INFERENCE_VERSION}" > /tmp/tpu_inference_version
1919

20-
# Clone vLLM
20+
# Build vllm-tpu wheel
2121
WORKDIR /workspace
2222
RUN export VLLM_TPU_VERSION=$(cat /tmp/tpu_inference_version) && \
2323
bash tpu_inference/.buildkite/scripts/build_vllm_tpu.sh ${VLLM_TPU_VERSION} ${VLLM_TPU_VERSION}
2424

25-
# Install vllm-tpu from whl
25+
# Install vllm-tpu wheel
2626
WORKDIR /workspace/vllm
2727
RUN pip install --no-cache-dir dist/*.whl
2828

29-
# Install test dependencies
30-
RUN python3 -m pip install tests/vllm_test_utils
31-
RUN python3 -m pip install --no-cache-dir \
32-
git+https://github.com/thuml/depyf.git \
33-
pytest-asyncio \
34-
git+https://github.com/EleutherAI/lm-evaluation-harness.git@206b7722158f58c35b7ffcd53b035fdbdda5126d#egg=lm-eval[api] \
35-
pytest-cov \
36-
tblib
37-
38-
# Remove repository
39-
WORKDIR /workspace
40-
RUN rm -rf /workspace/vllm /workspace/tpu_inference
4129

4230
CMD ["/bin/bash"]

0 commit comments

Comments
 (0)