File tree Expand file tree Collapse file tree 2 files changed +4
-17
lines changed
Expand file tree Collapse file tree 2 files changed +4
-17
lines changed Original file line number Diff line number Diff line change 44 # -----------------------------------------------------------------
55 - label : " Performance benchmarks for meta-llama/Llama-3.1-8B-Instruct"
66 key : " meta-llama_Llama-3_1-8B-Instruct_Benchmark"
7- soft_fail : true
87 agents :
98 queue : tpu_v6e_queue
109 env :
1918 MAX_NUM_BATCHED_TOKENS : 1024
2019 commands :
2120 - |
22- .buildkite/scripts/run_with_pypi.sh bash /usr/local/lib/python3.12/site-packages /tpu_inference/tests/e2e/benchmarking/benchmark.sh
21+ .buildkite/scripts/run_with_pypi.sh bash /workspace /tpu_inference/tests/e2e/benchmarking/benchmark.sh
2322
2423 - label : " Performance benchmarks for Qwen/Qwen3-4B"
2524 key : " Qwen_Qwen3-4B_Benchmark"
3736 MAX_NUM_BATCHED_TOKENS : 4096
3837 commands :
3938 - |
40- .buildkite/scripts/run_with_pypi.sh bash /usr/local/lib/python3.12/site-packages /tpu_inference/tests/e2e/benchmarking/benchmark.sh
39+ .buildkite/scripts/run_with_pypi.sh bash /workspace /tpu_inference/tests/e2e/benchmarking/benchmark.sh
Original file line number Diff line number Diff line change @@ -17,26 +17,14 @@ COPY . .
1717RUN export TPU_INFERENCE_VERSION=$(pip index versions tpu-inference --pre 2>/dev/null | grep -oE "[0-9]+\.[0-9]+\.[0-9]+\.dev[0-9]+" | head -n 1) && \
1818 echo -n "${TPU_INFERENCE_VERSION}" > /tmp/tpu_inference_version
1919
20- # Clone vLLM
20+ # Build vllm-tpu wheel
2121WORKDIR /workspace
2222RUN export VLLM_TPU_VERSION=$(cat /tmp/tpu_inference_version) && \
2323 bash tpu_inference/.buildkite/scripts/build_vllm_tpu.sh ${VLLM_TPU_VERSION} ${VLLM_TPU_VERSION}
2424
25- # Install vllm-tpu from whl
25+ # Install vllm-tpu wheel
2626WORKDIR /workspace/vllm
2727RUN pip install --no-cache-dir dist/*.whl
2828
29- # Install test dependencies
30- RUN python3 -m pip install tests/vllm_test_utils
31- RUN python3 -m pip install --no-cache-dir \
32- git+https://github.com/thuml/depyf.git \
33- pytest-asyncio \
34- git+https://github.com/EleutherAI/lm-evaluation-harness.git@206b7722158f58c35b7ffcd53b035fdbdda5126d#egg=lm-eval[api] \
35- pytest-cov \
36- tblib
37-
38- # Remove repository
39- WORKDIR /workspace
40- RUN rm -rf /workspace/vllm /workspace/tpu_inference
4129
4230CMD ["/bin/bash"]
You can’t perform that action at this time.
0 commit comments