Skip to content

Commit e538dad

Browse files
committed
Add some CUDA fixes on devgpu
1 parent 5ac18e3 commit e538dad

File tree

2 files changed

+4
-2
lines changed

2 files changed

+4
-2
lines changed

Diff for: vllm-benchmarks/cron.sh

+1
Original file line numberDiff line numberDiff line change
@@ -73,6 +73,7 @@ fi
7373

7474
while :
7575
do
76+
/usr/local/bin/fixmyserver || true
7677
pull_vllm
7778
run_benchmarks
7879
sleep 300

Diff for: vllm-benchmarks/run.sh

+3-2
Original file line numberDiff line numberDiff line change
@@ -42,7 +42,8 @@ build_vllm() {
4242
# Build and install vLLM
4343
if command -v nvidia-smi; then
4444
pip install -r requirements/build.txt
45-
pip install --editable .
45+
# TODO (huydhn): https://github.com/vllm-project/vllm/issues/15435
46+
TORCH_CUDA_ARCH_LIST=8.0 pip install --editable .
4647
elif command -v amd-smi; then
4748
pip install -r requirements/rocm.txt
4849
pip install -r requirements/rocm-build.txt
@@ -61,7 +62,7 @@ run_benchmark() {
6162
export no_proxy=".fbcdn.net,.facebook.com,.thefacebook.com,.tfbnw.net,.fb.com,.fb,localhost,127.0.0.1"
6263
fi
6364

64-
ENGINE_VERSION=v1 SAVE_TO_PYTORCH_BENCHMARK_FORMAT=1 \
65+
ENGINE_VERSION=v1 SAVE_TO_PYTORCH_BENCHMARK_FORMAT=1 CUDA_VISIBLE_DEVICES=4,5,6,7 \
6566
bash .buildkite/nightly-benchmarks/scripts/run-performance-benchmarks.sh > benchmarks.log 2>&1
6667
popd
6768
}

0 commit comments

Comments
 (0)