diff --git a/.github/workflows/scripts/build.sh b/.github/workflows/scripts/build.sh index 2578d448436d2..ed200fe724d3e 100644 --- a/.github/workflows/scripts/build.sh +++ b/.github/workflows/scripts/build.sh @@ -15,6 +15,7 @@ $python_executable -m pip install -r requirements.txt export MAX_JOBS=1 # Make sure punica is built for the release (for LoRA) export VLLM_INSTALL_PUNICA_KERNELS=1 - +# Make sure release wheels are built for the following architectures +export TORCH_CUDA_ARCH_LIST="7.0 7.5 8.0 8.6 8.9 9.0+PTX" # Build $python_executable setup.py bdist_wheel --dist-dir=dist