Upgrade to CUDA 12 (#1527)

Co-authored-by: Woosuk Kwon <woosuk.kwon@berkeley.edu>

Upgrade to CUDA 12 (#1527)
Co-authored-by: Woosuk Kwon <woosuk.kwon@berkeley.edu>
06458a0b · Zhuohan Li · GitHub · 1a2bbc93 · 06458a0b · 06458a0b
Unverified Commit 06458a0b authored Nov 08, 2023 by Zhuohan Li Committed by GitHub Nov 08, 2023
5 changed files
--- a/.github/workflows/publish.yml
+++ b/.github/workflows/publish.yml
@@ -49,8 +49,8 @@ jobs:
      matrix:
          os: ['ubuntu-20.04']
          python-version: ['3.8', '3.9', '3.10', '3.11']
-          pytorch-version: ['2.0.1']
+          pytorch-version: ['2.1.0']
-          cuda-version: ['11.8'] # Github runner can't build anything older than 11.8
+          cuda-version: ['12.1']
    steps:
      - name: Checkout

--- a/.github/workflows/scripts/build.sh
+++ b/.github/workflows/scripts/build.sh
@@ -11,5 +11,8 @@ LD_LIBRARY_PATH=${cuda_home}/lib64:$LD_LIBRARY_PATH
 $python_executable -m pip install wheel packaging
 $python_executable -m pip install -r requirements.txt
+# Limit the number of parallel jobs to avoid OOM
+export MAX_JOBS=1
 # Build
 $python_executable setup.py bdist_wheel --dist-dir=dist
--- a/.github/workflows/scripts/cuda-install.sh
+++ b/.github/workflows/scripts/cuda-install.sh
@@ -16,3 +16,8 @@ sudo apt clean
 # Test nvcc
 PATH=/usr/local/cuda-$1/bin:${PATH}
 nvcc --version
+# Log gcc, g++, c++ versions
+gcc --version
+g++ --version
+c++ --version
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -3,7 +3,7 @@ requires = [
    "ninja",
    "packaging",
    "setuptools",
-    "torch == 2.0.1",
+    "torch >= 2.1.0",
    "wheel",
 ]
 build-backend = "setuptools.build_meta"
--- a/requirements.txt
+++ b/requirements.txt
@@ -5,9 +5,9 @@ pandas  # Required for Ray data.
 pyarrow  # Required for Ray data.
 sentencepiece  # Required for LLaMA tokenizer.
 numpy
-torch == 2.0.1
+torch >= 2.1.0
 transformers >= 4.34.0  # Required for Mistral.
-xformers == 0.0.22  # Required for Mistral.
+xformers >= 0.0.22.post7  # Required for CUDA 12.1.
 fastapi
 uvicorn[standard]
 pydantic == 1.10.13  # Required for OpenAI server.