Unverified Commit 06458a0b authored by Zhuohan Li's avatar Zhuohan Li Committed by GitHub
Browse files

Upgrade to CUDA 12 (#1527)


Co-authored-by: default avatarWoosuk Kwon <woosuk.kwon@berkeley.edu>
parent 1a2bbc93
...@@ -49,8 +49,8 @@ jobs: ...@@ -49,8 +49,8 @@ jobs:
matrix: matrix:
os: ['ubuntu-20.04'] os: ['ubuntu-20.04']
python-version: ['3.8', '3.9', '3.10', '3.11'] python-version: ['3.8', '3.9', '3.10', '3.11']
pytorch-version: ['2.0.1'] pytorch-version: ['2.1.0']
cuda-version: ['11.8'] # Github runner can't build anything older than 11.8 cuda-version: ['12.1']
steps: steps:
- name: Checkout - name: Checkout
......
...@@ -11,5 +11,8 @@ LD_LIBRARY_PATH=${cuda_home}/lib64:$LD_LIBRARY_PATH ...@@ -11,5 +11,8 @@ LD_LIBRARY_PATH=${cuda_home}/lib64:$LD_LIBRARY_PATH
$python_executable -m pip install wheel packaging $python_executable -m pip install wheel packaging
$python_executable -m pip install -r requirements.txt $python_executable -m pip install -r requirements.txt
# Limit the number of parallel jobs to avoid OOM
export MAX_JOBS=1
# Build # Build
$python_executable setup.py bdist_wheel --dist-dir=dist $python_executable setup.py bdist_wheel --dist-dir=dist
...@@ -16,3 +16,8 @@ sudo apt clean ...@@ -16,3 +16,8 @@ sudo apt clean
# Test nvcc # Test nvcc
PATH=/usr/local/cuda-$1/bin:${PATH} PATH=/usr/local/cuda-$1/bin:${PATH}
nvcc --version nvcc --version
# Log gcc, g++, c++ versions
gcc --version
g++ --version
c++ --version
...@@ -3,7 +3,7 @@ requires = [ ...@@ -3,7 +3,7 @@ requires = [
"ninja", "ninja",
"packaging", "packaging",
"setuptools", "setuptools",
"torch == 2.0.1", "torch >= 2.1.0",
"wheel", "wheel",
] ]
build-backend = "setuptools.build_meta" build-backend = "setuptools.build_meta"
...@@ -5,9 +5,9 @@ pandas # Required for Ray data. ...@@ -5,9 +5,9 @@ pandas # Required for Ray data.
pyarrow # Required for Ray data. pyarrow # Required for Ray data.
sentencepiece # Required for LLaMA tokenizer. sentencepiece # Required for LLaMA tokenizer.
numpy numpy
torch == 2.0.1 torch >= 2.1.0
transformers >= 4.34.0 # Required for Mistral. transformers >= 4.34.0 # Required for Mistral.
xformers == 0.0.22 # Required for Mistral. xformers >= 0.0.22.post7 # Required for CUDA 12.1.
fastapi fastapi
uvicorn[standard] uvicorn[standard]
pydantic == 1.10.13 # Required for OpenAI server. pydantic == 1.10.13 # Required for OpenAI server.
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment