Upgrade to CUDA 12 (#1527)

Co-authored-by: Woosuk Kwon <woosuk.kwon@berkeley.edu>
This commit is contained in:
Zhuohan Li 2023-11-08 14:17:49 -08:00 committed by GitHub
parent 1a2bbc9301
commit 06458a0b42
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23
5 changed files with 15 additions and 7 deletions

View File

@ -49,8 +49,8 @@ jobs:
matrix:
os: ['ubuntu-20.04']
python-version: ['3.8', '3.9', '3.10', '3.11']
pytorch-version: ['2.0.1']
cuda-version: ['11.8'] # Github runner can't build anything older than 11.8
pytorch-version: ['2.1.0']
cuda-version: ['12.1']
steps:
- name: Checkout

View File

@ -11,5 +11,8 @@ LD_LIBRARY_PATH=${cuda_home}/lib64:$LD_LIBRARY_PATH
$python_executable -m pip install wheel packaging
$python_executable -m pip install -r requirements.txt
# Limit the number of parallel jobs to avoid OOM
export MAX_JOBS=1
# Build
$python_executable setup.py bdist_wheel --dist-dir=dist

View File

@ -16,3 +16,8 @@ sudo apt clean
# Test nvcc
PATH=/usr/local/cuda-$1/bin:${PATH}
nvcc --version
# Log gcc, g++, c++ versions
gcc --version
g++ --version
c++ --version

View File

@ -3,7 +3,7 @@ requires = [
"ninja",
"packaging",
"setuptools",
"torch == 2.0.1",
"torch >= 2.1.0",
"wheel",
]
build-backend = "setuptools.build_meta"

View File

@ -5,9 +5,9 @@ pandas # Required for Ray data.
pyarrow # Required for Ray data.
sentencepiece # Required for LLaMA tokenizer.
numpy
torch == 2.0.1
torch >= 2.1.0
transformers >= 4.34.0 # Required for Mistral.
xformers == 0.0.22 # Required for Mistral.
xformers >= 0.0.22.post7 # Required for CUDA 12.1.
fastapi
uvicorn[standard]
pydantic == 1.10.13 # Required for OpenAI server.