Upgrade to CUDA 12 (#1527)
Co-authored-by: Woosuk Kwon <woosuk.kwon@berkeley.edu>
This commit is contained in:
parent
1a2bbc9301
commit
06458a0b42
8
.github/workflows/publish.yml
vendored
8
.github/workflows/publish.yml
vendored
@ -43,14 +43,14 @@ jobs:
|
|||||||
name: Build Wheel
|
name: Build Wheel
|
||||||
runs-on: ${{ matrix.os }}
|
runs-on: ${{ matrix.os }}
|
||||||
needs: release
|
needs: release
|
||||||
|
|
||||||
strategy:
|
strategy:
|
||||||
fail-fast: false
|
fail-fast: false
|
||||||
matrix:
|
matrix:
|
||||||
os: ['ubuntu-20.04']
|
os: ['ubuntu-20.04']
|
||||||
python-version: ['3.8', '3.9', '3.10', '3.11']
|
python-version: ['3.8', '3.9', '3.10', '3.11']
|
||||||
pytorch-version: ['2.0.1']
|
pytorch-version: ['2.1.0']
|
||||||
cuda-version: ['11.8'] # Github runner can't build anything older than 11.8
|
cuda-version: ['12.1']
|
||||||
|
|
||||||
steps:
|
steps:
|
||||||
- name: Checkout
|
- name: Checkout
|
||||||
@ -82,7 +82,7 @@ jobs:
|
|||||||
asset_name=${wheel_name//"linux"/"manylinux1"}
|
asset_name=${wheel_name//"linux"/"manylinux1"}
|
||||||
echo "wheel_name=${wheel_name}" >> $GITHUB_ENV
|
echo "wheel_name=${wheel_name}" >> $GITHUB_ENV
|
||||||
echo "asset_name=${asset_name}" >> $GITHUB_ENV
|
echo "asset_name=${asset_name}" >> $GITHUB_ENV
|
||||||
|
|
||||||
- name: Upload Release Asset
|
- name: Upload Release Asset
|
||||||
uses: actions/upload-release-asset@v1
|
uses: actions/upload-release-asset@v1
|
||||||
env:
|
env:
|
||||||
|
|||||||
3
.github/workflows/scripts/build.sh
vendored
3
.github/workflows/scripts/build.sh
vendored
@ -11,5 +11,8 @@ LD_LIBRARY_PATH=${cuda_home}/lib64:$LD_LIBRARY_PATH
|
|||||||
$python_executable -m pip install wheel packaging
|
$python_executable -m pip install wheel packaging
|
||||||
$python_executable -m pip install -r requirements.txt
|
$python_executable -m pip install -r requirements.txt
|
||||||
|
|
||||||
|
# Limit the number of parallel jobs to avoid OOM
|
||||||
|
export MAX_JOBS=1
|
||||||
|
|
||||||
# Build
|
# Build
|
||||||
$python_executable setup.py bdist_wheel --dist-dir=dist
|
$python_executable setup.py bdist_wheel --dist-dir=dist
|
||||||
|
|||||||
5
.github/workflows/scripts/cuda-install.sh
vendored
5
.github/workflows/scripts/cuda-install.sh
vendored
@ -16,3 +16,8 @@ sudo apt clean
|
|||||||
# Test nvcc
|
# Test nvcc
|
||||||
PATH=/usr/local/cuda-$1/bin:${PATH}
|
PATH=/usr/local/cuda-$1/bin:${PATH}
|
||||||
nvcc --version
|
nvcc --version
|
||||||
|
|
||||||
|
# Log gcc, g++, c++ versions
|
||||||
|
gcc --version
|
||||||
|
g++ --version
|
||||||
|
c++ --version
|
||||||
|
|||||||
@ -3,7 +3,7 @@ requires = [
|
|||||||
"ninja",
|
"ninja",
|
||||||
"packaging",
|
"packaging",
|
||||||
"setuptools",
|
"setuptools",
|
||||||
"torch == 2.0.1",
|
"torch >= 2.1.0",
|
||||||
"wheel",
|
"wheel",
|
||||||
]
|
]
|
||||||
build-backend = "setuptools.build_meta"
|
build-backend = "setuptools.build_meta"
|
||||||
|
|||||||
@ -5,9 +5,9 @@ pandas # Required for Ray data.
|
|||||||
pyarrow # Required for Ray data.
|
pyarrow # Required for Ray data.
|
||||||
sentencepiece # Required for LLaMA tokenizer.
|
sentencepiece # Required for LLaMA tokenizer.
|
||||||
numpy
|
numpy
|
||||||
torch == 2.0.1
|
torch >= 2.1.0
|
||||||
transformers >= 4.34.0 # Required for Mistral.
|
transformers >= 4.34.0 # Required for Mistral.
|
||||||
xformers == 0.0.22 # Required for Mistral.
|
xformers >= 0.0.22.post7 # Required for CUDA 12.1.
|
||||||
fastapi
|
fastapi
|
||||||
uvicorn[standard]
|
uvicorn[standard]
|
||||||
pydantic == 1.10.13 # Required for OpenAI server.
|
pydantic == 1.10.13 # Required for OpenAI server.
|
||||||
|
|||||||
Loading…
Reference in New Issue
Block a user