diff --git a/.github/workflows/publish.yml b/.github/workflows/publish.yml index e4210734..aeba1ee5 100644 --- a/.github/workflows/publish.yml +++ b/.github/workflows/publish.yml @@ -43,14 +43,14 @@ jobs: name: Build Wheel runs-on: ${{ matrix.os }} needs: release - + strategy: fail-fast: false matrix: os: ['ubuntu-20.04'] python-version: ['3.8', '3.9', '3.10', '3.11'] - pytorch-version: ['2.0.1'] - cuda-version: ['11.8'] # Github runner can't build anything older than 11.8 + pytorch-version: ['2.1.0'] + cuda-version: ['12.1'] steps: - name: Checkout @@ -82,7 +82,7 @@ jobs: asset_name=${wheel_name//"linux"/"manylinux1"} echo "wheel_name=${wheel_name}" >> $GITHUB_ENV echo "asset_name=${asset_name}" >> $GITHUB_ENV - + - name: Upload Release Asset uses: actions/upload-release-asset@v1 env: diff --git a/.github/workflows/scripts/build.sh b/.github/workflows/scripts/build.sh index f8dead41..cf3bc118 100644 --- a/.github/workflows/scripts/build.sh +++ b/.github/workflows/scripts/build.sh @@ -11,5 +11,8 @@ LD_LIBRARY_PATH=${cuda_home}/lib64:$LD_LIBRARY_PATH $python_executable -m pip install wheel packaging $python_executable -m pip install -r requirements.txt +# Limit the number of parallel jobs to avoid OOM +export MAX_JOBS=1 + # Build $python_executable setup.py bdist_wheel --dist-dir=dist diff --git a/.github/workflows/scripts/cuda-install.sh b/.github/workflows/scripts/cuda-install.sh index 674bc8c9..312c6e82 100644 --- a/.github/workflows/scripts/cuda-install.sh +++ b/.github/workflows/scripts/cuda-install.sh @@ -16,3 +16,8 @@ sudo apt clean # Test nvcc PATH=/usr/local/cuda-$1/bin:${PATH} nvcc --version + +# Log gcc, g++, c++ versions +gcc --version +g++ --version +c++ --version diff --git a/pyproject.toml b/pyproject.toml index 360e023a..27285bb6 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -3,7 +3,7 @@ requires = [ "ninja", "packaging", "setuptools", - "torch == 2.0.1", + "torch >= 2.1.0", "wheel", ] build-backend = "setuptools.build_meta" diff --git a/requirements.txt b/requirements.txt index d8597b3e..fa9eb638 100644 --- a/requirements.txt +++ b/requirements.txt @@ -5,9 +5,9 @@ pandas # Required for Ray data. pyarrow # Required for Ray data. sentencepiece # Required for LLaMA tokenizer. numpy -torch == 2.0.1 +torch >= 2.1.0 transformers >= 4.34.0 # Required for Mistral. -xformers == 0.0.22 # Required for Mistral. +xformers >= 0.0.22.post7 # Required for CUDA 12.1. fastapi uvicorn[standard] pydantic == 1.10.13 # Required for OpenAI server.