diff --git a/.github/workflows/release.yaml b/.github/workflows/release.yaml index 6c66138ca333..00e27c271695 100644 --- a/.github/workflows/release.yaml +++ b/.github/workflows/release.yaml @@ -20,6 +20,10 @@ jobs: defines: '-DLLAMA_AVX2=OFF' - build: 'avx512' defines: '-DLLAMA_AVX512=ON' + - build: 'cuda12' + defines: '' + # - build: 'cuda11' + # defines: '' runs-on: ubuntu-latest steps: - name: Clone @@ -33,7 +37,13 @@ jobs: run: | sudo apt-get update sudo apt-get install build-essential ffmpeg - + - name: Install CUDA Dependencies + if: ${{ matrix.build == 'cuda12' || matrix.build == 'cuda11' }} + run: | + curl -O https://developer.download.nvidia.com/compute/cuda/repos/ubuntu2204/x86_64/cuda-keyring_1.1-1_all.deb + dpkg -i cuda-keyring_1.1-1_all.deb + apt-get update + apt-get install -y cuda-nvcc-12-3 libcublas-dev-12-3 - name: Cache grpc id: cache-grpc uses: actions/cache@v3 @@ -50,14 +60,20 @@ jobs: - name: Install gRPC run: | cd grpc && cd cmake/build && sudo make -j12 install - - name: Build id: build env: CMAKE_ARGS: "${{ matrix.defines }}" BUILD_ID: "${{ matrix.build }}" run: | - STATIC=true make dist + # check if cuda + if [ "${{ matrix.build }}" == "cuda12" ] || [ "${{ matrix.build }}" == "cuda11" ]; then + export BUILD_TYPE=cublas + export PATH=/usr/local/cuda/bin:$PATH + BUILD_GRPC_FOR_BACKEND_LLAMA=ON make dist + else + STATIC=true make dist + fi - uses: actions/upload-artifact@v3 with: name: ${{ matrix.build }}