|
| 1 | +name: Build Wheels (CUDA) |
| 2 | + |
| 3 | +on: workflow_dispatch |
| 4 | + |
| 5 | +permissions: |
| 6 | + contents: write |
| 7 | + |
| 8 | +jobs: |
| 9 | + define_matrix: |
| 10 | + name: Define Build Matrix |
| 11 | + runs-on: ubuntu-latest |
| 12 | + outputs: |
| 13 | + matrix: ${{ steps.set-matrix.outputs.matrix }} |
| 14 | + defaults: |
| 15 | + run: |
| 16 | + shell: pwsh |
| 17 | + |
| 18 | + steps: |
| 19 | + - name: Define Job Output |
| 20 | + id: set-matrix |
| 21 | + run: | |
| 22 | + $matrix = @{ |
| 23 | + 'os' = @('ubuntu-latest', 'windows-2019') |
| 24 | + 'pyver' = @("3.9", "3.10", "3.11", "3.12") |
| 25 | + 'cuda' = @("12.1.1", "12.2.2", "12.3.2", "12.4.1") #, "12.5.1", "12.6.1") |
| 26 | + 'releasetag' = @("basic") |
| 27 | + } |
| 28 | +
|
| 29 | + $matrixOut = ConvertTo-Json $matrix -Compress |
| 30 | + Write-Output ('matrix=' + $matrixOut) >> $env:GITHUB_OUTPUT |
| 31 | +
|
| 32 | + build_wheels: |
| 33 | + name: Build Wheel ${{ matrix.os }} ${{ matrix.pyver }} ${{ matrix.cuda }} ${{ matrix.releasetag == 'wheels' && 'AVX2' || matrix.releasetag }} |
| 34 | + needs: define_matrix |
| 35 | + runs-on: ${{ matrix.os }} |
| 36 | + strategy: |
| 37 | + matrix: ${{ fromJSON(needs.define_matrix.outputs.matrix) }} |
| 38 | + defaults: |
| 39 | + run: |
| 40 | + shell: pwsh |
| 41 | + env: |
| 42 | + CUDAVER: ${{ matrix.cuda }} |
| 43 | + AVXVER: ${{ matrix.releasetag }} |
| 44 | + |
| 45 | + steps: |
| 46 | + - name: Add MSBuild to PATH |
| 47 | + if: runner.os == 'Windows' |
| 48 | + uses: microsoft/setup-msbuild@v2 |
| 49 | + with: |
| 50 | + vs-version: '[16.11,16.12)' |
| 51 | + |
| 52 | + - uses: actions/checkout@v4 |
| 53 | + with: |
| 54 | + submodules: "recursive" |
| 55 | + |
| 56 | + - uses: actions/setup-python@v5 |
| 57 | + with: |
| 58 | + python-version: ${{ matrix.pyver }} |
| 59 | + cache: 'pip' |
| 60 | + |
| 61 | + - name: Setup Mamba |
| 62 | + uses: conda-incubator/setup-miniconda@v3.1.0 |
| 63 | + with: |
| 64 | + activate-environment: "build" |
| 65 | + python-version: ${{ matrix.pyver }} |
| 66 | + miniforge-variant: Mambaforge |
| 67 | + miniforge-version: latest |
| 68 | + use-mamba: true |
| 69 | + add-pip-as-python-dependency: true |
| 70 | + auto-activate-base: false |
| 71 | + |
| 72 | + - name: VS Integration Cache |
| 73 | + id: vs-integration-cache |
| 74 | + if: runner.os == 'Windows' |
| 75 | + uses: actions/cache@v4 |
| 76 | + with: |
| 77 | + path: ./MSBuildExtensions |
| 78 | + key: cuda-${{ matrix.cuda }}-vs-integration |
| 79 | + |
| 80 | + - name: Get Visual Studio Integration |
| 81 | + if: runner.os == 'Windows' && steps.vs-integration-cache.outputs.cache-hit != 'true' |
| 82 | + run: | |
| 83 | + if ($env:CUDAVER -eq '12.1.1') {$x = '12.1.0'} else {$x = $env:CUDAVER} |
| 84 | + $links = (Invoke-RestMethod 'https://raw.githubusercontent.com/Jimver/cuda-toolkit/master/src/links/windows-links.ts').Trim().split().where({$_ -ne ''}) |
| 85 | + for ($i=$q=0;$i -lt $links.count -and $q -lt 2;$i++) {if ($links[$i] -eq "'$x',") {$q++}} |
| 86 | + Invoke-RestMethod $links[$i].Trim("'") -OutFile 'cudainstaller.zip' |
| 87 | + & 'C:\Program Files\7-Zip\7z.exe' e cudainstaller.zip -oMSBuildExtensions -r *\MSBuildExtensions\* > $null |
| 88 | + Remove-Item 'cudainstaller.zip' |
| 89 | +
|
| 90 | + - name: Install Visual Studio Integration |
| 91 | + if: runner.os == 'Windows' |
| 92 | + run: | |
| 93 | + $y = (gi '.\MSBuildExtensions').fullname + '\*' |
| 94 | + (gi 'C:\Program Files (x86)\Microsoft Visual Studio\2019\Enterprise\MSBuild\Microsoft\VC\*\BuildCustomizations').fullname.foreach({cp $y $_}) |
| 95 | + $cupath = 'CUDA_PATH_V' + $env:CUDAVER.Remove($env:CUDAVER.LastIndexOf('.')).Replace('.','_') |
| 96 | + echo "$cupath=$env:CONDA_PREFIX" >> $env:GITHUB_ENV |
| 97 | +
|
| 98 | + - name: Install Dependencies |
| 99 | + env: |
| 100 | + MAMBA_DOWNLOAD_FAILFAST: "0" |
| 101 | + MAMBA_NO_LOW_SPEED_LIMIT: "1" |
| 102 | + run: | |
| 103 | + $cudaVersion = $env:CUDAVER |
| 104 | + mamba install -y 'cuda' -c nvidia/label/cuda-$cudaVersion |
| 105 | + python -m pip install build wheel |
| 106 | +
|
| 107 | + - name: Build Wheel |
| 108 | + run: | |
| 109 | + $cudaVersion = $env:CUDAVER.Remove($env:CUDAVER.LastIndexOf('.')).Replace('.','') |
| 110 | + $env:CUDA_PATH = $env:CONDA_PREFIX |
| 111 | + $env:CUDA_HOME = $env:CONDA_PREFIX |
| 112 | + $env:CUDA_TOOLKIT_ROOT_DIR = $env:CONDA_PREFIX |
| 113 | + if ($IsLinux) { |
| 114 | + $env:LD_LIBRARY_PATH = $env:CONDA_PREFIX + '/lib:' + $env:LD_LIBRARY_PATH |
| 115 | + } |
| 116 | + $env:VERBOSE = '1' |
| 117 | + $env:CMAKE_ARGS = '-DGGML_CUDA=on -DCMAKE_CUDA_ARCHITECTURES=all' |
| 118 | + $env:CMAKE_ARGS = "-DGGML_CUDA_FORCE_MMQ=ON $env:CMAKE_ARGS" |
| 119 | + # if ($env:AVXVER -eq 'AVX') { |
| 120 | + $env:CMAKE_ARGS = $env:CMAKE_ARGS + ' -DGGML_AVX2=off -DGGML_FMA=off -DGGML_F16C=off' |
| 121 | + # } |
| 122 | + # if ($env:AVXVER -eq 'AVX512') { |
| 123 | + # $env:CMAKE_ARGS = $env:CMAKE_ARGS + ' -DGGML_AVX512=on' |
| 124 | + # } |
| 125 | + # if ($env:AVXVER -eq 'basic') { |
| 126 | + # $env:CMAKE_ARGS = $env:CMAKE_ARGS + ' -DGGML_AVX=off -DGGML_AVX2=off -DGGML_FMA=off -DGGML_F16C=off' |
| 127 | + # } |
| 128 | + python -m build --wheel |
| 129 | + # write the build tag to the output |
| 130 | + Write-Output "CUDA_VERSION=$cudaVersion" >> $env:GITHUB_ENV |
| 131 | +
|
| 132 | + - uses: softprops/action-gh-release@v2 |
| 133 | + with: |
| 134 | + files: dist/* |
| 135 | + # Set tag_name to <tag>-cu<cuda_version> |
| 136 | + tag_name: ${{ github.ref_name }}-cu${{ env.CUDA_VERSION }} |
| 137 | + env: |
| 138 | + GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }} |
0 commit comments