From e64ccdabd136057aae00f3d838834789e390107f Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Sun, 31 Aug 2025 14:26:16 +0700 Subject: [PATCH 001/221] Create manual_wheel_cuda.yml --- .github/workflows/manual_wheel_cuda.yml | 136 ++++++++++++++++++++++++ 1 file changed, 136 insertions(+) create mode 100644 .github/workflows/manual_wheel_cuda.yml diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml new file mode 100644 index 0000000000..0870bcf10e --- /dev/null +++ b/.github/workflows/manual_wheel_cuda.yml @@ -0,0 +1,136 @@ +name: Build Wheels (CUDA) + +on: workflow_dispatch + +permissions: + contents: write + +jobs: + define_matrix: + name: Define Build Matrix + runs-on: ubuntu-22.04 + outputs: + matrix: ${{ steps.set-matrix.outputs.matrix }} + defaults: + run: + shell: pwsh + + steps: + - name: Define Job Output + id: set-matrix + run: | + $matrix = @{ + 'os' = @('ubuntu-22.04') #, 'windows-2022') + 'pyver' = @("3.9", "3.10", "3.11", "3.12") + 'cuda' = @("12.1.1", "12.2.2", "12.3.2", "12.4.1", "12.5.1", "12.6.1", "12.8.0", "12.9.2") + 'releasetag' = @("basic") + } + + $matrixOut = ConvertTo-Json $matrix -Compress + Write-Output ('matrix=' + $matrixOut) >> $env:GITHUB_OUTPUT + + build_wheels: + name: Build Wheel ${{ matrix.os }} ${{ matrix.pyver }} ${{ matrix.cuda }} ${{ matrix.releasetag == 'wheels' && 'AVX2' || matrix.releasetag }} + needs: define_matrix + runs-on: ${{ matrix.os }} + strategy: + matrix: ${{ fromJSON(needs.define_matrix.outputs.matrix) }} + defaults: + run: + shell: pwsh + env: + CUDAVER: ${{ matrix.cuda }} + AVXVER: ${{ matrix.releasetag }} + + steps: + - name: Add MSBuild to PATH + if: runner.os == 'Windows' + uses: microsoft/setup-msbuild@v2 + with: + vs-version: '[16.11,16.12)' + + - uses: actions/checkout@v4 + with: + submodules: "recursive" + + - uses: actions/setup-python@v5 + with: + python-version: ${{ matrix.pyver }} + cache: 'pip' + + - name: Setup Mamba + uses: conda-incubator/setup-miniconda@v3.1.0 + with: + activate-environment: "llamacpp" + python-version: ${{ matrix.pyver }} + miniforge-version: latest + add-pip-as-python-dependency: true + auto-activate-base: false + + - name: VS Integration Cache + id: vs-integration-cache + if: runner.os == 'Windows' + uses: actions/cache@v4 + with: + path: ./MSBuildExtensions + key: cuda-${{ matrix.cuda }}-vs-integration + + - name: Get Visual Studio Integration + if: runner.os == 'Windows' && steps.vs-integration-cache.outputs.cache-hit != 'true' + run: | + if ($env:CUDAVER -eq '12.1.1') {$x = '12.1.0'} else {$x = $env:CUDAVER} + $links = (Invoke-RestMethod 'https://raw.githubusercontent.com/Jimver/cuda-toolkit/master/src/links/windows-links.ts').Trim().split().where({$_ -ne ''}) + for ($i=$q=0;$i -lt $links.count -and $q -lt 2;$i++) {if ($links[$i] -eq "'$x',") {$q++}} + Invoke-RestMethod $links[$i].Trim("'") -OutFile 'cudainstaller.zip' + & 'C:\Program Files\7-Zip\7z.exe' e cudainstaller.zip -oMSBuildExtensions -r *\MSBuildExtensions\* > $null + Remove-Item 'cudainstaller.zip' + + - name: Install Visual Studio Integration + if: runner.os == 'Windows' + run: | + $y = (gi '.\MSBuildExtensions').fullname + '\*' + (gi 'C:\Program Files (x86)\Microsoft Visual Studio\2019\Enterprise\MSBuild\Microsoft\VC\*\BuildCustomizations').fullname.foreach({cp $y $_}) + $cupath = 'CUDA_PATH_V' + $env:CUDAVER.Remove($env:CUDAVER.LastIndexOf('.')).Replace('.','_') + echo "$cupath=$env:CONDA_PREFIX" >> $env:GITHUB_ENV + + - name: Install Dependencies + env: + MAMBA_DOWNLOAD_FAILFAST: "0" + MAMBA_NO_LOW_SPEED_LIMIT: "1" + run: | + $cudaVersion = $env:CUDAVER + mamba install -y 'cuda' -c nvidia/label/cuda-$cudaVersion + python -m pip install build wheel + + - name: Build Wheel + run: | + $cudaVersion = $env:CUDAVER.Remove($env:CUDAVER.LastIndexOf('.')).Replace('.','') + $env:CUDA_PATH = $env:CONDA_PREFIX + $env:CUDA_HOME = $env:CONDA_PREFIX + $env:CUDA_TOOLKIT_ROOT_DIR = $env:CONDA_PREFIX + if ($IsLinux) { + $env:LD_LIBRARY_PATH = $env:CONDA_PREFIX + '/lib:' + $env:LD_LIBRARY_PATH + } + $env:VERBOSE = '1' + $env:CMAKE_ARGS = '-DGGML_CUDA=on -DCMAKE_CUDA_ARCHITECTURES=all' + $env:CMAKE_ARGS = "-DGGML_CUDA_FORCE_MMQ=ON $env:CMAKE_ARGS" + # if ($env:AVXVER -eq 'AVX') { + $env:CMAKE_ARGS = $env:CMAKE_ARGS + ' -DGGML_AVX2=off -DGGML_FMA=off -DGGML_F16C=off' + # } + # if ($env:AVXVER -eq 'AVX512') { + # $env:CMAKE_ARGS = $env:CMAKE_ARGS + ' -DGGML_AVX512=on' + # } + # if ($env:AVXVER -eq 'basic') { + # $env:CMAKE_ARGS = $env:CMAKE_ARGS + ' -DGGML_AVX=off -DGGML_AVX2=off -DGGML_FMA=off -DGGML_F16C=off' + # } + python -m build --wheel + # write the build tag to the output + Write-Output "CUDA_VERSION=$cudaVersion" >> $env:GITHUB_ENV + + - uses: softprops/action-gh-release@v2 + with: + files: dist/* + # Set tag_name to -cu + tag_name: ${{ github.ref_name }}-cu${{ env.CUDA_VERSION }} + env: + GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }} From cb2687265e5fd335bf9b8890c19a34d995f41861 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Sun, 31 Aug 2025 14:52:10 +0700 Subject: [PATCH 002/221] Try with ubuntu-latest --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 0870bcf10e..1553c71a33 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -8,7 +8,7 @@ permissions: jobs: define_matrix: name: Define Build Matrix - runs-on: ubuntu-22.04 + runs-on: ubuntu-latest outputs: matrix: ${{ steps.set-matrix.outputs.matrix }} defaults: From 6320995a8b3bc74f96e6ae094109bef325b1b8f5 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Sun, 31 Aug 2025 19:26:16 +0700 Subject: [PATCH 003/221] Removing old python and cuda --- .github/workflows/manual_wheel_cuda.yml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 1553c71a33..883f04ff9f 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -21,8 +21,8 @@ jobs: run: | $matrix = @{ 'os' = @('ubuntu-22.04') #, 'windows-2022') - 'pyver' = @("3.9", "3.10", "3.11", "3.12") - 'cuda' = @("12.1.1", "12.2.2", "12.3.2", "12.4.1", "12.5.1", "12.6.1", "12.8.0", "12.9.2") + 'pyver' = @("3.10", "3.11", "3.12") #"3.9", + 'cuda' = @("12.4.1", "12.5.1", "12.6.1", "12.8.0", "12.9.2") #"12.1.1", "12.2.2", "12.3.2", 'releasetag' = @("basic") } From 8cbb8b432c3ad07334d184009fd3b3e1094aaba6 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Mon, 1 Sep 2025 12:36:35 +0700 Subject: [PATCH 004/221] Try with only cuda 12.9 pytorch 3.12 --- .github/workflows/manual_wheel_cuda.yml | 5 +++-- 1 file changed, 3 insertions(+), 2 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 883f04ff9f..dffaf0b8fc 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -21,8 +21,8 @@ jobs: run: | $matrix = @{ 'os' = @('ubuntu-22.04') #, 'windows-2022') - 'pyver' = @("3.10", "3.11", "3.12") #"3.9", - 'cuda' = @("12.4.1", "12.5.1", "12.6.1", "12.8.0", "12.9.2") #"12.1.1", "12.2.2", "12.3.2", + 'pyver' = @("3.12") #"3.9", "3.10", "3.11", + 'cuda' = @("12.9.2") #"12.1.1", "12.2.2", "12.3.2", "12.4.1", "12.5.1", "12.6.1", "12.8.0", 'releasetag' = @("basic") } @@ -111,6 +111,7 @@ jobs: if ($IsLinux) { $env:LD_LIBRARY_PATH = $env:CONDA_PREFIX + '/lib:' + $env:LD_LIBRARY_PATH } + $env:MAX_JOBS = '4' $env:VERBOSE = '1' $env:CMAKE_ARGS = '-DGGML_CUDA=on -DCMAKE_CUDA_ARCHITECTURES=all' $env:CMAKE_ARGS = "-DGGML_CUDA_FORCE_MMQ=ON $env:CMAKE_ARGS" From f2d886b1a4df3ac1199c3cef52454b407de3e623 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Mon, 1 Sep 2025 12:53:39 +0700 Subject: [PATCH 005/221] limit to 4 jobs at a time --- .github/workflows/manual_wheel_cuda.yml | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index dffaf0b8fc..d0d85eea7c 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -111,8 +111,9 @@ jobs: if ($IsLinux) { $env:LD_LIBRARY_PATH = $env:CONDA_PREFIX + '/lib:' + $env:LD_LIBRARY_PATH } - $env:MAX_JOBS = '4' $env:VERBOSE = '1' + $env:MAX_JOBS=4 + $env:CMAKE_BUILD_PARALLEL_LEVEL=4 $env:CMAKE_ARGS = '-DGGML_CUDA=on -DCMAKE_CUDA_ARCHITECTURES=all' $env:CMAKE_ARGS = "-DGGML_CUDA_FORCE_MMQ=ON $env:CMAKE_ARGS" # if ($env:AVXVER -eq 'AVX') { From 99126d99164cc9af99203c904b25a50383477845 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Mon, 1 Sep 2025 17:27:31 +0700 Subject: [PATCH 006/221] Try with 2 cuda and 2 pytorch version --- .github/workflows/manual_wheel_cuda.yml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index d0d85eea7c..c97e91ff2a 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -21,8 +21,8 @@ jobs: run: | $matrix = @{ 'os' = @('ubuntu-22.04') #, 'windows-2022') - 'pyver' = @("3.12") #"3.9", "3.10", "3.11", - 'cuda' = @("12.9.2") #"12.1.1", "12.2.2", "12.3.2", "12.4.1", "12.5.1", "12.6.1", "12.8.0", + 'pyver' = @("3.11", "3.12") #"3.9", "3.10", "3.11", + 'cuda' = @("12.8.1", "12.9.2") #"12.1.1", "12.2.2", "12.3.2", "12.4.1", "12.5.1", "12.6.1", "12.8.0", 'releasetag' = @("basic") } From a8ea4731d2c53f08c8009c4b2977857c878ade41 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Tue, 2 Sep 2025 02:20:19 +0700 Subject: [PATCH 007/221] Try with python 3.10 and cuda 12.6.3 too --- .github/workflows/manual_wheel_cuda.yml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index c97e91ff2a..502ce52e92 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -21,8 +21,8 @@ jobs: run: | $matrix = @{ 'os' = @('ubuntu-22.04') #, 'windows-2022') - 'pyver' = @("3.11", "3.12") #"3.9", "3.10", "3.11", - 'cuda' = @("12.8.1", "12.9.2") #"12.1.1", "12.2.2", "12.3.2", "12.4.1", "12.5.1", "12.6.1", "12.8.0", + 'pyver' = @("3.10", "3.11", "3.12") #"3.9", "3.10", "3.11", + 'cuda' = @("12.6.3", "12.8.1", "12.9.2") #"12.1.1", "12.2.2", "12.3.2", "12.4.1", "12.5.1", "12.6.3", "12.8.1", 'releasetag' = @("basic") } From b4ed25cc5254e83a2028d7423b4ab95cf9e915cb Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Tue, 2 Sep 2025 12:55:59 +0700 Subject: [PATCH 008/221] Try with more python and cuda versions --- .github/workflows/manual_wheel_cuda.yml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 502ce52e92..f65fdb40df 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -21,8 +21,8 @@ jobs: run: | $matrix = @{ 'os' = @('ubuntu-22.04') #, 'windows-2022') - 'pyver' = @("3.10", "3.11", "3.12") #"3.9", "3.10", "3.11", - 'cuda' = @("12.6.3", "12.8.1", "12.9.2") #"12.1.1", "12.2.2", "12.3.2", "12.4.1", "12.5.1", "12.6.3", "12.8.1", + 'pyver' = @("3.9", "3.10", "3.11", "3.12") #"3.9", "3.10", "3.11", + 'cuda' = @("12.4.1", "12.5.1", "12.6.3", "12.8.1", "12.9.2") #"12.1.1", "12.2.2", "12.3.2", "12.4.1", "12.5.1", "12.6.3", "12.8.1", 'releasetag' = @("basic") } From d729f9a2008c07c53dac3c1cd16171050dfd124f Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Tue, 2 Sep 2025 17:40:32 +0700 Subject: [PATCH 009/221] Enable for CUDA 12.5 to 12.9 too --- .github/workflows/generate-index-from-release.yaml | 6 ++++-- 1 file changed, 4 insertions(+), 2 deletions(-) diff --git a/.github/workflows/generate-index-from-release.yaml b/.github/workflows/generate-index-from-release.yaml index 255ee67d6f..296b317a4a 100644 --- a/.github/workflows/generate-index-from-release.yaml +++ b/.github/workflows/generate-index-from-release.yaml @@ -44,8 +44,10 @@ jobs: ./scripts/releases-to-pep-503.sh index/whl/cu122 '^[v]?[0-9]+\.[0-9]+\.[0-9]+-cu122$' ./scripts/releases-to-pep-503.sh index/whl/cu123 '^[v]?[0-9]+\.[0-9]+\.[0-9]+-cu123$' ./scripts/releases-to-pep-503.sh index/whl/cu124 '^[v]?[0-9]+\.[0-9]+\.[0-9]+-cu124$' - # ./scripts/releases-to-pep-503.sh index/whl/cu125 '^[v]?[0-9]+\.[0-9]+\.[0-9]+-cu124$' - # ./scripts/releases-to-pep-503.sh index/whl/cu126 '^[v]?[0-9]+\.[0-9]+\.[0-9]+-cu124$' + ./scripts/releases-to-pep-503.sh index/whl/cu125 '^[v]?[0-9]+\.[0-9]+\.[0-9]+-cu125$' + ./scripts/releases-to-pep-503.sh index/whl/cu126 '^[v]?[0-9]+\.[0-9]+\.[0-9]+-cu126$' + ./scripts/releases-to-pep-503.sh index/whl/cu128 '^[v]?[0-9]+\.[0-9]+\.[0-9]+-cu128$' + ./scripts/releases-to-pep-503.sh index/whl/cu129 '^[v]?[0-9]+\.[0-9]+\.[0-9]+-cu129$' ./scripts/releases-to-pep-503.sh index/whl/metal '^[v]?[0-9]+\.[0-9]+\.[0-9]+-metal$' - name: Upload artifact uses: actions/upload-pages-artifact@v3 From b8faf74096506cb0e6a6123886739b1e443fe9ea Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Tue, 2 Sep 2025 17:51:09 +0700 Subject: [PATCH 010/221] Try with Windows and more CUDA version --- .github/workflows/manual_wheel_cuda.yml | 8 ++++---- 1 file changed, 4 insertions(+), 4 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index f65fdb40df..2b41007f5c 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -8,7 +8,7 @@ permissions: jobs: define_matrix: name: Define Build Matrix - runs-on: ubuntu-latest + runs-on: 'ubuntu-22.04' outputs: matrix: ${{ steps.set-matrix.outputs.matrix }} defaults: @@ -20,9 +20,9 @@ jobs: id: set-matrix run: | $matrix = @{ - 'os' = @('ubuntu-22.04') #, 'windows-2022') - 'pyver' = @("3.9", "3.10", "3.11", "3.12") #"3.9", "3.10", "3.11", - 'cuda' = @("12.4.1", "12.5.1", "12.6.3", "12.8.1", "12.9.2") #"12.1.1", "12.2.2", "12.3.2", "12.4.1", "12.5.1", "12.6.3", "12.8.1", + 'os' = @('ubuntu-22.04', 'windows-2022') + 'pyver' = @("3.9", "3.10", "3.11", "3.12") + 'cuda' = @("12.1.1", "12.2.2", "12.3.2", "12.4.1", "12.5.1", "12.6.3", "12.8.1", "12.9.2") #"12.1.1", "12.2.2", "12.3.2", "12.4.1", "12.5.1", "12.6.3", "12.8.1", 'releasetag' = @("basic") } From f888093098ef9321b9205bbda0534f38ab3dfd19 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Tue, 2 Sep 2025 17:57:04 +0700 Subject: [PATCH 011/221] Try Disable for Windows --- .github/workflows/manual_wheel_cuda.yml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 2b41007f5c..2603fb41f7 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -8,7 +8,7 @@ permissions: jobs: define_matrix: name: Define Build Matrix - runs-on: 'ubuntu-22.04' + runs-on: ubuntu-22.04 outputs: matrix: ${{ steps.set-matrix.outputs.matrix }} defaults: @@ -20,7 +20,7 @@ jobs: id: set-matrix run: | $matrix = @{ - 'os' = @('ubuntu-22.04', 'windows-2022') + 'os' = @('ubuntu-22.04') #, 'windows-2022') 'pyver' = @("3.9", "3.10", "3.11", "3.12") 'cuda' = @("12.1.1", "12.2.2", "12.3.2", "12.4.1", "12.5.1", "12.6.3", "12.8.1", "12.9.2") #"12.1.1", "12.2.2", "12.3.2", "12.4.1", "12.5.1", "12.6.3", "12.8.1", 'releasetag' = @("basic") From 7e12829a357b30515d967bc918d882263e486e74 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 3 Sep 2025 00:59:10 +0700 Subject: [PATCH 012/221] use max-parallel = 4 --- .github/workflows/manual_wheel_cuda.yml | 1 + 1 file changed, 1 insertion(+) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 2603fb41f7..214f00b658 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -24,6 +24,7 @@ jobs: 'pyver' = @("3.9", "3.10", "3.11", "3.12") 'cuda' = @("12.1.1", "12.2.2", "12.3.2", "12.4.1", "12.5.1", "12.6.3", "12.8.1", "12.9.2") #"12.1.1", "12.2.2", "12.3.2", "12.4.1", "12.5.1", "12.6.3", "12.8.1", 'releasetag' = @("basic") + 'max-parallel' = @(4) } $matrixOut = ConvertTo-Json $matrix -Compress From bb127ab85e59b7f574f7508caf0719a68b17da0a Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 3 Sep 2025 01:05:36 +0700 Subject: [PATCH 013/221] oops --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 214f00b658..288e436a3f 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -24,7 +24,6 @@ jobs: 'pyver' = @("3.9", "3.10", "3.11", "3.12") 'cuda' = @("12.1.1", "12.2.2", "12.3.2", "12.4.1", "12.5.1", "12.6.3", "12.8.1", "12.9.2") #"12.1.1", "12.2.2", "12.3.2", "12.4.1", "12.5.1", "12.6.3", "12.8.1", 'releasetag' = @("basic") - 'max-parallel' = @(4) } $matrixOut = ConvertTo-Json $matrix -Compress @@ -35,6 +34,7 @@ jobs: needs: define_matrix runs-on: ${{ matrix.os }} strategy: + max-parallel: 5 matrix: ${{ fromJSON(needs.define_matrix.outputs.matrix) }} defaults: run: From 7e1cd86cd95940c9205b0ee572ea06b2d3997405 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 3 Sep 2025 04:48:11 +0700 Subject: [PATCH 014/221] use max-parallel 13 --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 288e436a3f..6e4dd93ae0 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -34,7 +34,7 @@ jobs: needs: define_matrix runs-on: ${{ matrix.os }} strategy: - max-parallel: 5 + max-parallel: 13 matrix: ${{ fromJSON(needs.define_matrix.outputs.matrix) }} defaults: run: From 35a7359cac70a192c6162cb8138f79bdf73f75e0 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 3 Sep 2025 09:30:56 +0700 Subject: [PATCH 015/221] Update URL on get-releases.sh --- scripts/get-releases.sh | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/scripts/get-releases.sh b/scripts/get-releases.sh index 4c904da78c..9a2fe11458 100755 --- a/scripts/get-releases.sh +++ b/scripts/get-releases.sh @@ -15,7 +15,7 @@ get_all_releases() { while true; do response=$(curl -s "${headers[@]}" \ - "https://api.github.com/repos/abetlen/llama-cpp-python/releases?page=$page&per_page=$per_page") + "https://api.github.com/repos/anr2me/llama-cpp-python/releases?page=$page&per_page=$per_page") # Check if the response is valid JSON if ! echo "$response" | jq empty > /dev/null 2>&1; then From 10911bef2ac770c9f74da3a3e09b29fcacea5fc7 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 3 Sep 2025 09:32:14 +0700 Subject: [PATCH 016/221] Update URL on releases-to-pep-503.sh --- scripts/releases-to-pep-503.sh | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/scripts/releases-to-pep-503.sh b/scripts/releases-to-pep-503.sh index 71910efcbf..fbabc19746 100755 --- a/scripts/releases-to-pep-503.sh +++ b/scripts/releases-to-pep-503.sh @@ -68,7 +68,7 @@ headers+=('--header' 'content-type: application/json') for release in $releases; do log_info "Processing release: $release" response=$(curl -s "${headers[@]}" \ - "https://api.github.com/repos/abetlen/llama-cpp-python/releases/tags/$release") + "https://api.github.com/repos/anr2me/llama-cpp-python/releases/tags/$release") if [ -z "$response" ]; then log_error "Empty response from GitHub API for release $release" From b841b9e20fe424f8fae86da70e6a53bd29b41525 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 3 Sep 2025 09:35:20 +0700 Subject: [PATCH 017/221] Try with Windows again --- .github/workflows/manual_wheel_cuda.yml | 8 ++++---- 1 file changed, 4 insertions(+), 4 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 6e4dd93ae0..4dcec1a976 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -20,9 +20,9 @@ jobs: id: set-matrix run: | $matrix = @{ - 'os' = @('ubuntu-22.04') #, 'windows-2022') + 'os' = @('ubuntu-22.04', 'windows-2022') 'pyver' = @("3.9", "3.10", "3.11", "3.12") - 'cuda' = @("12.1.1", "12.2.2", "12.3.2", "12.4.1", "12.5.1", "12.6.3", "12.8.1", "12.9.2") #"12.1.1", "12.2.2", "12.3.2", "12.4.1", "12.5.1", "12.6.3", "12.8.1", + 'cuda' = @("12.1.1", "12.2.2", "12.3.2", "12.4.1", "12.5.1", "12.6.3", "12.8.1", "12.9.2") 'releasetag' = @("basic") } @@ -113,8 +113,8 @@ jobs: $env:LD_LIBRARY_PATH = $env:CONDA_PREFIX + '/lib:' + $env:LD_LIBRARY_PATH } $env:VERBOSE = '1' - $env:MAX_JOBS=4 - $env:CMAKE_BUILD_PARALLEL_LEVEL=4 + #$env:MAX_JOBS=4 + #$env:CMAKE_BUILD_PARALLEL_LEVEL=4 $env:CMAKE_ARGS = '-DGGML_CUDA=on -DCMAKE_CUDA_ARCHITECTURES=all' $env:CMAKE_ARGS = "-DGGML_CUDA_FORCE_MMQ=ON $env:CMAKE_ARGS" # if ($env:AVXVER -eq 'AVX') { From 2b5676e5134bc2eacffb9a7373618d5bd06b5456 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 3 Sep 2025 12:57:16 +0700 Subject: [PATCH 018/221] Try with Windows only --- .github/workflows/manual_wheel_cuda.yml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 4dcec1a976..63609f7ed5 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -20,7 +20,7 @@ jobs: id: set-matrix run: | $matrix = @{ - 'os' = @('ubuntu-22.04', 'windows-2022') + 'os' = @('windows-2022') #'ubuntu-22.04', 'pyver' = @("3.9", "3.10", "3.11", "3.12") 'cuda' = @("12.1.1", "12.2.2", "12.3.2", "12.4.1", "12.5.1", "12.6.3", "12.8.1", "12.9.2") 'releasetag' = @("basic") @@ -48,7 +48,7 @@ jobs: if: runner.os == 'Windows' uses: microsoft/setup-msbuild@v2 with: - vs-version: '[16.11,16.12)' + vs-version: '[16.11,16.12,17.14)' - uses: actions/checkout@v4 with: From d8db35ed33767a676d6e5f850f5fce1437878d8c Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 3 Sep 2025 12:59:05 +0700 Subject: [PATCH 019/221] oops --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 63609f7ed5..ad1a746278 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -48,7 +48,7 @@ jobs: if: runner.os == 'Windows' uses: microsoft/setup-msbuild@v2 with: - vs-version: '[16.11,16.12,17.14)' + vs-version: '[16.11,17.14)' - uses: actions/checkout@v4 with: From e367f09fc7f609398dee8f9b2b53d6ebe8f8ce2c Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 3 Sep 2025 13:13:51 +0700 Subject: [PATCH 020/221] Shouldn't set the vs-version as adviced in msbuild-setup action. --- .github/workflows/manual_wheel_cuda.yml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index ad1a746278..612cf46ce5 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -47,8 +47,8 @@ jobs: - name: Add MSBuild to PATH if: runner.os == 'Windows' uses: microsoft/setup-msbuild@v2 - with: - vs-version: '[16.11,17.14)' + #with: + # vs-version: '[16.11,17.14)' - uses: actions/checkout@v4 with: From f4e2ea2dcee8536e38eb3e7959b90c4389684965 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 3 Sep 2025 13:46:29 +0700 Subject: [PATCH 021/221] Use asterisks instead of specific string --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 612cf46ce5..fc63e316dc 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -90,7 +90,7 @@ jobs: if: runner.os == 'Windows' run: | $y = (gi '.\MSBuildExtensions').fullname + '\*' - (gi 'C:\Program Files (x86)\Microsoft Visual Studio\2019\Enterprise\MSBuild\Microsoft\VC\*\BuildCustomizations').fullname.foreach({cp $y $_}) + (gi 'C:\Program Files*\Microsoft Visual Studio\20*\Enterprise\MSBuild\Microsoft\VC\*\BuildCustomizations').fullname.foreach({cp $y $_}) $cupath = 'CUDA_PATH_V' + $env:CUDAVER.Remove($env:CUDAVER.LastIndexOf('.')).Replace('.','_') echo "$cupath=$env:CONDA_PREFIX" >> $env:GITHUB_ENV From 35998cf3f5b4adc31038fe7b153edef1af65a728 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 3 Sep 2025 14:24:25 +0700 Subject: [PATCH 022/221] set CUDAToolkit_ROOT env var --- .github/workflows/manual_wheel_cuda.yml | 1 + 1 file changed, 1 insertion(+) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index fc63e316dc..c4975fb788 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -109,6 +109,7 @@ jobs: $env:CUDA_PATH = $env:CONDA_PREFIX $env:CUDA_HOME = $env:CONDA_PREFIX $env:CUDA_TOOLKIT_ROOT_DIR = $env:CONDA_PREFIX + $env:CUDAToolkit_ROOT = $env:CONDA_PREFIX if ($IsLinux) { $env:LD_LIBRARY_PATH = $env:CONDA_PREFIX + '/lib:' + $env:LD_LIBRARY_PATH } From 404131d1d9c7a2cc93150dab9456c5a2eae1a7df Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 3 Sep 2025 14:42:10 +0700 Subject: [PATCH 023/221] Replace cuda 12.9.2 with 12.9.1 on Windows --- .github/workflows/manual_wheel_cuda.yml | 1 + 1 file changed, 1 insertion(+) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index c4975fb788..261277f103 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -80,6 +80,7 @@ jobs: if: runner.os == 'Windows' && steps.vs-integration-cache.outputs.cache-hit != 'true' run: | if ($env:CUDAVER -eq '12.1.1') {$x = '12.1.0'} else {$x = $env:CUDAVER} + if ($env:CUDAVER -eq '12.9.2') {$x = '12.9.1'} else {$x = $env:CUDAVER} $links = (Invoke-RestMethod 'https://raw.githubusercontent.com/Jimver/cuda-toolkit/master/src/links/windows-links.ts').Trim().split().where({$_ -ne ''}) for ($i=$q=0;$i -lt $links.count -and $q -lt 2;$i++) {if ($links[$i] -eq "'$x',") {$q++}} Invoke-RestMethod $links[$i].Trim("'") -OutFile 'cudainstaller.zip' From c5a465be910578b076e0a8535d5815bd9f9ffe73 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 3 Sep 2025 18:18:58 +0700 Subject: [PATCH 024/221] Try with Windows 2019, since 2022 need cuda 12.4+ --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 261277f103..59168b8649 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -20,7 +20,7 @@ jobs: id: set-matrix run: | $matrix = @{ - 'os' = @('windows-2022') #'ubuntu-22.04', + 'os' = @('windows-2019') #'ubuntu-22.04', 'pyver' = @("3.9", "3.10", "3.11", "3.12") 'cuda' = @("12.1.1", "12.2.2", "12.3.2", "12.4.1", "12.5.1", "12.6.3", "12.8.1", "12.9.2") 'releasetag' = @("basic") From 113ef6c6becc1c7b7cac8b2295fdc0b8da2a7d4b Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 3 Sep 2025 18:31:37 +0700 Subject: [PATCH 025/221] oops windows 2019 have been removed, so we use cuda 12.4+ --- .github/workflows/manual_wheel_cuda.yml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 59168b8649..7a89daa71e 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -20,9 +20,9 @@ jobs: id: set-matrix run: | $matrix = @{ - 'os' = @('windows-2019') #'ubuntu-22.04', + 'os' = @('windows-2022') #'ubuntu-22.04', 'pyver' = @("3.9", "3.10", "3.11", "3.12") - 'cuda' = @("12.1.1", "12.2.2", "12.3.2", "12.4.1", "12.5.1", "12.6.3", "12.8.1", "12.9.2") + 'cuda' = @("12.4.1", "12.5.1", "12.6.3", "12.8.1", "12.9.2") # "12.1.1", "12.2.2", "12.3.2", 'releasetag' = @("basic") } From 1467609371454667051210571b017321cad69dc5 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 3 Sep 2025 19:36:11 +0700 Subject: [PATCH 026/221] Disabling windows again, not sure what was the "AlwaysCreate" issue was. --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 7a89daa71e..77192e6e31 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -20,7 +20,7 @@ jobs: id: set-matrix run: | $matrix = @{ - 'os' = @('windows-2022') #'ubuntu-22.04', + 'os' = @('ubuntu-22.04') #,'windows-2022') 'pyver' = @("3.9", "3.10", "3.11", "3.12") 'cuda' = @("12.4.1", "12.5.1", "12.6.3", "12.8.1", "12.9.2") # "12.1.1", "12.2.2", "12.3.2", 'releasetag' = @("basic") From bee01ad84d6c8df70cacc032d45481a8cba4cc15 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 3 Sep 2025 23:14:56 +0700 Subject: [PATCH 027/221] continue-on-error --- .github/workflows/generate-index-from-release.yaml | 1 + 1 file changed, 1 insertion(+) diff --git a/.github/workflows/generate-index-from-release.yaml b/.github/workflows/generate-index-from-release.yaml index 296b317a4a..907122aab6 100644 --- a/.github/workflows/generate-index-from-release.yaml +++ b/.github/workflows/generate-index-from-release.yaml @@ -35,6 +35,7 @@ jobs: - name: Setup Pages uses: actions/configure-pages@v5 - name: Build + continue-on-error: true env: GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }} run: | From 11011e49efa6d62183765c79db5f9a89613aa3e5 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 3 Sep 2025 23:25:04 +0700 Subject: [PATCH 028/221] testing --- scripts/releases-to-pep-503.sh | 1 + 1 file changed, 1 insertion(+) diff --git a/scripts/releases-to-pep-503.sh b/scripts/releases-to-pep-503.sh index fbabc19746..a802d514c4 100755 --- a/scripts/releases-to-pep-503.sh +++ b/scripts/releases-to-pep-503.sh @@ -12,6 +12,7 @@ log_info() { echo "INFO: $1" } +log_info($1) # Get output directory or default to index/whl/cpu output_dir=${1:-"index/whl/cpu"} From 2a90d04f573d1aff4198a199cdfbb23933cada93 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 3 Sep 2025 23:27:41 +0700 Subject: [PATCH 029/221] oops --- scripts/releases-to-pep-503.sh | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/scripts/releases-to-pep-503.sh b/scripts/releases-to-pep-503.sh index a802d514c4..8d1e9cdc4d 100755 --- a/scripts/releases-to-pep-503.sh +++ b/scripts/releases-to-pep-503.sh @@ -12,7 +12,7 @@ log_info() { echo "INFO: $1" } -log_info($1) +log_info "$1" # Get output directory or default to index/whl/cpu output_dir=${1:-"index/whl/cpu"} From 26a1207e2d8c0e1d182c4fde797d070db6ce1fb6 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 3 Sep 2025 23:30:32 +0700 Subject: [PATCH 030/221] disable exit on error --- scripts/releases-to-pep-503.sh | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/scripts/releases-to-pep-503.sh b/scripts/releases-to-pep-503.sh index 8d1e9cdc4d..cc2ef96555 100755 --- a/scripts/releases-to-pep-503.sh +++ b/scripts/releases-to-pep-503.sh @@ -1,7 +1,7 @@ #!/bin/bash # Enable exit on error -set -e +#set -e # Function for logging log_error() { From a8166aa71ce4f25a5e48904455d13574e4ed9f27 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 3 Sep 2025 23:37:11 +0700 Subject: [PATCH 031/221] oops bad idea --- scripts/releases-to-pep-503.sh | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/scripts/releases-to-pep-503.sh b/scripts/releases-to-pep-503.sh index cc2ef96555..8d1e9cdc4d 100755 --- a/scripts/releases-to-pep-503.sh +++ b/scripts/releases-to-pep-503.sh @@ -1,7 +1,7 @@ #!/bin/bash # Enable exit on error -#set -e +set -e # Function for logging log_error() { From 65d014997f9e32a31c0264b092ef2646e1f63b19 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 3 Sep 2025 23:39:04 +0700 Subject: [PATCH 032/221] disable cu121-123 --- .github/workflows/generate-index-from-release.yaml | 10 +++++----- 1 file changed, 5 insertions(+), 5 deletions(-) diff --git a/.github/workflows/generate-index-from-release.yaml b/.github/workflows/generate-index-from-release.yaml index 907122aab6..a2c17c1444 100644 --- a/.github/workflows/generate-index-from-release.yaml +++ b/.github/workflows/generate-index-from-release.yaml @@ -35,15 +35,15 @@ jobs: - name: Setup Pages uses: actions/configure-pages@v5 - name: Build - continue-on-error: true + #continue-on-error: true env: GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }} run: | ./scripts/get-releases.sh - ./scripts/releases-to-pep-503.sh index/whl/cpu '^[v]?[0-9]+\.[0-9]+\.[0-9]+$' - ./scripts/releases-to-pep-503.sh index/whl/cu121 '^[v]?[0-9]+\.[0-9]+\.[0-9]+-cu121$' - ./scripts/releases-to-pep-503.sh index/whl/cu122 '^[v]?[0-9]+\.[0-9]+\.[0-9]+-cu122$' - ./scripts/releases-to-pep-503.sh index/whl/cu123 '^[v]?[0-9]+\.[0-9]+\.[0-9]+-cu123$' + #./scripts/releases-to-pep-503.sh index/whl/cpu '^[v]?[0-9]+\.[0-9]+\.[0-9]+$' + #./scripts/releases-to-pep-503.sh index/whl/cu121 '^[v]?[0-9]+\.[0-9]+\.[0-9]+-cu121$' + #./scripts/releases-to-pep-503.sh index/whl/cu122 '^[v]?[0-9]+\.[0-9]+\.[0-9]+-cu122$' + #./scripts/releases-to-pep-503.sh index/whl/cu123 '^[v]?[0-9]+\.[0-9]+\.[0-9]+-cu123$' ./scripts/releases-to-pep-503.sh index/whl/cu124 '^[v]?[0-9]+\.[0-9]+\.[0-9]+-cu124$' ./scripts/releases-to-pep-503.sh index/whl/cu125 '^[v]?[0-9]+\.[0-9]+\.[0-9]+-cu125$' ./scripts/releases-to-pep-503.sh index/whl/cu126 '^[v]?[0-9]+\.[0-9]+\.[0-9]+-cu126$' From 0a50b3531baa3b47abb889be894782385b635991 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Sat, 10 Jan 2026 20:45:52 +0700 Subject: [PATCH 033/221] try with cuda 13.1 --- .github/workflows/manual_wheel_cuda.yml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 77192e6e31..b7a412af3a 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -21,8 +21,8 @@ jobs: run: | $matrix = @{ 'os' = @('ubuntu-22.04') #,'windows-2022') - 'pyver' = @("3.9", "3.10", "3.11", "3.12") - 'cuda' = @("12.4.1", "12.5.1", "12.6.3", "12.8.1", "12.9.2") # "12.1.1", "12.2.2", "12.3.2", + 'pyver' = @("3.9", "3.10", "3.11", "3.12") # ,"3.13", "3.14" + 'cuda' = @("12.4.1", "12.5.1", "12.6.3", "12.8.1", "12.9.2", "13.1.0") # "12.1.1", "12.2.2", "12.3.2", 'releasetag' = @("basic") } From d1dccc1340963bad19e8cbff88159e8af015e5fe Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Sun, 11 Jan 2026 02:36:22 +0700 Subject: [PATCH 034/221] this too --- .github/workflows/generate-index-from-release.yaml | 1 + 1 file changed, 1 insertion(+) diff --git a/.github/workflows/generate-index-from-release.yaml b/.github/workflows/generate-index-from-release.yaml index a2c17c1444..7edf663020 100644 --- a/.github/workflows/generate-index-from-release.yaml +++ b/.github/workflows/generate-index-from-release.yaml @@ -49,6 +49,7 @@ jobs: ./scripts/releases-to-pep-503.sh index/whl/cu126 '^[v]?[0-9]+\.[0-9]+\.[0-9]+-cu126$' ./scripts/releases-to-pep-503.sh index/whl/cu128 '^[v]?[0-9]+\.[0-9]+\.[0-9]+-cu128$' ./scripts/releases-to-pep-503.sh index/whl/cu129 '^[v]?[0-9]+\.[0-9]+\.[0-9]+-cu129$' + ./scripts/releases-to-pep-503.sh index/whl/cu130 '^[v]?[0-9]+\.[0-9]+\.[0-9]+-cu130$' ./scripts/releases-to-pep-503.sh index/whl/metal '^[v]?[0-9]+\.[0-9]+\.[0-9]+-metal$' - name: Upload artifact uses: actions/upload-pages-artifact@v3 From 3a55a5fc00c2141602c7b91e7717c8e27267b5e4 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Sun, 11 Jan 2026 02:39:48 +0700 Subject: [PATCH 035/221] oops --- .github/workflows/generate-index-from-release.yaml | 1 + 1 file changed, 1 insertion(+) diff --git a/.github/workflows/generate-index-from-release.yaml b/.github/workflows/generate-index-from-release.yaml index 7edf663020..eb6842c4a9 100644 --- a/.github/workflows/generate-index-from-release.yaml +++ b/.github/workflows/generate-index-from-release.yaml @@ -50,6 +50,7 @@ jobs: ./scripts/releases-to-pep-503.sh index/whl/cu128 '^[v]?[0-9]+\.[0-9]+\.[0-9]+-cu128$' ./scripts/releases-to-pep-503.sh index/whl/cu129 '^[v]?[0-9]+\.[0-9]+\.[0-9]+-cu129$' ./scripts/releases-to-pep-503.sh index/whl/cu130 '^[v]?[0-9]+\.[0-9]+\.[0-9]+-cu130$' + ./scripts/releases-to-pep-503.sh index/whl/cu131 '^[v]?[0-9]+\.[0-9]+\.[0-9]+-cu131$' ./scripts/releases-to-pep-503.sh index/whl/metal '^[v]?[0-9]+\.[0-9]+\.[0-9]+-metal$' - name: Upload artifact uses: actions/upload-pages-artifact@v3 From 346ad7fdf28529aa617e523bd293a4c759faa6d0 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Sun, 11 Jan 2026 02:43:34 +0700 Subject: [PATCH 036/221] oops 2 --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index b7a412af3a..ccc4e2c8df 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -22,7 +22,7 @@ jobs: $matrix = @{ 'os' = @('ubuntu-22.04') #,'windows-2022') 'pyver' = @("3.9", "3.10", "3.11", "3.12") # ,"3.13", "3.14" - 'cuda' = @("12.4.1", "12.5.1", "12.6.3", "12.8.1", "12.9.2", "13.1.0") # "12.1.1", "12.2.2", "12.3.2", + 'cuda' = @("12.4.1", "12.5.1", "12.6.3", "12.8.1", "12.9.2", "13.0.2", "13.1.0") # "12.1.1", "12.2.2", "12.3.2", 'releasetag' = @("basic") } From 36e0dca8cb1de00bd5b474c84e814c29bf128b13 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Sun, 18 Jan 2026 06:25:26 +0700 Subject: [PATCH 037/221] install cuda-toolkit instead of cuda to avoid building wheel using the latest cuda compiler --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index ccc4e2c8df..6782dfce74 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -101,7 +101,7 @@ jobs: MAMBA_NO_LOW_SPEED_LIMIT: "1" run: | $cudaVersion = $env:CUDAVER - mamba install -y 'cuda' -c nvidia/label/cuda-$cudaVersion + mamba install -y 'cuda-toolkit' -c "nvidia/label/cuda-$cudaVersion" python -m pip install build wheel - name: Build Wheel From 3d35a645a0d879579dace14198a32baa5eee58c4 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Sun, 18 Jan 2026 06:46:04 +0700 Subject: [PATCH 038/221] lets use the exact version too --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 6782dfce74..875262cab6 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -101,7 +101,7 @@ jobs: MAMBA_NO_LOW_SPEED_LIMIT: "1" run: | $cudaVersion = $env:CUDAVER - mamba install -y 'cuda-toolkit' -c "nvidia/label/cuda-$cudaVersion" + mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda-toolkit==$cudaVersion" python -m pip install build wheel - name: Build Wheel From e48e990dcd52af230b9f2bbe1981928c208cd433 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Sun, 18 Jan 2026 08:17:00 +0700 Subject: [PATCH 039/221] anaconda doesn't have cuda 12.9.2 --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 875262cab6..61240c1569 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -22,7 +22,7 @@ jobs: $matrix = @{ 'os' = @('ubuntu-22.04') #,'windows-2022') 'pyver' = @("3.9", "3.10", "3.11", "3.12") # ,"3.13", "3.14" - 'cuda' = @("12.4.1", "12.5.1", "12.6.3", "12.8.1", "12.9.2", "13.0.2", "13.1.0") # "12.1.1", "12.2.2", "12.3.2", + 'cuda' = @("12.4.1", "12.5.1", "12.6.3", "12.8.1", "12.9.1", "13.0.2", "13.1.0") # "12.1.1", "12.2.2", "12.3.2", 'releasetag' = @("basic") } From ffc54bb5d1da7df6399909c46c8115da724f39aa Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Sun, 18 Jan 2026 08:58:20 +0700 Subject: [PATCH 040/221] can't build wheel for cuda 12.9 (different number of arguments) --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 61240c1569..898a8d51fb 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -22,7 +22,7 @@ jobs: $matrix = @{ 'os' = @('ubuntu-22.04') #,'windows-2022') 'pyver' = @("3.9", "3.10", "3.11", "3.12") # ,"3.13", "3.14" - 'cuda' = @("12.4.1", "12.5.1", "12.6.3", "12.8.1", "12.9.1", "13.0.2", "13.1.0") # "12.1.1", "12.2.2", "12.3.2", + 'cuda' = @("12.4.1", "12.5.1", "12.6.3", "12.8.1", "13.0.2", "13.1.0") # "12.1.1", "12.2.2", "12.3.2", "12.9.1", 'releasetag' = @("basic") } From 0388be285dd8c682efd6859242aba2a6d3f6ffd2 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Sun, 18 Jan 2026 13:00:05 +0700 Subject: [PATCH 041/221] temporarily disable exit on error to get the logs --- scripts/releases-to-pep-503.sh | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/scripts/releases-to-pep-503.sh b/scripts/releases-to-pep-503.sh index 8d1e9cdc4d..cc2ef96555 100755 --- a/scripts/releases-to-pep-503.sh +++ b/scripts/releases-to-pep-503.sh @@ -1,7 +1,7 @@ #!/bin/bash # Enable exit on error -set -e +#set -e # Function for logging log_error() { From 79910821c89cb2534d4373f00c93f76dd8bcc9c4 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Sun, 18 Jan 2026 13:38:54 +0700 Subject: [PATCH 042/221] test 1 --- scripts/releases-to-pep-503.sh | 5 +++++ 1 file changed, 5 insertions(+) diff --git a/scripts/releases-to-pep-503.sh b/scripts/releases-to-pep-503.sh index cc2ef96555..6a5e5bd183 100755 --- a/scripts/releases-to-pep-503.sh +++ b/scripts/releases-to-pep-503.sh @@ -57,6 +57,11 @@ EOF # Filter releases by pattern releases=$(grep -E "$pattern" "$current_dir/all_releases.txt") +log_info "Test1" +cat "$current_dir/all_releases.txt" +log_info "Test2" +echo "$releases" +log_info "Test3" # Prepare curl headers headers=('--header' 'Accept: application/vnd.github.v3+json') From 19253146a8ffeef16d93e51bfc16138343ea4e4e Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Sun, 18 Jan 2026 13:48:52 +0700 Subject: [PATCH 043/221] test 2 --- scripts/releases-to-pep-503.sh | 3 +++ 1 file changed, 3 insertions(+) diff --git a/scripts/releases-to-pep-503.sh b/scripts/releases-to-pep-503.sh index 6a5e5bd183..7b0ba238ba 100755 --- a/scripts/releases-to-pep-503.sh +++ b/scripts/releases-to-pep-503.sh @@ -62,6 +62,8 @@ cat "$current_dir/all_releases.txt" log_info "Test2" echo "$releases" log_info "Test3" +echo "$pattern" +log_info "Test4" # Prepare curl headers headers=('--header' 'Accept: application/vnd.github.v3+json') @@ -102,6 +104,7 @@ for release in $releases; do echo "
" >> "$output_dir/llama-cpp-python/index.html" done done +log_info "Test5" echo " " >> "$output_dir/llama-cpp-python/index.html" echo "" >> "$output_dir/llama-cpp-python/index.html" From 0320411509973482efc56384cf3e3c23b2b3b797 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Sun, 18 Jan 2026 14:17:54 +0700 Subject: [PATCH 044/221] update setup-python and cibuildwheel --- .github/workflows/build-and-release.yaml | 8 ++++---- 1 file changed, 4 insertions(+), 4 deletions(-) diff --git a/.github/workflows/build-and-release.yaml b/.github/workflows/build-and-release.yaml index 7eaf017fbc..b8b5f4d986 100644 --- a/.github/workflows/build-and-release.yaml +++ b/.github/workflows/build-and-release.yaml @@ -19,7 +19,7 @@ jobs: submodules: "recursive" # Used to host cibuildwheel - - uses: actions/setup-python@v5 + - uses: actions/setup-python@v6 with: python-version: "3.9" @@ -42,7 +42,7 @@ jobs: shell: cmd - name: Build wheels - uses: pypa/cibuildwheel@v2.22.0 + uses: pypa/cibuildwheel@v3.3.1 env: # disable repair CIBW_REPAIR_WHEEL_COMMAND: "" @@ -69,7 +69,7 @@ jobs: platforms: linux/arm64 - name: Build wheels - uses: pypa/cibuildwheel@v2.22.0 + uses: pypa/cibuildwheel@v3.3.1 env: CIBW_SKIP: "*musllinux* pp*" CIBW_REPAIR_WHEEL_COMMAND: "" @@ -94,7 +94,7 @@ jobs: with: submodules: "recursive" - - uses: actions/setup-python@v5 + - uses: actions/setup-python@v6 with: python-version: "3.9" From c674fd7c6b1ecc98cb20e03ca95d21a7d7b85798 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Sun, 18 Jan 2026 19:33:36 +0700 Subject: [PATCH 045/221] reenable exit on error --- scripts/releases-to-pep-503.sh | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/scripts/releases-to-pep-503.sh b/scripts/releases-to-pep-503.sh index 7b0ba238ba..b79012dc4a 100755 --- a/scripts/releases-to-pep-503.sh +++ b/scripts/releases-to-pep-503.sh @@ -1,7 +1,7 @@ #!/bin/bash # Enable exit on error -#set -e +set -e # Function for logging log_error() { From 6e7a9bc89324dce426483a64b72af05b4d410031 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Sun, 18 Jan 2026 19:38:07 +0700 Subject: [PATCH 046/221] updated setup-python and cibuildwheel on metal too --- .github/workflows/build-wheels-metal.yaml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.github/workflows/build-wheels-metal.yaml b/.github/workflows/build-wheels-metal.yaml index 98f511e4a6..2194696681 100644 --- a/.github/workflows/build-wheels-metal.yaml +++ b/.github/workflows/build-wheels-metal.yaml @@ -19,7 +19,7 @@ jobs: submodules: "recursive" # Used to host cibuildwheel - - uses: actions/setup-python@v5 + - uses: actions/setup-python@v6 with: python-version: "3.12" cache: 'pip' @@ -32,7 +32,7 @@ jobs: shell: bash - name: Build wheels - uses: pypa/cibuildwheel@v2.22.0 + uses: pypa/cibuildwheel@v3.3.1 env: # disable repair CIBW_REPAIR_WHEEL_COMMAND: "" From 0f9e124d1d6edd7d3b52bfd0429175a58e42752f Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Sun, 18 Jan 2026 19:54:10 +0700 Subject: [PATCH 047/221] updated setup-python, macos image, and replace huggingface-cli with hf --- .github/workflows/test.yaml | 16 ++++++++-------- 1 file changed, 8 insertions(+), 8 deletions(-) diff --git a/.github/workflows/test.yaml b/.github/workflows/test.yaml index 95f6e5a272..138503c415 100644 --- a/.github/workflows/test.yaml +++ b/.github/workflows/test.yaml @@ -16,13 +16,13 @@ jobs: runs-on: ubuntu-latest steps: - name: Set up Python - uses: actions/setup-python@v5 + uses: actions/setup-python@v6 with: python-version: "3.9" - name: Install huggingface-hub run: pip install huggingface-hub - name: Download model - run: huggingface-cli download ${{ env.REPO_ID }} ${{ env.MODEL_FILE }} + run: hf download ${{ env.REPO_ID }} ${{ env.MODEL_FILE }} - name: Cache model uses: actions/cache@v4 with: @@ -41,7 +41,7 @@ jobs: submodules: "recursive" - name: Set up Python ${{ matrix.python-version }} - uses: actions/setup-python@v5 + uses: actions/setup-python@v6 with: python-version: ${{ matrix.python-version }} cache: 'pip' @@ -72,7 +72,7 @@ jobs: submodules: "recursive" - name: Set up Python ${{ matrix.python-version }} - uses: actions/setup-python@v5 + uses: actions/setup-python@v6 with: python-version: ${{ matrix.python-version }} cache: 'pip' @@ -96,7 +96,7 @@ jobs: build-macos: needs: download-model - runs-on: macos-13 + runs-on: macos-14 strategy: matrix: python-version: ["3.9", "3.10", "3.11", "3.12"] @@ -106,7 +106,7 @@ jobs: submodules: "recursive" - name: Set up Python ${{ matrix.python-version }} - uses: actions/setup-python@v5 + uses: actions/setup-python@v6 with: python-version: ${{ matrix.python-version }} cache: 'pip' @@ -137,14 +137,14 @@ jobs: build-macos-metal: needs: download-model - runs-on: macos-13 + runs-on: macos-14 steps: - uses: actions/checkout@v4 with: submodules: "recursive" - name: Set up Python 3.9 - uses: actions/setup-python@v5 + uses: actions/setup-python@v6 with: python-version: "3.9" From bf871cd96bb8702fc6c7add3c89d1c28aa350769 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Sun, 18 Jan 2026 20:04:29 +0700 Subject: [PATCH 048/221] replace macos-14 image with macos-latest --- .github/workflows/test.yaml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.github/workflows/test.yaml b/.github/workflows/test.yaml index 138503c415..ca87dea080 100644 --- a/.github/workflows/test.yaml +++ b/.github/workflows/test.yaml @@ -96,7 +96,7 @@ jobs: build-macos: needs: download-model - runs-on: macos-14 + runs-on: macos-latest strategy: matrix: python-version: ["3.9", "3.10", "3.11", "3.12"] @@ -137,7 +137,7 @@ jobs: build-macos-metal: needs: download-model - runs-on: macos-14 + runs-on: macos-latest steps: - uses: actions/checkout@v4 with: From 046dcbce2e9c0cbfe12edaf025c097a0b79d210c Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Sun, 18 Jan 2026 20:18:09 +0700 Subject: [PATCH 049/221] can't build on macos-15/latest, reverting to macos-14 --- .github/workflows/test.yaml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.github/workflows/test.yaml b/.github/workflows/test.yaml index ca87dea080..138503c415 100644 --- a/.github/workflows/test.yaml +++ b/.github/workflows/test.yaml @@ -96,7 +96,7 @@ jobs: build-macos: needs: download-model - runs-on: macos-latest + runs-on: macos-14 strategy: matrix: python-version: ["3.9", "3.10", "3.11", "3.12"] @@ -137,7 +137,7 @@ jobs: build-macos-metal: needs: download-model - runs-on: macos-latest + runs-on: macos-14 steps: - uses: actions/checkout@v4 with: From f0eec3bafc796daa7c4de7231b7fe76dd0436c87 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Sun, 18 Jan 2026 20:37:35 +0700 Subject: [PATCH 050/221] can't build on macos-15 --- .github/workflows/build-wheels-metal.yaml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/build-wheels-metal.yaml b/.github/workflows/build-wheels-metal.yaml index 2194696681..1cfe6166f8 100644 --- a/.github/workflows/build-wheels-metal.yaml +++ b/.github/workflows/build-wheels-metal.yaml @@ -11,7 +11,7 @@ jobs: runs-on: ${{ matrix.os }} strategy: matrix: - os: [macos-14, macos-15] + os: [macos-14] # , macos-15 steps: - uses: actions/checkout@v4 From 75a84103217f8443f52fd40dd43a1b723ad5c9a7 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Sun, 18 Jan 2026 21:10:44 +0700 Subject: [PATCH 051/221] can't build on macos-15 --- .github/workflows/build-and-release.yaml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/build-and-release.yaml b/.github/workflows/build-and-release.yaml index b8b5f4d986..5abf9f07e2 100644 --- a/.github/workflows/build-and-release.yaml +++ b/.github/workflows/build-and-release.yaml @@ -11,7 +11,7 @@ jobs: runs-on: ${{ matrix.os }} strategy: matrix: - os: [ubuntu-22.04, windows-2022, macos-14, macos-15] + os: [ubuntu-22.04, windows-2022, macos-14] # , macos-15 steps: - uses: actions/checkout@v4 From ac30b961c2a136217df97fbf0dbb36c8d409f91d Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Mon, 19 Jan 2026 03:37:02 +0700 Subject: [PATCH 052/221] temporarily disable cu129 until it can be build with cuda toolkit 12.9 instead of 13 Comment out the script for cu129 to prevent errors. --- .github/workflows/generate-index-from-release.yaml | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/.github/workflows/generate-index-from-release.yaml b/.github/workflows/generate-index-from-release.yaml index eb6842c4a9..86fb41c57c 100644 --- a/.github/workflows/generate-index-from-release.yaml +++ b/.github/workflows/generate-index-from-release.yaml @@ -40,6 +40,7 @@ jobs: GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }} run: | ./scripts/get-releases.sh + # Non-existing file could cause am error at the script #./scripts/releases-to-pep-503.sh index/whl/cpu '^[v]?[0-9]+\.[0-9]+\.[0-9]+$' #./scripts/releases-to-pep-503.sh index/whl/cu121 '^[v]?[0-9]+\.[0-9]+\.[0-9]+-cu121$' #./scripts/releases-to-pep-503.sh index/whl/cu122 '^[v]?[0-9]+\.[0-9]+\.[0-9]+-cu122$' @@ -48,7 +49,7 @@ jobs: ./scripts/releases-to-pep-503.sh index/whl/cu125 '^[v]?[0-9]+\.[0-9]+\.[0-9]+-cu125$' ./scripts/releases-to-pep-503.sh index/whl/cu126 '^[v]?[0-9]+\.[0-9]+\.[0-9]+-cu126$' ./scripts/releases-to-pep-503.sh index/whl/cu128 '^[v]?[0-9]+\.[0-9]+\.[0-9]+-cu128$' - ./scripts/releases-to-pep-503.sh index/whl/cu129 '^[v]?[0-9]+\.[0-9]+\.[0-9]+-cu129$' + #./scripts/releases-to-pep-503.sh index/whl/cu129 '^[v]?[0-9]+\.[0-9]+\.[0-9]+-cu129$' ./scripts/releases-to-pep-503.sh index/whl/cu130 '^[v]?[0-9]+\.[0-9]+\.[0-9]+-cu130$' ./scripts/releases-to-pep-503.sh index/whl/cu131 '^[v]?[0-9]+\.[0-9]+\.[0-9]+-cu131$' ./scripts/releases-to-pep-503.sh index/whl/metal '^[v]?[0-9]+\.[0-9]+\.[0-9]+-metal$' From 3a5818c0df166bfdf261be1563017b9e14c03f6c Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Mon, 19 Jan 2026 14:39:50 +0700 Subject: [PATCH 053/221] exclude python 3.8 --- .github/workflows/build-and-release.yaml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/build-and-release.yaml b/.github/workflows/build-and-release.yaml index 5abf9f07e2..c9476360b3 100644 --- a/.github/workflows/build-and-release.yaml +++ b/.github/workflows/build-and-release.yaml @@ -75,7 +75,7 @@ jobs: CIBW_REPAIR_WHEEL_COMMAND: "" CIBW_ARCHS: "aarch64" CIBW_ENVIRONMENT: CMAKE_ARGS="-DCMAKE_OSX_ARCHITECTURES=arm64 -DCMAKE_APPLE_SILICON_PROCESSOR=arm64 -DCMAKE_CROSSCOMPILING=ON" - CIBW_BUILD: "cp38-* cp39-* cp310-* cp311-* cp312-*" + CIBW_BUILD: "cp39-* cp310-* cp311-* cp312-*" with: output-dir: wheelhouse From f0131aab3d2031b062acaec8aa241618b4b6b9f3 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Tue, 10 Feb 2026 02:51:20 +0700 Subject: [PATCH 054/221] try with Windows --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 898a8d51fb..a2b71c3798 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -20,7 +20,7 @@ jobs: id: set-matrix run: | $matrix = @{ - 'os' = @('ubuntu-22.04') #,'windows-2022') + 'os' = @('ubuntu-22.04','windows-2022') 'pyver' = @("3.9", "3.10", "3.11", "3.12") # ,"3.13", "3.14" 'cuda' = @("12.4.1", "12.5.1", "12.6.3", "12.8.1", "13.0.2", "13.1.0") # "12.1.1", "12.2.2", "12.3.2", "12.9.1", 'releasetag' = @("basic") From 5ce7d1e89dcaa267da161f9fae072417ac2e7b7c Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Tue, 10 Feb 2026 12:43:22 +0700 Subject: [PATCH 055/221] use a matching cuda-nvcc instead of the latest version. --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index a2b71c3798..360c7d1af9 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -101,7 +101,7 @@ jobs: MAMBA_NO_LOW_SPEED_LIMIT: "1" run: | $cudaVersion = $env:CUDAVER - mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda-toolkit==$cudaVersion" + mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda-toolkit==$cudaVersion" I "nvidia::cuda-nvcc==$cudaVersion" python -m pip install build wheel - name: Build Wheel From 232ea00150b5ffa8e279f94bdc19f9dd206866f7 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Tue, 10 Feb 2026 13:11:43 +0700 Subject: [PATCH 056/221] oops --- .github/workflows/manual_wheel_cuda.yml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 360c7d1af9..bfe4420e7c 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -60,7 +60,7 @@ jobs: cache: 'pip' - name: Setup Mamba - uses: conda-incubator/setup-miniconda@v3.1.0 + uses: conda-incubator/setup-miniconda@v3.3.0 with: activate-environment: "llamacpp" python-version: ${{ matrix.pyver }} @@ -101,7 +101,7 @@ jobs: MAMBA_NO_LOW_SPEED_LIMIT: "1" run: | $cudaVersion = $env:CUDAVER - mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda-toolkit==$cudaVersion" I "nvidia::cuda-nvcc==$cudaVersion" + mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda-toolkit==$cudaVersion" I "nvidia::cuda-nvcc==${ split($cudaVersion, '.')[0] }.*" python -m pip install build wheel - name: Build Wheel From c03266561113a730b6ae20c4812295af795ab884 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Tue, 10 Feb 2026 13:32:58 +0700 Subject: [PATCH 057/221] oops 2 --- .github/workflows/manual_wheel_cuda.yml | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index bfe4420e7c..66be80d70b 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -101,7 +101,8 @@ jobs: MAMBA_NO_LOW_SPEED_LIMIT: "1" run: | $cudaVersion = $env:CUDAVER - mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda-toolkit==$cudaVersion" I "nvidia::cuda-nvcc==${ split($cudaVersion, '.')[0] }.*" + $cudaMajor = $cudaVersion.Split('.')[0] + mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda-toolkit==$cudaVersion" "nvidia::cuda-nvcc==$cudaMajor.*" python -m pip install build wheel - name: Build Wheel From 10fcbec3336d813404da454b9e74b55a4f343f14 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Tue, 10 Feb 2026 13:59:57 +0700 Subject: [PATCH 058/221] testing cuda-version --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 66be80d70b..9785dc9a92 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -102,7 +102,7 @@ jobs: run: | $cudaVersion = $env:CUDAVER $cudaMajor = $cudaVersion.Split('.')[0] - mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda-toolkit==$cudaVersion" "nvidia::cuda-nvcc==$cudaMajor.*" + mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda-toolkit==$cudaVersion" "nvidia::cuda-nvcc==$cudaMajor.*" "nvidia::cuda-version==$cudaVersion" python -m pip install build wheel - name: Build Wheel From d59aabaa91d51bf2e50891e47349c99e2d97d72e Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Tue, 10 Feb 2026 14:08:39 +0700 Subject: [PATCH 059/221] testing cuda majorminor --- .github/workflows/manual_wheel_cuda.yml | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 9785dc9a92..d74d331785 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -102,7 +102,9 @@ jobs: run: | $cudaVersion = $env:CUDAVER $cudaMajor = $cudaVersion.Split('.')[0] - mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda-toolkit==$cudaVersion" "nvidia::cuda-nvcc==$cudaMajor.*" "nvidia::cuda-version==$cudaVersion" + $cudaParts = $cudaVersion -split '\.' + $cudaMajorMinor = "$($cudaParts[0]).$($cudaParts[1])" + mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda-toolkit==$cudaVersion" "nvidia::cuda-nvcc==$cudaMajorMinor.*" "nvidia::cuda-version==$cudaMajorMinor.*" python -m pip install build wheel - name: Build Wheel From 361ada289bb4137ce4710890ca8b2026abee0574 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Tue, 10 Feb 2026 14:15:10 +0700 Subject: [PATCH 060/221] testing newer cccl --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index d74d331785..65e456efcf 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -104,7 +104,7 @@ jobs: $cudaMajor = $cudaVersion.Split('.')[0] $cudaParts = $cudaVersion -split '\.' $cudaMajorMinor = "$($cudaParts[0]).$($cudaParts[1])" - mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda-toolkit==$cudaVersion" "nvidia::cuda-nvcc==$cudaMajorMinor.*" "nvidia::cuda-version==$cudaMajorMinor.*" + mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda-toolkit==$cudaVersion" "nvidia::cuda-nvcc==$cudaMajorMinor.*" "conda-forge::cccl" python -m pip install build wheel - name: Build Wheel From 234f13925a160069bf1a4b05dc0e844b6c07c56c Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Tue, 10 Feb 2026 14:25:50 +0700 Subject: [PATCH 061/221] the latest cccl causing upgrade to cuda version 13 --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 65e456efcf..aa4fef7320 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -104,7 +104,7 @@ jobs: $cudaMajor = $cudaVersion.Split('.')[0] $cudaParts = $cudaVersion -split '\.' $cudaMajorMinor = "$($cudaParts[0]).$($cudaParts[1])" - mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda-toolkit==$cudaVersion" "nvidia::cuda-nvcc==$cudaMajorMinor.*" "conda-forge::cccl" + mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda-toolkit==$cudaVersion" "nvidia::cuda-nvcc==$cudaMajorMinor.*" python -m pip install build wheel - name: Build Wheel From d18c2a874a986dcf6babf8b0d69472d333d44d23 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Tue, 10 Feb 2026 14:35:23 +0700 Subject: [PATCH 062/221] testing cuda-version --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index aa4fef7320..7790b4c031 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -104,7 +104,7 @@ jobs: $cudaMajor = $cudaVersion.Split('.')[0] $cudaParts = $cudaVersion -split '\.' $cudaMajorMinor = "$($cudaParts[0]).$($cudaParts[1])" - mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda-toolkit==$cudaVersion" "nvidia::cuda-nvcc==$cudaMajorMinor.*" + mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda-toolkit==$cudaVersion" "nvidia::cuda-nvcc==$cudaMajorMinor.*" "conda-forge::cuda-version==$cudaMajorMinor.*" python -m pip install build wheel - name: Build Wheel From f8da86ccb6e3bbbd2335e5e978973c125916f6a7 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Tue, 10 Feb 2026 14:51:44 +0700 Subject: [PATCH 063/221] testing without explicit cuda-nvcc installation --- .github/workflows/manual_wheel_cuda.yml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 7790b4c031..4047aa919b 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -104,7 +104,7 @@ jobs: $cudaMajor = $cudaVersion.Split('.')[0] $cudaParts = $cudaVersion -split '\.' $cudaMajorMinor = "$($cudaParts[0]).$($cudaParts[1])" - mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda-toolkit==$cudaVersion" "nvidia::cuda-nvcc==$cudaMajorMinor.*" "conda-forge::cuda-version==$cudaMajorMinor.*" + mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda-toolkit==$cudaVersion" "conda-forge::cuda-version==$cudaMajorMinor.*" python -m pip install build wheel - name: Build Wheel @@ -120,7 +120,7 @@ jobs: $env:VERBOSE = '1' #$env:MAX_JOBS=4 #$env:CMAKE_BUILD_PARALLEL_LEVEL=4 - $env:CMAKE_ARGS = '-DGGML_CUDA=on -DCMAKE_CUDA_ARCHITECTURES=all' + $env:CMAKE_ARGS = '-DGGML_CUDA=on -DLLAMA_CUBLAS=on -DCMAKE_CUDA_ARCHITECTURES=all' $env:CMAKE_ARGS = "-DGGML_CUDA_FORCE_MMQ=ON $env:CMAKE_ARGS" # if ($env:AVXVER -eq 'AVX') { $env:CMAKE_ARGS = $env:CMAKE_ARGS + ' -DGGML_AVX2=off -DGGML_FMA=off -DGGML_F16C=off' From e9f0e4f1a85d19657ad755c13a20fb5fdfc2ee99 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Tue, 10 Feb 2026 15:01:09 +0700 Subject: [PATCH 064/221] oops --- .github/workflows/manual_wheel_cuda.yml | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 4047aa919b..8c250a53f4 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -118,9 +118,10 @@ jobs: $env:LD_LIBRARY_PATH = $env:CONDA_PREFIX + '/lib:' + $env:LD_LIBRARY_PATH } $env:VERBOSE = '1' + $env:FORCE_CMAKE=1 #$env:MAX_JOBS=4 #$env:CMAKE_BUILD_PARALLEL_LEVEL=4 - $env:CMAKE_ARGS = '-DGGML_CUDA=on -DLLAMA_CUBLAS=on -DCMAKE_CUDA_ARCHITECTURES=all' + $env:CMAKE_ARGS = '-DGGML_CUDA=on -DCMAKE_CUDA_ARCHITECTURES=all' $env:CMAKE_ARGS = "-DGGML_CUDA_FORCE_MMQ=ON $env:CMAKE_ARGS" # if ($env:AVXVER -eq 'AVX') { $env:CMAKE_ARGS = $env:CMAKE_ARGS + ' -DGGML_AVX2=off -DGGML_FMA=off -DGGML_F16C=off' From b5a6d2a9b6c272d3718d07243872206ea5150205 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Tue, 10 Feb 2026 15:14:51 +0700 Subject: [PATCH 065/221] install cuda too --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 8c250a53f4..90d81d71ff 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -104,7 +104,7 @@ jobs: $cudaMajor = $cudaVersion.Split('.')[0] $cudaParts = $cudaVersion -split '\.' $cudaMajorMinor = "$($cudaParts[0]).$($cudaParts[1])" - mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda-toolkit==$cudaVersion" "conda-forge::cuda-version==$cudaMajorMinor.*" + mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda" "nvidia::cuda-toolkit==$cudaVersion" "conda-forge::cuda-version==$cudaMajorMinor.*" python -m pip install build wheel - name: Build Wheel From 4605b78c6cd5049c5d7bc5b5c3079945421eef4c Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Tue, 10 Feb 2026 15:38:16 +0700 Subject: [PATCH 066/221] set CPATH too --- .github/workflows/manual_wheel_cuda.yml | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 90d81d71ff..01eb0e8677 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -116,9 +116,10 @@ jobs: $env:CUDAToolkit_ROOT = $env:CONDA_PREFIX if ($IsLinux) { $env:LD_LIBRARY_PATH = $env:CONDA_PREFIX + '/lib:' + $env:LD_LIBRARY_PATH + $env:CPATH = $env:CONDA_PREFIX + '/include:' + $env:CPATH } $env:VERBOSE = '1' - $env:FORCE_CMAKE=1 + #$env:FORCE_CMAKE=1 #$env:MAX_JOBS=4 #$env:CMAKE_BUILD_PARALLEL_LEVEL=4 $env:CMAKE_ARGS = '-DGGML_CUDA=on -DCMAKE_CUDA_ARCHITECTURES=all' From f0335c0fabb827eb64df23868fe7b4722294656f Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Tue, 10 Feb 2026 15:49:32 +0700 Subject: [PATCH 067/221] test finding cuda_runtime.h --- .github/workflows/manual_wheel_cuda.yml | 1 + 1 file changed, 1 insertion(+) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 01eb0e8677..bfa8938470 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -118,6 +118,7 @@ jobs: $env:LD_LIBRARY_PATH = $env:CONDA_PREFIX + '/lib:' + $env:LD_LIBRARY_PATH $env:CPATH = $env:CONDA_PREFIX + '/include:' + $env:CPATH } + Get-ChildItem -Path ~ -Filter "cuda_runtime.h" -Recurse -ErrorAction SilentlyContinue $env:VERBOSE = '1' #$env:FORCE_CMAKE=1 #$env:MAX_JOBS=4 From 3c55d94bbe369865b391a46459b63006db0d2b22 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Tue, 10 Feb 2026 16:01:31 +0700 Subject: [PATCH 068/221] update lib and include path Update environment variables for CUDA paths on Linux. --- .github/workflows/manual_wheel_cuda.yml | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index bfa8938470..be04b983c7 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -115,10 +115,10 @@ jobs: $env:CUDA_TOOLKIT_ROOT_DIR = $env:CONDA_PREFIX $env:CUDAToolkit_ROOT = $env:CONDA_PREFIX if ($IsLinux) { - $env:LD_LIBRARY_PATH = $env:CONDA_PREFIX + '/lib:' + $env:LD_LIBRARY_PATH - $env:CPATH = $env:CONDA_PREFIX + '/include:' + $env:CPATH + $env:LD_LIBRARY_PATH = $env:CONDA_PREFIX + '/lib:' + $env:CONDA_PREFIX + '/targets/x86_64-linux/lib:' + $env:LD_LIBRARY_PATH + $env:CPATH = $env:CONDA_PREFIX + '/include:' + $env:CONDA_PREFIX + '/targets/x86_64-linux/include:' + $env:CPATH } - Get-ChildItem -Path ~ -Filter "cuda_runtime.h" -Recurse -ErrorAction SilentlyContinue + #Get-ChildItem -Path ~ -Filter "cuda_runtime.h" -Recurse -ErrorAction SilentlyContinue $env:VERBOSE = '1' #$env:FORCE_CMAKE=1 #$env:MAX_JOBS=4 From d2889e0364cc25bb863e80d9c1d9a27485ffc9b2 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Tue, 10 Feb 2026 16:53:38 +0700 Subject: [PATCH 069/221] allow unsupported compiler (ie. gcc 14 or newer) --- .github/workflows/manual_wheel_cuda.yml | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index be04b983c7..cff40f6774 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -120,11 +120,12 @@ jobs: } #Get-ChildItem -Path ~ -Filter "cuda_runtime.h" -Recurse -ErrorAction SilentlyContinue $env:VERBOSE = '1' + $env:NVCCFLAGS="-allow-unsupported-compiler" #$env:FORCE_CMAKE=1 #$env:MAX_JOBS=4 #$env:CMAKE_BUILD_PARALLEL_LEVEL=4 $env:CMAKE_ARGS = '-DGGML_CUDA=on -DCMAKE_CUDA_ARCHITECTURES=all' - $env:CMAKE_ARGS = "-DGGML_CUDA_FORCE_MMQ=ON $env:CMAKE_ARGS" + $env:CMAKE_ARGS = "-DGGML_CUDA_FORCE_MMQ=ON $env:CMAKE_ARGS" # -DCMAKE_CUDA_FLAGS='-allow-unsupported-compiler' # if ($env:AVXVER -eq 'AVX') { $env:CMAKE_ARGS = $env:CMAKE_ARGS + ' -DGGML_AVX2=off -DGGML_FMA=off -DGGML_F16C=off' # } From 9fcb6f08980d75196cb6f07af39071ea20fc15ab Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Tue, 10 Feb 2026 17:02:15 +0700 Subject: [PATCH 070/221] oops --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index cff40f6774..6763102762 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -125,7 +125,7 @@ jobs: #$env:MAX_JOBS=4 #$env:CMAKE_BUILD_PARALLEL_LEVEL=4 $env:CMAKE_ARGS = '-DGGML_CUDA=on -DCMAKE_CUDA_ARCHITECTURES=all' - $env:CMAKE_ARGS = "-DGGML_CUDA_FORCE_MMQ=ON $env:CMAKE_ARGS" # -DCMAKE_CUDA_FLAGS='-allow-unsupported-compiler' + $env:CMAKE_ARGS = "-DGGML_CUDA_FORCE_MMQ=ON -DCMAKE_CUDA_FLAGS='-allow-unsupported-compiler' $env:CMAKE_ARGS" # if ($env:AVXVER -eq 'AVX') { $env:CMAKE_ARGS = $env:CMAKE_ARGS + ' -DGGML_AVX2=off -DGGML_FMA=off -DGGML_F16C=off' # } From 8dd59a0350d4370011652dd23d6d1e147f156a7b Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Tue, 10 Feb 2026 17:12:35 +0700 Subject: [PATCH 071/221] use gcc 13 --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 6763102762..13f164f411 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -104,7 +104,7 @@ jobs: $cudaMajor = $cudaVersion.Split('.')[0] $cudaParts = $cudaVersion -split '\.' $cudaMajorMinor = "$($cudaParts[0]).$($cudaParts[1])" - mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda" "nvidia::cuda-toolkit==$cudaVersion" "conda-forge::cuda-version==$cudaMajorMinor.*" + mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda" "nvidia::cuda-toolkit==$cudaVersion" "conda-forge::cuda-version==$cudaMajorMinor.*" "conda-forge::gcc==13.*" python -m pip install build wheel - name: Build Wheel From e4e2cc453188fb59a64596bc2cd943542691d2d6 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Tue, 10 Feb 2026 17:53:32 +0700 Subject: [PATCH 072/221] oops --- .github/workflows/manual_wheel_cuda.yml | 5 +++-- 1 file changed, 3 insertions(+), 2 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 13f164f411..1ed35782f9 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -118,14 +118,15 @@ jobs: $env:LD_LIBRARY_PATH = $env:CONDA_PREFIX + '/lib:' + $env:CONDA_PREFIX + '/targets/x86_64-linux/lib:' + $env:LD_LIBRARY_PATH $env:CPATH = $env:CONDA_PREFIX + '/include:' + $env:CONDA_PREFIX + '/targets/x86_64-linux/include:' + $env:CPATH } - #Get-ChildItem -Path ~ -Filter "cuda_runtime.h" -Recurse -ErrorAction SilentlyContinue + Get-ChildItem -Path ~ -Filter "cuda_runtime.h" -Recurse -ErrorAction SilentlyContinue $env:VERBOSE = '1' $env:NVCCFLAGS="-allow-unsupported-compiler" #$env:FORCE_CMAKE=1 #$env:MAX_JOBS=4 #$env:CMAKE_BUILD_PARALLEL_LEVEL=4 $env:CMAKE_ARGS = '-DGGML_CUDA=on -DCMAKE_CUDA_ARCHITECTURES=all' - $env:CMAKE_ARGS = "-DGGML_CUDA_FORCE_MMQ=ON -DCMAKE_CUDA_FLAGS='-allow-unsupported-compiler' $env:CMAKE_ARGS" + $env:CMAKE_ARGS = "-DGGML_CUDA_FORCE_MMQ=ON $env:CMAKE_ARGS" + $env:CMAKE_ARGS = "-DCMAKE_CUDA_FLAGS='-allow-unsupported-compiler' $env:CMAKE_ARGS" # if ($env:AVXVER -eq 'AVX') { $env:CMAKE_ARGS = $env:CMAKE_ARGS + ' -DGGML_AVX2=off -DGGML_FMA=off -DGGML_F16C=off' # } From 061f7a0c6fae0881f7518431eb5624a0e837e2c0 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Tue, 10 Feb 2026 18:28:32 +0700 Subject: [PATCH 073/221] testing IncludePath --- .github/workflows/manual_wheel_cuda.yml | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 1ed35782f9..7bd9ab097a 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -117,6 +117,10 @@ jobs: if ($IsLinux) { $env:LD_LIBRARY_PATH = $env:CONDA_PREFIX + '/lib:' + $env:CONDA_PREFIX + '/targets/x86_64-linux/lib:' + $env:LD_LIBRARY_PATH $env:CPATH = $env:CONDA_PREFIX + '/include:' + $env:CONDA_PREFIX + '/targets/x86_64-linux/include:' + $env:CPATH + } + else { + $env:IncludePath = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:IncludePath + $env:CL='/I\' + $env:CONDA_PREFIX + '\Library\include' } Get-ChildItem -Path ~ -Filter "cuda_runtime.h" -Recurse -ErrorAction SilentlyContinue $env:VERBOSE = '1' From 2ba6bd2a50191e97399bd9386541e67f2ba3d2db Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Tue, 10 Feb 2026 18:45:20 +0700 Subject: [PATCH 074/221] more include env vars --- .github/workflows/manual_wheel_cuda.yml | 3 +++ 1 file changed, 3 insertions(+) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 7bd9ab097a..dee9e2609c 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -120,6 +120,9 @@ jobs: } else { $env:IncludePath = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:IncludePath + $env:C_INCLUDE_PATH = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:C_INCLUDE_PATH + $env:CPLUS_INCLUDE_PATH = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:CPLUS_INCLUDE_PATH + $env:INCLUDE = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:INCLUDE $env:CL='/I\' + $env:CONDA_PREFIX + '\Library\include' } Get-ChildItem -Path ~ -Filter "cuda_runtime.h" -Recurse -ErrorAction SilentlyContinue From 37458973ed4607cc522f0d32d3801b4995f3243b Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 11 Feb 2026 01:06:43 +0700 Subject: [PATCH 075/221] try finding nvcc.exe --- .github/workflows/manual_wheel_cuda.yml | 1 + 1 file changed, 1 insertion(+) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index dee9e2609c..9426096972 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -124,6 +124,7 @@ jobs: $env:CPLUS_INCLUDE_PATH = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:CPLUS_INCLUDE_PATH $env:INCLUDE = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:INCLUDE $env:CL='/I\' + $env:CONDA_PREFIX + '\Library\include' + Get-ChildItem -Path ~ -Filter "nvcc.exe" -Recurse -ErrorAction SilentlyContinue } Get-ChildItem -Path ~ -Filter "cuda_runtime.h" -Recurse -ErrorAction SilentlyContinue $env:VERBOSE = '1' From 47aa856de49ef9d34715010567c36fdc6396aecf Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 11 Feb 2026 01:51:57 +0700 Subject: [PATCH 076/221] update PATH --- .github/workflows/manual_wheel_cuda.yml | 2 ++ 1 file changed, 2 insertions(+) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 9426096972..265995d9d4 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -114,6 +114,7 @@ jobs: $env:CUDA_HOME = $env:CONDA_PREFIX $env:CUDA_TOOLKIT_ROOT_DIR = $env:CONDA_PREFIX $env:CUDAToolkit_ROOT = $env:CONDA_PREFIX + echo "CONDA_PREFIX = $env:CONDA_PREFIX" if ($IsLinux) { $env:LD_LIBRARY_PATH = $env:CONDA_PREFIX + '/lib:' + $env:CONDA_PREFIX + '/targets/x86_64-linux/lib:' + $env:LD_LIBRARY_PATH $env:CPATH = $env:CONDA_PREFIX + '/include:' + $env:CONDA_PREFIX + '/targets/x86_64-linux/include:' + $env:CPATH @@ -124,6 +125,7 @@ jobs: $env:CPLUS_INCLUDE_PATH = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:CPLUS_INCLUDE_PATH $env:INCLUDE = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:INCLUDE $env:CL='/I\' + $env:CONDA_PREFIX + '\Library\include' + $env:PATH = $env:CONDA_PREFIX + '\bin;' + $env:CONDA_PREFIX + '\Library\bin;' + $env:PATH Get-ChildItem -Path ~ -Filter "nvcc.exe" -Recurse -ErrorAction SilentlyContinue } Get-ChildItem -Path ~ -Filter "cuda_runtime.h" -Recurse -ErrorAction SilentlyContinue From 90684598185d0d516fb43dc1c01531cef187e911 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 11 Feb 2026 03:35:38 +0700 Subject: [PATCH 077/221] disable allow-unsupported-compiler --- .github/workflows/manual_wheel_cuda.yml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 265995d9d4..8b25002b0f 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -130,13 +130,13 @@ jobs: } Get-ChildItem -Path ~ -Filter "cuda_runtime.h" -Recurse -ErrorAction SilentlyContinue $env:VERBOSE = '1' - $env:NVCCFLAGS="-allow-unsupported-compiler" + #$env:NVCCFLAGS="-allow-unsupported-compiler" #$env:FORCE_CMAKE=1 #$env:MAX_JOBS=4 #$env:CMAKE_BUILD_PARALLEL_LEVEL=4 $env:CMAKE_ARGS = '-DGGML_CUDA=on -DCMAKE_CUDA_ARCHITECTURES=all' $env:CMAKE_ARGS = "-DGGML_CUDA_FORCE_MMQ=ON $env:CMAKE_ARGS" - $env:CMAKE_ARGS = "-DCMAKE_CUDA_FLAGS='-allow-unsupported-compiler' $env:CMAKE_ARGS" + #$env:CMAKE_ARGS = "-DCMAKE_CUDA_FLAGS='-allow-unsupported-compiler' $env:CMAKE_ARGS" # if ($env:AVXVER -eq 'AVX') { $env:CMAKE_ARGS = $env:CMAKE_ARGS + ' -DGGML_AVX2=off -DGGML_FMA=off -DGGML_F16C=off' # } From 8482156b73b115f337413f55ae71aa3d2650b4e7 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 11 Feb 2026 05:40:07 +0700 Subject: [PATCH 078/221] testing nvcc version --- .github/workflows/manual_wheel_cuda.yml | 1 + 1 file changed, 1 insertion(+) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 8b25002b0f..0f73d1b17e 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -127,6 +127,7 @@ jobs: $env:CL='/I\' + $env:CONDA_PREFIX + '\Library\include' $env:PATH = $env:CONDA_PREFIX + '\bin;' + $env:CONDA_PREFIX + '\Library\bin;' + $env:PATH Get-ChildItem -Path ~ -Filter "nvcc.exe" -Recurse -ErrorAction SilentlyContinue + & "C:\Users\runneradmin\miniconda3\envs\llamacpp\bin\nvcc.exe" --version } Get-ChildItem -Path ~ -Filter "cuda_runtime.h" -Recurse -ErrorAction SilentlyContinue $env:VERBOSE = '1' From 19ffabecbe5ab11b014cce38c8edc0325acd0599 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 11 Feb 2026 06:24:46 +0700 Subject: [PATCH 079/221] testing path again --- .github/workflows/manual_wheel_cuda.yml | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 0f73d1b17e..5616d47b0f 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -125,9 +125,11 @@ jobs: $env:CPLUS_INCLUDE_PATH = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:CPLUS_INCLUDE_PATH $env:INCLUDE = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:INCLUDE $env:CL='/I\' + $env:CONDA_PREFIX + '\Library\include' - $env:PATH = $env:CONDA_PREFIX + '\bin;' + $env:CONDA_PREFIX + '\Library\bin;' + $env:PATH + #$env:PATH = $env:CONDA_PREFIX + '\bin;' + $env:CONDA_PREFIX + '\Library\bin;' + $env:PATH + echo "$env:CONDA_PREFIX\\Library\\bin" | Out-File -FilePath $env:GITHUB_PATH -Encoding utf8 -Append Get-ChildItem -Path ~ -Filter "nvcc.exe" -Recurse -ErrorAction SilentlyContinue & "C:\Users\runneradmin\miniconda3\envs\llamacpp\bin\nvcc.exe" --version + Get-ChildItem -Path "C:\Users\runneradmin\miniconda3\envs\llamacpp" -Recurse -ErrorAction SilentlyContinue } Get-ChildItem -Path ~ -Filter "cuda_runtime.h" -Recurse -ErrorAction SilentlyContinue $env:VERBOSE = '1' From 246b0d6fd0c950e479c1f7e080096a16bb6c25fb Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 11 Feb 2026 06:32:53 +0700 Subject: [PATCH 080/221] oops --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 5616d47b0f..3fc1e174e6 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -128,7 +128,7 @@ jobs: #$env:PATH = $env:CONDA_PREFIX + '\bin;' + $env:CONDA_PREFIX + '\Library\bin;' + $env:PATH echo "$env:CONDA_PREFIX\\Library\\bin" | Out-File -FilePath $env:GITHUB_PATH -Encoding utf8 -Append Get-ChildItem -Path ~ -Filter "nvcc.exe" -Recurse -ErrorAction SilentlyContinue - & "C:\Users\runneradmin\miniconda3\envs\llamacpp\bin\nvcc.exe" --version + nvcc.exe --version Get-ChildItem -Path "C:\Users\runneradmin\miniconda3\envs\llamacpp" -Recurse -ErrorAction SilentlyContinue } Get-ChildItem -Path ~ -Filter "cuda_runtime.h" -Recurse -ErrorAction SilentlyContinue From bbae81d245b83869e9790ae197872df400a73416 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 11 Feb 2026 06:45:04 +0700 Subject: [PATCH 081/221] only shows directory --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 3fc1e174e6..07477efdbc 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -129,7 +129,7 @@ jobs: echo "$env:CONDA_PREFIX\\Library\\bin" | Out-File -FilePath $env:GITHUB_PATH -Encoding utf8 -Append Get-ChildItem -Path ~ -Filter "nvcc.exe" -Recurse -ErrorAction SilentlyContinue nvcc.exe --version - Get-ChildItem -Path "C:\Users\runneradmin\miniconda3\envs\llamacpp" -Recurse -ErrorAction SilentlyContinue + Get-ChildItem -Path "C:\Users\runneradmin\miniconda3\envs\llamacpp" -Directory -Recurse -ErrorAction SilentlyContinue } Get-ChildItem -Path ~ -Filter "cuda_runtime.h" -Recurse -ErrorAction SilentlyContinue $env:VERBOSE = '1' From ad56fe72d9255655f4a28c5335f47120fcd496ac Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 11 Feb 2026 07:31:52 +0700 Subject: [PATCH 082/221] testing cuda_path --- .github/workflows/manual_wheel_cuda.yml | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 07477efdbc..a3efe9fc66 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -120,6 +120,7 @@ jobs: $env:CPATH = $env:CONDA_PREFIX + '/include:' + $env:CONDA_PREFIX + '/targets/x86_64-linux/include:' + $env:CPATH } else { + $env:CUDA_PATH = $env:CONDA_PREFIX + '\\Library\\bin' $env:IncludePath = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:IncludePath $env:C_INCLUDE_PATH = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:C_INCLUDE_PATH $env:CPLUS_INCLUDE_PATH = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:CPLUS_INCLUDE_PATH @@ -129,7 +130,7 @@ jobs: echo "$env:CONDA_PREFIX\\Library\\bin" | Out-File -FilePath $env:GITHUB_PATH -Encoding utf8 -Append Get-ChildItem -Path ~ -Filter "nvcc.exe" -Recurse -ErrorAction SilentlyContinue nvcc.exe --version - Get-ChildItem -Path "C:\Users\runneradmin\miniconda3\envs\llamacpp" -Directory -Recurse -ErrorAction SilentlyContinue + #Get-ChildItem -Path "C:\Users\runneradmin\miniconda3\envs\llamacpp" -Directory -Recurse -ErrorAction SilentlyContinue } Get-ChildItem -Path ~ -Filter "cuda_runtime.h" -Recurse -ErrorAction SilentlyContinue $env:VERBOSE = '1' From 75cd725cc40eab75e4a1a453a92a04ac1e34c4c2 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 11 Feb 2026 07:55:12 +0700 Subject: [PATCH 083/221] update conda_prefix --- .github/workflows/manual_wheel_cuda.yml | 5 ++++- 1 file changed, 4 insertions(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index a3efe9fc66..12b6756f06 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -110,6 +110,9 @@ jobs: - name: Build Wheel run: | $cudaVersion = $env:CUDAVER.Remove($env:CUDAVER.LastIndexOf('.')).Replace('.','') + if ($env:RUNNER_OS -eq 'Windows') { + $env:CONDA_PREFIX = $env:CONDA_PREFIX + '\\Library' + } $env:CUDA_PATH = $env:CONDA_PREFIX $env:CUDA_HOME = $env:CONDA_PREFIX $env:CUDA_TOOLKIT_ROOT_DIR = $env:CONDA_PREFIX @@ -119,7 +122,7 @@ jobs: $env:LD_LIBRARY_PATH = $env:CONDA_PREFIX + '/lib:' + $env:CONDA_PREFIX + '/targets/x86_64-linux/lib:' + $env:LD_LIBRARY_PATH $env:CPATH = $env:CONDA_PREFIX + '/include:' + $env:CONDA_PREFIX + '/targets/x86_64-linux/include:' + $env:CPATH } - else { + elseif ($env:RUNNER_OS -eq 'Windows') { $env:CUDA_PATH = $env:CONDA_PREFIX + '\\Library\\bin' $env:IncludePath = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:IncludePath $env:C_INCLUDE_PATH = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:C_INCLUDE_PATH From c36dcc50009e454188a26f54de871a1edd39e47a Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 11 Feb 2026 08:33:35 +0700 Subject: [PATCH 084/221] testing -DCMAKE_CUDA_COMPILER --- .github/workflows/manual_wheel_cuda.yml | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 12b6756f06..feb1fa13d2 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -111,7 +111,7 @@ jobs: run: | $cudaVersion = $env:CUDAVER.Remove($env:CUDAVER.LastIndexOf('.')).Replace('.','') if ($env:RUNNER_OS -eq 'Windows') { - $env:CONDA_PREFIX = $env:CONDA_PREFIX + '\\Library' + $env:CONDA_PREFIX = $env:CONDA_PREFIX + '\Library' } $env:CUDA_PATH = $env:CONDA_PREFIX $env:CUDA_HOME = $env:CONDA_PREFIX @@ -143,6 +143,7 @@ jobs: #$env:CMAKE_BUILD_PARALLEL_LEVEL=4 $env:CMAKE_ARGS = '-DGGML_CUDA=on -DCMAKE_CUDA_ARCHITECTURES=all' $env:CMAKE_ARGS = "-DGGML_CUDA_FORCE_MMQ=ON $env:CMAKE_ARGS" + $env:CMAKE_ARGS = "-DCMAKE_CUDA_COMPILER='$env:CONDA_PREFIX\\bin' $env:CMAKE_ARGS" #$env:CMAKE_ARGS = "-DCMAKE_CUDA_FLAGS='-allow-unsupported-compiler' $env:CMAKE_ARGS" # if ($env:AVXVER -eq 'AVX') { $env:CMAKE_ARGS = $env:CMAKE_ARGS + ' -DGGML_AVX2=off -DGGML_FMA=off -DGGML_F16C=off' From cd1c207d35b60a3ff6b0b7bbe3a4ed1e3427ab6a Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 11 Feb 2026 08:39:26 +0700 Subject: [PATCH 085/221] oops --- .github/workflows/manual_wheel_cuda.yml | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index feb1fa13d2..25eca01c29 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -143,7 +143,9 @@ jobs: #$env:CMAKE_BUILD_PARALLEL_LEVEL=4 $env:CMAKE_ARGS = '-DGGML_CUDA=on -DCMAKE_CUDA_ARCHITECTURES=all' $env:CMAKE_ARGS = "-DGGML_CUDA_FORCE_MMQ=ON $env:CMAKE_ARGS" - $env:CMAKE_ARGS = "-DCMAKE_CUDA_COMPILER='$env:CONDA_PREFIX\\bin' $env:CMAKE_ARGS" + if ($env:RUNNER_OS -eq 'Windows') { + $env:CMAKE_ARGS = "-DCMAKE_CUDA_COMPILER='$env:CONDA_PREFIX\\bin' $env:CMAKE_ARGS" + } #$env:CMAKE_ARGS = "-DCMAKE_CUDA_FLAGS='-allow-unsupported-compiler' $env:CMAKE_ARGS" # if ($env:AVXVER -eq 'AVX') { $env:CMAKE_ARGS = $env:CMAKE_ARGS + ' -DGGML_AVX2=off -DGGML_FMA=off -DGGML_F16C=off' From 9c6b3bf796c2fdcc284f6af72e6ec1bbf7f71f8f Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 11 Feb 2026 11:26:44 +0700 Subject: [PATCH 086/221] use symlink to nvcc.exe --- .github/workflows/manual_wheel_cuda.yml | 1 + 1 file changed, 1 insertion(+) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 25eca01c29..a0f536f449 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -133,6 +133,7 @@ jobs: echo "$env:CONDA_PREFIX\\Library\\bin" | Out-File -FilePath $env:GITHUB_PATH -Encoding utf8 -Append Get-ChildItem -Path ~ -Filter "nvcc.exe" -Recurse -ErrorAction SilentlyContinue nvcc.exe --version + New-Item -ItemType SymbolicLink -Path "C:\Users\runneradmin\miniconda3\envs\llamacpp\bin\nvcc.exe" -Target "$env:CONDA_PREFIX\\Library\\bin\\nvcc.exe" # -Force #Get-ChildItem -Path "C:\Users\runneradmin\miniconda3\envs\llamacpp" -Directory -Recurse -ErrorAction SilentlyContinue } Get-ChildItem -Path ~ -Filter "cuda_runtime.h" -Recurse -ErrorAction SilentlyContinue From f0b6ef065948870a773cc136487bf4ac20dc666d Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 11 Feb 2026 11:27:52 +0700 Subject: [PATCH 087/221] oops --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index a0f536f449..02e5534d20 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -133,7 +133,7 @@ jobs: echo "$env:CONDA_PREFIX\\Library\\bin" | Out-File -FilePath $env:GITHUB_PATH -Encoding utf8 -Append Get-ChildItem -Path ~ -Filter "nvcc.exe" -Recurse -ErrorAction SilentlyContinue nvcc.exe --version - New-Item -ItemType SymbolicLink -Path "C:\Users\runneradmin\miniconda3\envs\llamacpp\bin\nvcc.exe" -Target "$env:CONDA_PREFIX\\Library\\bin\\nvcc.exe" # -Force + New-Item -ItemType SymbolicLink -Path "C:\Users\runneradmin\miniconda3\envs\llamacpp\bin\nvcc.exe" -Target "$env:CONDA_PREFIX\\bin\\nvcc.exe" # -Force #Get-ChildItem -Path "C:\Users\runneradmin\miniconda3\envs\llamacpp" -Directory -Recurse -ErrorAction SilentlyContinue } Get-ChildItem -Path ~ -Filter "cuda_runtime.h" -Recurse -ErrorAction SilentlyContinue From 9e2d98d32544fbb3e02dd0d4b260a6fd2bb91dff Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 11 Feb 2026 11:46:54 +0700 Subject: [PATCH 088/221] oops swapped --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 02e5534d20..df320b06d9 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -133,7 +133,7 @@ jobs: echo "$env:CONDA_PREFIX\\Library\\bin" | Out-File -FilePath $env:GITHUB_PATH -Encoding utf8 -Append Get-ChildItem -Path ~ -Filter "nvcc.exe" -Recurse -ErrorAction SilentlyContinue nvcc.exe --version - New-Item -ItemType SymbolicLink -Path "C:\Users\runneradmin\miniconda3\envs\llamacpp\bin\nvcc.exe" -Target "$env:CONDA_PREFIX\\bin\\nvcc.exe" # -Force + New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\bin\\nvcc.exe" -Target "C:\Users\runneradmin\miniconda3\envs\llamacpp\bin\nvcc.exe" # -Force #Get-ChildItem -Path "C:\Users\runneradmin\miniconda3\envs\llamacpp" -Directory -Recurse -ErrorAction SilentlyContinue } Get-ChildItem -Path ~ -Filter "cuda_runtime.h" -Recurse -ErrorAction SilentlyContinue From c3b3b4c4f69183543f9594c24d0dbfa16335029d Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 11 Feb 2026 12:10:51 +0700 Subject: [PATCH 089/221] oops 3 --- .github/workflows/manual_wheel_cuda.yml | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index df320b06d9..c19b7b5751 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -133,7 +133,8 @@ jobs: echo "$env:CONDA_PREFIX\\Library\\bin" | Out-File -FilePath $env:GITHUB_PATH -Encoding utf8 -Append Get-ChildItem -Path ~ -Filter "nvcc.exe" -Recurse -ErrorAction SilentlyContinue nvcc.exe --version - New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\bin\\nvcc.exe" -Target "C:\Users\runneradmin\miniconda3\envs\llamacpp\bin\nvcc.exe" # -Force + New-Item -ItemType Directory -Path "C:\Users\runneradmin\miniconda3\envs\llamacpp\bin" -Force + New-Item -ItemType SymbolicLink -Path "C:\Users\runneradmin\miniconda3\envs\llamacpp\bin\nvcc.exe" -Target "$env:CONDA_PREFIX\\bin\\nvcc.exe" # -Force #Get-ChildItem -Path "C:\Users\runneradmin\miniconda3\envs\llamacpp" -Directory -Recurse -ErrorAction SilentlyContinue } Get-ChildItem -Path ~ -Filter "cuda_runtime.h" -Recurse -ErrorAction SilentlyContinue From b9105cc744c46cba4d1f0561903a6de49ca758ef Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 11 Feb 2026 13:56:36 +0700 Subject: [PATCH 090/221] find cicc.exe --- .github/workflows/manual_wheel_cuda.yml | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index c19b7b5751..4d268fa462 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -104,7 +104,7 @@ jobs: $cudaMajor = $cudaVersion.Split('.')[0] $cudaParts = $cudaVersion -split '\.' $cudaMajorMinor = "$($cudaParts[0]).$($cudaParts[1])" - mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda" "nvidia::cuda-toolkit==$cudaVersion" "conda-forge::cuda-version==$cudaMajorMinor.*" "conda-forge::gcc==13.*" + mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda" "nvidia::cuda-toolkit==$cudaVersion" "nvidia::cuda-nvcc" "conda-forge::cuda-version==$cudaMajorMinor.*" "conda-forge::gcc==13.*" python -m pip install build wheel - name: Build Wheel @@ -133,6 +133,8 @@ jobs: echo "$env:CONDA_PREFIX\\Library\\bin" | Out-File -FilePath $env:GITHUB_PATH -Encoding utf8 -Append Get-ChildItem -Path ~ -Filter "nvcc.exe" -Recurse -ErrorAction SilentlyContinue nvcc.exe --version + Get-ChildItem -Path ~ -Filter "cicc.exe" -Recurse -ErrorAction SilentlyContinue + cicc.exe --version New-Item -ItemType Directory -Path "C:\Users\runneradmin\miniconda3\envs\llamacpp\bin" -Force New-Item -ItemType SymbolicLink -Path "C:\Users\runneradmin\miniconda3\envs\llamacpp\bin\nvcc.exe" -Target "$env:CONDA_PREFIX\\bin\\nvcc.exe" # -Force #Get-ChildItem -Path "C:\Users\runneradmin\miniconda3\envs\llamacpp" -Directory -Recurse -ErrorAction SilentlyContinue From 83f6c617fe81bb38a9b15b9639944d80fedddfb4 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 11 Feb 2026 18:34:56 +0700 Subject: [PATCH 091/221] add nvvm to PATH --- .github/workflows/manual_wheel_cuda.yml | 21 +++++++++++---------- 1 file changed, 11 insertions(+), 10 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 4d268fa462..02c5c5b6dd 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -110,9 +110,9 @@ jobs: - name: Build Wheel run: | $cudaVersion = $env:CUDAVER.Remove($env:CUDAVER.LastIndexOf('.')).Replace('.','') - if ($env:RUNNER_OS -eq 'Windows') { - $env:CONDA_PREFIX = $env:CONDA_PREFIX + '\Library' - } + #if ($env:RUNNER_OS -eq 'Windows') { + # $env:CONDA_PREFIX = $env:CONDA_PREFIX + '\Library' + #} $env:CUDA_PATH = $env:CONDA_PREFIX $env:CUDA_HOME = $env:CONDA_PREFIX $env:CUDA_TOOLKIT_ROOT_DIR = $env:CONDA_PREFIX @@ -123,20 +123,21 @@ jobs: $env:CPATH = $env:CONDA_PREFIX + '/include:' + $env:CONDA_PREFIX + '/targets/x86_64-linux/include:' + $env:CPATH } elseif ($env:RUNNER_OS -eq 'Windows') { - $env:CUDA_PATH = $env:CONDA_PREFIX + '\\Library\\bin' + #$env:CUDA_PATH = $env:CONDA_PREFIX + '\\Library\\bin' $env:IncludePath = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:IncludePath $env:C_INCLUDE_PATH = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:C_INCLUDE_PATH $env:CPLUS_INCLUDE_PATH = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:CPLUS_INCLUDE_PATH $env:INCLUDE = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:INCLUDE $env:CL='/I\' + $env:CONDA_PREFIX + '\Library\include' - #$env:PATH = $env:CONDA_PREFIX + '\bin;' + $env:CONDA_PREFIX + '\Library\bin;' + $env:PATH + #echo "$env:CONDA_PREFIX + '\bin;' + $env:CONDA_PREFIX + '\Library\bin;' + $env:CONDA_PREFIX + '\nvvm\bin;'" >> $env:GITHUB_PATH echo "$env:CONDA_PREFIX\\Library\\bin" | Out-File -FilePath $env:GITHUB_PATH -Encoding utf8 -Append + echo "$env:CONDA_PREFIX\\nvvm\\bin" | Out-File -FilePath $env:GITHUB_PATH -Encoding utf8 -Append Get-ChildItem -Path ~ -Filter "nvcc.exe" -Recurse -ErrorAction SilentlyContinue nvcc.exe --version Get-ChildItem -Path ~ -Filter "cicc.exe" -Recurse -ErrorAction SilentlyContinue cicc.exe --version - New-Item -ItemType Directory -Path "C:\Users\runneradmin\miniconda3\envs\llamacpp\bin" -Force - New-Item -ItemType SymbolicLink -Path "C:\Users\runneradmin\miniconda3\envs\llamacpp\bin\nvcc.exe" -Target "$env:CONDA_PREFIX\\bin\\nvcc.exe" # -Force + New-Item -ItemType Directory -Path "$env:CONDA_PREFIX\\bin" -Force + New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\bin\\nvcc.exe" -Target "$env:CONDA_PREFIX\\Library\\bin\\nvcc.exe" # -Force #Get-ChildItem -Path "C:\Users\runneradmin\miniconda3\envs\llamacpp" -Directory -Recurse -ErrorAction SilentlyContinue } Get-ChildItem -Path ~ -Filter "cuda_runtime.h" -Recurse -ErrorAction SilentlyContinue @@ -147,9 +148,9 @@ jobs: #$env:CMAKE_BUILD_PARALLEL_LEVEL=4 $env:CMAKE_ARGS = '-DGGML_CUDA=on -DCMAKE_CUDA_ARCHITECTURES=all' $env:CMAKE_ARGS = "-DGGML_CUDA_FORCE_MMQ=ON $env:CMAKE_ARGS" - if ($env:RUNNER_OS -eq 'Windows') { - $env:CMAKE_ARGS = "-DCMAKE_CUDA_COMPILER='$env:CONDA_PREFIX\\bin' $env:CMAKE_ARGS" - } + #if ($env:RUNNER_OS -eq 'Windows') { + # $env:CMAKE_ARGS = "-DCMAKE_CUDA_COMPILER='$env:CONDA_PREFIX\\Library\\bin' $env:CMAKE_ARGS" + #} #$env:CMAKE_ARGS = "-DCMAKE_CUDA_FLAGS='-allow-unsupported-compiler' $env:CMAKE_ARGS" # if ($env:AVXVER -eq 'AVX') { $env:CMAKE_ARGS = $env:CMAKE_ARGS + ' -DGGML_AVX2=off -DGGML_FMA=off -DGGML_F16C=off' From 0076d6162fc9a91ae16fc54d1d14d68af86ba9ce Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 11 Feb 2026 22:38:47 +0700 Subject: [PATCH 092/221] try using Path for immediate effect --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 02c5c5b6dd..2a82c42e09 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -129,7 +129,7 @@ jobs: $env:CPLUS_INCLUDE_PATH = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:CPLUS_INCLUDE_PATH $env:INCLUDE = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:INCLUDE $env:CL='/I\' + $env:CONDA_PREFIX + '\Library\include' - #echo "$env:CONDA_PREFIX + '\bin;' + $env:CONDA_PREFIX + '\Library\bin;' + $env:CONDA_PREFIX + '\nvvm\bin;'" >> $env:GITHUB_PATH + $env:Path = "$env:CONDA_PREFIX\\bin; $env:CONDA_PREFIX\\Library\\bin; $env:CONDA_PREFIX\\nvvm\\bin;" + $env:Path echo "$env:CONDA_PREFIX\\Library\\bin" | Out-File -FilePath $env:GITHUB_PATH -Encoding utf8 -Append echo "$env:CONDA_PREFIX\\nvvm\\bin" | Out-File -FilePath $env:GITHUB_PATH -Encoding utf8 -Append Get-ChildItem -Path ~ -Filter "nvcc.exe" -Recurse -ErrorAction SilentlyContinue From 0315e9425983f2eaa6af77ea1b175b1f6ef8097a Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 12 Feb 2026 01:03:23 +0700 Subject: [PATCH 093/221] test 1 --- .github/workflows/manual_wheel_cuda.yml | 25 +++++++++++++------------ 1 file changed, 13 insertions(+), 12 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 2a82c42e09..53ef4c6a0e 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -123,21 +123,22 @@ jobs: $env:CPATH = $env:CONDA_PREFIX + '/include:' + $env:CONDA_PREFIX + '/targets/x86_64-linux/include:' + $env:CPATH } elseif ($env:RUNNER_OS -eq 'Windows') { - #$env:CUDA_PATH = $env:CONDA_PREFIX + '\\Library\\bin' - $env:IncludePath = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:IncludePath - $env:C_INCLUDE_PATH = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:C_INCLUDE_PATH - $env:CPLUS_INCLUDE_PATH = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:CPLUS_INCLUDE_PATH - $env:INCLUDE = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:INCLUDE - $env:CL='/I\' + $env:CONDA_PREFIX + '\Library\include' - $env:Path = "$env:CONDA_PREFIX\\bin; $env:CONDA_PREFIX\\Library\\bin; $env:CONDA_PREFIX\\nvvm\\bin;" + $env:Path - echo "$env:CONDA_PREFIX\\Library\\bin" | Out-File -FilePath $env:GITHUB_PATH -Encoding utf8 -Append - echo "$env:CONDA_PREFIX\\nvvm\\bin" | Out-File -FilePath $env:GITHUB_PATH -Encoding utf8 -Append + ##$env:CUDA_PATH = $env:CONDA_PREFIX + '\\Library\\bin' + #$env:IncludePath = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:IncludePath + #$env:C_INCLUDE_PATH = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:C_INCLUDE_PATH + #$env:CPLUS_INCLUDE_PATH = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:CPLUS_INCLUDE_PATH + #$env:INCLUDE = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:INCLUDE + #$env:CL='/I\' + $env:CONDA_PREFIX + '\Library\include' + #$env:Path = "$env:CONDA_PREFIX\\bin; $env:CONDA_PREFIX\\Library\\bin; $env:CONDA_PREFIX\\nvvm\\bin;" + $env:Path + #echo "$env:CONDA_PREFIX\\Library\\bin" | Out-File -FilePath $env:GITHUB_PATH -Encoding utf8 -Append + #echo "$env:CONDA_PREFIX\\nvvm\\bin" | Out-File -FilePath $env:GITHUB_PATH -Encoding utf8 -Append Get-ChildItem -Path ~ -Filter "nvcc.exe" -Recurse -ErrorAction SilentlyContinue nvcc.exe --version Get-ChildItem -Path ~ -Filter "cicc.exe" -Recurse -ErrorAction SilentlyContinue - cicc.exe --version - New-Item -ItemType Directory -Path "$env:CONDA_PREFIX\\bin" -Force - New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\bin\\nvcc.exe" -Target "$env:CONDA_PREFIX\\Library\\bin\\nvcc.exe" # -Force + if (-not (Test-Path -Path "$env:CONDA_PREFIX\\bin\\nvcc.exe")) { + #New-Item -ItemType Directory -Path "$env:CONDA_PREFIX\\bin" -Force + #New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\bin\\nvcc.exe" -Target "$env:CONDA_PREFIX\\Library\\bin\\nvcc.exe" # -Force + } #Get-ChildItem -Path "C:\Users\runneradmin\miniconda3\envs\llamacpp" -Directory -Recurse -ErrorAction SilentlyContinue } Get-ChildItem -Path ~ -Filter "cuda_runtime.h" -Recurse -ErrorAction SilentlyContinue From 21ccd3110e992acad8005aea78528a9c6f9d83cc Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 12 Feb 2026 01:25:17 +0700 Subject: [PATCH 094/221] try with cuda-cudart --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 53ef4c6a0e..85b4f04cc2 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -104,7 +104,7 @@ jobs: $cudaMajor = $cudaVersion.Split('.')[0] $cudaParts = $cudaVersion -split '\.' $cudaMajorMinor = "$($cudaParts[0]).$($cudaParts[1])" - mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda" "nvidia::cuda-toolkit==$cudaVersion" "nvidia::cuda-nvcc" "conda-forge::cuda-version==$cudaMajorMinor.*" "conda-forge::gcc==13.*" + mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda" "nvidia::cuda-toolkit==$cudaVersion" "nvidia::cuda-cudart" "nvidia::cuda-nvcc" "conda-forge::cuda-version==$cudaMajorMinor.*" "conda-forge::gcc==13.*" python -m pip install build wheel - name: Build Wheel From 9aab4fabb333f9e67d1f573927002555b7a859a3 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 12 Feb 2026 01:40:24 +0700 Subject: [PATCH 095/221] try with cuda-libraries-dev --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 85b4f04cc2..16d5058bb8 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -104,7 +104,7 @@ jobs: $cudaMajor = $cudaVersion.Split('.')[0] $cudaParts = $cudaVersion -split '\.' $cudaMajorMinor = "$($cudaParts[0]).$($cudaParts[1])" - mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda" "nvidia::cuda-toolkit==$cudaVersion" "nvidia::cuda-cudart" "nvidia::cuda-nvcc" "conda-forge::cuda-version==$cudaMajorMinor.*" "conda-forge::gcc==13.*" + mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda" "nvidia::cuda-toolkit==$cudaVersion" "nvidia::cuda-libraries-dev" "nvidia::cuda-nvcc" "conda-forge::cuda-version==$cudaMajorMinor.*" "conda-forge::gcc==13.*" python -m pip install build wheel - name: Build Wheel From 514fcace79e174d76eec55aa6948a6b9ae25eb63 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 12 Feb 2026 01:50:03 +0700 Subject: [PATCH 096/221] try with cuda-cudart-dev --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 16d5058bb8..f4a7243697 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -104,7 +104,7 @@ jobs: $cudaMajor = $cudaVersion.Split('.')[0] $cudaParts = $cudaVersion -split '\.' $cudaMajorMinor = "$($cudaParts[0]).$($cudaParts[1])" - mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda" "nvidia::cuda-toolkit==$cudaVersion" "nvidia::cuda-libraries-dev" "nvidia::cuda-nvcc" "conda-forge::cuda-version==$cudaMajorMinor.*" "conda-forge::gcc==13.*" + mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda" "nvidia::cuda-toolkit==$cudaVersion" "nvidia::cuda-libraries-dev" "nvidia::cuda-cudart-dev" "nvidia::cuda-nvcc" "conda-forge::cuda-version==$cudaMajorMinor.*" "conda-forge::gcc==13.*" python -m pip install build wheel - name: Build Wheel From 92f21ceb636dac14c42247780c9333d36b5df693 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 12 Feb 2026 02:03:09 +0700 Subject: [PATCH 097/221] try with nvidia::cuda-version --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index f4a7243697..7b3be8330b 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -104,7 +104,7 @@ jobs: $cudaMajor = $cudaVersion.Split('.')[0] $cudaParts = $cudaVersion -split '\.' $cudaMajorMinor = "$($cudaParts[0]).$($cudaParts[1])" - mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda" "nvidia::cuda-toolkit==$cudaVersion" "nvidia::cuda-libraries-dev" "nvidia::cuda-cudart-dev" "nvidia::cuda-nvcc" "conda-forge::cuda-version==$cudaMajorMinor.*" "conda-forge::gcc==13.*" + mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda" "nvidia::cuda-toolkit==$cudaVersion" "nvidia::cuda-libraries-dev" "nvidia::cuda-cudart-dev" "nvidia::cuda-nvcc" "nvidia::cuda-version==$cudaMajorMinor.*" "conda-forge::gcc==13.*" python -m pip install build wheel - name: Build Wheel From a2c558ea82be183769efc9a029f9e004761c801e Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 12 Feb 2026 02:20:30 +0700 Subject: [PATCH 098/221] apparently nvidia::cuda-version doesn't have 12.4 --- .github/workflows/manual_wheel_cuda.yml | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 7b3be8330b..a989442987 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -101,8 +101,10 @@ jobs: MAMBA_NO_LOW_SPEED_LIMIT: "1" run: | $cudaVersion = $env:CUDAVER - $cudaMajor = $cudaVersion.Split('.')[0] + #$cudaMajor = $cudaVersion.Split('.')[0] $cudaParts = $cudaVersion -split '\.' + if ("$cudaParts[0].$cudaParts[1]" -eq "12.4") {$cudaParts[1] = '5'} + $cudaMajor = $cudaParts[0] $cudaMajorMinor = "$($cudaParts[0]).$($cudaParts[1])" mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda" "nvidia::cuda-toolkit==$cudaVersion" "nvidia::cuda-libraries-dev" "nvidia::cuda-cudart-dev" "nvidia::cuda-nvcc" "nvidia::cuda-version==$cudaMajorMinor.*" "conda-forge::gcc==13.*" python -m pip install build wheel From 0a5d372f645e45fe0204daf755f5adeb6d2051c3 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 12 Feb 2026 02:31:53 +0700 Subject: [PATCH 099/221] oops --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index a989442987..68884fe3be 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -103,7 +103,7 @@ jobs: $cudaVersion = $env:CUDAVER #$cudaMajor = $cudaVersion.Split('.')[0] $cudaParts = $cudaVersion -split '\.' - if ("$cudaParts[0].$cudaParts[1]" -eq "12.4") {$cudaParts[1] = '5'} + if ("$($cudaParts[0]).$($cudaParts[1])" -eq "12.4") {$cudaParts[1] = '5'} $cudaMajor = $cudaParts[0] $cudaMajorMinor = "$($cudaParts[0]).$($cudaParts[1])" mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda" "nvidia::cuda-toolkit==$cudaVersion" "nvidia::cuda-libraries-dev" "nvidia::cuda-cudart-dev" "nvidia::cuda-nvcc" "nvidia::cuda-version==$cudaMajorMinor.*" "conda-forge::gcc==13.*" From cf2982401b57b906ad4aec5e0f5069c32c4d6016 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 12 Feb 2026 02:50:32 +0700 Subject: [PATCH 100/221] testing --- .github/workflows/manual_wheel_cuda.yml | 6 +++++- 1 file changed, 5 insertions(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 68884fe3be..e8a2053c07 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -106,7 +106,11 @@ jobs: if ("$($cudaParts[0]).$($cudaParts[1])" -eq "12.4") {$cudaParts[1] = '5'} $cudaMajor = $cudaParts[0] $cudaMajorMinor = "$($cudaParts[0]).$($cudaParts[1])" - mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda" "nvidia::cuda-toolkit==$cudaVersion" "nvidia::cuda-libraries-dev" "nvidia::cuda-cudart-dev" "nvidia::cuda-nvcc" "nvidia::cuda-version==$cudaMajorMinor.*" "conda-forge::gcc==13.*" + mamba config --add channels nvidia + mamba config --add channels conda-forge + mamba config --set channel_priority strict + mamba install -y 'cuda' -c nvidia/label/cuda-$cudaVersion + #mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda" "nvidia::cuda-toolkit==$cudaVersion" "nvidia::cuda-libraries-dev" "nvidia::cuda-cudart-dev" "nvidia::cuda-nvcc" "nvidia::cuda-version==$cudaMajorMinor.*" "conda-forge::gcc==13.*" python -m pip install build wheel - name: Build Wheel From 6ccfdf9cbaccc38a4ef2dbd534e04f7136ca7aa0 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 12 Feb 2026 03:04:10 +0700 Subject: [PATCH 101/221] testing 2 --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index e8a2053c07..afd99cfce1 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -109,7 +109,7 @@ jobs: mamba config --add channels nvidia mamba config --add channels conda-forge mamba config --set channel_priority strict - mamba install -y 'cuda' -c nvidia/label/cuda-$cudaVersion + mamba install -y -c nvidia/label/cuda-$cudaVersion "nvidia::cuda-version==$cudaMajorMinor.*" "conda-forge::gcc==13.*" #mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda" "nvidia::cuda-toolkit==$cudaVersion" "nvidia::cuda-libraries-dev" "nvidia::cuda-cudart-dev" "nvidia::cuda-nvcc" "nvidia::cuda-version==$cudaMajorMinor.*" "conda-forge::gcc==13.*" python -m pip install build wheel From 0172b3723e106cbfeb4413be10df99ac05076b30 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 12 Feb 2026 03:13:48 +0700 Subject: [PATCH 102/221] testing 3 --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index afd99cfce1..4478fcbe26 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -109,7 +109,7 @@ jobs: mamba config --add channels nvidia mamba config --add channels conda-forge mamba config --set channel_priority strict - mamba install -y -c nvidia/label/cuda-$cudaVersion "nvidia::cuda-version==$cudaMajorMinor.*" "conda-forge::gcc==13.*" + mamba install -y -c nvidia/label/cuda-$cudaVersion "nvidia::cuda-version==$cudaMajorMinor.*" "nvidia::cuda==$cudaVersion" "conda-forge::gcc==13.*" #mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda" "nvidia::cuda-toolkit==$cudaVersion" "nvidia::cuda-libraries-dev" "nvidia::cuda-cudart-dev" "nvidia::cuda-nvcc" "nvidia::cuda-version==$cudaMajorMinor.*" "conda-forge::gcc==13.*" python -m pip install build wheel From d19781d4bf2e89a3a325cf35fd5c31e2e2f06f0e Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 12 Feb 2026 03:31:11 +0700 Subject: [PATCH 103/221] test 4 --- .github/workflows/manual_wheel_cuda.yml | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 4478fcbe26..def99242eb 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -106,10 +106,10 @@ jobs: if ("$($cudaParts[0]).$($cudaParts[1])" -eq "12.4") {$cudaParts[1] = '5'} $cudaMajor = $cudaParts[0] $cudaMajorMinor = "$($cudaParts[0]).$($cudaParts[1])" - mamba config --add channels nvidia - mamba config --add channels conda-forge mamba config --set channel_priority strict - mamba install -y -c nvidia/label/cuda-$cudaVersion "nvidia::cuda-version==$cudaMajorMinor.*" "nvidia::cuda==$cudaVersion" "conda-forge::gcc==13.*" + mamba config --prepend channels nvidia + mamba config --append channels conda-forge + mamba install -y -c nvidia/label/cuda-$cudaVersion "cuda-version==$cudaMajorMinor.*" "cuda==$cudaVersion" "gcc==13.*" #mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda" "nvidia::cuda-toolkit==$cudaVersion" "nvidia::cuda-libraries-dev" "nvidia::cuda-cudart-dev" "nvidia::cuda-nvcc" "nvidia::cuda-version==$cudaMajorMinor.*" "conda-forge::gcc==13.*" python -m pip install build wheel From 562ade283c94cad829412383f366215f7f3d3ef4 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 12 Feb 2026 03:41:32 +0700 Subject: [PATCH 104/221] test 5 --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index def99242eb..c159536962 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -109,7 +109,7 @@ jobs: mamba config --set channel_priority strict mamba config --prepend channels nvidia mamba config --append channels conda-forge - mamba install -y -c nvidia/label/cuda-$cudaVersion "cuda-version==$cudaMajorMinor.*" "cuda==$cudaVersion" "gcc==13.*" + mamba install -y -c nvidia/label/cuda-$cudaVersion "cuda-version==$cudaMajorMinor.*" "cuda-toolkit==$cudaVersion" "gcc==13.*" #mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda" "nvidia::cuda-toolkit==$cudaVersion" "nvidia::cuda-libraries-dev" "nvidia::cuda-cudart-dev" "nvidia::cuda-nvcc" "nvidia::cuda-version==$cudaMajorMinor.*" "conda-forge::gcc==13.*" python -m pip install build wheel From c66273f45980990956019b8b7c0cabbdde1465d3 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 12 Feb 2026 04:03:37 +0700 Subject: [PATCH 105/221] test 6 --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index c159536962..d34c6d8c41 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -109,7 +109,7 @@ jobs: mamba config --set channel_priority strict mamba config --prepend channels nvidia mamba config --append channels conda-forge - mamba install -y -c nvidia/label/cuda-$cudaVersion "cuda-version==$cudaMajorMinor.*" "cuda-toolkit==$cudaVersion" "gcc==13.*" + mamba install -y -c nvidia/label/cuda-$cudaVersion "cuda-version==$cudaMajorMinor.*" "cuda-toolkit==$cudaVersion" "cuda-nvcc" "cuda-cudart-dev" "gcc==13.*" #mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda" "nvidia::cuda-toolkit==$cudaVersion" "nvidia::cuda-libraries-dev" "nvidia::cuda-cudart-dev" "nvidia::cuda-nvcc" "nvidia::cuda-version==$cudaMajorMinor.*" "conda-forge::gcc==13.*" python -m pip install build wheel From 114f20f9ab97b2301d297fdfead98199ea835568 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 12 Feb 2026 04:32:30 +0700 Subject: [PATCH 106/221] test 7 --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index d34c6d8c41..253c26822a 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -109,7 +109,7 @@ jobs: mamba config --set channel_priority strict mamba config --prepend channels nvidia mamba config --append channels conda-forge - mamba install -y -c nvidia/label/cuda-$cudaVersion "cuda-version==$cudaMajorMinor.*" "cuda-toolkit==$cudaVersion" "cuda-nvcc" "cuda-cudart-dev" "gcc==13.*" + mamba install -y "cuda-version==$cudaMajorMinor.*" "cuda-toolkit==$cudaVersion" "cuda-nvcc" "cuda-cudart-dev" "gcc==13.*" #mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda" "nvidia::cuda-toolkit==$cudaVersion" "nvidia::cuda-libraries-dev" "nvidia::cuda-cudart-dev" "nvidia::cuda-nvcc" "nvidia::cuda-version==$cudaMajorMinor.*" "conda-forge::gcc==13.*" python -m pip install build wheel From 50d9de50e529c8681e9d4195cbe0347e9376cfff Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 12 Feb 2026 04:43:48 +0700 Subject: [PATCH 107/221] test 8 --- .github/workflows/manual_wheel_cuda.yml | 7 ++++--- 1 file changed, 4 insertions(+), 3 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 253c26822a..c665a3bd34 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -106,9 +106,10 @@ jobs: if ("$($cudaParts[0]).$($cudaParts[1])" -eq "12.4") {$cudaParts[1] = '5'} $cudaMajor = $cudaParts[0] $cudaMajorMinor = "$($cudaParts[0]).$($cudaParts[1])" - mamba config --set channel_priority strict - mamba config --prepend channels nvidia - mamba config --append channels conda-forge + conda config --set channel_priority strict + conda config --prepend channels nvidia + conda config --append channels conda-forge + conda config --remove channels defaults mamba install -y "cuda-version==$cudaMajorMinor.*" "cuda-toolkit==$cudaVersion" "cuda-nvcc" "cuda-cudart-dev" "gcc==13.*" #mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda" "nvidia::cuda-toolkit==$cudaVersion" "nvidia::cuda-libraries-dev" "nvidia::cuda-cudart-dev" "nvidia::cuda-nvcc" "nvidia::cuda-version==$cudaMajorMinor.*" "conda-forge::gcc==13.*" python -m pip install build wheel From 8054b1fa94164c23965f843582320c3c07489995 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 12 Feb 2026 06:15:54 +0700 Subject: [PATCH 108/221] need defaults channel --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index c665a3bd34..8f5f4daf79 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -109,7 +109,7 @@ jobs: conda config --set channel_priority strict conda config --prepend channels nvidia conda config --append channels conda-forge - conda config --remove channels defaults + #conda config --remove channels defaults mamba install -y "cuda-version==$cudaMajorMinor.*" "cuda-toolkit==$cudaVersion" "cuda-nvcc" "cuda-cudart-dev" "gcc==13.*" #mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda" "nvidia::cuda-toolkit==$cudaVersion" "nvidia::cuda-libraries-dev" "nvidia::cuda-cudart-dev" "nvidia::cuda-nvcc" "nvidia::cuda-version==$cudaMajorMinor.*" "conda-forge::gcc==13.*" python -m pip install build wheel From 9a2239c13d8aa734a5dd54f0405445494f3b0d8f Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 12 Feb 2026 06:25:33 +0700 Subject: [PATCH 109/221] use flexible priority to mix versions --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 8f5f4daf79..81ccdefd83 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -106,7 +106,7 @@ jobs: if ("$($cudaParts[0]).$($cudaParts[1])" -eq "12.4") {$cudaParts[1] = '5'} $cudaMajor = $cudaParts[0] $cudaMajorMinor = "$($cudaParts[0]).$($cudaParts[1])" - conda config --set channel_priority strict + conda config --set channel_priority flexible # strict conda config --prepend channels nvidia conda config --append channels conda-forge #conda config --remove channels defaults From 9ccf9f5458e946db63f766693eb6971e212be505 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 12 Feb 2026 06:38:21 +0700 Subject: [PATCH 110/221] try cudacxx --- .github/workflows/manual_wheel_cuda.yml | 1 + 1 file changed, 1 insertion(+) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 81ccdefd83..74c1c68b76 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -131,6 +131,7 @@ jobs: } elseif ($env:RUNNER_OS -eq 'Windows') { ##$env:CUDA_PATH = $env:CONDA_PREFIX + '\\Library\\bin' + $env:CUDACXX = $env:CONDA_PREFIX + '\\Library\\bin\\nvcc.exe' #$env:IncludePath = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:IncludePath #$env:C_INCLUDE_PATH = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:C_INCLUDE_PATH #$env:CPLUS_INCLUDE_PATH = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:CPLUS_INCLUDE_PATH From 5e3ee03524aacc186f7612bead08fc6ccdfc7323 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 12 Feb 2026 06:50:45 +0700 Subject: [PATCH 111/221] show channel list --- .github/workflows/manual_wheel_cuda.yml | 1 + 1 file changed, 1 insertion(+) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 74c1c68b76..1257c1a672 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -110,6 +110,7 @@ jobs: conda config --prepend channels nvidia conda config --append channels conda-forge #conda config --remove channels defaults + conda config --show channels mamba install -y "cuda-version==$cudaMajorMinor.*" "cuda-toolkit==$cudaVersion" "cuda-nvcc" "cuda-cudart-dev" "gcc==13.*" #mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda" "nvidia::cuda-toolkit==$cudaVersion" "nvidia::cuda-libraries-dev" "nvidia::cuda-cudart-dev" "nvidia::cuda-nvcc" "nvidia::cuda-version==$cudaMajorMinor.*" "conda-forge::gcc==13.*" python -m pip install build wheel From 8164e61aebf746bb6cbc7a32baaa18a3154fb292 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 12 Feb 2026 08:26:54 +0700 Subject: [PATCH 112/221] try with libstdcxx-ng --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 1257c1a672..c5f52972d8 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -111,7 +111,7 @@ jobs: conda config --append channels conda-forge #conda config --remove channels defaults conda config --show channels - mamba install -y "cuda-version==$cudaMajorMinor.*" "cuda-toolkit==$cudaVersion" "cuda-nvcc" "cuda-cudart-dev" "gcc==13.*" + mamba install -y "cuda-version==$cudaMajorMinor.*" "cuda-toolkit==$cudaVersion" "cuda-nvcc" "cuda-cudart-dev" "gcc==13.*" "libstdcxx-ng" #mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda" "nvidia::cuda-toolkit==$cudaVersion" "nvidia::cuda-libraries-dev" "nvidia::cuda-cudart-dev" "nvidia::cuda-nvcc" "nvidia::cuda-version==$cudaMajorMinor.*" "conda-forge::gcc==13.*" python -m pip install build wheel From a646be0be7df4aaf75cc6936321c3447ec43dc1c Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 12 Feb 2026 08:45:49 +0700 Subject: [PATCH 113/221] oops --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index c5f52972d8..617abdc203 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -111,7 +111,7 @@ jobs: conda config --append channels conda-forge #conda config --remove channels defaults conda config --show channels - mamba install -y "cuda-version==$cudaMajorMinor.*" "cuda-toolkit==$cudaVersion" "cuda-nvcc" "cuda-cudart-dev" "gcc==13.*" "libstdcxx-ng" + mamba install -y "cuda-version==$cudaMajorMinor.*" "cuda-toolkit==$cudaVersion" "cuda-nvcc" "cuda-cudart-dev" "gcc==13.*" "conda-forge::libstdcxx-ng" #mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda" "nvidia::cuda-toolkit==$cudaVersion" "nvidia::cuda-libraries-dev" "nvidia::cuda-cudart-dev" "nvidia::cuda-nvcc" "nvidia::cuda-version==$cudaMajorMinor.*" "conda-forge::gcc==13.*" python -m pip install build wheel From 5b1403ee7aee3adffe8020f98faa82cad3c67a37 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 12 Feb 2026 08:55:07 +0700 Subject: [PATCH 114/221] lets just remove cuda 12.4 --- .github/workflows/manual_wheel_cuda.yml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 617abdc203..f60eb3e90c 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -22,7 +22,7 @@ jobs: $matrix = @{ 'os' = @('ubuntu-22.04','windows-2022') 'pyver' = @("3.9", "3.10", "3.11", "3.12") # ,"3.13", "3.14" - 'cuda' = @("12.4.1", "12.5.1", "12.6.3", "12.8.1", "13.0.2", "13.1.0") # "12.1.1", "12.2.2", "12.3.2", "12.9.1", + 'cuda' = @("12.5.1", "12.6.3", "12.8.1", "13.0.2", "13.1.0") # "12.1.1", "12.2.2", "12.3.2", "12.4.1", "12.9.1", 'releasetag' = @("basic") } @@ -103,7 +103,7 @@ jobs: $cudaVersion = $env:CUDAVER #$cudaMajor = $cudaVersion.Split('.')[0] $cudaParts = $cudaVersion -split '\.' - if ("$($cudaParts[0]).$($cudaParts[1])" -eq "12.4") {$cudaParts[1] = '5'} + #if ("$($cudaParts[0]).$($cudaParts[1])" -eq "12.4") {$cudaParts[1] = '5'} $cudaMajor = $cudaParts[0] $cudaMajorMinor = "$($cudaParts[0]).$($cudaParts[1])" conda config --set channel_priority flexible # strict From fc31240f8c8853a2a75c296ece78b0f6764dced6 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 12 Feb 2026 08:55:35 +0700 Subject: [PATCH 115/221] oops --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index f60eb3e90c..0d17807bd3 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -111,7 +111,7 @@ jobs: conda config --append channels conda-forge #conda config --remove channels defaults conda config --show channels - mamba install -y "cuda-version==$cudaMajorMinor.*" "cuda-toolkit==$cudaVersion" "cuda-nvcc" "cuda-cudart-dev" "gcc==13.*" "conda-forge::libstdcxx-ng" + mamba install -y "cuda-version==$cudaMajorMinor.*" "cuda-toolkit==$cudaVersion" "cuda-nvcc" "cuda-cudart-dev" "gcc==13.*" # "conda-forge::libstdcxx-ng" #mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda" "nvidia::cuda-toolkit==$cudaVersion" "nvidia::cuda-libraries-dev" "nvidia::cuda-cudart-dev" "nvidia::cuda-nvcc" "nvidia::cuda-version==$cudaMajorMinor.*" "conda-forge::gcc==13.*" python -m pip install build wheel From 9ac1dbf238b73b7212af40b368ac9e35977ab050 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 12 Feb 2026 10:41:21 +0700 Subject: [PATCH 116/221] try with strict again --- .github/workflows/manual_wheel_cuda.yml | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 0d17807bd3..de9367f0a4 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -106,7 +106,7 @@ jobs: #if ("$($cudaParts[0]).$($cudaParts[1])" -eq "12.4") {$cudaParts[1] = '5'} $cudaMajor = $cudaParts[0] $cudaMajorMinor = "$($cudaParts[0]).$($cudaParts[1])" - conda config --set channel_priority flexible # strict + conda config --set channel_priority strict conda config --prepend channels nvidia conda config --append channels conda-forge #conda config --remove channels defaults @@ -129,6 +129,7 @@ jobs: if ($IsLinux) { $env:LD_LIBRARY_PATH = $env:CONDA_PREFIX + '/lib:' + $env:CONDA_PREFIX + '/targets/x86_64-linux/lib:' + $env:LD_LIBRARY_PATH $env:CPATH = $env:CONDA_PREFIX + '/include:' + $env:CONDA_PREFIX + '/targets/x86_64-linux/include:' + $env:CPATH + Get-ChildItem -Path ~ -Filter "nvcc" -Recurse -ErrorAction SilentlyContinue } elseif ($env:RUNNER_OS -eq 'Windows') { ##$env:CUDA_PATH = $env:CONDA_PREFIX + '\\Library\\bin' From 1151c41a1d5674ab662e895ac3b31afee54cc241 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 12 Feb 2026 10:49:43 +0700 Subject: [PATCH 117/221] use nvidia channel --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index de9367f0a4..bf0c202d79 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -111,7 +111,7 @@ jobs: conda config --append channels conda-forge #conda config --remove channels defaults conda config --show channels - mamba install -y "cuda-version==$cudaMajorMinor.*" "cuda-toolkit==$cudaVersion" "cuda-nvcc" "cuda-cudart-dev" "gcc==13.*" # "conda-forge::libstdcxx-ng" + mamba install -y -c nvidia "cuda-version==$cudaMajorMinor.*" "cuda-toolkit==$cudaVersion" "cuda-nvcc" "cuda-cudart-dev" "gcc==13.*" # "conda-forge::libstdcxx-ng" #mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda" "nvidia::cuda-toolkit==$cudaVersion" "nvidia::cuda-libraries-dev" "nvidia::cuda-cudart-dev" "nvidia::cuda-nvcc" "nvidia::cuda-version==$cudaMajorMinor.*" "conda-forge::gcc==13.*" python -m pip install build wheel From e86531d204654375e81bac4009a30f32ff48a32f Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 12 Feb 2026 11:12:10 +0700 Subject: [PATCH 118/221] try without conda-forge channel --- .github/workflows/manual_wheel_cuda.yml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index bf0c202d79..85ab3367e1 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -108,10 +108,10 @@ jobs: $cudaMajorMinor = "$($cudaParts[0]).$($cudaParts[1])" conda config --set channel_priority strict conda config --prepend channels nvidia - conda config --append channels conda-forge + #conda config --append channels conda-forge #conda config --remove channels defaults conda config --show channels - mamba install -y -c nvidia "cuda-version==$cudaMajorMinor.*" "cuda-toolkit==$cudaVersion" "cuda-nvcc" "cuda-cudart-dev" "gcc==13.*" # "conda-forge::libstdcxx-ng" + mamba install -y "cuda-version==$cudaMajorMinor.*" "cuda-toolkit==$cudaVersion" "cuda-nvcc" "cuda-cudart-dev" "gcc==13.*" # "conda-forge::libstdcxx-ng" #mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda" "nvidia::cuda-toolkit==$cudaVersion" "nvidia::cuda-libraries-dev" "nvidia::cuda-cudart-dev" "nvidia::cuda-nvcc" "nvidia::cuda-version==$cudaMajorMinor.*" "conda-forge::gcc==13.*" python -m pip install build wheel From 9f7ec45321bd472791cf7521602bc3449c980090 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 12 Feb 2026 12:49:16 +0700 Subject: [PATCH 119/221] remove conda-forge channel --- .github/workflows/manual_wheel_cuda.yml | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 85ab3367e1..e8c2471cee 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -108,6 +108,7 @@ jobs: $cudaMajorMinor = "$($cudaParts[0]).$($cudaParts[1])" conda config --set channel_priority strict conda config --prepend channels nvidia + conda config --remove channels conda-forge #conda config --append channels conda-forge #conda config --remove channels defaults conda config --show channels @@ -133,7 +134,7 @@ jobs: } elseif ($env:RUNNER_OS -eq 'Windows') { ##$env:CUDA_PATH = $env:CONDA_PREFIX + '\\Library\\bin' - $env:CUDACXX = $env:CONDA_PREFIX + '\\Library\\bin\\nvcc.exe' + #$env:CUDACXX = $env:CONDA_PREFIX + '\\Library\\bin\\nvcc.exe' #$env:IncludePath = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:IncludePath #$env:C_INCLUDE_PATH = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:C_INCLUDE_PATH #$env:CPLUS_INCLUDE_PATH = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:CPLUS_INCLUDE_PATH From b44dd48121e2a14acc1469d502c2f212fcb05660 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 12 Feb 2026 15:36:14 +0700 Subject: [PATCH 120/221] try explicitly use nvidia channel --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index e8c2471cee..38034271cc 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -112,7 +112,7 @@ jobs: #conda config --append channels conda-forge #conda config --remove channels defaults conda config --show channels - mamba install -y "cuda-version==$cudaMajorMinor.*" "cuda-toolkit==$cudaVersion" "cuda-nvcc" "cuda-cudart-dev" "gcc==13.*" # "conda-forge::libstdcxx-ng" + mamba install -y "nvidia::cuda-version==$cudaMajorMinor.*" "nvidia::cuda-toolkit==$cudaVersion" "nvidia::cuda-nvcc" "nvidia::cuda-cudart-dev" "gcc==13.*" # "conda-forge::libstdcxx-ng" #mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda" "nvidia::cuda-toolkit==$cudaVersion" "nvidia::cuda-libraries-dev" "nvidia::cuda-cudart-dev" "nvidia::cuda-nvcc" "nvidia::cuda-version==$cudaMajorMinor.*" "conda-forge::gcc==13.*" python -m pip install build wheel From 43571224900fc03ac7bcd0be41a4b833653cd8d4 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 12 Feb 2026 15:44:08 +0700 Subject: [PATCH 121/221] lets use flexible priority --- .github/workflows/manual_wheel_cuda.yml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 38034271cc..b056040c5c 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -106,13 +106,13 @@ jobs: #if ("$($cudaParts[0]).$($cudaParts[1])" -eq "12.4") {$cudaParts[1] = '5'} $cudaMajor = $cudaParts[0] $cudaMajorMinor = "$($cudaParts[0]).$($cudaParts[1])" - conda config --set channel_priority strict + conda config --set channel_priority flexible # strict conda config --prepend channels nvidia conda config --remove channels conda-forge #conda config --append channels conda-forge #conda config --remove channels defaults conda config --show channels - mamba install -y "nvidia::cuda-version==$cudaMajorMinor.*" "nvidia::cuda-toolkit==$cudaVersion" "nvidia::cuda-nvcc" "nvidia::cuda-cudart-dev" "gcc==13.*" # "conda-forge::libstdcxx-ng" + mamba install -y "nvidia::cuda-version==$cudaMajorMinor.*" "nvidia::cuda-toolkit" "nvidia::cuda-nvcc" "nvidia::cuda-cudart-dev" "gcc==13.*" # "conda-forge::libstdcxx-ng" #mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda" "nvidia::cuda-toolkit==$cudaVersion" "nvidia::cuda-libraries-dev" "nvidia::cuda-cudart-dev" "nvidia::cuda-nvcc" "nvidia::cuda-version==$cudaMajorMinor.*" "conda-forge::gcc==13.*" python -m pip install build wheel From ae2ddc0d5daf8eab7ee45141a64ad2f89a148052 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 12 Feb 2026 15:59:34 +0700 Subject: [PATCH 122/221] Test 1 --- .github/workflows/manual_wheel_cuda.yml | 8 ++++---- 1 file changed, 4 insertions(+), 4 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index b056040c5c..df5a8f5413 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -108,12 +108,12 @@ jobs: $cudaMajorMinor = "$($cudaParts[0]).$($cudaParts[1])" conda config --set channel_priority flexible # strict conda config --prepend channels nvidia - conda config --remove channels conda-forge - #conda config --append channels conda-forge + #conda config --remove channels conda-forge + conda config --append channels conda-forge #conda config --remove channels defaults conda config --show channels - mamba install -y "nvidia::cuda-version==$cudaMajorMinor.*" "nvidia::cuda-toolkit" "nvidia::cuda-nvcc" "nvidia::cuda-cudart-dev" "gcc==13.*" # "conda-forge::libstdcxx-ng" - #mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda" "nvidia::cuda-toolkit==$cudaVersion" "nvidia::cuda-libraries-dev" "nvidia::cuda-cudart-dev" "nvidia::cuda-nvcc" "nvidia::cuda-version==$cudaMajorMinor.*" "conda-forge::gcc==13.*" + #mamba install -y "nvidia::cuda-version==$cudaMajorMinor.*" "nvidia::cuda-toolkit" "nvidia::cuda-nvcc" "nvidia::cuda-cudart-dev" "conda-forge::gcc==13.*" # "conda-forge::libstdcxx-ng" + mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda" "nvidia::cuda-toolkit==$cudaVersion" "nvidia::cuda-libraries-dev" "nvidia::cuda-cudart-dev" "nvidia::cuda-nvcc" "nvidia::cuda-version==$cudaMajorMinor.*" "conda-forge::gcc==13.*" python -m pip install build wheel - name: Build Wheel From 4ae838feb895159dd5fde9ef6f92d095a319a1b7 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 12 Feb 2026 16:10:18 +0700 Subject: [PATCH 123/221] update Path --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index df5a8f5413..a01b3bf33d 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -140,7 +140,7 @@ jobs: #$env:CPLUS_INCLUDE_PATH = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:CPLUS_INCLUDE_PATH #$env:INCLUDE = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:INCLUDE #$env:CL='/I\' + $env:CONDA_PREFIX + '\Library\include' - #$env:Path = "$env:CONDA_PREFIX\\bin; $env:CONDA_PREFIX\\Library\\bin; $env:CONDA_PREFIX\\nvvm\\bin;" + $env:Path + $env:Path = "$env:CONDA_PREFIX\\bin; $env:CONDA_PREFIX\\Library\\bin; $env:CONDA_PREFIX\\nvvm\\bin;" + $env:Path #echo "$env:CONDA_PREFIX\\Library\\bin" | Out-File -FilePath $env:GITHUB_PATH -Encoding utf8 -Append #echo "$env:CONDA_PREFIX\\nvvm\\bin" | Out-File -FilePath $env:GITHUB_PATH -Encoding utf8 -Append Get-ChildItem -Path ~ -Filter "nvcc.exe" -Recurse -ErrorAction SilentlyContinue From 84b1fa541d179c12ef9d9671443d0f9d679e7920 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 12 Feb 2026 16:27:07 +0700 Subject: [PATCH 124/221] use symlink to nvcc --- .github/workflows/manual_wheel_cuda.yml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index a01b3bf33d..70c90bb032 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -147,8 +147,8 @@ jobs: nvcc.exe --version Get-ChildItem -Path ~ -Filter "cicc.exe" -Recurse -ErrorAction SilentlyContinue if (-not (Test-Path -Path "$env:CONDA_PREFIX\\bin\\nvcc.exe")) { - #New-Item -ItemType Directory -Path "$env:CONDA_PREFIX\\bin" -Force - #New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\bin\\nvcc.exe" -Target "$env:CONDA_PREFIX\\Library\\bin\\nvcc.exe" # -Force + New-Item -ItemType Directory -Path "$env:CONDA_PREFIX\\bin" -Force + New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\bin\\nvcc.exe" -Target "$env:CONDA_PREFIX\\Library\\bin\\nvcc.exe" # -Force } #Get-ChildItem -Path "C:\Users\runneradmin\miniconda3\envs\llamacpp" -Directory -Recurse -ErrorAction SilentlyContinue } From 4d5577d41cba95f5d0e5e7c9f4b05940ede323b2 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 12 Feb 2026 17:27:59 +0700 Subject: [PATCH 125/221] Update include path --- .github/workflows/manual_wheel_cuda.yml | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 70c90bb032..3eccac970a 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -135,9 +135,9 @@ jobs: elseif ($env:RUNNER_OS -eq 'Windows') { ##$env:CUDA_PATH = $env:CONDA_PREFIX + '\\Library\\bin' #$env:CUDACXX = $env:CONDA_PREFIX + '\\Library\\bin\\nvcc.exe' - #$env:IncludePath = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:IncludePath - #$env:C_INCLUDE_PATH = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:C_INCLUDE_PATH - #$env:CPLUS_INCLUDE_PATH = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:CPLUS_INCLUDE_PATH + $env:IncludePath = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:IncludePath + $env:C_INCLUDE_PATH = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:C_INCLUDE_PATH + $env:CPLUS_INCLUDE_PATH = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:CPLUS_INCLUDE_PATH #$env:INCLUDE = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:INCLUDE #$env:CL='/I\' + $env:CONDA_PREFIX + '\Library\include' $env:Path = "$env:CONDA_PREFIX\\bin; $env:CONDA_PREFIX\\Library\\bin; $env:CONDA_PREFIX\\nvvm\\bin;" + $env:Path From 7a5597cdbc54009a2deee0a69cce29d2f87a661f Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 12 Feb 2026 17:44:53 +0700 Subject: [PATCH 126/221] update include --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 3eccac970a..52d22ae445 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -138,7 +138,7 @@ jobs: $env:IncludePath = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:IncludePath $env:C_INCLUDE_PATH = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:C_INCLUDE_PATH $env:CPLUS_INCLUDE_PATH = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:CPLUS_INCLUDE_PATH - #$env:INCLUDE = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:INCLUDE + $env:INCLUDE = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:INCLUDE #$env:CL='/I\' + $env:CONDA_PREFIX + '\Library\include' $env:Path = "$env:CONDA_PREFIX\\bin; $env:CONDA_PREFIX\\Library\\bin; $env:CONDA_PREFIX\\nvvm\\bin;" + $env:Path #echo "$env:CONDA_PREFIX\\Library\\bin" | Out-File -FilePath $env:GITHUB_PATH -Encoding utf8 -Append From 3d35ea69ea76b9711c025792c16ab620722df8a8 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 12 Feb 2026 18:07:10 +0700 Subject: [PATCH 127/221] update CL env --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 52d22ae445..825061494e 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -139,7 +139,7 @@ jobs: $env:C_INCLUDE_PATH = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:C_INCLUDE_PATH $env:CPLUS_INCLUDE_PATH = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:CPLUS_INCLUDE_PATH $env:INCLUDE = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:INCLUDE - #$env:CL='/I\' + $env:CONDA_PREFIX + '\Library\include' + $env:CL='/I\' + $env:CONDA_PREFIX + '\Library\include' $env:Path = "$env:CONDA_PREFIX\\bin; $env:CONDA_PREFIX\\Library\\bin; $env:CONDA_PREFIX\\nvvm\\bin;" + $env:Path #echo "$env:CONDA_PREFIX\\Library\\bin" | Out-File -FilePath $env:GITHUB_PATH -Encoding utf8 -Append #echo "$env:CONDA_PREFIX\\nvvm\\bin" | Out-File -FilePath $env:GITHUB_PATH -Encoding utf8 -Append From bb97abba66a1f299939b98783282ce4e3a11893f Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 12 Feb 2026 21:27:20 +0700 Subject: [PATCH 128/221] updated root --- .github/workflows/manual_wheel_cuda.yml | 14 ++++++++------ 1 file changed, 8 insertions(+), 6 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 825061494e..c7fa92418f 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -133,13 +133,15 @@ jobs: Get-ChildItem -Path ~ -Filter "nvcc" -Recurse -ErrorAction SilentlyContinue } elseif ($env:RUNNER_OS -eq 'Windows') { - ##$env:CUDA_PATH = $env:CONDA_PREFIX + '\\Library\\bin' + $env:CUDA_TOOLKIT_ROOT_DIR += "\\Library" + $env:CUDAToolkit_ROOT += "\\Library" + #$env:CUDA_PATH = $env:CONDA_PREFIX + '\\Library\\bin' #$env:CUDACXX = $env:CONDA_PREFIX + '\\Library\\bin\\nvcc.exe' - $env:IncludePath = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:IncludePath - $env:C_INCLUDE_PATH = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:C_INCLUDE_PATH - $env:CPLUS_INCLUDE_PATH = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:CPLUS_INCLUDE_PATH - $env:INCLUDE = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:INCLUDE - $env:CL='/I\' + $env:CONDA_PREFIX + '\Library\include' + #$env:IncludePath = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:IncludePath + #$env:C_INCLUDE_PATH = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:C_INCLUDE_PATH + #$env:CPLUS_INCLUDE_PATH = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:CPLUS_INCLUDE_PATH + #$env:INCLUDE = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:INCLUDE + #$env:CL='/I\' + $env:CONDA_PREFIX + '\Library\include' $env:Path = "$env:CONDA_PREFIX\\bin; $env:CONDA_PREFIX\\Library\\bin; $env:CONDA_PREFIX\\nvvm\\bin;" + $env:Path #echo "$env:CONDA_PREFIX\\Library\\bin" | Out-File -FilePath $env:GITHUB_PATH -Encoding utf8 -Append #echo "$env:CONDA_PREFIX\\nvvm\\bin" | Out-File -FilePath $env:GITHUB_PATH -Encoding utf8 -Append From 7e241b57818bb6ddf40d8d8b24af08a658bf6771 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 12 Feb 2026 21:56:34 +0700 Subject: [PATCH 129/221] Test 2 --- .github/workflows/manual_wheel_cuda.yml | 15 ++++++++------- 1 file changed, 8 insertions(+), 7 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index c7fa92418f..243ffb3f00 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -135,16 +135,17 @@ jobs: elseif ($env:RUNNER_OS -eq 'Windows') { $env:CUDA_TOOLKIT_ROOT_DIR += "\\Library" $env:CUDAToolkit_ROOT += "\\Library" - #$env:CUDA_PATH = $env:CONDA_PREFIX + '\\Library\\bin' + $env:CUDA_PATH = $env:CONDA_PREFIX + '\\Library\\bin' + $env:CUDA_INC_PATH = $env:CONDA_PREFIX + '\\Library\\include' #$env:CUDACXX = $env:CONDA_PREFIX + '\\Library\\bin\\nvcc.exe' - #$env:IncludePath = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:IncludePath - #$env:C_INCLUDE_PATH = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:C_INCLUDE_PATH - #$env:CPLUS_INCLUDE_PATH = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:CPLUS_INCLUDE_PATH - #$env:INCLUDE = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:INCLUDE + $env:IncludePath = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:IncludePath + $env:C_INCLUDE_PATH = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:C_INCLUDE_PATH + $env:CPLUS_INCLUDE_PATH = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:CPLUS_INCLUDE_PATH + $env:INCLUDE = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:INCLUDE #$env:CL='/I\' + $env:CONDA_PREFIX + '\Library\include' - $env:Path = "$env:CONDA_PREFIX\\bin; $env:CONDA_PREFIX\\Library\\bin; $env:CONDA_PREFIX\\nvvm\\bin;" + $env:Path + $env:Path = "$env:CONDA_PREFIX\\bin; $env:CONDA_PREFIX\\Library\\bin; $env:CONDA_PREFIX\\nvvm\\bin; $env:CONDA_PREFIX\\Library\\nvvm\\bin;" + $env:Path #echo "$env:CONDA_PREFIX\\Library\\bin" | Out-File -FilePath $env:GITHUB_PATH -Encoding utf8 -Append - #echo "$env:CONDA_PREFIX\\nvvm\\bin" | Out-File -FilePath $env:GITHUB_PATH -Encoding utf8 -Append + #echo "$env:CONDA_PREFIX\\Library\\nvvm\\bin" | Out-File -FilePath $env:GITHUB_PATH -Encoding utf8 -Append Get-ChildItem -Path ~ -Filter "nvcc.exe" -Recurse -ErrorAction SilentlyContinue nvcc.exe --version Get-ChildItem -Path ~ -Filter "cicc.exe" -Recurse -ErrorAction SilentlyContinue From 1ccf7ef2c7b97d8b6158c788a461a52d9954b230 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Fri, 13 Feb 2026 04:04:28 +0700 Subject: [PATCH 130/221] create symlink to cicc.exe --- .github/workflows/manual_wheel_cuda.yml | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 243ffb3f00..fac2b7cfec 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -153,6 +153,10 @@ jobs: New-Item -ItemType Directory -Path "$env:CONDA_PREFIX\\bin" -Force New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\bin\\nvcc.exe" -Target "$env:CONDA_PREFIX\\Library\\bin\\nvcc.exe" # -Force } + if (-not (Test-Path -Path "$env:CONDA_PREFIX\\nvvm\\bin\\cicc.exe")) { + New-Item -ItemType Directory -Path "$env:CONDA_PREFIX\\nvvm\\bin" -Force + New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\nvvm\\bin\\cicc.exe" -Target "$env:CONDA_PREFIX\\Library\\nvvm\\bin\\cicc.exe" # -Force + } #Get-ChildItem -Path "C:\Users\runneradmin\miniconda3\envs\llamacpp" -Directory -Recurse -ErrorAction SilentlyContinue } Get-ChildItem -Path ~ -Filter "cuda_runtime.h" -Recurse -ErrorAction SilentlyContinue From 02e8c854451e27b6fac35e346268a02443891601 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Fri, 13 Feb 2026 04:18:25 +0700 Subject: [PATCH 131/221] try with cuda-nvvm --- .github/workflows/manual_wheel_cuda.yml | 12 ++++-------- 1 file changed, 4 insertions(+), 8 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index fac2b7cfec..511d7dd4c1 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -113,7 +113,7 @@ jobs: #conda config --remove channels defaults conda config --show channels #mamba install -y "nvidia::cuda-version==$cudaMajorMinor.*" "nvidia::cuda-toolkit" "nvidia::cuda-nvcc" "nvidia::cuda-cudart-dev" "conda-forge::gcc==13.*" # "conda-forge::libstdcxx-ng" - mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda" "nvidia::cuda-toolkit==$cudaVersion" "nvidia::cuda-libraries-dev" "nvidia::cuda-cudart-dev" "nvidia::cuda-nvcc" "nvidia::cuda-version==$cudaMajorMinor.*" "conda-forge::gcc==13.*" + mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda" "nvidia::cuda-toolkit==$cudaVersion" "nvidia::cuda-libraries-dev" "nvidia::cuda-cudart-dev" "nvidia::cuda-nvcc" "nvidia::cuda-nvvm" "nvidia::cuda-version==$cudaMajorMinor.*" "conda-forge::gcc==13.*" python -m pip install build wheel - name: Build Wheel @@ -149,13 +149,9 @@ jobs: Get-ChildItem -Path ~ -Filter "nvcc.exe" -Recurse -ErrorAction SilentlyContinue nvcc.exe --version Get-ChildItem -Path ~ -Filter "cicc.exe" -Recurse -ErrorAction SilentlyContinue - if (-not (Test-Path -Path "$env:CONDA_PREFIX\\bin\\nvcc.exe")) { - New-Item -ItemType Directory -Path "$env:CONDA_PREFIX\\bin" -Force - New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\bin\\nvcc.exe" -Target "$env:CONDA_PREFIX\\Library\\bin\\nvcc.exe" # -Force - } - if (-not (Test-Path -Path "$env:CONDA_PREFIX\\nvvm\\bin\\cicc.exe")) { - New-Item -ItemType Directory -Path "$env:CONDA_PREFIX\\nvvm\\bin" -Force - New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\nvvm\\bin\\cicc.exe" -Target "$env:CONDA_PREFIX\\Library\\nvvm\\bin\\cicc.exe" # -Force + if (-not (Test-Path -Path "$env:CONDA_PREFIX\\bin")) { + #New-Item -ItemType Directory -Path "$env:CONDA_PREFIX\\bin" -Force + New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\bin" -Target "$env:CONDA_PREFIX\\Library\\bin" # -Force } #Get-ChildItem -Path "C:\Users\runneradmin\miniconda3\envs\llamacpp" -Directory -Recurse -ErrorAction SilentlyContinue } From 0519dcf9e97451f2cda528d6bc62db1d94e0e342 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Fri, 13 Feb 2026 06:32:18 +0700 Subject: [PATCH 132/221] Test 1 --- .github/workflows/manual_wheel_cuda.yml | 12 ++++++++---- 1 file changed, 8 insertions(+), 4 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 511d7dd4c1..b0cd0c7930 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -113,11 +113,12 @@ jobs: #conda config --remove channels defaults conda config --show channels #mamba install -y "nvidia::cuda-version==$cudaMajorMinor.*" "nvidia::cuda-toolkit" "nvidia::cuda-nvcc" "nvidia::cuda-cudart-dev" "conda-forge::gcc==13.*" # "conda-forge::libstdcxx-ng" - mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda" "nvidia::cuda-toolkit==$cudaVersion" "nvidia::cuda-libraries-dev" "nvidia::cuda-cudart-dev" "nvidia::cuda-nvcc" "nvidia::cuda-nvvm" "nvidia::cuda-version==$cudaMajorMinor.*" "conda-forge::gcc==13.*" + mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda-version==$cudaMajorMinor.*" "nvidia::cuda-toolkit==$cudaVersion" "nvidia::cuda-libraries-dev" "nvidia::cuda-cudart-dev" "nvidia::cuda-nvvm" "nvidia::cuda-nvcc" "conda-forge::gcc==13.*" python -m pip install build wheel - name: Build Wheel run: | + $cpuArch = $env:PROCESSOR_ARCHITECTURE $cudaVersion = $env:CUDAVER.Remove($env:CUDAVER.LastIndexOf('.')).Replace('.','') #if ($env:RUNNER_OS -eq 'Windows') { # $env:CONDA_PREFIX = $env:CONDA_PREFIX + '\Library' @@ -128,15 +129,18 @@ jobs: $env:CUDAToolkit_ROOT = $env:CONDA_PREFIX echo "CONDA_PREFIX = $env:CONDA_PREFIX" if ($IsLinux) { - $env:LD_LIBRARY_PATH = $env:CONDA_PREFIX + '/lib:' + $env:CONDA_PREFIX + '/targets/x86_64-linux/lib:' + $env:LD_LIBRARY_PATH - $env:CPATH = $env:CONDA_PREFIX + '/include:' + $env:CONDA_PREFIX + '/targets/x86_64-linux/include:' + $env:CPATH + if ($cpuArch -eq 'AMD64') { $cpuArch = 'x86_64' } + $env:LD_LIBRARY_PATH = $env:CONDA_PREFIX + '/lib:' + $env:CONDA_PREFIX + "/targets/$cpuArch-linux/lib:" + $env:LD_LIBRARY_PATH + $env:CPATH = $env:CONDA_PREFIX + '/include:' + $env:CONDA_PREFIX + "/targets/$cpuArch-linux/include:" + $env:CPATH Get-ChildItem -Path ~ -Filter "nvcc" -Recurse -ErrorAction SilentlyContinue + Get-ChildItem -Path ~ -Filter "cicc" -Recurse -ErrorAction SilentlyContinue } - elseif ($env:RUNNER_OS -eq 'Windows') { + elseif ($IsWindows) { $env:CUDA_TOOLKIT_ROOT_DIR += "\\Library" $env:CUDAToolkit_ROOT += "\\Library" $env:CUDA_PATH = $env:CONDA_PREFIX + '\\Library\\bin' $env:CUDA_INC_PATH = $env:CONDA_PREFIX + '\\Library\\include' + $env:CUDA_LIB_PATH = $env:CONDA_PREFIX + '\\Library\\lib' #$env:CUDACXX = $env:CONDA_PREFIX + '\\Library\\bin\\nvcc.exe' $env:IncludePath = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:IncludePath $env:C_INCLUDE_PATH = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:C_INCLUDE_PATH From d05897bdd1d0fdc85dc9b2c9e718feeace17af8d Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Fri, 13 Feb 2026 06:48:17 +0700 Subject: [PATCH 133/221] Test 2 --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index b0cd0c7930..2bcaab85f0 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -156,7 +156,7 @@ jobs: if (-not (Test-Path -Path "$env:CONDA_PREFIX\\bin")) { #New-Item -ItemType Directory -Path "$env:CONDA_PREFIX\\bin" -Force New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\bin" -Target "$env:CONDA_PREFIX\\Library\\bin" # -Force - } + } else { echo "Warning: bin directory already existed! Not creating symlink."} #Get-ChildItem -Path "C:\Users\runneradmin\miniconda3\envs\llamacpp" -Directory -Recurse -ErrorAction SilentlyContinue } Get-ChildItem -Path ~ -Filter "cuda_runtime.h" -Recurse -ErrorAction SilentlyContinue From 617c71ad4976dae87dc9c2e9de3b953cde3939d8 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Fri, 13 Feb 2026 10:34:59 +0700 Subject: [PATCH 134/221] create symlink to nvvm directory --- .github/workflows/manual_wheel_cuda.yml | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 2bcaab85f0..94d5464b6b 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -157,6 +157,10 @@ jobs: #New-Item -ItemType Directory -Path "$env:CONDA_PREFIX\\bin" -Force New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\bin" -Target "$env:CONDA_PREFIX\\Library\\bin" # -Force } else { echo "Warning: bin directory already existed! Not creating symlink."} + if (-not (Test-Path -Path "$env:CONDA_PREFIX\\nvvm")) { + #New-Item -ItemType Directory -Path "$env:CONDA_PREFIX\\nvvm" -Force + New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\nvvm" -Target "$env:CONDA_PREFIX\\Library\\nvvm" # -Force + } else { echo "Warning: nvvm directory already existed! Not creating symlink."} #Get-ChildItem -Path "C:\Users\runneradmin\miniconda3\envs\llamacpp" -Directory -Recurse -ErrorAction SilentlyContinue } Get-ChildItem -Path ~ -Filter "cuda_runtime.h" -Recurse -ErrorAction SilentlyContinue From d88a1220066938ee2e28738a5a794f0cea31a431 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Fri, 13 Feb 2026 10:52:39 +0700 Subject: [PATCH 135/221] create symlink to lib directory --- .github/workflows/manual_wheel_cuda.yml | 5 +++++ 1 file changed, 5 insertions(+) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 94d5464b6b..0b5ec39bf0 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -142,6 +142,7 @@ jobs: $env:CUDA_INC_PATH = $env:CONDA_PREFIX + '\\Library\\include' $env:CUDA_LIB_PATH = $env:CONDA_PREFIX + '\\Library\\lib' #$env:CUDACXX = $env:CONDA_PREFIX + '\\Library\\bin\\nvcc.exe' + $env:LIB = $env:CONDA_PREFIX + '\lib;' + $env:CONDA_PREFIX + '\Library\lib;' + $env:LIB $env:IncludePath = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:IncludePath $env:C_INCLUDE_PATH = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:C_INCLUDE_PATH $env:CPLUS_INCLUDE_PATH = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:CPLUS_INCLUDE_PATH @@ -161,6 +162,10 @@ jobs: #New-Item -ItemType Directory -Path "$env:CONDA_PREFIX\\nvvm" -Force New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\nvvm" -Target "$env:CONDA_PREFIX\\Library\\nvvm" # -Force } else { echo "Warning: nvvm directory already existed! Not creating symlink."} + if (-not (Test-Path -Path "$env:CONDA_PREFIX\\lib")) { + #New-Item -ItemType Directory -Path "$env:CONDA_PREFIX\\lib" -Force + New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\lib" -Target "$env:CONDA_PREFIX\\Library\\lib" # -Force + } else { echo "Warning: lib directory already existed! Not creating symlink."} #Get-ChildItem -Path "C:\Users\runneradmin\miniconda3\envs\llamacpp" -Directory -Recurse -ErrorAction SilentlyContinue } Get-ChildItem -Path ~ -Filter "cuda_runtime.h" -Recurse -ErrorAction SilentlyContinue From 7d13ac7bccadcb2b193c5ed046cd928518523f1a Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Fri, 13 Feb 2026 11:06:08 +0700 Subject: [PATCH 136/221] find cudart_static.lib --- .github/workflows/manual_wheel_cuda.yml | 1 + 1 file changed, 1 insertion(+) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 0b5ec39bf0..431e2efb06 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -154,6 +154,7 @@ jobs: Get-ChildItem -Path ~ -Filter "nvcc.exe" -Recurse -ErrorAction SilentlyContinue nvcc.exe --version Get-ChildItem -Path ~ -Filter "cicc.exe" -Recurse -ErrorAction SilentlyContinue + Get-ChildItem -Path ~ -Filter "cudart_static.lib" -Recurse -ErrorAction SilentlyContinue if (-not (Test-Path -Path "$env:CONDA_PREFIX\\bin")) { #New-Item -ItemType Directory -Path "$env:CONDA_PREFIX\\bin" -Force New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\bin" -Target "$env:CONDA_PREFIX\\Library\\bin" # -Force From 2085481fc3d7cf586c0b1e0d9745f6a3b6e29d62 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Fri, 13 Feb 2026 13:40:37 +0700 Subject: [PATCH 137/221] try with LIBPATH --- .github/workflows/manual_wheel_cuda.yml | 13 +++++++------ 1 file changed, 7 insertions(+), 6 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 431e2efb06..9c2163ffac 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -142,12 +142,13 @@ jobs: $env:CUDA_INC_PATH = $env:CONDA_PREFIX + '\\Library\\include' $env:CUDA_LIB_PATH = $env:CONDA_PREFIX + '\\Library\\lib' #$env:CUDACXX = $env:CONDA_PREFIX + '\\Library\\bin\\nvcc.exe' - $env:LIB = $env:CONDA_PREFIX + '\lib;' + $env:CONDA_PREFIX + '\Library\lib;' + $env:LIB - $env:IncludePath = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:IncludePath - $env:C_INCLUDE_PATH = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:C_INCLUDE_PATH - $env:CPLUS_INCLUDE_PATH = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:CPLUS_INCLUDE_PATH - $env:INCLUDE = $env:CONDA_PREFIX + '\include;' + $env:CONDA_PREFIX + '\Library\include;' + $env:INCLUDE - #$env:CL='/I\' + $env:CONDA_PREFIX + '\Library\include' + $env:LIB = $env:CONDA_PREFIX + '\\lib;' + $env:CONDA_PREFIX + '\\Library\\lib;' + $env:LIB + $env:LIBPATH = $env:CONDA_PREFIX + '\\lib;' + $env:CONDA_PREFIX + '\\Library\\lib;' + $env:LIBPATH + $env:IncludePath = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:IncludePath + $env:C_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:C_INCLUDE_PATH + $env:CPLUS_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:CPLUS_INCLUDE_PATH + $env:INCLUDE = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:INCLUDE + #$env:CL='/I\' + $env:CONDA_PREFIX + '\\Library\\include' $env:Path = "$env:CONDA_PREFIX\\bin; $env:CONDA_PREFIX\\Library\\bin; $env:CONDA_PREFIX\\nvvm\\bin; $env:CONDA_PREFIX\\Library\\nvvm\\bin;" + $env:Path #echo "$env:CONDA_PREFIX\\Library\\bin" | Out-File -FilePath $env:GITHUB_PATH -Encoding utf8 -Append #echo "$env:CONDA_PREFIX\\Library\\nvvm\\bin" | Out-File -FilePath $env:GITHUB_PATH -Encoding utf8 -Append From 19f8cb2349bae4c582b1fb88c6af06beb7984d4c Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Fri, 13 Feb 2026 13:51:09 +0700 Subject: [PATCH 138/221] create symlink to lib64 --- .github/workflows/manual_wheel_cuda.yml | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 9c2163ffac..e7df5b6d0e 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -168,6 +168,10 @@ jobs: #New-Item -ItemType Directory -Path "$env:CONDA_PREFIX\\lib" -Force New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\lib" -Target "$env:CONDA_PREFIX\\Library\\lib" # -Force } else { echo "Warning: lib directory already existed! Not creating symlink."} + if (-not (Test-Path -Path "$env:CONDA_PREFIX\\lib64")) { + #New-Item -ItemType Directory -Path "$env:CONDA_PREFIX\\lib64" -Force + New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\lib64" -Target "$env:CONDA_PREFIX\\Library\\lib" # -Force + } else { echo "Warning: lib64 directory already existed! Not creating symlink."} #Get-ChildItem -Path "C:\Users\runneradmin\miniconda3\envs\llamacpp" -Directory -Recurse -ErrorAction SilentlyContinue } Get-ChildItem -Path ~ -Filter "cuda_runtime.h" -Recurse -ErrorAction SilentlyContinue From 5733e9993987714154c051992c75c8a940100d47 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Fri, 13 Feb 2026 14:09:24 +0700 Subject: [PATCH 139/221] create symlink to include directory --- .github/workflows/manual_wheel_cuda.yml | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index e7df5b6d0e..914e8c5c79 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -172,6 +172,10 @@ jobs: #New-Item -ItemType Directory -Path "$env:CONDA_PREFIX\\lib64" -Force New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\lib64" -Target "$env:CONDA_PREFIX\\Library\\lib" # -Force } else { echo "Warning: lib64 directory already existed! Not creating symlink."} + if (-not (Test-Path -Path "$env:CONDA_PREFIX\\include")) { + #New-Item -ItemType Directory -Path "$env:CONDA_PREFIX\\include" -Force + New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\include" -Target "$env:CONDA_PREFIX\\Library\\include" # -Force + } else { echo "Warning: include directory already existed! Not creating symlink."} #Get-ChildItem -Path "C:\Users\runneradmin\miniconda3\envs\llamacpp" -Directory -Recurse -ErrorAction SilentlyContinue } Get-ChildItem -Path ~ -Filter "cuda_runtime.h" -Recurse -ErrorAction SilentlyContinue From 540876938376e619cbd90b4b2c822c34b45f8e28 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Fri, 13 Feb 2026 14:29:46 +0700 Subject: [PATCH 140/221] try cuda-cccl --- .github/workflows/manual_wheel_cuda.yml | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 914e8c5c79..63aaef8bc0 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -113,7 +113,7 @@ jobs: #conda config --remove channels defaults conda config --show channels #mamba install -y "nvidia::cuda-version==$cudaMajorMinor.*" "nvidia::cuda-toolkit" "nvidia::cuda-nvcc" "nvidia::cuda-cudart-dev" "conda-forge::gcc==13.*" # "conda-forge::libstdcxx-ng" - mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda-version==$cudaMajorMinor.*" "nvidia::cuda-toolkit==$cudaVersion" "nvidia::cuda-libraries-dev" "nvidia::cuda-cudart-dev" "nvidia::cuda-nvvm" "nvidia::cuda-nvcc" "conda-forge::gcc==13.*" + mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda-version==$cudaMajorMinor.*" "nvidia::cuda-toolkit==$cudaVersion" "nvidia::cuda-libraries-dev" "nvidia::cuda-cudart-dev" "nvidia::cuda-cccl" "nvidia::cuda-nvvm" "nvidia::cuda-nvcc" "conda-forge::gcc==13.*" python -m pip install build wheel - name: Build Wheel @@ -127,6 +127,7 @@ jobs: $env:CUDA_HOME = $env:CONDA_PREFIX $env:CUDA_TOOLKIT_ROOT_DIR = $env:CONDA_PREFIX $env:CUDAToolkit_ROOT = $env:CONDA_PREFIX + $env:CUDATOOLKITDIR = $env:CONDA_PREFIX echo "CONDA_PREFIX = $env:CONDA_PREFIX" if ($IsLinux) { if ($cpuArch -eq 'AMD64') { $cpuArch = 'x86_64' } From a7a34a7be51596fb4607edc2fe11742e6bdd95e7 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Sat, 14 Feb 2026 03:03:51 +0700 Subject: [PATCH 141/221] try with strict priority --- .github/workflows/manual_wheel_cuda.yml | 5 ++--- 1 file changed, 2 insertions(+), 3 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 63aaef8bc0..956ad782b9 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -106,14 +106,13 @@ jobs: #if ("$($cudaParts[0]).$($cudaParts[1])" -eq "12.4") {$cudaParts[1] = '5'} $cudaMajor = $cudaParts[0] $cudaMajorMinor = "$($cudaParts[0]).$($cudaParts[1])" - conda config --set channel_priority flexible # strict + conda config --set channel_priority strict # flexible conda config --prepend channels nvidia - #conda config --remove channels conda-forge conda config --append channels conda-forge #conda config --remove channels defaults conda config --show channels #mamba install -y "nvidia::cuda-version==$cudaMajorMinor.*" "nvidia::cuda-toolkit" "nvidia::cuda-nvcc" "nvidia::cuda-cudart-dev" "conda-forge::gcc==13.*" # "conda-forge::libstdcxx-ng" - mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda-version==$cudaMajorMinor.*" "nvidia::cuda-toolkit==$cudaVersion" "nvidia::cuda-libraries-dev" "nvidia::cuda-cudart-dev" "nvidia::cuda-cccl" "nvidia::cuda-nvvm" "nvidia::cuda-nvcc" "conda-forge::gcc==13.*" + mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda-version==$cudaMajorMinor.*" "nvidia::cuda-toolkit" "nvidia::cuda-libraries-dev" "nvidia::cuda-cudart-dev" "nvidia::cuda-cccl" "nvidia::cuda-nvvm" "nvidia::cuda-nvcc" "conda-forge::gcc==13.*" python -m pip install build wheel - name: Build Wheel From e023174269922ab00a2df69008ac6b48c80d62ea Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Sat, 14 Feb 2026 03:08:20 +0700 Subject: [PATCH 142/221] excluding cu124 index --- .github/workflows/generate-index-from-release.yaml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/generate-index-from-release.yaml b/.github/workflows/generate-index-from-release.yaml index 86fb41c57c..f68cf0b1a9 100644 --- a/.github/workflows/generate-index-from-release.yaml +++ b/.github/workflows/generate-index-from-release.yaml @@ -45,7 +45,7 @@ jobs: #./scripts/releases-to-pep-503.sh index/whl/cu121 '^[v]?[0-9]+\.[0-9]+\.[0-9]+-cu121$' #./scripts/releases-to-pep-503.sh index/whl/cu122 '^[v]?[0-9]+\.[0-9]+\.[0-9]+-cu122$' #./scripts/releases-to-pep-503.sh index/whl/cu123 '^[v]?[0-9]+\.[0-9]+\.[0-9]+-cu123$' - ./scripts/releases-to-pep-503.sh index/whl/cu124 '^[v]?[0-9]+\.[0-9]+\.[0-9]+-cu124$' + #./scripts/releases-to-pep-503.sh index/whl/cu124 '^[v]?[0-9]+\.[0-9]+\.[0-9]+-cu124$' ./scripts/releases-to-pep-503.sh index/whl/cu125 '^[v]?[0-9]+\.[0-9]+\.[0-9]+-cu125$' ./scripts/releases-to-pep-503.sh index/whl/cu126 '^[v]?[0-9]+\.[0-9]+\.[0-9]+-cu126$' ./scripts/releases-to-pep-503.sh index/whl/cu128 '^[v]?[0-9]+\.[0-9]+\.[0-9]+-cu128$' From 2cd916fb4caa78cd95f807878f41d498a45bb47a Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Sat, 14 Feb 2026 03:12:19 +0700 Subject: [PATCH 143/221] try with flexible again but without version --- .github/workflows/manual_wheel_cuda.yml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 956ad782b9..cb37760126 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -106,13 +106,13 @@ jobs: #if ("$($cudaParts[0]).$($cudaParts[1])" -eq "12.4") {$cudaParts[1] = '5'} $cudaMajor = $cudaParts[0] $cudaMajorMinor = "$($cudaParts[0]).$($cudaParts[1])" - conda config --set channel_priority strict # flexible + conda config --set channel_priority flexible # strict conda config --prepend channels nvidia conda config --append channels conda-forge #conda config --remove channels defaults conda config --show channels #mamba install -y "nvidia::cuda-version==$cudaMajorMinor.*" "nvidia::cuda-toolkit" "nvidia::cuda-nvcc" "nvidia::cuda-cudart-dev" "conda-forge::gcc==13.*" # "conda-forge::libstdcxx-ng" - mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda-version==$cudaMajorMinor.*" "nvidia::cuda-toolkit" "nvidia::cuda-libraries-dev" "nvidia::cuda-cudart-dev" "nvidia::cuda-cccl" "nvidia::cuda-nvvm" "nvidia::cuda-nvcc" "conda-forge::gcc==13.*" + mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda-version" "nvidia::cuda-toolkit" "nvidia::cuda-libraries-dev" "nvidia::cuda-cudart-dev" "nvidia::cuda-cccl" "nvidia::cuda-nvvm" "nvidia::cuda-nvcc" "conda-forge::gcc==13.*" python -m pip install build wheel - name: Build Wheel From b0ec4e9430a887025a853ce1c7a85024397b42b4 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Sat, 14 Feb 2026 03:39:00 +0700 Subject: [PATCH 144/221] use version but without explicit nvidia --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index cb37760126..b2d769dc9d 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -112,7 +112,7 @@ jobs: #conda config --remove channels defaults conda config --show channels #mamba install -y "nvidia::cuda-version==$cudaMajorMinor.*" "nvidia::cuda-toolkit" "nvidia::cuda-nvcc" "nvidia::cuda-cudart-dev" "conda-forge::gcc==13.*" # "conda-forge::libstdcxx-ng" - mamba install -y -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda-version" "nvidia::cuda-toolkit" "nvidia::cuda-libraries-dev" "nvidia::cuda-cudart-dev" "nvidia::cuda-cccl" "nvidia::cuda-nvvm" "nvidia::cuda-nvcc" "conda-forge::gcc==13.*" + mamba install -y "cuda-version==$cudaMajorMinor.*" "cuda-toolkit" "cuda-libraries-dev" "cuda-cudart-dev" "cuda-cccl" "cuda-nvvm" "cuda-nvcc" "conda-forge::gcc==13.*" # -c "nvidia/label/cuda-$cudaVersion" python -m pip install build wheel - name: Build Wheel From 04693e272ca91abe9bc671cf08d41640273f35bf Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Sat, 14 Feb 2026 05:50:26 +0700 Subject: [PATCH 145/221] update LIBPATH to lib\x64 --- .github/workflows/manual_wheel_cuda.yml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index b2d769dc9d..e7065260b4 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -142,8 +142,8 @@ jobs: $env:CUDA_INC_PATH = $env:CONDA_PREFIX + '\\Library\\include' $env:CUDA_LIB_PATH = $env:CONDA_PREFIX + '\\Library\\lib' #$env:CUDACXX = $env:CONDA_PREFIX + '\\Library\\bin\\nvcc.exe' - $env:LIB = $env:CONDA_PREFIX + '\\lib;' + $env:CONDA_PREFIX + '\\Library\\lib;' + $env:LIB - $env:LIBPATH = $env:CONDA_PREFIX + '\\lib;' + $env:CONDA_PREFIX + '\\Library\\lib;' + $env:LIBPATH + $env:LIB = $env:CONDA_PREFIX + '\\lib;' + $env:CONDA_PREFIX + '\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib;' + $env:CONDA_PREFIX + '\\Library\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib\\x64;' + $env:LIB + $env:LIBPATH = $env:CONDA_PREFIX + '\\lib;' + $env:CONDA_PREFIX + '\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib;' + $env:CONDA_PREFIX + '\\Library\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib\\x64;' + $env:LIBPATH $env:IncludePath = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:IncludePath $env:C_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:C_INCLUDE_PATH $env:CPLUS_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:CPLUS_INCLUDE_PATH From 7c05b626e797aa6556818efb1b48219ab4399c96 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Sat, 14 Feb 2026 06:06:40 +0700 Subject: [PATCH 146/221] create x64 symlink if lib directory already exist --- .github/workflows/manual_wheel_cuda.yml | 8 +++++++- 1 file changed, 7 insertions(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index e7065260b4..0580ad036b 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -167,7 +167,13 @@ jobs: if (-not (Test-Path -Path "$env:CONDA_PREFIX\\lib")) { #New-Item -ItemType Directory -Path "$env:CONDA_PREFIX\\lib" -Force New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\lib" -Target "$env:CONDA_PREFIX\\Library\\lib" # -Force - } else { echo "Warning: lib directory already existed! Not creating symlink."} + } else { + echo "Warning: lib directory already existed! Not creating symlink." + if (-not (Test-Path -Path "$env:CONDA_PREFIX\\lib\\x64")) { + #New-Item -ItemType Directory -Path "$env:CONDA_PREFIX\\lib\\x64" -Force + New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\lib\\x64" -Target "$env:CONDA_PREFIX\\Library\\lib\\x64" # -Force + } else { echo "Warning: lib\x64 directory already existed! Not creating symlink."} + } if (-not (Test-Path -Path "$env:CONDA_PREFIX\\lib64")) { #New-Item -ItemType Directory -Path "$env:CONDA_PREFIX\\lib64" -Force New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\lib64" -Target "$env:CONDA_PREFIX\\Library\\lib" # -Force From 479955e24515b0aa4c8cfe5bf8351909563e93f9 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Sat, 14 Feb 2026 07:52:38 +0700 Subject: [PATCH 147/221] oops --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 0580ad036b..a4a30b959b 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -171,7 +171,7 @@ jobs: echo "Warning: lib directory already existed! Not creating symlink." if (-not (Test-Path -Path "$env:CONDA_PREFIX\\lib\\x64")) { #New-Item -ItemType Directory -Path "$env:CONDA_PREFIX\\lib\\x64" -Force - New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\lib\\x64" -Target "$env:CONDA_PREFIX\\Library\\lib\\x64" # -Force + New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\lib\\x64" -Target "$env:CONDA_PREFIX\\Library\\lib" # -Force } else { echo "Warning: lib\x64 directory already existed! Not creating symlink."} } if (-not (Test-Path -Path "$env:CONDA_PREFIX\\lib64")) { From 790940d5b2314e2acea0147bdb96b4b0ef4097dd Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Sat, 14 Feb 2026 16:47:32 +0700 Subject: [PATCH 148/221] add more symlink conditions --- .github/workflows/manual_wheel_cuda.yml | 7 +++++-- 1 file changed, 5 insertions(+), 2 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index a4a30b959b..67a84bb5d2 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -170,8 +170,11 @@ jobs: } else { echo "Warning: lib directory already existed! Not creating symlink." if (-not (Test-Path -Path "$env:CONDA_PREFIX\\lib\\x64")) { - #New-Item -ItemType Directory -Path "$env:CONDA_PREFIX\\lib\\x64" -Force - New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\lib\\x64" -Target "$env:CONDA_PREFIX\\Library\\lib" # -Force + if (-not (Test-Path -Path "$env:CONDA_PREFIX\\Library\\lib\x64")) { + New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\lib\\x64" -Target "$env:CONDA_PREFIX\\Library\\lib" # -Force + } else { + New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\lib\\x64" -Target "$env:CONDA_PREFIX\\Library\\lib\\x64" # -Force + } } else { echo "Warning: lib\x64 directory already existed! Not creating symlink."} } if (-not (Test-Path -Path "$env:CONDA_PREFIX\\lib64")) { From 708b48dad48f01a96da21358f62feadfb63c49a4 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Sun, 15 Feb 2026 11:51:53 +0700 Subject: [PATCH 149/221] use linker flags on cmake --- .github/workflows/manual_wheel_cuda.yml | 12 ++++-------- 1 file changed, 4 insertions(+), 8 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 67a84bb5d2..7b9eb88a85 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -157,15 +157,12 @@ jobs: Get-ChildItem -Path ~ -Filter "cicc.exe" -Recurse -ErrorAction SilentlyContinue Get-ChildItem -Path ~ -Filter "cudart_static.lib" -Recurse -ErrorAction SilentlyContinue if (-not (Test-Path -Path "$env:CONDA_PREFIX\\bin")) { - #New-Item -ItemType Directory -Path "$env:CONDA_PREFIX\\bin" -Force New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\bin" -Target "$env:CONDA_PREFIX\\Library\\bin" # -Force } else { echo "Warning: bin directory already existed! Not creating symlink."} if (-not (Test-Path -Path "$env:CONDA_PREFIX\\nvvm")) { - #New-Item -ItemType Directory -Path "$env:CONDA_PREFIX\\nvvm" -Force New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\nvvm" -Target "$env:CONDA_PREFIX\\Library\\nvvm" # -Force } else { echo "Warning: nvvm directory already existed! Not creating symlink."} if (-not (Test-Path -Path "$env:CONDA_PREFIX\\lib")) { - #New-Item -ItemType Directory -Path "$env:CONDA_PREFIX\\lib" -Force New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\lib" -Target "$env:CONDA_PREFIX\\Library\\lib" # -Force } else { echo "Warning: lib directory already existed! Not creating symlink." @@ -178,11 +175,9 @@ jobs: } else { echo "Warning: lib\x64 directory already existed! Not creating symlink."} } if (-not (Test-Path -Path "$env:CONDA_PREFIX\\lib64")) { - #New-Item -ItemType Directory -Path "$env:CONDA_PREFIX\\lib64" -Force New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\lib64" -Target "$env:CONDA_PREFIX\\Library\\lib" # -Force } else { echo "Warning: lib64 directory already existed! Not creating symlink."} if (-not (Test-Path -Path "$env:CONDA_PREFIX\\include")) { - #New-Item -ItemType Directory -Path "$env:CONDA_PREFIX\\include" -Force New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\include" -Target "$env:CONDA_PREFIX\\Library\\include" # -Force } else { echo "Warning: include directory already existed! Not creating symlink."} #Get-ChildItem -Path "C:\Users\runneradmin\miniconda3\envs\llamacpp" -Directory -Recurse -ErrorAction SilentlyContinue @@ -195,9 +190,10 @@ jobs: #$env:CMAKE_BUILD_PARALLEL_LEVEL=4 $env:CMAKE_ARGS = '-DGGML_CUDA=on -DCMAKE_CUDA_ARCHITECTURES=all' $env:CMAKE_ARGS = "-DGGML_CUDA_FORCE_MMQ=ON $env:CMAKE_ARGS" - #if ($env:RUNNER_OS -eq 'Windows') { - # $env:CMAKE_ARGS = "-DCMAKE_CUDA_COMPILER='$env:CONDA_PREFIX\\Library\\bin' $env:CMAKE_ARGS" - #} + if ($env:RUNNER_OS -eq 'Windows') { + #$env:CMAKE_ARGS = "-DCMAKE_CUDA_COMPILER='$env:CONDA_PREFIX\\Library\\bin' $env:CMAKE_ARGS" + $env:CMAKE_ARGS = "-DCMAKE_LINKER_FLAGS='/LIBPATH:$env:CONDA_PREFIX\\Library\\lib' $env:CMAKE_ARGS" + } #$env:CMAKE_ARGS = "-DCMAKE_CUDA_FLAGS='-allow-unsupported-compiler' $env:CMAKE_ARGS" # if ($env:AVXVER -eq 'AVX') { $env:CMAKE_ARGS = $env:CMAKE_ARGS + ' -DGGML_AVX2=off -DGGML_FMA=off -DGGML_F16C=off' From 1c533b2c0c9936d8b95faf64f086f85b9dd589b8 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Sun, 15 Feb 2026 12:23:42 +0700 Subject: [PATCH 150/221] symlink lib\x64 to Library\lib --- .github/workflows/manual_wheel_cuda.yml | 8 ++++---- 1 file changed, 4 insertions(+), 4 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 7b9eb88a85..15a982f0d0 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -167,11 +167,11 @@ jobs: } else { echo "Warning: lib directory already existed! Not creating symlink." if (-not (Test-Path -Path "$env:CONDA_PREFIX\\lib\\x64")) { - if (-not (Test-Path -Path "$env:CONDA_PREFIX\\Library\\lib\x64")) { + #if (-not (Test-Path -Path "$env:CONDA_PREFIX\\Library\\lib\\x64")) { New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\lib\\x64" -Target "$env:CONDA_PREFIX\\Library\\lib" # -Force - } else { - New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\lib\\x64" -Target "$env:CONDA_PREFIX\\Library\\lib\\x64" # -Force - } + #} else { + #New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\lib\\x64" -Target "$env:CONDA_PREFIX\\Library\\lib\\x64" # -Force + #} } else { echo "Warning: lib\x64 directory already existed! Not creating symlink."} } if (-not (Test-Path -Path "$env:CONDA_PREFIX\\lib64")) { From caf2fa5125af17882e01ccebc7cfd2feb357342f Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Sun, 15 Feb 2026 16:00:11 +0700 Subject: [PATCH 151/221] update symlink condition for cuda 13+ --- .github/workflows/manual_wheel_cuda.yml | 16 ++++++++-------- 1 file changed, 8 insertions(+), 8 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 15a982f0d0..02d2c9092e 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -157,28 +157,28 @@ jobs: Get-ChildItem -Path ~ -Filter "cicc.exe" -Recurse -ErrorAction SilentlyContinue Get-ChildItem -Path ~ -Filter "cudart_static.lib" -Recurse -ErrorAction SilentlyContinue if (-not (Test-Path -Path "$env:CONDA_PREFIX\\bin")) { - New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\bin" -Target "$env:CONDA_PREFIX\\Library\\bin" # -Force + New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\bin" -Target "$env:CONDA_PREFIX\\Library\\bin" } else { echo "Warning: bin directory already existed! Not creating symlink."} if (-not (Test-Path -Path "$env:CONDA_PREFIX\\nvvm")) { - New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\nvvm" -Target "$env:CONDA_PREFIX\\Library\\nvvm" # -Force + New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\nvvm" -Target "$env:CONDA_PREFIX\\Library\\nvvm" } else { echo "Warning: nvvm directory already existed! Not creating symlink."} if (-not (Test-Path -Path "$env:CONDA_PREFIX\\lib")) { New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\lib" -Target "$env:CONDA_PREFIX\\Library\\lib" # -Force } else { echo "Warning: lib directory already existed! Not creating symlink." if (-not (Test-Path -Path "$env:CONDA_PREFIX\\lib\\x64")) { - #if (-not (Test-Path -Path "$env:CONDA_PREFIX\\Library\\lib\\x64")) { - New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\lib\\x64" -Target "$env:CONDA_PREFIX\\Library\\lib" # -Force - #} else { - #New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\lib\\x64" -Target "$env:CONDA_PREFIX\\Library\\lib\\x64" # -Force - #} + if ([int]$cudaMajor -ge 13) { + New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\lib\\x64" -Target "$env:CONDA_PREFIX\\Library\\lib\\x64" + } else { + New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\lib\\x64" -Target "$env:CONDA_PREFIX\\Library\\lib" + } } else { echo "Warning: lib\x64 directory already existed! Not creating symlink."} } if (-not (Test-Path -Path "$env:CONDA_PREFIX\\lib64")) { New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\lib64" -Target "$env:CONDA_PREFIX\\Library\\lib" # -Force } else { echo "Warning: lib64 directory already existed! Not creating symlink."} if (-not (Test-Path -Path "$env:CONDA_PREFIX\\include")) { - New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\include" -Target "$env:CONDA_PREFIX\\Library\\include" # -Force + New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\include" -Target "$env:CONDA_PREFIX\\Library\\include" } else { echo "Warning: include directory already existed! Not creating symlink."} #Get-ChildItem -Path "C:\Users\runneradmin\miniconda3\envs\llamacpp" -Directory -Recurse -ErrorAction SilentlyContinue } From 20eaa31398ee88e0cb16297a5f6015f484ff6d24 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Mon, 16 Feb 2026 02:21:39 +0700 Subject: [PATCH 152/221] oops $cudaMajor doesn't exist yet --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 02d2c9092e..73a2b684b0 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -101,7 +101,6 @@ jobs: MAMBA_NO_LOW_SPEED_LIMIT: "1" run: | $cudaVersion = $env:CUDAVER - #$cudaMajor = $cudaVersion.Split('.')[0] $cudaParts = $cudaVersion -split '\.' #if ("$($cudaParts[0]).$($cudaParts[1])" -eq "12.4") {$cudaParts[1] = '5'} $cudaMajor = $cudaParts[0] @@ -119,6 +118,7 @@ jobs: run: | $cpuArch = $env:PROCESSOR_ARCHITECTURE $cudaVersion = $env:CUDAVER.Remove($env:CUDAVER.LastIndexOf('.')).Replace('.','') + $cudaMajor = $cudaVersion.Split('.')[0] #if ($env:RUNNER_OS -eq 'Windows') { # $env:CONDA_PREFIX = $env:CONDA_PREFIX + '\Library' #} From 98b4efdd091436415f078ece26d09df1a2c92796 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Mon, 16 Feb 2026 02:31:54 +0700 Subject: [PATCH 153/221] oops --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 73a2b684b0..107b4b90e1 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -118,7 +118,7 @@ jobs: run: | $cpuArch = $env:PROCESSOR_ARCHITECTURE $cudaVersion = $env:CUDAVER.Remove($env:CUDAVER.LastIndexOf('.')).Replace('.','') - $cudaMajor = $cudaVersion.Split('.')[0] + $cudaMajor = $env:CUDAVER.Split('.')[0] #if ($env:RUNNER_OS -eq 'Windows') { # $env:CONDA_PREFIX = $env:CONDA_PREFIX + '\Library' #} From 444e631cfffb122cacaaac9bb1679a5a9523b641 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Mon, 16 Feb 2026 04:49:38 +0700 Subject: [PATCH 154/221] try with cuda-thrust --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 107b4b90e1..d21e616164 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -111,7 +111,7 @@ jobs: #conda config --remove channels defaults conda config --show channels #mamba install -y "nvidia::cuda-version==$cudaMajorMinor.*" "nvidia::cuda-toolkit" "nvidia::cuda-nvcc" "nvidia::cuda-cudart-dev" "conda-forge::gcc==13.*" # "conda-forge::libstdcxx-ng" - mamba install -y "cuda-version==$cudaMajorMinor.*" "cuda-toolkit" "cuda-libraries-dev" "cuda-cudart-dev" "cuda-cccl" "cuda-nvvm" "cuda-nvcc" "conda-forge::gcc==13.*" # -c "nvidia/label/cuda-$cudaVersion" + mamba install -y "cuda-version==$cudaMajorMinor.*" "cuda-toolkit" "cuda-libraries-dev" "cuda-thrust" "cuda-cudart-dev" "cuda-cccl" "cuda-nvvm" "cuda-nvcc" "conda-forge::gcc==13.*" # -c "nvidia/label/cuda-$cudaVersion" python -m pip install build wheel - name: Build Wheel From 0a9931bd71e894b8fcb58ef8d138f4c73c45338b Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Mon, 16 Feb 2026 05:16:29 +0700 Subject: [PATCH 155/221] try with cccl --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index d21e616164..399328f221 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -111,7 +111,7 @@ jobs: #conda config --remove channels defaults conda config --show channels #mamba install -y "nvidia::cuda-version==$cudaMajorMinor.*" "nvidia::cuda-toolkit" "nvidia::cuda-nvcc" "nvidia::cuda-cudart-dev" "conda-forge::gcc==13.*" # "conda-forge::libstdcxx-ng" - mamba install -y "cuda-version==$cudaMajorMinor.*" "cuda-toolkit" "cuda-libraries-dev" "cuda-thrust" "cuda-cudart-dev" "cuda-cccl" "cuda-nvvm" "cuda-nvcc" "conda-forge::gcc==13.*" # -c "nvidia/label/cuda-$cudaVersion" + mamba install -y "cuda-version==$cudaMajorMinor.*" "cuda-toolkit" "cuda-libraries-dev" "cuda-cudart-dev" "cuda-cccl" cccl "cuda-nvvm" "cuda-nvcc" "conda-forge::gcc==13.*" # -c "nvidia/label/cuda-$cudaVersion" "cuda-thrust" python -m pip install build wheel - name: Build Wheel From 0e5224e8f6dbc3c0ad6d70d4610ddd98256d4885 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Mon, 16 Feb 2026 05:29:35 +0700 Subject: [PATCH 156/221] prioritize conda-forge --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 399328f221..b0499a06cc 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -106,7 +106,7 @@ jobs: $cudaMajor = $cudaParts[0] $cudaMajorMinor = "$($cudaParts[0]).$($cudaParts[1])" conda config --set channel_priority flexible # strict - conda config --prepend channels nvidia + #conda config --prepend channels nvidia conda config --append channels conda-forge #conda config --remove channels defaults conda config --show channels From 29fedd60cf17ddc3887853dcc8e7a444de798013 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Mon, 16 Feb 2026 11:48:09 +0700 Subject: [PATCH 157/221] try more dependencies --- .github/workflows/manual_wheel_cuda.yml | 7 ++++--- 1 file changed, 4 insertions(+), 3 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index b0499a06cc..1e0ee8d4ee 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -111,7 +111,7 @@ jobs: #conda config --remove channels defaults conda config --show channels #mamba install -y "nvidia::cuda-version==$cudaMajorMinor.*" "nvidia::cuda-toolkit" "nvidia::cuda-nvcc" "nvidia::cuda-cudart-dev" "conda-forge::gcc==13.*" # "conda-forge::libstdcxx-ng" - mamba install -y "cuda-version==$cudaMajorMinor.*" "cuda-toolkit" "cuda-libraries-dev" "cuda-cudart-dev" "cuda-cccl" cccl "cuda-nvvm" "cuda-nvcc" "conda-forge::gcc==13.*" # -c "nvidia/label/cuda-$cudaVersion" "cuda-thrust" + mamba install -y "cuda-version==$cudaMajorMinor.*" cuda cuda-runtime "cuda-toolkit" "cuda-libraries-dev" "cuda-cudart-dev" "cuda-cccl" cccl "cuda-thrust" "cuda-nvvm" "cuda-nvcc" "conda-forge::gcc==13.*" # -c "nvidia/label/cuda-$cudaVersion" python -m pip install build wheel - name: Build Wheel @@ -141,7 +141,7 @@ jobs: $env:CUDA_PATH = $env:CONDA_PREFIX + '\\Library\\bin' $env:CUDA_INC_PATH = $env:CONDA_PREFIX + '\\Library\\include' $env:CUDA_LIB_PATH = $env:CONDA_PREFIX + '\\Library\\lib' - #$env:CUDACXX = $env:CONDA_PREFIX + '\\Library\\bin\\nvcc.exe' + $env:CUDACXX = $env:CONDA_PREFIX + '\\Library\\bin\\nvcc.exe' $env:LIB = $env:CONDA_PREFIX + '\\lib;' + $env:CONDA_PREFIX + '\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib;' + $env:CONDA_PREFIX + '\\Library\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib\\x64;' + $env:LIB $env:LIBPATH = $env:CONDA_PREFIX + '\\lib;' + $env:CONDA_PREFIX + '\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib;' + $env:CONDA_PREFIX + '\\Library\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib\\x64;' + $env:LIBPATH $env:IncludePath = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:IncludePath @@ -188,10 +188,11 @@ jobs: #$env:FORCE_CMAKE=1 #$env:MAX_JOBS=4 #$env:CMAKE_BUILD_PARALLEL_LEVEL=4 + $env:CMAKE_GENERATOR_TOOLSET = $env:CUDA_HOME $env:CMAKE_ARGS = '-DGGML_CUDA=on -DCMAKE_CUDA_ARCHITECTURES=all' $env:CMAKE_ARGS = "-DGGML_CUDA_FORCE_MMQ=ON $env:CMAKE_ARGS" if ($env:RUNNER_OS -eq 'Windows') { - #$env:CMAKE_ARGS = "-DCMAKE_CUDA_COMPILER='$env:CONDA_PREFIX\\Library\\bin' $env:CMAKE_ARGS" + $env:CMAKE_ARGS = "-DCMAKE_CUDA_COMPILER='$env:CONDA_PREFIX\\Library\\bin' $env:CMAKE_ARGS" $env:CMAKE_ARGS = "-DCMAKE_LINKER_FLAGS='/LIBPATH:$env:CONDA_PREFIX\\Library\\lib' $env:CMAKE_ARGS" } #$env:CMAKE_ARGS = "-DCMAKE_CUDA_FLAGS='-allow-unsupported-compiler' $env:CMAKE_ARGS" From b645d368f22c044e5c74b0b6f91a30fd46c76a7e Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Mon, 16 Feb 2026 12:02:57 +0700 Subject: [PATCH 158/221] oops doesn't support toolset --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 1e0ee8d4ee..7527579423 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -188,7 +188,7 @@ jobs: #$env:FORCE_CMAKE=1 #$env:MAX_JOBS=4 #$env:CMAKE_BUILD_PARALLEL_LEVEL=4 - $env:CMAKE_GENERATOR_TOOLSET = $env:CUDA_HOME + #$env:CMAKE_GENERATOR_TOOLSET = $env:CUDA_HOME $env:CMAKE_ARGS = '-DGGML_CUDA=on -DCMAKE_CUDA_ARCHITECTURES=all' $env:CMAKE_ARGS = "-DGGML_CUDA_FORCE_MMQ=ON $env:CMAKE_ARGS" if ($env:RUNNER_OS -eq 'Windows') { From 5ceb7382234a2b0f6a448346e95dee7b8b12fe77 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Mon, 16 Feb 2026 12:08:26 +0700 Subject: [PATCH 159/221] oops cuda-thrust doesn't available on conda-forge --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 7527579423..8e41263129 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -111,7 +111,7 @@ jobs: #conda config --remove channels defaults conda config --show channels #mamba install -y "nvidia::cuda-version==$cudaMajorMinor.*" "nvidia::cuda-toolkit" "nvidia::cuda-nvcc" "nvidia::cuda-cudart-dev" "conda-forge::gcc==13.*" # "conda-forge::libstdcxx-ng" - mamba install -y "cuda-version==$cudaMajorMinor.*" cuda cuda-runtime "cuda-toolkit" "cuda-libraries-dev" "cuda-cudart-dev" "cuda-cccl" cccl "cuda-thrust" "cuda-nvvm" "cuda-nvcc" "conda-forge::gcc==13.*" # -c "nvidia/label/cuda-$cudaVersion" + mamba install -y "cuda-version==$cudaMajorMinor.*" cuda cuda-runtime "cuda-toolkit" "cuda-libraries-dev" "cuda-cudart-dev" "cuda-cccl" cccl "nvidia::cuda-thrust" "cuda-nvvm" "cuda-nvcc" "conda-forge::gcc==13.*" # -c "nvidia/label/cuda-$cudaVersion" python -m pip install build wheel - name: Build Wheel From 6d2d99a0ab1795007f5736a99adb3061543ce730 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Mon, 16 Feb 2026 13:08:14 +0700 Subject: [PATCH 160/221] excluding cuda 13.1 --- .github/workflows/manual_wheel_cuda.yml | 10 +++++----- 1 file changed, 5 insertions(+), 5 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 8e41263129..5b9c1c2f39 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -22,7 +22,7 @@ jobs: $matrix = @{ 'os' = @('ubuntu-22.04','windows-2022') 'pyver' = @("3.9", "3.10", "3.11", "3.12") # ,"3.13", "3.14" - 'cuda' = @("12.5.1", "12.6.3", "12.8.1", "13.0.2", "13.1.0") # "12.1.1", "12.2.2", "12.3.2", "12.4.1", "12.9.1", + 'cuda' = @("12.5.1", "12.6.3", "12.8.1", "13.0.2") # "12.1.1", "12.2.2", "12.3.2", "12.4.1", "12.9.1", "13.1.0" 'releasetag' = @("basic") } @@ -111,7 +111,7 @@ jobs: #conda config --remove channels defaults conda config --show channels #mamba install -y "nvidia::cuda-version==$cudaMajorMinor.*" "nvidia::cuda-toolkit" "nvidia::cuda-nvcc" "nvidia::cuda-cudart-dev" "conda-forge::gcc==13.*" # "conda-forge::libstdcxx-ng" - mamba install -y "cuda-version==$cudaMajorMinor.*" cuda cuda-runtime "cuda-toolkit" "cuda-libraries-dev" "cuda-cudart-dev" "cuda-cccl" cccl "nvidia::cuda-thrust" "cuda-nvvm" "cuda-nvcc" "conda-forge::gcc==13.*" # -c "nvidia/label/cuda-$cudaVersion" + mamba install -y "cuda-version==$cudaMajorMinor.*" "cuda-toolkit" "cuda-libraries-dev" "cuda-cudart-dev" "cuda-cccl" "cuda-nvvm" "cuda-nvcc" "conda-forge::gcc==13.*" # -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda-thrust" python -m pip install build wheel - name: Build Wheel @@ -141,7 +141,7 @@ jobs: $env:CUDA_PATH = $env:CONDA_PREFIX + '\\Library\\bin' $env:CUDA_INC_PATH = $env:CONDA_PREFIX + '\\Library\\include' $env:CUDA_LIB_PATH = $env:CONDA_PREFIX + '\\Library\\lib' - $env:CUDACXX = $env:CONDA_PREFIX + '\\Library\\bin\\nvcc.exe' + #$env:CUDACXX = $env:CONDA_PREFIX + '\\Library\\bin\\nvcc.exe' $env:LIB = $env:CONDA_PREFIX + '\\lib;' + $env:CONDA_PREFIX + '\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib;' + $env:CONDA_PREFIX + '\\Library\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib\\x64;' + $env:LIB $env:LIBPATH = $env:CONDA_PREFIX + '\\lib;' + $env:CONDA_PREFIX + '\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib;' + $env:CONDA_PREFIX + '\\Library\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib\\x64;' + $env:LIBPATH $env:IncludePath = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:IncludePath @@ -183,7 +183,7 @@ jobs: #Get-ChildItem -Path "C:\Users\runneradmin\miniconda3\envs\llamacpp" -Directory -Recurse -ErrorAction SilentlyContinue } Get-ChildItem -Path ~ -Filter "cuda_runtime.h" -Recurse -ErrorAction SilentlyContinue - $env:VERBOSE = '1' + #$env:VERBOSE = '1' #$env:NVCCFLAGS="-allow-unsupported-compiler" #$env:FORCE_CMAKE=1 #$env:MAX_JOBS=4 @@ -192,7 +192,7 @@ jobs: $env:CMAKE_ARGS = '-DGGML_CUDA=on -DCMAKE_CUDA_ARCHITECTURES=all' $env:CMAKE_ARGS = "-DGGML_CUDA_FORCE_MMQ=ON $env:CMAKE_ARGS" if ($env:RUNNER_OS -eq 'Windows') { - $env:CMAKE_ARGS = "-DCMAKE_CUDA_COMPILER='$env:CONDA_PREFIX\\Library\\bin' $env:CMAKE_ARGS" + #$env:CMAKE_ARGS = "-DCMAKE_CUDA_COMPILER='$env:CONDA_PREFIX\\Library\\bin' $env:CMAKE_ARGS" $env:CMAKE_ARGS = "-DCMAKE_LINKER_FLAGS='/LIBPATH:$env:CONDA_PREFIX\\Library\\lib' $env:CMAKE_ARGS" } #$env:CMAKE_ARGS = "-DCMAKE_CUDA_FLAGS='-allow-unsupported-compiler' $env:CMAKE_ARGS" From c0dfb540fc583db37a4b35e52cc3a30d10705696 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Mon, 16 Feb 2026 23:32:43 +0700 Subject: [PATCH 161/221] Test 1 --- .github/workflows/manual_wheel_cuda.yml | 28 ++++++++++++------------- 1 file changed, 14 insertions(+), 14 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 5b9c1c2f39..a14b22db5d 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -105,13 +105,13 @@ jobs: #if ("$($cudaParts[0]).$($cudaParts[1])" -eq "12.4") {$cudaParts[1] = '5'} $cudaMajor = $cudaParts[0] $cudaMajorMinor = "$($cudaParts[0]).$($cudaParts[1])" - conda config --set channel_priority flexible # strict + #conda config --set channel_priority flexible # strict #conda config --prepend channels nvidia - conda config --append channels conda-forge + #conda config --append channels conda-forge #conda config --remove channels defaults conda config --show channels #mamba install -y "nvidia::cuda-version==$cudaMajorMinor.*" "nvidia::cuda-toolkit" "nvidia::cuda-nvcc" "nvidia::cuda-cudart-dev" "conda-forge::gcc==13.*" # "conda-forge::libstdcxx-ng" - mamba install -y "cuda-version==$cudaMajorMinor.*" "cuda-toolkit" "cuda-libraries-dev" "cuda-cudart-dev" "cuda-cccl" "cuda-nvvm" "cuda-nvcc" "conda-forge::gcc==13.*" # -c "nvidia/label/cuda-$cudaVersion" "nvidia::cuda-thrust" + mamba install -y -c conda-forge "cuda-version==$cudaMajorMinor.*" "cuda-toolkit" "cuda-cudart-dev" "cuda-cccl" "cuda-nvvm" "cuda-nvcc" "conda-forge::gcc==13.*" # -c "nvidia/label/cuda-$cudaVersion" "cuda-libraries-dev" "nvidia::cuda-thrust" python -m pip install build wheel - name: Build Wheel @@ -136,18 +136,18 @@ jobs: Get-ChildItem -Path ~ -Filter "cicc" -Recurse -ErrorAction SilentlyContinue } elseif ($IsWindows) { - $env:CUDA_TOOLKIT_ROOT_DIR += "\\Library" - $env:CUDAToolkit_ROOT += "\\Library" - $env:CUDA_PATH = $env:CONDA_PREFIX + '\\Library\\bin' - $env:CUDA_INC_PATH = $env:CONDA_PREFIX + '\\Library\\include' - $env:CUDA_LIB_PATH = $env:CONDA_PREFIX + '\\Library\\lib' + #$env:CUDA_TOOLKIT_ROOT_DIR += "\\Library" + #$env:CUDAToolkit_ROOT += "\\Library" + #$env:CUDA_PATH = $env:CONDA_PREFIX + '\\Library\\bin' + #$env:CUDA_INC_PATH = $env:CONDA_PREFIX + '\\Library\\include' + #$env:CUDA_LIB_PATH = $env:CONDA_PREFIX + '\\Library\\lib' #$env:CUDACXX = $env:CONDA_PREFIX + '\\Library\\bin\\nvcc.exe' - $env:LIB = $env:CONDA_PREFIX + '\\lib;' + $env:CONDA_PREFIX + '\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib;' + $env:CONDA_PREFIX + '\\Library\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib\\x64;' + $env:LIB - $env:LIBPATH = $env:CONDA_PREFIX + '\\lib;' + $env:CONDA_PREFIX + '\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib;' + $env:CONDA_PREFIX + '\\Library\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib\\x64;' + $env:LIBPATH - $env:IncludePath = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:IncludePath - $env:C_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:C_INCLUDE_PATH - $env:CPLUS_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:CPLUS_INCLUDE_PATH - $env:INCLUDE = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:INCLUDE + #$env:LIB = $env:CONDA_PREFIX + '\\lib;' + $env:CONDA_PREFIX + '\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib;' + $env:CONDA_PREFIX + '\\Library\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib\\x64;' + $env:LIB + #$env:LIBPATH = $env:CONDA_PREFIX + '\\lib;' + $env:CONDA_PREFIX + '\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib;' + $env:CONDA_PREFIX + '\\Library\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib\\x64;' + $env:LIBPATH + #$env:IncludePath = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:IncludePath + #$env:C_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:C_INCLUDE_PATH + #$env:CPLUS_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:CPLUS_INCLUDE_PATH + #$env:INCLUDE = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:INCLUDE #$env:CL='/I\' + $env:CONDA_PREFIX + '\\Library\\include' $env:Path = "$env:CONDA_PREFIX\\bin; $env:CONDA_PREFIX\\Library\\bin; $env:CONDA_PREFIX\\nvvm\\bin; $env:CONDA_PREFIX\\Library\\nvvm\\bin;" + $env:Path #echo "$env:CONDA_PREFIX\\Library\\bin" | Out-File -FilePath $env:GITHUB_PATH -Encoding utf8 -Append From decde2eb8d945d96d9d79b7ad52b84835a35f22f Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Tue, 17 Feb 2026 01:03:39 +0700 Subject: [PATCH 162/221] Test 2 --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index a14b22db5d..4bf3292fd4 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -144,7 +144,7 @@ jobs: #$env:CUDACXX = $env:CONDA_PREFIX + '\\Library\\bin\\nvcc.exe' #$env:LIB = $env:CONDA_PREFIX + '\\lib;' + $env:CONDA_PREFIX + '\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib;' + $env:CONDA_PREFIX + '\\Library\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib\\x64;' + $env:LIB #$env:LIBPATH = $env:CONDA_PREFIX + '\\lib;' + $env:CONDA_PREFIX + '\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib;' + $env:CONDA_PREFIX + '\\Library\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib\\x64;' + $env:LIBPATH - #$env:IncludePath = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:IncludePath + $env:IncludePath = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:IncludePath #$env:C_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:C_INCLUDE_PATH #$env:CPLUS_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:CPLUS_INCLUDE_PATH #$env:INCLUDE = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:INCLUDE From a18f90eba57ec2735c5a75be7a1ee5e24a9a6565 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Tue, 17 Feb 2026 01:11:29 +0700 Subject: [PATCH 163/221] Test 3 --- .github/workflows/manual_wheel_cuda.yml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 4bf3292fd4..1ac528f6dc 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -144,8 +144,8 @@ jobs: #$env:CUDACXX = $env:CONDA_PREFIX + '\\Library\\bin\\nvcc.exe' #$env:LIB = $env:CONDA_PREFIX + '\\lib;' + $env:CONDA_PREFIX + '\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib;' + $env:CONDA_PREFIX + '\\Library\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib\\x64;' + $env:LIB #$env:LIBPATH = $env:CONDA_PREFIX + '\\lib;' + $env:CONDA_PREFIX + '\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib;' + $env:CONDA_PREFIX + '\\Library\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib\\x64;' + $env:LIBPATH - $env:IncludePath = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:IncludePath - #$env:C_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:C_INCLUDE_PATH + #$env:IncludePath = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:IncludePath + $env:C_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:C_INCLUDE_PATH #$env:CPLUS_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:CPLUS_INCLUDE_PATH #$env:INCLUDE = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:INCLUDE #$env:CL='/I\' + $env:CONDA_PREFIX + '\\Library\\include' From 80a4ec83e33aa69e2ee02cdf651a9296ca824e60 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Tue, 17 Feb 2026 02:46:48 +0700 Subject: [PATCH 164/221] Test 4 --- .github/workflows/manual_wheel_cuda.yml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 1ac528f6dc..f753c9b34d 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -146,8 +146,8 @@ jobs: #$env:LIBPATH = $env:CONDA_PREFIX + '\\lib;' + $env:CONDA_PREFIX + '\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib;' + $env:CONDA_PREFIX + '\\Library\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib\\x64;' + $env:LIBPATH #$env:IncludePath = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:IncludePath $env:C_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:C_INCLUDE_PATH - #$env:CPLUS_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:CPLUS_INCLUDE_PATH - #$env:INCLUDE = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:INCLUDE + $env:CPLUS_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:CPLUS_INCLUDE_PATH + $env:INCLUDE = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:INCLUDE #$env:CL='/I\' + $env:CONDA_PREFIX + '\\Library\\include' $env:Path = "$env:CONDA_PREFIX\\bin; $env:CONDA_PREFIX\\Library\\bin; $env:CONDA_PREFIX\\nvvm\\bin; $env:CONDA_PREFIX\\Library\\nvvm\\bin;" + $env:Path #echo "$env:CONDA_PREFIX\\Library\\bin" | Out-File -FilePath $env:GITHUB_PATH -Encoding utf8 -Append From 1038e5d059628e251865d8a9ddbef596f17a9de7 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Tue, 17 Feb 2026 04:18:16 +0700 Subject: [PATCH 165/221] Test 6 --- .github/workflows/manual_wheel_cuda.yml | 8 ++++---- 1 file changed, 4 insertions(+), 4 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index f753c9b34d..68371a0675 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -139,15 +139,15 @@ jobs: #$env:CUDA_TOOLKIT_ROOT_DIR += "\\Library" #$env:CUDAToolkit_ROOT += "\\Library" #$env:CUDA_PATH = $env:CONDA_PREFIX + '\\Library\\bin' - #$env:CUDA_INC_PATH = $env:CONDA_PREFIX + '\\Library\\include' + $env:CUDA_INC_PATH = $env:CONDA_PREFIX + '\\Library\\include' #$env:CUDA_LIB_PATH = $env:CONDA_PREFIX + '\\Library\\lib' #$env:CUDACXX = $env:CONDA_PREFIX + '\\Library\\bin\\nvcc.exe' #$env:LIB = $env:CONDA_PREFIX + '\\lib;' + $env:CONDA_PREFIX + '\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib;' + $env:CONDA_PREFIX + '\\Library\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib\\x64;' + $env:LIB #$env:LIBPATH = $env:CONDA_PREFIX + '\\lib;' + $env:CONDA_PREFIX + '\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib;' + $env:CONDA_PREFIX + '\\Library\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib\\x64;' + $env:LIBPATH #$env:IncludePath = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:IncludePath - $env:C_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:C_INCLUDE_PATH - $env:CPLUS_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:CPLUS_INCLUDE_PATH - $env:INCLUDE = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:INCLUDE + #$env:C_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:C_INCLUDE_PATH + #$env:CPLUS_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:CPLUS_INCLUDE_PATH + #$env:INCLUDE = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:INCLUDE #$env:CL='/I\' + $env:CONDA_PREFIX + '\\Library\\include' $env:Path = "$env:CONDA_PREFIX\\bin; $env:CONDA_PREFIX\\Library\\bin; $env:CONDA_PREFIX\\nvvm\\bin; $env:CONDA_PREFIX\\Library\\nvvm\\bin;" + $env:Path #echo "$env:CONDA_PREFIX\\Library\\bin" | Out-File -FilePath $env:GITHUB_PATH -Encoding utf8 -Append From f484816666be9e887bf0e658e668a018812f7160 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Tue, 17 Feb 2026 05:54:23 +0700 Subject: [PATCH 166/221] Test 7 --- .github/workflows/manual_wheel_cuda.yml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 68371a0675..0b7522b245 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -146,8 +146,8 @@ jobs: #$env:LIBPATH = $env:CONDA_PREFIX + '\\lib;' + $env:CONDA_PREFIX + '\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib;' + $env:CONDA_PREFIX + '\\Library\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib\\x64;' + $env:LIBPATH #$env:IncludePath = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:IncludePath #$env:C_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:C_INCLUDE_PATH - #$env:CPLUS_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:CPLUS_INCLUDE_PATH - #$env:INCLUDE = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:INCLUDE + $env:CPLUS_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:CPLUS_INCLUDE_PATH + $env:INCLUDE = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:INCLUDE #$env:CL='/I\' + $env:CONDA_PREFIX + '\\Library\\include' $env:Path = "$env:CONDA_PREFIX\\bin; $env:CONDA_PREFIX\\Library\\bin; $env:CONDA_PREFIX\\nvvm\\bin; $env:CONDA_PREFIX\\Library\\nvvm\\bin;" + $env:Path #echo "$env:CONDA_PREFIX\\Library\\bin" | Out-File -FilePath $env:GITHUB_PATH -Encoding utf8 -Append From c7cb2a294ad234e27e462b2324133814a87a14ea Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Tue, 17 Feb 2026 06:27:45 +0700 Subject: [PATCH 167/221] Test 8 --- .github/workflows/manual_wheel_cuda.yml | 10 +++++----- 1 file changed, 5 insertions(+), 5 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 0b7522b245..227a48d09f 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -136,18 +136,18 @@ jobs: Get-ChildItem -Path ~ -Filter "cicc" -Recurse -ErrorAction SilentlyContinue } elseif ($IsWindows) { - #$env:CUDA_TOOLKIT_ROOT_DIR += "\\Library" - #$env:CUDAToolkit_ROOT += "\\Library" + $env:CUDA_TOOLKIT_ROOT_DIR += "\\Library" + $env:CUDAToolkit_ROOT += "\\Library" #$env:CUDA_PATH = $env:CONDA_PREFIX + '\\Library\\bin' - $env:CUDA_INC_PATH = $env:CONDA_PREFIX + '\\Library\\include' + #$env:CUDA_INC_PATH = $env:CONDA_PREFIX + '\\Library\\include' #$env:CUDA_LIB_PATH = $env:CONDA_PREFIX + '\\Library\\lib' #$env:CUDACXX = $env:CONDA_PREFIX + '\\Library\\bin\\nvcc.exe' #$env:LIB = $env:CONDA_PREFIX + '\\lib;' + $env:CONDA_PREFIX + '\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib;' + $env:CONDA_PREFIX + '\\Library\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib\\x64;' + $env:LIB #$env:LIBPATH = $env:CONDA_PREFIX + '\\lib;' + $env:CONDA_PREFIX + '\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib;' + $env:CONDA_PREFIX + '\\Library\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib\\x64;' + $env:LIBPATH #$env:IncludePath = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:IncludePath #$env:C_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:C_INCLUDE_PATH - $env:CPLUS_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:CPLUS_INCLUDE_PATH - $env:INCLUDE = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:INCLUDE + #$env:CPLUS_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:CPLUS_INCLUDE_PATH + #$env:INCLUDE = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:INCLUDE #$env:CL='/I\' + $env:CONDA_PREFIX + '\\Library\\include' $env:Path = "$env:CONDA_PREFIX\\bin; $env:CONDA_PREFIX\\Library\\bin; $env:CONDA_PREFIX\\nvvm\\bin; $env:CONDA_PREFIX\\Library\\nvvm\\bin;" + $env:Path #echo "$env:CONDA_PREFIX\\Library\\bin" | Out-File -FilePath $env:GITHUB_PATH -Encoding utf8 -Append From f8e21f0d45031cc793b5a67459d46ab19fc9dbf0 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Tue, 17 Feb 2026 06:38:21 +0700 Subject: [PATCH 168/221] Test 9 --- .github/workflows/manual_wheel_cuda.yml | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 227a48d09f..b99344d088 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -138,9 +138,9 @@ jobs: elseif ($IsWindows) { $env:CUDA_TOOLKIT_ROOT_DIR += "\\Library" $env:CUDAToolkit_ROOT += "\\Library" - #$env:CUDA_PATH = $env:CONDA_PREFIX + '\\Library\\bin' - #$env:CUDA_INC_PATH = $env:CONDA_PREFIX + '\\Library\\include' - #$env:CUDA_LIB_PATH = $env:CONDA_PREFIX + '\\Library\\lib' + $env:CUDA_PATH = $env:CONDA_PREFIX + '\\Library\\bin' + $env:CUDA_INC_PATH = $env:CONDA_PREFIX + '\\Library\\include' + $env:CUDA_LIB_PATH = $env:CONDA_PREFIX + '\\Library\\lib' #$env:CUDACXX = $env:CONDA_PREFIX + '\\Library\\bin\\nvcc.exe' #$env:LIB = $env:CONDA_PREFIX + '\\lib;' + $env:CONDA_PREFIX + '\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib;' + $env:CONDA_PREFIX + '\\Library\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib\\x64;' + $env:LIB #$env:LIBPATH = $env:CONDA_PREFIX + '\\lib;' + $env:CONDA_PREFIX + '\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib;' + $env:CONDA_PREFIX + '\\Library\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib\\x64;' + $env:LIBPATH From 0d8fbaa9e52bfef6a7158a58444829a5435f8cf6 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Tue, 17 Feb 2026 06:45:55 +0700 Subject: [PATCH 169/221] Test 10 --- .github/workflows/manual_wheel_cuda.yml | 12 ++++++------ 1 file changed, 6 insertions(+), 6 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index b99344d088..377b9f06f9 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -142,12 +142,12 @@ jobs: $env:CUDA_INC_PATH = $env:CONDA_PREFIX + '\\Library\\include' $env:CUDA_LIB_PATH = $env:CONDA_PREFIX + '\\Library\\lib' #$env:CUDACXX = $env:CONDA_PREFIX + '\\Library\\bin\\nvcc.exe' - #$env:LIB = $env:CONDA_PREFIX + '\\lib;' + $env:CONDA_PREFIX + '\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib;' + $env:CONDA_PREFIX + '\\Library\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib\\x64;' + $env:LIB - #$env:LIBPATH = $env:CONDA_PREFIX + '\\lib;' + $env:CONDA_PREFIX + '\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib;' + $env:CONDA_PREFIX + '\\Library\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib\\x64;' + $env:LIBPATH - #$env:IncludePath = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:IncludePath - #$env:C_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:C_INCLUDE_PATH - #$env:CPLUS_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:CPLUS_INCLUDE_PATH - #$env:INCLUDE = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:INCLUDE + $env:LIB = $env:CONDA_PREFIX + '\\lib;' + $env:CONDA_PREFIX + '\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib;' + $env:CONDA_PREFIX + '\\Library\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib\\x64;' + $env:LIB + $env:LIBPATH = $env:CONDA_PREFIX + '\\lib;' + $env:CONDA_PREFIX + '\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib;' + $env:CONDA_PREFIX + '\\Library\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib\\x64;' + $env:LIBPATH + $env:IncludePath = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:IncludePath + $env:C_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:C_INCLUDE_PATH + $env:CPLUS_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:CPLUS_INCLUDE_PATH + $env:INCLUDE = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:INCLUDE #$env:CL='/I\' + $env:CONDA_PREFIX + '\\Library\\include' $env:Path = "$env:CONDA_PREFIX\\bin; $env:CONDA_PREFIX\\Library\\bin; $env:CONDA_PREFIX\\nvvm\\bin; $env:CONDA_PREFIX\\Library\\nvvm\\bin;" + $env:Path #echo "$env:CONDA_PREFIX\\Library\\bin" | Out-File -FilePath $env:GITHUB_PATH -Encoding utf8 -Append From 46b368a46c92b87b5024afe356ea80ca7634ffd7 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Tue, 17 Feb 2026 13:45:19 +0700 Subject: [PATCH 170/221] try the latest gcc --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 377b9f06f9..1cc8d16d2c 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -111,7 +111,7 @@ jobs: #conda config --remove channels defaults conda config --show channels #mamba install -y "nvidia::cuda-version==$cudaMajorMinor.*" "nvidia::cuda-toolkit" "nvidia::cuda-nvcc" "nvidia::cuda-cudart-dev" "conda-forge::gcc==13.*" # "conda-forge::libstdcxx-ng" - mamba install -y -c conda-forge "cuda-version==$cudaMajorMinor.*" "cuda-toolkit" "cuda-cudart-dev" "cuda-cccl" "cuda-nvvm" "cuda-nvcc" "conda-forge::gcc==13.*" # -c "nvidia/label/cuda-$cudaVersion" "cuda-libraries-dev" "nvidia::cuda-thrust" + mamba install -y -c conda-forge "cuda-version==$cudaMajorMinor.*" "cuda-toolkit" "cuda-cudart-dev" "cuda-cccl" "cuda-nvvm" "cuda-nvcc" # "conda-forge::gcc==13.*" # -c "nvidia/label/cuda-$cudaVersion" "cuda-libraries-dev" "nvidia::cuda-thrust" python -m pip install build wheel - name: Build Wheel From 718df85f867d431eb974a20b7ed881e678204451 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 18 Feb 2026 06:38:16 +0700 Subject: [PATCH 171/221] test 1 --- .github/workflows/manual_wheel_cuda.yml | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 1cc8d16d2c..535c2e080f 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -140,10 +140,10 @@ jobs: $env:CUDAToolkit_ROOT += "\\Library" $env:CUDA_PATH = $env:CONDA_PREFIX + '\\Library\\bin' $env:CUDA_INC_PATH = $env:CONDA_PREFIX + '\\Library\\include' - $env:CUDA_LIB_PATH = $env:CONDA_PREFIX + '\\Library\\lib' + #$env:CUDA_LIB_PATH = $env:CONDA_PREFIX + '\\Library\\lib' #$env:CUDACXX = $env:CONDA_PREFIX + '\\Library\\bin\\nvcc.exe' - $env:LIB = $env:CONDA_PREFIX + '\\lib;' + $env:CONDA_PREFIX + '\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib;' + $env:CONDA_PREFIX + '\\Library\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib\\x64;' + $env:LIB - $env:LIBPATH = $env:CONDA_PREFIX + '\\lib;' + $env:CONDA_PREFIX + '\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib;' + $env:CONDA_PREFIX + '\\Library\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib\\x64;' + $env:LIBPATH + #$env:LIB = $env:CONDA_PREFIX + '\\lib;' + $env:CONDA_PREFIX + '\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib;' + $env:CONDA_PREFIX + '\\Library\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib\\x64;' + $env:LIB + #$env:LIBPATH = $env:CONDA_PREFIX + '\\lib;' + $env:CONDA_PREFIX + '\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib;' + $env:CONDA_PREFIX + '\\Library\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib\\x64;' + $env:LIBPATH $env:IncludePath = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:IncludePath $env:C_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:C_INCLUDE_PATH $env:CPLUS_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:CPLUS_INCLUDE_PATH From bcfa357296f4f7550a517ef0909877785aaccbfa Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 18 Feb 2026 18:01:13 +0700 Subject: [PATCH 172/221] test 2 --- .github/workflows/manual_wheel_cuda.yml | 16 ++++++++-------- 1 file changed, 8 insertions(+), 8 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 535c2e080f..803a5421ed 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -20,7 +20,7 @@ jobs: id: set-matrix run: | $matrix = @{ - 'os' = @('ubuntu-22.04','windows-2022') + 'os' = @('windows-2022') # 'ubuntu-22.04', 'pyver' = @("3.9", "3.10", "3.11", "3.12") # ,"3.13", "3.14" 'cuda' = @("12.5.1", "12.6.3", "12.8.1", "13.0.2") # "12.1.1", "12.2.2", "12.3.2", "12.4.1", "12.9.1", "13.1.0" 'releasetag' = @("basic") @@ -138,17 +138,17 @@ jobs: elseif ($IsWindows) { $env:CUDA_TOOLKIT_ROOT_DIR += "\\Library" $env:CUDAToolkit_ROOT += "\\Library" - $env:CUDA_PATH = $env:CONDA_PREFIX + '\\Library\\bin' - $env:CUDA_INC_PATH = $env:CONDA_PREFIX + '\\Library\\include' - #$env:CUDA_LIB_PATH = $env:CONDA_PREFIX + '\\Library\\lib' - #$env:CUDACXX = $env:CONDA_PREFIX + '\\Library\\bin\\nvcc.exe' - #$env:LIB = $env:CONDA_PREFIX + '\\lib;' + $env:CONDA_PREFIX + '\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib;' + $env:CONDA_PREFIX + '\\Library\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib\\x64;' + $env:LIB - #$env:LIBPATH = $env:CONDA_PREFIX + '\\lib;' + $env:CONDA_PREFIX + '\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib;' + $env:CONDA_PREFIX + '\\Library\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib\\x64;' + $env:LIBPATH + #$env:CUDA_PATH = $env:CONDA_PREFIX + '\\Library\\bin' + #$env:CUDA_INC_PATH = $env:CONDA_PREFIX + '\\Library\\include' + ##$env:CUDA_LIB_PATH = $env:CONDA_PREFIX + '\\Library\\lib' + ##$env:CUDACXX = $env:CONDA_PREFIX + '\\Library\\bin\\nvcc.exe' + ##$env:LIB = $env:CONDA_PREFIX + '\\lib;' + $env:CONDA_PREFIX + '\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib;' + $env:CONDA_PREFIX + '\\Library\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib\\x64;' + $env:LIB + ##$env:LIBPATH = $env:CONDA_PREFIX + '\\lib;' + $env:CONDA_PREFIX + '\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib;' + $env:CONDA_PREFIX + '\\Library\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib\\x64;' + $env:LIBPATH $env:IncludePath = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:IncludePath $env:C_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:C_INCLUDE_PATH $env:CPLUS_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:CPLUS_INCLUDE_PATH $env:INCLUDE = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:INCLUDE - #$env:CL='/I\' + $env:CONDA_PREFIX + '\\Library\\include' + ##$env:CL='/I\' + $env:CONDA_PREFIX + '\\Library\\include' $env:Path = "$env:CONDA_PREFIX\\bin; $env:CONDA_PREFIX\\Library\\bin; $env:CONDA_PREFIX\\nvvm\\bin; $env:CONDA_PREFIX\\Library\\nvvm\\bin;" + $env:Path #echo "$env:CONDA_PREFIX\\Library\\bin" | Out-File -FilePath $env:GITHUB_PATH -Encoding utf8 -Append #echo "$env:CONDA_PREFIX\\Library\\nvvm\\bin" | Out-File -FilePath $env:GITHUB_PATH -Encoding utf8 -Append From 7b36c2b79f4cb689d2e3e2b734210ec839ec0533 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 19 Feb 2026 05:03:54 +0700 Subject: [PATCH 173/221] test 3 --- .github/workflows/manual_wheel_cuda.yml | 10 +++++----- 1 file changed, 5 insertions(+), 5 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 803a5421ed..f4c4bc0a5a 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -138,15 +138,15 @@ jobs: elseif ($IsWindows) { $env:CUDA_TOOLKIT_ROOT_DIR += "\\Library" $env:CUDAToolkit_ROOT += "\\Library" - #$env:CUDA_PATH = $env:CONDA_PREFIX + '\\Library\\bin' - #$env:CUDA_INC_PATH = $env:CONDA_PREFIX + '\\Library\\include' + ##$env:CUDA_PATH = $env:CONDA_PREFIX + '\\Library\\bin' + ##$env:CUDA_INC_PATH = $env:CONDA_PREFIX + '\\Library\\include' ##$env:CUDA_LIB_PATH = $env:CONDA_PREFIX + '\\Library\\lib' ##$env:CUDACXX = $env:CONDA_PREFIX + '\\Library\\bin\\nvcc.exe' ##$env:LIB = $env:CONDA_PREFIX + '\\lib;' + $env:CONDA_PREFIX + '\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib;' + $env:CONDA_PREFIX + '\\Library\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib\\x64;' + $env:LIB ##$env:LIBPATH = $env:CONDA_PREFIX + '\\lib;' + $env:CONDA_PREFIX + '\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib;' + $env:CONDA_PREFIX + '\\Library\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib\\x64;' + $env:LIBPATH - $env:IncludePath = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:IncludePath - $env:C_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:C_INCLUDE_PATH - $env:CPLUS_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:CPLUS_INCLUDE_PATH + #$env:IncludePath = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:IncludePath + #$env:C_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:C_INCLUDE_PATH + #$env:CPLUS_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:CPLUS_INCLUDE_PATH $env:INCLUDE = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:INCLUDE ##$env:CL='/I\' + $env:CONDA_PREFIX + '\\Library\\include' $env:Path = "$env:CONDA_PREFIX\\bin; $env:CONDA_PREFIX\\Library\\bin; $env:CONDA_PREFIX\\nvvm\\bin; $env:CONDA_PREFIX\\Library\\nvvm\\bin;" + $env:Path From e3235401cf058466d2e836691872251a37eabcf4 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 19 Feb 2026 06:09:56 +0700 Subject: [PATCH 174/221] test 4 --- .github/workflows/manual_wheel_cuda.yml | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index f4c4bc0a5a..1ded49f833 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -145,9 +145,9 @@ jobs: ##$env:LIB = $env:CONDA_PREFIX + '\\lib;' + $env:CONDA_PREFIX + '\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib;' + $env:CONDA_PREFIX + '\\Library\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib\\x64;' + $env:LIB ##$env:LIBPATH = $env:CONDA_PREFIX + '\\lib;' + $env:CONDA_PREFIX + '\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib;' + $env:CONDA_PREFIX + '\\Library\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib\\x64;' + $env:LIBPATH #$env:IncludePath = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:IncludePath - #$env:C_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:C_INCLUDE_PATH - #$env:CPLUS_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:CPLUS_INCLUDE_PATH - $env:INCLUDE = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:INCLUDE + $env:C_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:C_INCLUDE_PATH + $env:CPLUS_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:CPLUS_INCLUDE_PATH + #$env:INCLUDE = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:INCLUDE ##$env:CL='/I\' + $env:CONDA_PREFIX + '\\Library\\include' $env:Path = "$env:CONDA_PREFIX\\bin; $env:CONDA_PREFIX\\Library\\bin; $env:CONDA_PREFIX\\nvvm\\bin; $env:CONDA_PREFIX\\Library\\nvvm\\bin;" + $env:Path #echo "$env:CONDA_PREFIX\\Library\\bin" | Out-File -FilePath $env:GITHUB_PATH -Encoding utf8 -Append From a98eaabe7ddba4143e0b3ac1aa7dcb09fed16ec7 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 19 Feb 2026 06:17:41 +0700 Subject: [PATCH 175/221] test 5 --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 1ded49f833..d2b1ce6534 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -144,7 +144,7 @@ jobs: ##$env:CUDACXX = $env:CONDA_PREFIX + '\\Library\\bin\\nvcc.exe' ##$env:LIB = $env:CONDA_PREFIX + '\\lib;' + $env:CONDA_PREFIX + '\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib;' + $env:CONDA_PREFIX + '\\Library\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib\\x64;' + $env:LIB ##$env:LIBPATH = $env:CONDA_PREFIX + '\\lib;' + $env:CONDA_PREFIX + '\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib;' + $env:CONDA_PREFIX + '\\Library\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib\\x64;' + $env:LIBPATH - #$env:IncludePath = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:IncludePath + $env:IncludePath = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:IncludePath $env:C_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:C_INCLUDE_PATH $env:CPLUS_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:CPLUS_INCLUDE_PATH #$env:INCLUDE = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:INCLUDE From 7b50e96f1876bc54593e08efef7d32555394d02b Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 19 Feb 2026 16:31:55 +0700 Subject: [PATCH 176/221] test 6 --- .github/workflows/manual_wheel_cuda.yml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index d2b1ce6534..3a8e17ce10 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -34,7 +34,7 @@ jobs: needs: define_matrix runs-on: ${{ matrix.os }} strategy: - max-parallel: 13 + max-parallel: 12 matrix: ${{ fromJSON(needs.define_matrix.outputs.matrix) }} defaults: run: @@ -145,7 +145,7 @@ jobs: ##$env:LIB = $env:CONDA_PREFIX + '\\lib;' + $env:CONDA_PREFIX + '\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib;' + $env:CONDA_PREFIX + '\\Library\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib\\x64;' + $env:LIB ##$env:LIBPATH = $env:CONDA_PREFIX + '\\lib;' + $env:CONDA_PREFIX + '\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib;' + $env:CONDA_PREFIX + '\\Library\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib\\x64;' + $env:LIBPATH $env:IncludePath = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:IncludePath - $env:C_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:C_INCLUDE_PATH + #$env:C_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:C_INCLUDE_PATH $env:CPLUS_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:CPLUS_INCLUDE_PATH #$env:INCLUDE = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:INCLUDE ##$env:CL='/I\' + $env:CONDA_PREFIX + '\\Library\\include' From 09f8be29265f40485ca494b94d055ebf2bda13da Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Fri, 20 Feb 2026 00:45:47 +0700 Subject: [PATCH 177/221] test 7 --- .github/workflows/manual_wheel_cuda.yml | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 3a8e17ce10..d16bcfab21 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -145,9 +145,9 @@ jobs: ##$env:LIB = $env:CONDA_PREFIX + '\\lib;' + $env:CONDA_PREFIX + '\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib;' + $env:CONDA_PREFIX + '\\Library\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib\\x64;' + $env:LIB ##$env:LIBPATH = $env:CONDA_PREFIX + '\\lib;' + $env:CONDA_PREFIX + '\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib;' + $env:CONDA_PREFIX + '\\Library\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib\\x64;' + $env:LIBPATH $env:IncludePath = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:IncludePath - #$env:C_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:C_INCLUDE_PATH - $env:CPLUS_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:CPLUS_INCLUDE_PATH - #$env:INCLUDE = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:INCLUDE + ##$env:C_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:C_INCLUDE_PATH + #$env:CPLUS_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:CPLUS_INCLUDE_PATH + ##$env:INCLUDE = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:INCLUDE ##$env:CL='/I\' + $env:CONDA_PREFIX + '\\Library\\include' $env:Path = "$env:CONDA_PREFIX\\bin; $env:CONDA_PREFIX\\Library\\bin; $env:CONDA_PREFIX\\nvvm\\bin; $env:CONDA_PREFIX\\Library\\nvvm\\bin;" + $env:Path #echo "$env:CONDA_PREFIX\\Library\\bin" | Out-File -FilePath $env:GITHUB_PATH -Encoding utf8 -Append From c45575a0e814eff9c4f6a551fae3eec6d36018d0 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Fri, 20 Feb 2026 08:59:36 +0700 Subject: [PATCH 178/221] test 8 --- .github/workflows/manual_wheel_cuda.yml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index d16bcfab21..f95619e8d8 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -144,9 +144,9 @@ jobs: ##$env:CUDACXX = $env:CONDA_PREFIX + '\\Library\\bin\\nvcc.exe' ##$env:LIB = $env:CONDA_PREFIX + '\\lib;' + $env:CONDA_PREFIX + '\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib;' + $env:CONDA_PREFIX + '\\Library\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib\\x64;' + $env:LIB ##$env:LIBPATH = $env:CONDA_PREFIX + '\\lib;' + $env:CONDA_PREFIX + '\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib;' + $env:CONDA_PREFIX + '\\Library\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib\\x64;' + $env:LIBPATH - $env:IncludePath = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:IncludePath + #$env:IncludePath = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:IncludePath ##$env:C_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:C_INCLUDE_PATH - #$env:CPLUS_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:CPLUS_INCLUDE_PATH + ##$env:CPLUS_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:CPLUS_INCLUDE_PATH ##$env:INCLUDE = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:INCLUDE ##$env:CL='/I\' + $env:CONDA_PREFIX + '\\Library\\include' $env:Path = "$env:CONDA_PREFIX\\bin; $env:CONDA_PREFIX\\Library\\bin; $env:CONDA_PREFIX\\nvvm\\bin; $env:CONDA_PREFIX\\Library\\nvvm\\bin;" + $env:Path From c219a4db0bd759687c80e8ccc7d4e208fb076e68 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Fri, 20 Feb 2026 09:05:44 +0700 Subject: [PATCH 179/221] test 9 --- .github/workflows/manual_wheel_cuda.yml | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index f95619e8d8..fa726e7ec6 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -136,15 +136,15 @@ jobs: Get-ChildItem -Path ~ -Filter "cicc" -Recurse -ErrorAction SilentlyContinue } elseif ($IsWindows) { - $env:CUDA_TOOLKIT_ROOT_DIR += "\\Library" - $env:CUDAToolkit_ROOT += "\\Library" + #$env:CUDA_TOOLKIT_ROOT_DIR += "\\Library" + #$env:CUDAToolkit_ROOT += "\\Library" ##$env:CUDA_PATH = $env:CONDA_PREFIX + '\\Library\\bin' ##$env:CUDA_INC_PATH = $env:CONDA_PREFIX + '\\Library\\include' ##$env:CUDA_LIB_PATH = $env:CONDA_PREFIX + '\\Library\\lib' ##$env:CUDACXX = $env:CONDA_PREFIX + '\\Library\\bin\\nvcc.exe' ##$env:LIB = $env:CONDA_PREFIX + '\\lib;' + $env:CONDA_PREFIX + '\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib;' + $env:CONDA_PREFIX + '\\Library\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib\\x64;' + $env:LIB ##$env:LIBPATH = $env:CONDA_PREFIX + '\\lib;' + $env:CONDA_PREFIX + '\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib;' + $env:CONDA_PREFIX + '\\Library\\lib64;' + $env:CONDA_PREFIX + '\\Library\\lib\\x64;' + $env:LIBPATH - #$env:IncludePath = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:IncludePath + $env:IncludePath = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:IncludePath ##$env:C_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:C_INCLUDE_PATH ##$env:CPLUS_INCLUDE_PATH = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:CPLUS_INCLUDE_PATH ##$env:INCLUDE = $env:CONDA_PREFIX + '\\include;' + $env:CONDA_PREFIX + '\\Library\\include;' + $env:INCLUDE From 9f2a312b83c4dc9d7e25020be5fa83eacfb40c3a Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Fri, 20 Feb 2026 09:27:33 +0700 Subject: [PATCH 180/221] test 9 --- .github/workflows/manual_wheel_cuda.yml | 23 ++++++++++++----------- 1 file changed, 12 insertions(+), 11 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index fa726e7ec6..feb796c513 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -136,8 +136,9 @@ jobs: Get-ChildItem -Path ~ -Filter "cicc" -Recurse -ErrorAction SilentlyContinue } elseif ($IsWindows) { - #$env:CUDA_TOOLKIT_ROOT_DIR += "\\Library" - #$env:CUDAToolkit_ROOT += "\\Library" + if ($cpuArch -eq 'AMD64') { $cpuArch = 'x64' } + $env:CUDA_TOOLKIT_ROOT_DIR += "\\Library" + $env:CUDAToolkit_ROOT += "\\Library" ##$env:CUDA_PATH = $env:CONDA_PREFIX + '\\Library\\bin' ##$env:CUDA_INC_PATH = $env:CONDA_PREFIX + '\\Library\\include' ##$env:CUDA_LIB_PATH = $env:CONDA_PREFIX + '\\Library\\lib' @@ -156,6 +157,9 @@ jobs: nvcc.exe --version Get-ChildItem -Path ~ -Filter "cicc.exe" -Recurse -ErrorAction SilentlyContinue Get-ChildItem -Path ~ -Filter "cudart_static.lib" -Recurse -ErrorAction SilentlyContinue + if (-not (Test-Path -Path "$env:CONDA_PREFIX\\include")) { + New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\include" -Target "$env:CONDA_PREFIX\\Library\\include" + } else { echo "Warning: include directory already existed! Not creating symlink."} if (-not (Test-Path -Path "$env:CONDA_PREFIX\\bin")) { New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\bin" -Target "$env:CONDA_PREFIX\\Library\\bin" } else { echo "Warning: bin directory already existed! Not creating symlink."} @@ -166,20 +170,17 @@ jobs: New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\lib" -Target "$env:CONDA_PREFIX\\Library\\lib" # -Force } else { echo "Warning: lib directory already existed! Not creating symlink." - if (-not (Test-Path -Path "$env:CONDA_PREFIX\\lib\\x64")) { + if (-not (Test-Path -Path "$env:CONDA_PREFIX\\lib\\$cpuArch")) { if ([int]$cudaMajor -ge 13) { - New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\lib\\x64" -Target "$env:CONDA_PREFIX\\Library\\lib\\x64" + New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\lib\\$cpuArch" -Target "$env:CONDA_PREFIX\\Library\\lib\\$cpuArch" } else { - New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\lib\\x64" -Target "$env:CONDA_PREFIX\\Library\\lib" + New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\lib\\cpuArch" -Target "$env:CONDA_PREFIX\\Library\\lib" } - } else { echo "Warning: lib\x64 directory already existed! Not creating symlink."} + } else { echo "Warning: lib\$cpuArch directory already existed! Not creating symlink."} } if (-not (Test-Path -Path "$env:CONDA_PREFIX\\lib64")) { New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\lib64" -Target "$env:CONDA_PREFIX\\Library\\lib" # -Force } else { echo "Warning: lib64 directory already existed! Not creating symlink."} - if (-not (Test-Path -Path "$env:CONDA_PREFIX\\include")) { - New-Item -ItemType SymbolicLink -Path "$env:CONDA_PREFIX\\include" -Target "$env:CONDA_PREFIX\\Library\\include" - } else { echo "Warning: include directory already existed! Not creating symlink."} #Get-ChildItem -Path "C:\Users\runneradmin\miniconda3\envs\llamacpp" -Directory -Recurse -ErrorAction SilentlyContinue } Get-ChildItem -Path ~ -Filter "cuda_runtime.h" -Recurse -ErrorAction SilentlyContinue @@ -192,8 +193,8 @@ jobs: $env:CMAKE_ARGS = '-DGGML_CUDA=on -DCMAKE_CUDA_ARCHITECTURES=all' $env:CMAKE_ARGS = "-DGGML_CUDA_FORCE_MMQ=ON $env:CMAKE_ARGS" if ($env:RUNNER_OS -eq 'Windows') { - #$env:CMAKE_ARGS = "-DCMAKE_CUDA_COMPILER='$env:CONDA_PREFIX\\Library\\bin' $env:CMAKE_ARGS" - $env:CMAKE_ARGS = "-DCMAKE_LINKER_FLAGS='/LIBPATH:$env:CONDA_PREFIX\\Library\\lib' $env:CMAKE_ARGS" + ##$env:CMAKE_ARGS = "-DCMAKE_CUDA_COMPILER='$env:CONDA_PREFIX\\Library\\bin' $env:CMAKE_ARGS" + #$env:CMAKE_ARGS = "-DCMAKE_LINKER_FLAGS='/LIBPATH:$env:CONDA_PREFIX\\Library\\lib' $env:CMAKE_ARGS" } #$env:CMAKE_ARGS = "-DCMAKE_CUDA_FLAGS='-allow-unsupported-compiler' $env:CMAKE_ARGS" # if ($env:AVXVER -eq 'AVX') { From 4bfbc3000f3de1f1f889f0a8f36666c8488da698 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Sat, 21 Feb 2026 00:09:44 +0700 Subject: [PATCH 181/221] last test --- .github/workflows/manual_wheel_cuda.yml | 8 ++++---- 1 file changed, 4 insertions(+), 4 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index feb796c513..03b50c098a 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -20,7 +20,7 @@ jobs: id: set-matrix run: | $matrix = @{ - 'os' = @('windows-2022') # 'ubuntu-22.04', + 'os' = @('ubuntu-22.04', 'windows-2022') # 'pyver' = @("3.9", "3.10", "3.11", "3.12") # ,"3.13", "3.14" 'cuda' = @("12.5.1", "12.6.3", "12.8.1", "13.0.2") # "12.1.1", "12.2.2", "12.3.2", "12.4.1", "12.9.1", "13.1.0" 'releasetag' = @("basic") @@ -192,10 +192,10 @@ jobs: #$env:CMAKE_GENERATOR_TOOLSET = $env:CUDA_HOME $env:CMAKE_ARGS = '-DGGML_CUDA=on -DCMAKE_CUDA_ARCHITECTURES=all' $env:CMAKE_ARGS = "-DGGML_CUDA_FORCE_MMQ=ON $env:CMAKE_ARGS" - if ($env:RUNNER_OS -eq 'Windows') { + #if ($env:RUNNER_OS -eq 'Windows') { ##$env:CMAKE_ARGS = "-DCMAKE_CUDA_COMPILER='$env:CONDA_PREFIX\\Library\\bin' $env:CMAKE_ARGS" - #$env:CMAKE_ARGS = "-DCMAKE_LINKER_FLAGS='/LIBPATH:$env:CONDA_PREFIX\\Library\\lib' $env:CMAKE_ARGS" - } + ##$env:CMAKE_ARGS = "-DCMAKE_LINKER_FLAGS='/LIBPATH:$env:CONDA_PREFIX\\Library\\lib' $env:CMAKE_ARGS" + #} #$env:CMAKE_ARGS = "-DCMAKE_CUDA_FLAGS='-allow-unsupported-compiler' $env:CMAKE_ARGS" # if ($env:AVXVER -eq 'AVX') { $env:CMAKE_ARGS = $env:CMAKE_ARGS + ' -DGGML_AVX2=off -DGGML_FMA=off -DGGML_F16C=off' From 48eecd8b0e1fcee0268b888af046cae44ab97303 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Sun, 22 Feb 2026 05:02:03 +0700 Subject: [PATCH 182/221] testing cuda 12.9 --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 03b50c098a..96861aee9f 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -22,7 +22,7 @@ jobs: $matrix = @{ 'os' = @('ubuntu-22.04', 'windows-2022') # 'pyver' = @("3.9", "3.10", "3.11", "3.12") # ,"3.13", "3.14" - 'cuda' = @("12.5.1", "12.6.3", "12.8.1", "13.0.2") # "12.1.1", "12.2.2", "12.3.2", "12.4.1", "12.9.1", "13.1.0" + 'cuda' = @("12.5.1", "12.6.3", "12.8.1", "12.9.1", "13.0.2") # "12.1.1", "12.2.2", "12.3.2", "12.4.1", "13.1.0" 'releasetag' = @("basic") } From 3f8005e672e3c4f42314d4d44a2d840fd8015bd9 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Sun, 22 Feb 2026 07:20:58 +0700 Subject: [PATCH 183/221] testing python 3.13 and 3.14, also remove cuda 12.9 again --- .github/workflows/manual_wheel_cuda.yml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 96861aee9f..215fe8a0b0 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -21,8 +21,8 @@ jobs: run: | $matrix = @{ 'os' = @('ubuntu-22.04', 'windows-2022') # - 'pyver' = @("3.9", "3.10", "3.11", "3.12") # ,"3.13", "3.14" - 'cuda' = @("12.5.1", "12.6.3", "12.8.1", "12.9.1", "13.0.2") # "12.1.1", "12.2.2", "12.3.2", "12.4.1", "13.1.0" + 'pyver' = @("3.9", "3.10", "3.11", "3.12", "3.13", "3.14") # + 'cuda' = @("12.5.1", "12.6.3", "12.8.1", "13.0.2") # "12.1.1", "12.2.2", "12.3.2", "12.4.1", "12.9.1", "13.1.0" 'releasetag' = @("basic") } From c2db396bd53ea830d6a6c870a2f464b48ee0214a Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Mon, 23 Feb 2026 05:30:08 +0700 Subject: [PATCH 184/221] add cp13 and cp14 on metal --- .github/workflows/build-wheels-metal.yaml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/build-wheels-metal.yaml b/.github/workflows/build-wheels-metal.yaml index 1cfe6166f8..40d011b3fa 100644 --- a/.github/workflows/build-wheels-metal.yaml +++ b/.github/workflows/build-wheels-metal.yaml @@ -38,7 +38,7 @@ jobs: CIBW_REPAIR_WHEEL_COMMAND: "" CIBW_ARCHS: "arm64" CIBW_ENVIRONMENT: CMAKE_ARGS="-DCMAKE_OSX_ARCHITECTURES=arm64 -DCMAKE_APPLE_SILICON_PROCESSOR=arm64 -DGGML_METAL=on -DCMAKE_CROSSCOMPILING=ON" - CIBW_BUILD: "cp39-* cp310-* cp311-* cp312-*" + CIBW_BUILD: "cp39-* cp310-* cp311-* cp312-* cp313-* cp314-*" with: package-dir: . output-dir: wheelhouse2 From fc4d8d41e687f40dbc9dc622acece74eefef5ed2 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Mon, 23 Feb 2026 05:43:02 +0700 Subject: [PATCH 185/221] disable indexing wheel for cu131 --- .github/workflows/generate-index-from-release.yaml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.github/workflows/generate-index-from-release.yaml b/.github/workflows/generate-index-from-release.yaml index f68cf0b1a9..8036285dbf 100644 --- a/.github/workflows/generate-index-from-release.yaml +++ b/.github/workflows/generate-index-from-release.yaml @@ -40,7 +40,7 @@ jobs: GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }} run: | ./scripts/get-releases.sh - # Non-existing file could cause am error at the script + # Non-existing file could cause an error at the script #./scripts/releases-to-pep-503.sh index/whl/cpu '^[v]?[0-9]+\.[0-9]+\.[0-9]+$' #./scripts/releases-to-pep-503.sh index/whl/cu121 '^[v]?[0-9]+\.[0-9]+\.[0-9]+-cu121$' #./scripts/releases-to-pep-503.sh index/whl/cu122 '^[v]?[0-9]+\.[0-9]+\.[0-9]+-cu122$' @@ -51,7 +51,7 @@ jobs: ./scripts/releases-to-pep-503.sh index/whl/cu128 '^[v]?[0-9]+\.[0-9]+\.[0-9]+-cu128$' #./scripts/releases-to-pep-503.sh index/whl/cu129 '^[v]?[0-9]+\.[0-9]+\.[0-9]+-cu129$' ./scripts/releases-to-pep-503.sh index/whl/cu130 '^[v]?[0-9]+\.[0-9]+\.[0-9]+-cu130$' - ./scripts/releases-to-pep-503.sh index/whl/cu131 '^[v]?[0-9]+\.[0-9]+\.[0-9]+-cu131$' + #./scripts/releases-to-pep-503.sh index/whl/cu131 '^[v]?[0-9]+\.[0-9]+\.[0-9]+-cu131$' ./scripts/releases-to-pep-503.sh index/whl/metal '^[v]?[0-9]+\.[0-9]+\.[0-9]+-metal$' - name: Upload artifact uses: actions/upload-pages-artifact@v3 From a9af00bf808447dbc4b9aadb661ac8c4ffe274b4 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Mon, 23 Feb 2026 05:47:16 +0700 Subject: [PATCH 186/221] add python 3.13 and 3.14 to the test --- .github/workflows/test.yaml | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/.github/workflows/test.yaml b/.github/workflows/test.yaml index 138503c415..26b88873f5 100644 --- a/.github/workflows/test.yaml +++ b/.github/workflows/test.yaml @@ -34,7 +34,7 @@ jobs: runs-on: ubuntu-latest strategy: matrix: - python-version: ["3.9", "3.10", "3.11", "3.12"] + python-version: ["3.9", "3.10", "3.11", "3.12", "3.13", "3.14"] steps: - uses: actions/checkout@v4 with: @@ -65,7 +65,7 @@ jobs: runs-on: windows-latest strategy: matrix: - python-version: ["3.9", "3.10", "3.11", "3.12"] + python-version: ["3.9", "3.10", "3.11", "3.12", "3.13", "3.14"] steps: - uses: actions/checkout@v4 with: @@ -99,7 +99,7 @@ jobs: runs-on: macos-14 strategy: matrix: - python-version: ["3.9", "3.10", "3.11", "3.12"] + python-version: ["3.9", "3.10", "3.11", "3.12", "3.13", "3.14"] steps: - uses: actions/checkout@v4 with: From 5b9fbd9e00791d0d6a7093ee0a7c773bdbd766eb Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Tue, 24 Feb 2026 12:19:11 +0700 Subject: [PATCH 187/221] testing linux arm --- .github/workflows/manual_wheel_cuda.yml | 5 +++-- 1 file changed, 3 insertions(+), 2 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 215fe8a0b0..c140108c8a 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -20,7 +20,7 @@ jobs: id: set-matrix run: | $matrix = @{ - 'os' = @('ubuntu-22.04', 'windows-2022') # + 'os' = @('ubuntu-22.04-arm') # , 'ubuntu-22.04-arm', 'windows-2022' 'pyver' = @("3.9", "3.10", "3.11", "3.12", "3.13", "3.14") # 'cuda' = @("12.5.1", "12.6.3", "12.8.1", "13.0.2") # "12.1.1", "12.2.2", "12.3.2", "12.4.1", "12.9.1", "13.1.0" 'releasetag' = @("basic") @@ -129,7 +129,8 @@ jobs: $env:CUDATOOLKITDIR = $env:CONDA_PREFIX echo "CONDA_PREFIX = $env:CONDA_PREFIX" if ($IsLinux) { - if ($cpuArch -eq 'AMD64') { $cpuArch = 'x86_64' } + #if ($cpuArch -eq 'AMD64') { $cpuArch = 'x86_64' } + $cpuArch = uname -m $env:LD_LIBRARY_PATH = $env:CONDA_PREFIX + '/lib:' + $env:CONDA_PREFIX + "/targets/$cpuArch-linux/lib:" + $env:LD_LIBRARY_PATH $env:CPATH = $env:CONDA_PREFIX + '/include:' + $env:CONDA_PREFIX + "/targets/$cpuArch-linux/include:" + $env:CPATH Get-ChildItem -Path ~ -Filter "nvcc" -Recurse -ErrorAction SilentlyContinue From 50765f32d474a89c5f5e6d97ed80cf9b5a7b1e9f Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Tue, 24 Feb 2026 14:48:39 +0700 Subject: [PATCH 188/221] try with sbsa --- .github/workflows/manual_wheel_cuda.yml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index c140108c8a..bd746d2ece 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -129,8 +129,8 @@ jobs: $env:CUDATOOLKITDIR = $env:CONDA_PREFIX echo "CONDA_PREFIX = $env:CONDA_PREFIX" if ($IsLinux) { - #if ($cpuArch -eq 'AMD64') { $cpuArch = 'x86_64' } - $cpuArch = uname -m + if ($cpuArch -eq 'AMD64') { $cpuArch = 'x86_64' } else { $cpuArch = 'sbsa' } + #$cpuArch = uname -m $env:LD_LIBRARY_PATH = $env:CONDA_PREFIX + '/lib:' + $env:CONDA_PREFIX + "/targets/$cpuArch-linux/lib:" + $env:LD_LIBRARY_PATH $env:CPATH = $env:CONDA_PREFIX + '/include:' + $env:CONDA_PREFIX + "/targets/$cpuArch-linux/include:" + $env:CPATH Get-ChildItem -Path ~ -Filter "nvcc" -Recurse -ErrorAction SilentlyContinue From 2bba46bc532569cb08c696e61b15e60d3f53f477 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Tue, 24 Feb 2026 20:07:00 +0700 Subject: [PATCH 189/221] Done testing linux arm --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index bd746d2ece..339b8787d5 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -20,7 +20,7 @@ jobs: id: set-matrix run: | $matrix = @{ - 'os' = @('ubuntu-22.04-arm') # , 'ubuntu-22.04-arm', 'windows-2022' + 'os' = @('ubuntu-22.04-arm', 'ubuntu-22.04', 'windows-2022') # 'pyver' = @("3.9", "3.10", "3.11", "3.12", "3.13", "3.14") # 'cuda' = @("12.5.1", "12.6.3", "12.8.1", "13.0.2") # "12.1.1", "12.2.2", "12.3.2", "12.4.1", "12.9.1", "13.1.0" 'releasetag' = @("basic") From 6c0295c9304c1fa506eadbd90ba71799cc1a9b43 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 25 Feb 2026 04:52:52 +0700 Subject: [PATCH 190/221] Test to apply patch from PR --- .github/workflows/manual_wheel_cuda.yml | 5 +++++ 1 file changed, 5 insertions(+) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index 339b8787d5..aa4a1107bc 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -185,6 +185,11 @@ jobs: #Get-ChildItem -Path "C:\Users\runneradmin\miniconda3\envs\llamacpp" -Directory -Recurse -ErrorAction SilentlyContinue } Get-ChildItem -Path ~ -Filter "cuda_runtime.h" -Recurse -ErrorAction SilentlyContinue + + # Applying Windows CUDA DLL Patch from PR 2083 + curl -L -O https://github.com/abetlen/llama-cpp-python/pull/2083.patch + git am 2083.patch + #$env:VERBOSE = '1' #$env:NVCCFLAGS="-allow-unsupported-compiler" #$env:FORCE_CMAKE=1 From 69e99cae991e02bdc8ce252f609dbd644b7db490 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 25 Feb 2026 05:05:57 +0700 Subject: [PATCH 191/221] test on linux-arm too --- .github/workflows/test.yaml | 31 +++++++++++++++++++++++++++++++ 1 file changed, 31 insertions(+) diff --git a/.github/workflows/test.yaml b/.github/workflows/test.yaml index 26b88873f5..5feb7f3702 100644 --- a/.github/workflows/test.yaml +++ b/.github/workflows/test.yaml @@ -60,6 +60,37 @@ jobs: run: | python -m pytest + build-linux-arm: + needs: download-model + runs-on: ubuntu-24.04-arm + strategy: + matrix: + python-version: ["3.9", "3.10", "3.11", "3.12", "3.13", "3.14"] + steps: + - uses: actions/checkout@v4 + with: + submodules: "recursive" + + - name: Set up Python ${{ matrix.python-version }} + uses: actions/setup-python@v6 + with: + python-version: ${{ matrix.python-version }} + cache: 'pip' + - name: Restore model cache + uses: actions/cache@v4 + with: + path: ~/.cache/huggingface/hub + key: ${{ runner.os }}-model-${{ env.REPO_ID }}-${{ env.MODEL_FILE }} + - name: Install dependencies (Linux/MacOS) + run: | + python -m pip install --upgrade pip + python -m pip install uv + python -m uv pip install -e .[all] --verbose + shell: bash + - name: Test with pytest + run: | + python -m pytest + build-windows: needs: download-model runs-on: windows-latest From 317f58f51de02a7b11f0e4f0d6241f79722a3a04 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 25 Feb 2026 05:13:44 +0700 Subject: [PATCH 192/221] add ubuntu arm runner, and cp13 & cp14 --- .github/workflows/build-and-release.yaml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.github/workflows/build-and-release.yaml b/.github/workflows/build-and-release.yaml index c9476360b3..0a0015b7ea 100644 --- a/.github/workflows/build-and-release.yaml +++ b/.github/workflows/build-and-release.yaml @@ -11,7 +11,7 @@ jobs: runs-on: ${{ matrix.os }} strategy: matrix: - os: [ubuntu-22.04, windows-2022, macos-14] # , macos-15 + os: [ubuntu-22.04-arm, ubuntu-22.04, windows-2022, macos-14] # , macos-15 steps: - uses: actions/checkout@v4 @@ -75,7 +75,7 @@ jobs: CIBW_REPAIR_WHEEL_COMMAND: "" CIBW_ARCHS: "aarch64" CIBW_ENVIRONMENT: CMAKE_ARGS="-DCMAKE_OSX_ARCHITECTURES=arm64 -DCMAKE_APPLE_SILICON_PROCESSOR=arm64 -DCMAKE_CROSSCOMPILING=ON" - CIBW_BUILD: "cp39-* cp310-* cp311-* cp312-*" + CIBW_BUILD: "cp39-* cp310-* cp311-* cp312-* cp313-* cp314-*" with: output-dir: wheelhouse From b2ae79f218bc47638be66db3bde3c8a36683c403 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 25 Feb 2026 05:36:43 +0700 Subject: [PATCH 193/221] test indexing cpu wheel --- .github/workflows/generate-index-from-release.yaml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/generate-index-from-release.yaml b/.github/workflows/generate-index-from-release.yaml index 8036285dbf..5307f3042a 100644 --- a/.github/workflows/generate-index-from-release.yaml +++ b/.github/workflows/generate-index-from-release.yaml @@ -41,7 +41,7 @@ jobs: run: | ./scripts/get-releases.sh # Non-existing file could cause an error at the script - #./scripts/releases-to-pep-503.sh index/whl/cpu '^[v]?[0-9]+\.[0-9]+\.[0-9]+$' + ./scripts/releases-to-pep-503.sh index/whl/cpu '^[v]?[0-9]+\.[0-9]+\.[0-9]+$' #./scripts/releases-to-pep-503.sh index/whl/cu121 '^[v]?[0-9]+\.[0-9]+\.[0-9]+-cu121$' #./scripts/releases-to-pep-503.sh index/whl/cu122 '^[v]?[0-9]+\.[0-9]+\.[0-9]+-cu122$' #./scripts/releases-to-pep-503.sh index/whl/cu123 '^[v]?[0-9]+\.[0-9]+\.[0-9]+-cu123$' From 8301737f865f7999446561bca01503f06704c459 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 25 Feb 2026 06:16:34 +0700 Subject: [PATCH 194/221] try to enable gcc-toolset-14 --- .github/workflows/build-and-release.yaml | 2 ++ 1 file changed, 2 insertions(+) diff --git a/.github/workflows/build-and-release.yaml b/.github/workflows/build-and-release.yaml index 0a0015b7ea..3c7110cb47 100644 --- a/.github/workflows/build-and-release.yaml +++ b/.github/workflows/build-and-release.yaml @@ -26,6 +26,7 @@ jobs: - name: Install dependencies (Linux/MacOS) if: runner.os != 'Windows' run: | + source /opt/rh/gcc-toolset-14/enable python -m pip install --upgrade pip python -m pip install uv RUST_LOG=trace python -m uv pip install -e .[all] --verbose @@ -101,6 +102,7 @@ jobs: - name: Install dependencies (Linux/MacOS) if: runner.os != 'Windows' run: | + source /opt/rh/gcc-toolset-14/enable python -m pip install --upgrade pip python -m pip install uv RUST_LOG=trace python -m uv pip install -e .[all] --verbose From 82f829cf2188cd6bb4286d5b2bb01218632610c4 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 25 Feb 2026 06:34:33 +0700 Subject: [PATCH 195/221] oops --- .github/workflows/build-and-release.yaml | 8 ++++++-- 1 file changed, 6 insertions(+), 2 deletions(-) diff --git a/.github/workflows/build-and-release.yaml b/.github/workflows/build-and-release.yaml index 3c7110cb47..57f76c35e1 100644 --- a/.github/workflows/build-and-release.yaml +++ b/.github/workflows/build-and-release.yaml @@ -26,7 +26,9 @@ jobs: - name: Install dependencies (Linux/MacOS) if: runner.os != 'Windows' run: | - source /opt/rh/gcc-toolset-14/enable + if [ "$RUNNER_OS" == "Linux" ]; then + source /opt/rh/gcc-toolset-14/enable + fi python -m pip install --upgrade pip python -m pip install uv RUST_LOG=trace python -m uv pip install -e .[all] --verbose @@ -102,7 +104,9 @@ jobs: - name: Install dependencies (Linux/MacOS) if: runner.os != 'Windows' run: | - source /opt/rh/gcc-toolset-14/enable + if [ "$RUNNER_OS" == "Linux" ]; then + source /opt/rh/gcc-toolset-14/enable + fi python -m pip install --upgrade pip python -m pip install uv RUST_LOG=trace python -m uv pip install -e .[all] --verbose From a863b40f440f53efcb6e654e2ad2aa53e3edae45 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 25 Feb 2026 06:44:30 +0700 Subject: [PATCH 196/221] wrong distro --- .github/workflows/build-and-release.yaml | 14 ++++++++++++-- 1 file changed, 12 insertions(+), 2 deletions(-) diff --git a/.github/workflows/build-and-release.yaml b/.github/workflows/build-and-release.yaml index 57f76c35e1..87e4d23663 100644 --- a/.github/workflows/build-and-release.yaml +++ b/.github/workflows/build-and-release.yaml @@ -27,7 +27,12 @@ jobs: if: runner.os != 'Windows' run: | if [ "$RUNNER_OS" == "Linux" ]; then - source /opt/rh/gcc-toolset-14/enable + sudo add-apt-repository -y ppa:ubuntu-toolchain-r/test + sudo apt-get update + sudo apt-get install -y gcc-14 g++-14 + sudo update-alternatives --install /usr/bin/gcc gcc /usr/bin/gcc-14 100 + sudo update-alternatives --install /usr/bin/g++ g++ /usr/bin/g++-14 100 + gcc --version fi python -m pip install --upgrade pip python -m pip install uv @@ -105,7 +110,12 @@ jobs: if: runner.os != 'Windows' run: | if [ "$RUNNER_OS" == "Linux" ]; then - source /opt/rh/gcc-toolset-14/enable + sudo add-apt-repository -y ppa:ubuntu-toolchain-r/test + sudo apt-get update + sudo apt-get install -y gcc-14 g++-14 + sudo update-alternatives --install /usr/bin/gcc gcc /usr/bin/gcc-14 100 + sudo update-alternatives --install /usr/bin/g++ g++ /usr/bin/g++-14 100 + gcc --version fi python -m pip install --upgrade pip python -m pip install uv From 464fbfe25a9f33050692b859d38d4f741cb81d4a Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 25 Feb 2026 07:29:17 +0700 Subject: [PATCH 197/221] try with CMAKE_ARGS --- .github/workflows/build-and-release.yaml | 22 ++++++++++++++-------- 1 file changed, 14 insertions(+), 8 deletions(-) diff --git a/.github/workflows/build-and-release.yaml b/.github/workflows/build-and-release.yaml index 87e4d23663..61fe8f6bad 100644 --- a/.github/workflows/build-and-release.yaml +++ b/.github/workflows/build-and-release.yaml @@ -25,13 +25,15 @@ jobs: - name: Install dependencies (Linux/MacOS) if: runner.os != 'Windows' + env: + CMAKE_ARGS: "-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF" run: | if [ "$RUNNER_OS" == "Linux" ]; then sudo add-apt-repository -y ppa:ubuntu-toolchain-r/test sudo apt-get update - sudo apt-get install -y gcc-14 g++-14 - sudo update-alternatives --install /usr/bin/gcc gcc /usr/bin/gcc-14 100 - sudo update-alternatives --install /usr/bin/g++ g++ /usr/bin/g++-14 100 + #sudo apt-get install -y gcc-14 g++-14 + #sudo update-alternatives --install /usr/bin/gcc gcc /usr/bin/gcc-14 100 + #sudo update-alternatives --install /usr/bin/g++ g++ /usr/bin/g++-14 100 gcc --version fi python -m pip install --upgrade pip @@ -42,7 +44,8 @@ jobs: - name: Install dependencies (Windows) if: runner.os == 'Windows' env: - RUST_LOG: trace + RUST_LOG: trace + CMAKE_ARGS: "-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF" run: | python -m pip install --upgrade pip python -m pip install uv @@ -108,13 +111,15 @@ jobs: - name: Install dependencies (Linux/MacOS) if: runner.os != 'Windows' + env: + CMAKE_ARGS: "-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF" run: | if [ "$RUNNER_OS" == "Linux" ]; then sudo add-apt-repository -y ppa:ubuntu-toolchain-r/test sudo apt-get update - sudo apt-get install -y gcc-14 g++-14 - sudo update-alternatives --install /usr/bin/gcc gcc /usr/bin/gcc-14 100 - sudo update-alternatives --install /usr/bin/g++ g++ /usr/bin/g++-14 100 + #sudo apt-get install -y gcc-14 g++-14 + #sudo update-alternatives --install /usr/bin/gcc gcc /usr/bin/gcc-14 100 + #sudo update-alternatives --install /usr/bin/g++ g++ /usr/bin/g++-14 100 gcc --version fi python -m pip install --upgrade pip @@ -126,7 +131,8 @@ jobs: - name: Install dependencies (Windows) if: runner.os == 'Windows' env: - RUST_LOG: trace + RUST_LOG: trace + CMAKE_ARGS: "-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF" run: | python -m pip install --upgrade pip python -m pip install uv From e4431026488ce84f70b4c18ff785bbb663a74668 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 25 Feb 2026 07:46:07 +0700 Subject: [PATCH 198/221] oops --- .github/workflows/build-and-release.yaml | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/.github/workflows/build-and-release.yaml b/.github/workflows/build-and-release.yaml index 61fe8f6bad..7fb95f091a 100644 --- a/.github/workflows/build-and-release.yaml +++ b/.github/workflows/build-and-release.yaml @@ -57,6 +57,7 @@ jobs: env: # disable repair CIBW_REPAIR_WHEEL_COMMAND: "" + CIBW_ENVIRONMENT: CMAKE_ARGS="-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF" with: package-dir: . output-dir: wheelhouse @@ -85,7 +86,7 @@ jobs: CIBW_SKIP: "*musllinux* pp*" CIBW_REPAIR_WHEEL_COMMAND: "" CIBW_ARCHS: "aarch64" - CIBW_ENVIRONMENT: CMAKE_ARGS="-DCMAKE_OSX_ARCHITECTURES=arm64 -DCMAKE_APPLE_SILICON_PROCESSOR=arm64 -DCMAKE_CROSSCOMPILING=ON" + CIBW_ENVIRONMENT: CMAKE_ARGS="-DCMAKE_OSX_ARCHITECTURES=arm64 -DCMAKE_APPLE_SILICON_PROCESSOR=arm64 -DCMAKE_CROSSCOMPILING=ON -DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF" CIBW_BUILD: "cp39-* cp310-* cp311-* cp312-* cp313-* cp314-*" with: output-dir: wheelhouse From 6c2a6788a7f55e8d66acb7ce35d20ce2ae463b24 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 25 Feb 2026 09:30:34 +0700 Subject: [PATCH 199/221] remove unneeded lines --- .github/workflows/build-and-release.yaml | 16 ---------------- 1 file changed, 16 deletions(-) diff --git a/.github/workflows/build-and-release.yaml b/.github/workflows/build-and-release.yaml index 7fb95f091a..627bd79f87 100644 --- a/.github/workflows/build-and-release.yaml +++ b/.github/workflows/build-and-release.yaml @@ -28,14 +28,6 @@ jobs: env: CMAKE_ARGS: "-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF" run: | - if [ "$RUNNER_OS" == "Linux" ]; then - sudo add-apt-repository -y ppa:ubuntu-toolchain-r/test - sudo apt-get update - #sudo apt-get install -y gcc-14 g++-14 - #sudo update-alternatives --install /usr/bin/gcc gcc /usr/bin/gcc-14 100 - #sudo update-alternatives --install /usr/bin/g++ g++ /usr/bin/g++-14 100 - gcc --version - fi python -m pip install --upgrade pip python -m pip install uv RUST_LOG=trace python -m uv pip install -e .[all] --verbose @@ -115,14 +107,6 @@ jobs: env: CMAKE_ARGS: "-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF" run: | - if [ "$RUNNER_OS" == "Linux" ]; then - sudo add-apt-repository -y ppa:ubuntu-toolchain-r/test - sudo apt-get update - #sudo apt-get install -y gcc-14 g++-14 - #sudo update-alternatives --install /usr/bin/gcc gcc /usr/bin/gcc-14 100 - #sudo update-alternatives --install /usr/bin/g++ g++ /usr/bin/g++-14 100 - gcc --version - fi python -m pip install --upgrade pip python -m pip install uv RUST_LOG=trace python -m uv pip install -e .[all] --verbose From a90f14b87bb49a5dcb274a6b4e3d14f337a378ce Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 25 Feb 2026 13:01:29 +0700 Subject: [PATCH 200/221] use git apply --- .github/workflows/manual_wheel_cuda.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/manual_wheel_cuda.yml b/.github/workflows/manual_wheel_cuda.yml index aa4a1107bc..a3e9b76830 100644 --- a/.github/workflows/manual_wheel_cuda.yml +++ b/.github/workflows/manual_wheel_cuda.yml @@ -188,7 +188,7 @@ jobs: # Applying Windows CUDA DLL Patch from PR 2083 curl -L -O https://github.com/abetlen/llama-cpp-python/pull/2083.patch - git am 2083.patch + git apply 2083.patch # git am #$env:VERBOSE = '1' #$env:NVCCFLAGS="-allow-unsupported-compiler" From 7ef0dc25dba27c4ea0c22750e26de0ca6f871b7a Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 25 Feb 2026 15:01:19 +0700 Subject: [PATCH 201/221] optimize cpu wheel with OpenBLAS --- .github/workflows/build-and-release.yaml | 12 ++++++------ 1 file changed, 6 insertions(+), 6 deletions(-) diff --git a/.github/workflows/build-and-release.yaml b/.github/workflows/build-and-release.yaml index 627bd79f87..02f7488293 100644 --- a/.github/workflows/build-and-release.yaml +++ b/.github/workflows/build-and-release.yaml @@ -26,7 +26,7 @@ jobs: - name: Install dependencies (Linux/MacOS) if: runner.os != 'Windows' env: - CMAKE_ARGS: "-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF" + CMAKE_ARGS: "-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" run: | python -m pip install --upgrade pip python -m pip install uv @@ -37,7 +37,7 @@ jobs: if: runner.os == 'Windows' env: RUST_LOG: trace - CMAKE_ARGS: "-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF" + CMAKE_ARGS: "-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" run: | python -m pip install --upgrade pip python -m pip install uv @@ -49,7 +49,7 @@ jobs: env: # disable repair CIBW_REPAIR_WHEEL_COMMAND: "" - CIBW_ENVIRONMENT: CMAKE_ARGS="-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF" + CIBW_ENVIRONMENT: CMAKE_ARGS="-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" with: package-dir: . output-dir: wheelhouse @@ -78,7 +78,7 @@ jobs: CIBW_SKIP: "*musllinux* pp*" CIBW_REPAIR_WHEEL_COMMAND: "" CIBW_ARCHS: "aarch64" - CIBW_ENVIRONMENT: CMAKE_ARGS="-DCMAKE_OSX_ARCHITECTURES=arm64 -DCMAKE_APPLE_SILICON_PROCESSOR=arm64 -DCMAKE_CROSSCOMPILING=ON -DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF" + CIBW_ENVIRONMENT: CMAKE_ARGS="-DCMAKE_OSX_ARCHITECTURES=arm64 -DCMAKE_APPLE_SILICON_PROCESSOR=arm64 -DCMAKE_CROSSCOMPILING=ON -DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" CIBW_BUILD: "cp39-* cp310-* cp311-* cp312-* cp313-* cp314-*" with: output-dir: wheelhouse @@ -105,7 +105,7 @@ jobs: - name: Install dependencies (Linux/MacOS) if: runner.os != 'Windows' env: - CMAKE_ARGS: "-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF" + CMAKE_ARGS: "-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" run: | python -m pip install --upgrade pip python -m pip install uv @@ -117,7 +117,7 @@ jobs: if: runner.os == 'Windows' env: RUST_LOG: trace - CMAKE_ARGS: "-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF" + CMAKE_ARGS: "-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" run: | python -m pip install --upgrade pip python -m pip install uv From fac94f353b1e21e1db6a5a5dd0a9dd2a57e4396b Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 25 Feb 2026 18:06:43 +0700 Subject: [PATCH 202/221] install openblas dev package --- .github/workflows/build-and-release.yaml | 16 ++++++++++++++++ 1 file changed, 16 insertions(+) diff --git a/.github/workflows/build-and-release.yaml b/.github/workflows/build-and-release.yaml index 02f7488293..ed433b8438 100644 --- a/.github/workflows/build-and-release.yaml +++ b/.github/workflows/build-and-release.yaml @@ -28,6 +28,12 @@ jobs: env: CMAKE_ARGS: "-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" run: | + if [ "$RUNNER_OS" == "Linux" ]; then + sudo apt-get update + sudo apt-get install -y libopenblas-dev + else + sudo port -N install OpenBLAS-devel + fi python -m pip install --upgrade pip python -m pip install uv RUST_LOG=trace python -m uv pip install -e .[all] --verbose @@ -39,6 +45,7 @@ jobs: RUST_LOG: trace CMAKE_ARGS: "-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" run: | + vcpkg install openblas python -m pip install --upgrade pip python -m pip install uv python -m uv pip install -e .[all] --verbose @@ -50,6 +57,7 @@ jobs: # disable repair CIBW_REPAIR_WHEEL_COMMAND: "" CIBW_ENVIRONMENT: CMAKE_ARGS="-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" + CIBW_BEFORE_ALL_LINUX: "yum install -y openblas-devel" with: package-dir: . output-dir: wheelhouse @@ -79,6 +87,7 @@ jobs: CIBW_REPAIR_WHEEL_COMMAND: "" CIBW_ARCHS: "aarch64" CIBW_ENVIRONMENT: CMAKE_ARGS="-DCMAKE_OSX_ARCHITECTURES=arm64 -DCMAKE_APPLE_SILICON_PROCESSOR=arm64 -DCMAKE_CROSSCOMPILING=ON -DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" + CIBW_BEFORE_ALL_LINUX: "yum install -y openblas-devel" CIBW_BUILD: "cp39-* cp310-* cp311-* cp312-* cp313-* cp314-*" with: output-dir: wheelhouse @@ -107,6 +116,12 @@ jobs: env: CMAKE_ARGS: "-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" run: | + if [ "$RUNNER_OS" == "Linux" ]; then + sudo apt-get update + sudo apt-get install -y libopenblas-dev + else + sudo port -N install OpenBLAS-devel + fi python -m pip install --upgrade pip python -m pip install uv RUST_LOG=trace python -m uv pip install -e .[all] --verbose @@ -119,6 +134,7 @@ jobs: RUST_LOG: trace CMAKE_ARGS: "-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" run: | + vcpkg install openblas python -m pip install --upgrade pip python -m pip install uv python -m uv pip install -e .[all] --verbose From f72104bd675c419d046764cd98ab54247774d9b8 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Wed, 25 Feb 2026 18:38:27 +0700 Subject: [PATCH 203/221] use default blas vendor --- .github/workflows/build-and-release.yaml | 16 ++++++---------- 1 file changed, 6 insertions(+), 10 deletions(-) diff --git a/.github/workflows/build-and-release.yaml b/.github/workflows/build-and-release.yaml index ed433b8438..f614e3a2c4 100644 --- a/.github/workflows/build-and-release.yaml +++ b/.github/workflows/build-and-release.yaml @@ -26,13 +26,11 @@ jobs: - name: Install dependencies (Linux/MacOS) if: runner.os != 'Windows' env: - CMAKE_ARGS: "-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" + CMAKE_ARGS: "-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON" run: | if [ "$RUNNER_OS" == "Linux" ]; then sudo apt-get update sudo apt-get install -y libopenblas-dev - else - sudo port -N install OpenBLAS-devel fi python -m pip install --upgrade pip python -m pip install uv @@ -43,7 +41,7 @@ jobs: if: runner.os == 'Windows' env: RUST_LOG: trace - CMAKE_ARGS: "-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" + CMAKE_ARGS: "-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON" run: | vcpkg install openblas python -m pip install --upgrade pip @@ -56,7 +54,7 @@ jobs: env: # disable repair CIBW_REPAIR_WHEEL_COMMAND: "" - CIBW_ENVIRONMENT: CMAKE_ARGS="-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" + CIBW_ENVIRONMENT: CMAKE_ARGS="-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON" CIBW_BEFORE_ALL_LINUX: "yum install -y openblas-devel" with: package-dir: . @@ -86,7 +84,7 @@ jobs: CIBW_SKIP: "*musllinux* pp*" CIBW_REPAIR_WHEEL_COMMAND: "" CIBW_ARCHS: "aarch64" - CIBW_ENVIRONMENT: CMAKE_ARGS="-DCMAKE_OSX_ARCHITECTURES=arm64 -DCMAKE_APPLE_SILICON_PROCESSOR=arm64 -DCMAKE_CROSSCOMPILING=ON -DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" + CIBW_ENVIRONMENT: CMAKE_ARGS="-DCMAKE_OSX_ARCHITECTURES=arm64 -DCMAKE_APPLE_SILICON_PROCESSOR=arm64 -DCMAKE_CROSSCOMPILING=ON -DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON" CIBW_BEFORE_ALL_LINUX: "yum install -y openblas-devel" CIBW_BUILD: "cp39-* cp310-* cp311-* cp312-* cp313-* cp314-*" with: @@ -114,13 +112,11 @@ jobs: - name: Install dependencies (Linux/MacOS) if: runner.os != 'Windows' env: - CMAKE_ARGS: "-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" + CMAKE_ARGS: "-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON" run: | if [ "$RUNNER_OS" == "Linux" ]; then sudo apt-get update sudo apt-get install -y libopenblas-dev - else - sudo port -N install OpenBLAS-devel fi python -m pip install --upgrade pip python -m pip install uv @@ -132,7 +128,7 @@ jobs: if: runner.os == 'Windows' env: RUST_LOG: trace - CMAKE_ARGS: "-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" + CMAKE_ARGS: "-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON" run: | vcpkg install openblas python -m pip install --upgrade pip From 3d0d9ba4b84690ed2400f0b05ca66f0a566dcc34 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 26 Feb 2026 01:58:42 +0700 Subject: [PATCH 204/221] explicitly set blas vendor to OpenBLAS on non-macos --- .github/workflows/build-and-release.yaml | 8 +++++--- 1 file changed, 5 insertions(+), 3 deletions(-) diff --git a/.github/workflows/build-and-release.yaml b/.github/workflows/build-and-release.yaml index f614e3a2c4..1b1e424cf9 100644 --- a/.github/workflows/build-and-release.yaml +++ b/.github/workflows/build-and-release.yaml @@ -31,6 +31,7 @@ jobs: if [ "$RUNNER_OS" == "Linux" ]; then sudo apt-get update sudo apt-get install -y libopenblas-dev + CMAKE_ARGS="$CMAKE_ARGS -DGGML_BLAS_VENDOR=OpenBLAS" fi python -m pip install --upgrade pip python -m pip install uv @@ -41,7 +42,7 @@ jobs: if: runner.os == 'Windows' env: RUST_LOG: trace - CMAKE_ARGS: "-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON" + CMAKE_ARGS: "-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" run: | vcpkg install openblas python -m pip install --upgrade pip @@ -54,7 +55,7 @@ jobs: env: # disable repair CIBW_REPAIR_WHEEL_COMMAND: "" - CIBW_ENVIRONMENT: CMAKE_ARGS="-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON" + CIBW_ENVIRONMENT: CMAKE_ARGS="-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" CIBW_BEFORE_ALL_LINUX: "yum install -y openblas-devel" with: package-dir: . @@ -117,6 +118,7 @@ jobs: if [ "$RUNNER_OS" == "Linux" ]; then sudo apt-get update sudo apt-get install -y libopenblas-dev + CMAKE_ARGS="$CMAKE_ARGS -DGGML_BLAS_VENDOR=OpenBLAS" fi python -m pip install --upgrade pip python -m pip install uv @@ -128,7 +130,7 @@ jobs: if: runner.os == 'Windows' env: RUST_LOG: trace - CMAKE_ARGS: "-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON" + CMAKE_ARGS: "-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" run: | vcpkg install openblas python -m pip install --upgrade pip From 9f134345b12658098a990c7c8248cd7ad812cbb0 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 26 Feb 2026 02:20:23 +0700 Subject: [PATCH 205/221] use Accelerate blas vendor on macos --- .github/workflows/build-and-release.yaml | 6 +++++- 1 file changed, 5 insertions(+), 1 deletion(-) diff --git a/.github/workflows/build-and-release.yaml b/.github/workflows/build-and-release.yaml index 1b1e424cf9..9324d90ed2 100644 --- a/.github/workflows/build-and-release.yaml +++ b/.github/workflows/build-and-release.yaml @@ -32,6 +32,8 @@ jobs: sudo apt-get update sudo apt-get install -y libopenblas-dev CMAKE_ARGS="$CMAKE_ARGS -DGGML_BLAS_VENDOR=OpenBLAS" + else + CMAKE_ARGS="$CMAKE_ARGS -DGGML_BLAS_VENDOR=Accelerate" fi python -m pip install --upgrade pip python -m pip install uv @@ -85,7 +87,7 @@ jobs: CIBW_SKIP: "*musllinux* pp*" CIBW_REPAIR_WHEEL_COMMAND: "" CIBW_ARCHS: "aarch64" - CIBW_ENVIRONMENT: CMAKE_ARGS="-DCMAKE_OSX_ARCHITECTURES=arm64 -DCMAKE_APPLE_SILICON_PROCESSOR=arm64 -DCMAKE_CROSSCOMPILING=ON -DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON" + CIBW_ENVIRONMENT: CMAKE_ARGS="-DCMAKE_OSX_ARCHITECTURES=arm64 -DCMAKE_APPLE_SILICON_PROCESSOR=arm64 -DCMAKE_CROSSCOMPILING=ON -DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=Accelerate" CIBW_BEFORE_ALL_LINUX: "yum install -y openblas-devel" CIBW_BUILD: "cp39-* cp310-* cp311-* cp312-* cp313-* cp314-*" with: @@ -119,6 +121,8 @@ jobs: sudo apt-get update sudo apt-get install -y libopenblas-dev CMAKE_ARGS="$CMAKE_ARGS -DGGML_BLAS_VENDOR=OpenBLAS" + else + CMAKE_ARGS="$CMAKE_ARGS -DGGML_BLAS_VENDOR=Accelerate" fi python -m pip install --upgrade pip python -m pip install uv From 8ae8240532ab7ab92ace25f53f40ce038c96d90a Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 26 Feb 2026 03:17:21 +0700 Subject: [PATCH 206/221] not explicitly set BLAS to ON on macos --- .github/workflows/build-and-release.yaml | 18 ++++++++---------- 1 file changed, 8 insertions(+), 10 deletions(-) diff --git a/.github/workflows/build-and-release.yaml b/.github/workflows/build-and-release.yaml index 9324d90ed2..b765fca079 100644 --- a/.github/workflows/build-and-release.yaml +++ b/.github/workflows/build-and-release.yaml @@ -26,14 +26,13 @@ jobs: - name: Install dependencies (Linux/MacOS) if: runner.os != 'Windows' env: - CMAKE_ARGS: "-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON" + CMAKE_ARGS: "-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF" run: | if [ "$RUNNER_OS" == "Linux" ]; then sudo apt-get update sudo apt-get install -y libopenblas-dev - CMAKE_ARGS="$CMAKE_ARGS -DGGML_BLAS_VENDOR=OpenBLAS" - else - CMAKE_ARGS="$CMAKE_ARGS -DGGML_BLAS_VENDOR=Accelerate" + CMAKE_ARGS="$CMAKE_ARGS -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" + echo "CMAKE_ARGS=$CMAKE_ARGS" >> $GITHUB_ENV fi python -m pip install --upgrade pip python -m pip install uv @@ -57,7 +56,7 @@ jobs: env: # disable repair CIBW_REPAIR_WHEEL_COMMAND: "" - CIBW_ENVIRONMENT: CMAKE_ARGS="-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" + CIBW_ENVIRONMENT: CMAKE_ARGS="$CMAKE_ARGS" #"-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" CIBW_BEFORE_ALL_LINUX: "yum install -y openblas-devel" with: package-dir: . @@ -87,7 +86,7 @@ jobs: CIBW_SKIP: "*musllinux* pp*" CIBW_REPAIR_WHEEL_COMMAND: "" CIBW_ARCHS: "aarch64" - CIBW_ENVIRONMENT: CMAKE_ARGS="-DCMAKE_OSX_ARCHITECTURES=arm64 -DCMAKE_APPLE_SILICON_PROCESSOR=arm64 -DCMAKE_CROSSCOMPILING=ON -DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=Accelerate" + CIBW_ENVIRONMENT: CMAKE_ARGS="-DCMAKE_OSX_ARCHITECTURES=arm64 -DCMAKE_APPLE_SILICON_PROCESSOR=arm64 -DCMAKE_CROSSCOMPILING=ON -DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" CIBW_BEFORE_ALL_LINUX: "yum install -y openblas-devel" CIBW_BUILD: "cp39-* cp310-* cp311-* cp312-* cp313-* cp314-*" with: @@ -115,14 +114,13 @@ jobs: - name: Install dependencies (Linux/MacOS) if: runner.os != 'Windows' env: - CMAKE_ARGS: "-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON" + CMAKE_ARGS: "-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF" run: | if [ "$RUNNER_OS" == "Linux" ]; then sudo apt-get update sudo apt-get install -y libopenblas-dev - CMAKE_ARGS="$CMAKE_ARGS -DGGML_BLAS_VENDOR=OpenBLAS" - else - CMAKE_ARGS="$CMAKE_ARGS -DGGML_BLAS_VENDOR=Accelerate" + CMAKE_ARGS="$CMAKE_ARGS -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" + echo "CMAKE_ARGS=$CMAKE_ARGS" >> $GITHUB_ENV fi python -m pip install --upgrade pip python -m pip install uv From 47a40aa48204d6f3b42e7f1ba097cf4acfea222d Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 26 Feb 2026 03:21:56 +0700 Subject: [PATCH 207/221] oops --- .github/workflows/build-and-release.yaml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/build-and-release.yaml b/.github/workflows/build-and-release.yaml index b765fca079..2b5d272e0c 100644 --- a/.github/workflows/build-and-release.yaml +++ b/.github/workflows/build-and-release.yaml @@ -56,7 +56,7 @@ jobs: env: # disable repair CIBW_REPAIR_WHEEL_COMMAND: "" - CIBW_ENVIRONMENT: CMAKE_ARGS="$CMAKE_ARGS" #"-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" + CIBW_ENVIRONMENT: CMAKE_ARGS="${{ env.CMAKE_ARGS }}" #"-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" CIBW_BEFORE_ALL_LINUX: "yum install -y openblas-devel" with: package-dir: . From cc8805cffd1b5a7d32d8e5d7adac3233543363b1 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 26 Feb 2026 03:53:20 +0700 Subject: [PATCH 208/221] oops 2 --- .github/workflows/build-and-release.yaml | 10 +++++++--- 1 file changed, 7 insertions(+), 3 deletions(-) diff --git a/.github/workflows/build-and-release.yaml b/.github/workflows/build-and-release.yaml index 2b5d272e0c..2f608bcc96 100644 --- a/.github/workflows/build-and-release.yaml +++ b/.github/workflows/build-and-release.yaml @@ -32,8 +32,8 @@ jobs: sudo apt-get update sudo apt-get install -y libopenblas-dev CMAKE_ARGS="$CMAKE_ARGS -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" - echo "CMAKE_ARGS=$CMAKE_ARGS" >> $GITHUB_ENV fi + echo "CMAKE_ARGS=$CMAKE_ARGS" >> $GITHUB_ENV python -m pip install --upgrade pip python -m pip install uv RUST_LOG=trace python -m uv pip install -e .[all] --verbose @@ -45,6 +45,7 @@ jobs: RUST_LOG: trace CMAKE_ARGS: "-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" run: | + echo "CMAKE_ARGS=$CMAKE_ARGS" >> $GITHUB_ENV vcpkg install openblas python -m pip install --upgrade pip python -m pip install uv @@ -86,8 +87,10 @@ jobs: CIBW_SKIP: "*musllinux* pp*" CIBW_REPAIR_WHEEL_COMMAND: "" CIBW_ARCHS: "aarch64" - CIBW_ENVIRONMENT: CMAKE_ARGS="-DCMAKE_OSX_ARCHITECTURES=arm64 -DCMAKE_APPLE_SILICON_PROCESSOR=arm64 -DCMAKE_CROSSCOMPILING=ON -DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" + CIBW_ENVIRONMENT: CMAKE_ARGS="-DCMAKE_OSX_ARCHITECTURES=arm64 -DCMAKE_APPLE_SILICON_PROCESSOR=arm64 -DCMAKE_CROSSCOMPILING=ON -DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF" CIBW_BEFORE_ALL_LINUX: "yum install -y openblas-devel" + CIBW_BEFORE_ALL_MACOS: "brew install openblas" + CIBW_BEFORE_ALL_WINDOWS: "vcpkg install openblas" CIBW_BUILD: "cp39-* cp310-* cp311-* cp312-* cp313-* cp314-*" with: output-dir: wheelhouse @@ -120,8 +123,8 @@ jobs: sudo apt-get update sudo apt-get install -y libopenblas-dev CMAKE_ARGS="$CMAKE_ARGS -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" - echo "CMAKE_ARGS=$CMAKE_ARGS" >> $GITHUB_ENV fi + echo "CMAKE_ARGS=$CMAKE_ARGS" >> $GITHUB_ENV python -m pip install --upgrade pip python -m pip install uv RUST_LOG=trace python -m uv pip install -e .[all] --verbose @@ -134,6 +137,7 @@ jobs: RUST_LOG: trace CMAKE_ARGS: "-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" run: | + echo "CMAKE_ARGS=$CMAKE_ARGS" >> $GITHUB_ENV vcpkg install openblas python -m pip install --upgrade pip python -m pip install uv From 2e6bce1a0c41b150453f03b1db648842f1d8e50d Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 26 Feb 2026 04:46:13 +0700 Subject: [PATCH 209/221] disable trace logging to prevent flooding the logs --- .github/workflows/build-and-release.yaml | 10 ++++++---- 1 file changed, 6 insertions(+), 4 deletions(-) diff --git a/.github/workflows/build-and-release.yaml b/.github/workflows/build-and-release.yaml index 2f608bcc96..bccaaae160 100644 --- a/.github/workflows/build-and-release.yaml +++ b/.github/workflows/build-and-release.yaml @@ -26,6 +26,7 @@ jobs: - name: Install dependencies (Linux/MacOS) if: runner.os != 'Windows' env: + #RUST_LOG: trace CMAKE_ARGS: "-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF" run: | if [ "$RUNNER_OS" == "Linux" ]; then @@ -36,13 +37,13 @@ jobs: echo "CMAKE_ARGS=$CMAKE_ARGS" >> $GITHUB_ENV python -m pip install --upgrade pip python -m pip install uv - RUST_LOG=trace python -m uv pip install -e .[all] --verbose + python -m uv pip install -e .[all] --verbose shell: bash - name: Install dependencies (Windows) if: runner.os == 'Windows' env: - RUST_LOG: trace + #RUST_LOG: trace CMAKE_ARGS: "-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" run: | echo "CMAKE_ARGS=$CMAKE_ARGS" >> $GITHUB_ENV @@ -117,6 +118,7 @@ jobs: - name: Install dependencies (Linux/MacOS) if: runner.os != 'Windows' env: + #RUST_LOG: trace CMAKE_ARGS: "-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF" run: | if [ "$RUNNER_OS" == "Linux" ]; then @@ -127,14 +129,14 @@ jobs: echo "CMAKE_ARGS=$CMAKE_ARGS" >> $GITHUB_ENV python -m pip install --upgrade pip python -m pip install uv - RUST_LOG=trace python -m uv pip install -e .[all] --verbose + python -m uv pip install -e .[all] --verbose python -m uv pip install build shell: bash - name: Install dependencies (Windows) if: runner.os == 'Windows' env: - RUST_LOG: trace + #RUST_LOG: trace CMAKE_ARGS: "-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" run: | echo "CMAKE_ARGS=$CMAKE_ARGS" >> $GITHUB_ENV From 8639b2b0a0475c46ef703bf51e7f360c848689d6 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 26 Feb 2026 07:54:09 +0700 Subject: [PATCH 210/221] set -DCMAKE_TOOLCHAIN_FILE on Windows --- .github/workflows/build-and-release.yaml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.github/workflows/build-and-release.yaml b/.github/workflows/build-and-release.yaml index bccaaae160..c0770ca1fe 100644 --- a/.github/workflows/build-and-release.yaml +++ b/.github/workflows/build-and-release.yaml @@ -44,7 +44,7 @@ jobs: if: runner.os == 'Windows' env: #RUST_LOG: trace - CMAKE_ARGS: "-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" + CMAKE_ARGS: "-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS -DCMAKE_TOOLCHAIN_FILE=C:/vcpkg/scripts/buildsystems/vcpkg.cmake" run: | echo "CMAKE_ARGS=$CMAKE_ARGS" >> $GITHUB_ENV vcpkg install openblas @@ -137,7 +137,7 @@ jobs: if: runner.os == 'Windows' env: #RUST_LOG: trace - CMAKE_ARGS: "-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" + CMAKE_ARGS: "-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS -DCMAKE_TOOLCHAIN_FILE=C:/vcpkg/scripts/buildsystems/vcpkg.cmake" run: | echo "CMAKE_ARGS=$CMAKE_ARGS" >> $GITHUB_ENV vcpkg install openblas From 9ef0efc98ba67aa3b50fe2e62893863bfc74e573 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 26 Feb 2026 08:18:53 +0700 Subject: [PATCH 211/221] try with openblas again on macos --- .github/workflows/build-and-release.yaml | 13 ++++++++++++- 1 file changed, 12 insertions(+), 1 deletion(-) diff --git a/.github/workflows/build-and-release.yaml b/.github/workflows/build-and-release.yaml index c0770ca1fe..efa357d1bd 100644 --- a/.github/workflows/build-and-release.yaml +++ b/.github/workflows/build-and-release.yaml @@ -33,6 +33,9 @@ jobs: sudo apt-get update sudo apt-get install -y libopenblas-dev CMAKE_ARGS="$CMAKE_ARGS -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" + else + brew install openblas + CMAKE_ARGS="$CMAKE_ARGS -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS -DCMAKE_PREFIX_PATH=/opt/homebrew/opt/openblas" fi echo "CMAKE_ARGS=$CMAKE_ARGS" >> $GITHUB_ENV python -m pip install --upgrade pip @@ -59,7 +62,9 @@ jobs: # disable repair CIBW_REPAIR_WHEEL_COMMAND: "" CIBW_ENVIRONMENT: CMAKE_ARGS="${{ env.CMAKE_ARGS }}" #"-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" - CIBW_BEFORE_ALL_LINUX: "yum install -y openblas-devel" + #CIBW_BEFORE_ALL_LINUX: "yum install -y openblas-devel" + #CIBW_BEFORE_ALL_MACOS: "brew install openblas" + #CIBW_BEFORE_ALL_WINDOWS: "vcpkg install openblas" with: package-dir: . output-dir: wheelhouse @@ -89,6 +94,9 @@ jobs: CIBW_REPAIR_WHEEL_COMMAND: "" CIBW_ARCHS: "aarch64" CIBW_ENVIRONMENT: CMAKE_ARGS="-DCMAKE_OSX_ARCHITECTURES=arm64 -DCMAKE_APPLE_SILICON_PROCESSOR=arm64 -DCMAKE_CROSSCOMPILING=ON -DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF" + CIBW_ENVIRONMENT_LINUX: CMAKE_ARGS="-DCMAKE_OSX_ARCHITECTURES=arm64 -DCMAKE_APPLE_SILICON_PROCESSOR=arm64 -DCMAKE_CROSSCOMPILING=ON -DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" + CIBW_ENVIRONMENT_WINDOWS: CMAKE_ARGS="-DCMAKE_OSX_ARCHITECTURES=arm64 -DCMAKE_APPLE_SILICON_PROCESSOR=arm64 -DCMAKE_CROSSCOMPILING=ON -DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS -DCMAKE_TOOLCHAIN_FILE=C:/vcpkg/scripts/buildsystems/vcpkg.cmake" + CIBW_ENVIRONMENT_MACOS: CMAKE_ARGS="-DCMAKE_OSX_ARCHITECTURES=arm64 -DCMAKE_APPLE_SILICON_PROCESSOR=arm64 -DCMAKE_CROSSCOMPILING=ON -DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS -DCMAKE_PREFIX_PATH=/opt/homebrew/opt/openblas" CIBW_BEFORE_ALL_LINUX: "yum install -y openblas-devel" CIBW_BEFORE_ALL_MACOS: "brew install openblas" CIBW_BEFORE_ALL_WINDOWS: "vcpkg install openblas" @@ -125,6 +133,9 @@ jobs: sudo apt-get update sudo apt-get install -y libopenblas-dev CMAKE_ARGS="$CMAKE_ARGS -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" + else + brew install openblas + CMAKE_ARGS="$CMAKE_ARGS -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS -DCMAKE_PREFIX_PATH=/opt/homebrew/opt/openblas" fi echo "CMAKE_ARGS=$CMAKE_ARGS" >> $GITHUB_ENV python -m pip install --upgrade pip From c3d03325c8cb89ba99c08d4ad9851869e7aa8ca2 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 26 Feb 2026 08:29:42 +0700 Subject: [PATCH 212/221] install pkgconf on windows --- .github/workflows/build-and-release.yaml | 8 ++++---- 1 file changed, 4 insertions(+), 4 deletions(-) diff --git a/.github/workflows/build-and-release.yaml b/.github/workflows/build-and-release.yaml index efa357d1bd..bc3776a910 100644 --- a/.github/workflows/build-and-release.yaml +++ b/.github/workflows/build-and-release.yaml @@ -50,7 +50,7 @@ jobs: CMAKE_ARGS: "-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS -DCMAKE_TOOLCHAIN_FILE=C:/vcpkg/scripts/buildsystems/vcpkg.cmake" run: | echo "CMAKE_ARGS=$CMAKE_ARGS" >> $GITHUB_ENV - vcpkg install openblas + vcpkg install openblas pkgconf python -m pip install --upgrade pip python -m pip install uv python -m uv pip install -e .[all] --verbose @@ -64,7 +64,7 @@ jobs: CIBW_ENVIRONMENT: CMAKE_ARGS="${{ env.CMAKE_ARGS }}" #"-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" #CIBW_BEFORE_ALL_LINUX: "yum install -y openblas-devel" #CIBW_BEFORE_ALL_MACOS: "brew install openblas" - #CIBW_BEFORE_ALL_WINDOWS: "vcpkg install openblas" + #CIBW_BEFORE_ALL_WINDOWS: "vcpkg install openblas pkgconf" with: package-dir: . output-dir: wheelhouse @@ -99,7 +99,7 @@ jobs: CIBW_ENVIRONMENT_MACOS: CMAKE_ARGS="-DCMAKE_OSX_ARCHITECTURES=arm64 -DCMAKE_APPLE_SILICON_PROCESSOR=arm64 -DCMAKE_CROSSCOMPILING=ON -DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS -DCMAKE_PREFIX_PATH=/opt/homebrew/opt/openblas" CIBW_BEFORE_ALL_LINUX: "yum install -y openblas-devel" CIBW_BEFORE_ALL_MACOS: "brew install openblas" - CIBW_BEFORE_ALL_WINDOWS: "vcpkg install openblas" + CIBW_BEFORE_ALL_WINDOWS: "vcpkg install openblas pkgconf" CIBW_BUILD: "cp39-* cp310-* cp311-* cp312-* cp313-* cp314-*" with: output-dir: wheelhouse @@ -151,7 +151,7 @@ jobs: CMAKE_ARGS: "-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS -DCMAKE_TOOLCHAIN_FILE=C:/vcpkg/scripts/buildsystems/vcpkg.cmake" run: | echo "CMAKE_ARGS=$CMAKE_ARGS" >> $GITHUB_ENV - vcpkg install openblas + vcpkg install openblas pkgconf python -m pip install --upgrade pip python -m pip install uv python -m uv pip install -e .[all] --verbose From b89aab8c50cbe042cc3541c4ec438932c82c94e5 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 26 Feb 2026 08:41:54 +0700 Subject: [PATCH 213/221] try with yum --- .github/workflows/build-and-release.yaml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/build-and-release.yaml b/.github/workflows/build-and-release.yaml index bc3776a910..86a4c37f65 100644 --- a/.github/workflows/build-and-release.yaml +++ b/.github/workflows/build-and-release.yaml @@ -62,7 +62,7 @@ jobs: # disable repair CIBW_REPAIR_WHEEL_COMMAND: "" CIBW_ENVIRONMENT: CMAKE_ARGS="${{ env.CMAKE_ARGS }}" #"-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" - #CIBW_BEFORE_ALL_LINUX: "yum install -y openblas-devel" + CIBW_BEFORE_ALL_LINUX: "yum install -y openblas-devel" #CIBW_BEFORE_ALL_MACOS: "brew install openblas" #CIBW_BEFORE_ALL_WINDOWS: "vcpkg install openblas pkgconf" with: From 94c9b1e75d8295cd6dc1b8699619b748f7b9c1a8 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 26 Feb 2026 08:53:20 +0700 Subject: [PATCH 214/221] disable openmp on macos since it's conflicting with openblas --- .github/workflows/build-and-release.yaml | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/.github/workflows/build-and-release.yaml b/.github/workflows/build-and-release.yaml index 86a4c37f65..ce5cad06c3 100644 --- a/.github/workflows/build-and-release.yaml +++ b/.github/workflows/build-and-release.yaml @@ -35,7 +35,7 @@ jobs: CMAKE_ARGS="$CMAKE_ARGS -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" else brew install openblas - CMAKE_ARGS="$CMAKE_ARGS -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS -DCMAKE_PREFIX_PATH=/opt/homebrew/opt/openblas" + CMAKE_ARGS="$CMAKE_ARGS -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS -DGGML_OPENMP=OFF -DCMAKE_PREFIX_PATH=/opt/homebrew/opt/openblas" fi echo "CMAKE_ARGS=$CMAKE_ARGS" >> $GITHUB_ENV python -m pip install --upgrade pip @@ -96,7 +96,7 @@ jobs: CIBW_ENVIRONMENT: CMAKE_ARGS="-DCMAKE_OSX_ARCHITECTURES=arm64 -DCMAKE_APPLE_SILICON_PROCESSOR=arm64 -DCMAKE_CROSSCOMPILING=ON -DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF" CIBW_ENVIRONMENT_LINUX: CMAKE_ARGS="-DCMAKE_OSX_ARCHITECTURES=arm64 -DCMAKE_APPLE_SILICON_PROCESSOR=arm64 -DCMAKE_CROSSCOMPILING=ON -DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" CIBW_ENVIRONMENT_WINDOWS: CMAKE_ARGS="-DCMAKE_OSX_ARCHITECTURES=arm64 -DCMAKE_APPLE_SILICON_PROCESSOR=arm64 -DCMAKE_CROSSCOMPILING=ON -DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS -DCMAKE_TOOLCHAIN_FILE=C:/vcpkg/scripts/buildsystems/vcpkg.cmake" - CIBW_ENVIRONMENT_MACOS: CMAKE_ARGS="-DCMAKE_OSX_ARCHITECTURES=arm64 -DCMAKE_APPLE_SILICON_PROCESSOR=arm64 -DCMAKE_CROSSCOMPILING=ON -DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS -DCMAKE_PREFIX_PATH=/opt/homebrew/opt/openblas" + CIBW_ENVIRONMENT_MACOS: CMAKE_ARGS="-DCMAKE_OSX_ARCHITECTURES=arm64 -DCMAKE_APPLE_SILICON_PROCESSOR=arm64 -DCMAKE_CROSSCOMPILING=ON -DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS -DGGML_OPENMP=OFF -DCMAKE_PREFIX_PATH=/opt/homebrew/opt/openblas" CIBW_BEFORE_ALL_LINUX: "yum install -y openblas-devel" CIBW_BEFORE_ALL_MACOS: "brew install openblas" CIBW_BEFORE_ALL_WINDOWS: "vcpkg install openblas pkgconf" @@ -135,7 +135,7 @@ jobs: CMAKE_ARGS="$CMAKE_ARGS -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" else brew install openblas - CMAKE_ARGS="$CMAKE_ARGS -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS -DCMAKE_PREFIX_PATH=/opt/homebrew/opt/openblas" + CMAKE_ARGS="$CMAKE_ARGS -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS -DGGML_OPENMP=OFF -DCMAKE_PREFIX_PATH=/opt/homebrew/opt/openblas" fi echo "CMAKE_ARGS=$CMAKE_ARGS" >> $GITHUB_ENV python -m pip install --upgrade pip From 4a363c27458a8b97f4fb8798d6193039e085aacb Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 26 Feb 2026 09:12:58 +0700 Subject: [PATCH 215/221] let's just use ACCELERATE on macos instead of BLAS --- .github/workflows/build-and-release.yaml | 15 +++++++++------ 1 file changed, 9 insertions(+), 6 deletions(-) diff --git a/.github/workflows/build-and-release.yaml b/.github/workflows/build-and-release.yaml index ce5cad06c3..7556f5fa0e 100644 --- a/.github/workflows/build-and-release.yaml +++ b/.github/workflows/build-and-release.yaml @@ -34,8 +34,9 @@ jobs: sudo apt-get install -y libopenblas-dev CMAKE_ARGS="$CMAKE_ARGS -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" else - brew install openblas - CMAKE_ARGS="$CMAKE_ARGS -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS -DGGML_OPENMP=OFF -DCMAKE_PREFIX_PATH=/opt/homebrew/opt/openblas" + #brew install openblas + #CMAKE_ARGS="$CMAKE_ARGS -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS -DGGML_OPENMP=OFF -DCMAKE_PREFIX_PATH=/opt/homebrew/opt/openblas" + CMAKE_ARGS="$CMAKE_ARGS -DGGML_ACCELERATE=ON" fi echo "CMAKE_ARGS=$CMAKE_ARGS" >> $GITHUB_ENV python -m pip install --upgrade pip @@ -96,9 +97,10 @@ jobs: CIBW_ENVIRONMENT: CMAKE_ARGS="-DCMAKE_OSX_ARCHITECTURES=arm64 -DCMAKE_APPLE_SILICON_PROCESSOR=arm64 -DCMAKE_CROSSCOMPILING=ON -DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF" CIBW_ENVIRONMENT_LINUX: CMAKE_ARGS="-DCMAKE_OSX_ARCHITECTURES=arm64 -DCMAKE_APPLE_SILICON_PROCESSOR=arm64 -DCMAKE_CROSSCOMPILING=ON -DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" CIBW_ENVIRONMENT_WINDOWS: CMAKE_ARGS="-DCMAKE_OSX_ARCHITECTURES=arm64 -DCMAKE_APPLE_SILICON_PROCESSOR=arm64 -DCMAKE_CROSSCOMPILING=ON -DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS -DCMAKE_TOOLCHAIN_FILE=C:/vcpkg/scripts/buildsystems/vcpkg.cmake" - CIBW_ENVIRONMENT_MACOS: CMAKE_ARGS="-DCMAKE_OSX_ARCHITECTURES=arm64 -DCMAKE_APPLE_SILICON_PROCESSOR=arm64 -DCMAKE_CROSSCOMPILING=ON -DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS -DGGML_OPENMP=OFF -DCMAKE_PREFIX_PATH=/opt/homebrew/opt/openblas" + CIBW_ENVIRONMENT_MACOS: CMAKE_ARGS="-DCMAKE_OSX_ARCHITECTURES=arm64 -DCMAKE_APPLE_SILICON_PROCESSOR=arm64 -DCMAKE_CROSSCOMPILING=ON -DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_ACCELERATE=ON" + #CIBW_ENVIRONMENT_MACOS: CMAKE_ARGS="-DCMAKE_OSX_ARCHITECTURES=arm64 -DCMAKE_APPLE_SILICON_PROCESSOR=arm64 -DCMAKE_CROSSCOMPILING=ON -DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS -DGGML_OPENMP=OFF -DCMAKE_PREFIX_PATH=/opt/homebrew/opt/openblas" + #CIBW_BEFORE_ALL_MACOS: "brew install openblas" CIBW_BEFORE_ALL_LINUX: "yum install -y openblas-devel" - CIBW_BEFORE_ALL_MACOS: "brew install openblas" CIBW_BEFORE_ALL_WINDOWS: "vcpkg install openblas pkgconf" CIBW_BUILD: "cp39-* cp310-* cp311-* cp312-* cp313-* cp314-*" with: @@ -134,8 +136,9 @@ jobs: sudo apt-get install -y libopenblas-dev CMAKE_ARGS="$CMAKE_ARGS -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" else - brew install openblas - CMAKE_ARGS="$CMAKE_ARGS -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS -DGGML_OPENMP=OFF -DCMAKE_PREFIX_PATH=/opt/homebrew/opt/openblas" + #brew install openblas + #CMAKE_ARGS="$CMAKE_ARGS -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS -DGGML_OPENMP=OFF -DCMAKE_PREFIX_PATH=/opt/homebrew/opt/openblas" + CMAKE_ARGS="$CMAKE_ARGS -DGGML_ACCELERATE=ON" fi echo "CMAKE_ARGS=$CMAKE_ARGS" >> $GITHUB_ENV python -m pip install --upgrade pip From fbe19bfa3ec4606db63833974c2892446eea943e Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 26 Feb 2026 09:37:33 +0700 Subject: [PATCH 216/221] try with apt-get --- .github/workflows/build-and-release.yaml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/build-and-release.yaml b/.github/workflows/build-and-release.yaml index 7556f5fa0e..1953d9b2c3 100644 --- a/.github/workflows/build-and-release.yaml +++ b/.github/workflows/build-and-release.yaml @@ -63,7 +63,7 @@ jobs: # disable repair CIBW_REPAIR_WHEEL_COMMAND: "" CIBW_ENVIRONMENT: CMAKE_ARGS="${{ env.CMAKE_ARGS }}" #"-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" - CIBW_BEFORE_ALL_LINUX: "yum install -y openblas-devel" + CIBW_BEFORE_ALL_LINUX: "sudo apt-get install -y libopenblas-dev" # "yum install -y openblas-devel" #CIBW_BEFORE_ALL_MACOS: "brew install openblas" #CIBW_BEFORE_ALL_WINDOWS: "vcpkg install openblas pkgconf" with: From fb909eed21380cf682f50ebcd60b9f98e461f0ed Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 26 Feb 2026 09:50:45 +0700 Subject: [PATCH 217/221] oops --- .github/workflows/build-and-release.yaml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/build-and-release.yaml b/.github/workflows/build-and-release.yaml index 1953d9b2c3..09ee9f6686 100644 --- a/.github/workflows/build-and-release.yaml +++ b/.github/workflows/build-and-release.yaml @@ -63,7 +63,7 @@ jobs: # disable repair CIBW_REPAIR_WHEEL_COMMAND: "" CIBW_ENVIRONMENT: CMAKE_ARGS="${{ env.CMAKE_ARGS }}" #"-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" - CIBW_BEFORE_ALL_LINUX: "sudo apt-get install -y libopenblas-dev" # "yum install -y openblas-devel" + CIBW_BEFORE_ALL_LINUX: "apt-get install -y libopenblas-dev" # "yum install -y openblas-devel" #CIBW_BEFORE_ALL_MACOS: "brew install openblas" #CIBW_BEFORE_ALL_WINDOWS: "vcpkg install openblas pkgconf" with: From 188a6d8c755ca6fbaad93551cb8f0ada895c3fef Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 26 Feb 2026 10:13:32 +0700 Subject: [PATCH 218/221] use OS-aware openBLAS installation --- .github/workflows/build-and-release.yaml | 5 ++++- 1 file changed, 4 insertions(+), 1 deletion(-) diff --git a/.github/workflows/build-and-release.yaml b/.github/workflows/build-and-release.yaml index 09ee9f6686..a1da0e6def 100644 --- a/.github/workflows/build-and-release.yaml +++ b/.github/workflows/build-and-release.yaml @@ -63,9 +63,12 @@ jobs: # disable repair CIBW_REPAIR_WHEEL_COMMAND: "" CIBW_ENVIRONMENT: CMAKE_ARGS="${{ env.CMAKE_ARGS }}" #"-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" - CIBW_BEFORE_ALL_LINUX: "apt-get install -y libopenblas-dev" # "yum install -y openblas-devel" + CIBW_BEFORE_BUILD: "rm -rf build/ llama_cpp/lib/*.so" #CIBW_BEFORE_ALL_MACOS: "brew install openblas" #CIBW_BEFORE_ALL_WINDOWS: "vcpkg install openblas pkgconf" + CIBW_BEFORE_ALL_LINUX: >- + if command -v yum >/dev/null 2>&1; then yum install -y openblas-devel; + elif command -v apk >/dev/null 2>&1; then apk add openblas-dev; fi with: package-dir: . output-dir: wheelhouse From 088bceeae06db7b14e9b0ad695bc3a51734a49da Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 26 Feb 2026 13:52:08 +0700 Subject: [PATCH 219/221] remove jobs with wheel duplicates --- .github/workflows/build-and-release.yaml | 45 +++--------------------- 1 file changed, 5 insertions(+), 40 deletions(-) diff --git a/.github/workflows/build-and-release.yaml b/.github/workflows/build-and-release.yaml index a1da0e6def..024ad8d944 100644 --- a/.github/workflows/build-and-release.yaml +++ b/.github/workflows/build-and-release.yaml @@ -60,10 +60,12 @@ jobs: - name: Build wheels uses: pypa/cibuildwheel@v3.3.1 env: + CIBW_SKIP: "*musllinux*" + #CIBW_BUILD: "cp39-* cp310-* cp311-* cp312-* cp313-* cp314-*" # disable repair CIBW_REPAIR_WHEEL_COMMAND: "" - CIBW_ENVIRONMENT: CMAKE_ARGS="${{ env.CMAKE_ARGS }}" #"-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" - CIBW_BEFORE_BUILD: "rm -rf build/ llama_cpp/lib/*.so" + CIBW_ENVIRONMENT: CMAKE_ARGS="${{ env.CMAKE_ARGS }}" #-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF + CIBW_BEFORE_BUILD_LINUX: "rm -rf build/ llama_cpp/lib/*.so" #CIBW_BEFORE_ALL_MACOS: "brew install openblas" #CIBW_BEFORE_ALL_WINDOWS: "vcpkg install openblas pkgconf" CIBW_BEFORE_ALL_LINUX: >- @@ -77,44 +79,7 @@ jobs: with: name: wheels-${{ matrix.os }} path: ./wheelhouse/*.whl - - build_wheels_arm64: - name: Build arm64 wheels - runs-on: ubuntu-latest - steps: - - uses: actions/checkout@v4 - with: - submodules: "recursive" - - - name: Set up QEMU - uses: docker/setup-qemu-action@v3 - with: - platforms: linux/arm64 - - - name: Build wheels - uses: pypa/cibuildwheel@v3.3.1 - env: - CIBW_SKIP: "*musllinux* pp*" - CIBW_REPAIR_WHEEL_COMMAND: "" - CIBW_ARCHS: "aarch64" - CIBW_ENVIRONMENT: CMAKE_ARGS="-DCMAKE_OSX_ARCHITECTURES=arm64 -DCMAKE_APPLE_SILICON_PROCESSOR=arm64 -DCMAKE_CROSSCOMPILING=ON -DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF" - CIBW_ENVIRONMENT_LINUX: CMAKE_ARGS="-DCMAKE_OSX_ARCHITECTURES=arm64 -DCMAKE_APPLE_SILICON_PROCESSOR=arm64 -DCMAKE_CROSSCOMPILING=ON -DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" - CIBW_ENVIRONMENT_WINDOWS: CMAKE_ARGS="-DCMAKE_OSX_ARCHITECTURES=arm64 -DCMAKE_APPLE_SILICON_PROCESSOR=arm64 -DCMAKE_CROSSCOMPILING=ON -DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS -DCMAKE_TOOLCHAIN_FILE=C:/vcpkg/scripts/buildsystems/vcpkg.cmake" - CIBW_ENVIRONMENT_MACOS: CMAKE_ARGS="-DCMAKE_OSX_ARCHITECTURES=arm64 -DCMAKE_APPLE_SILICON_PROCESSOR=arm64 -DCMAKE_CROSSCOMPILING=ON -DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_ACCELERATE=ON" - #CIBW_ENVIRONMENT_MACOS: CMAKE_ARGS="-DCMAKE_OSX_ARCHITECTURES=arm64 -DCMAKE_APPLE_SILICON_PROCESSOR=arm64 -DCMAKE_CROSSCOMPILING=ON -DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS -DGGML_OPENMP=OFF -DCMAKE_PREFIX_PATH=/opt/homebrew/opt/openblas" - #CIBW_BEFORE_ALL_MACOS: "brew install openblas" - CIBW_BEFORE_ALL_LINUX: "yum install -y openblas-devel" - CIBW_BEFORE_ALL_WINDOWS: "vcpkg install openblas pkgconf" - CIBW_BUILD: "cp39-* cp310-* cp311-* cp312-* cp313-* cp314-*" - with: - output-dir: wheelhouse - - - name: Upload wheels as artifacts - uses: actions/upload-artifact@v4 - with: - name: wheels_arm64 - path: ./wheelhouse/*.whl - + build_sdist: name: Build source distribution runs-on: ubuntu-latest From f29e5a3121f3f3363fef10bfa6fe82d000f95173 Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 26 Feb 2026 13:56:57 +0700 Subject: [PATCH 220/221] oops --- .github/workflows/build-and-release.yaml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/build-and-release.yaml b/.github/workflows/build-and-release.yaml index 024ad8d944..549301fbea 100644 --- a/.github/workflows/build-and-release.yaml +++ b/.github/workflows/build-and-release.yaml @@ -140,7 +140,7 @@ jobs: release: name: Release - needs: [build_wheels, build_wheels_arm64, build_sdist] + needs: [build_wheels, build_sdist] runs-on: ubuntu-latest steps: From 2b2d70336f1cdc5b12e8cda71a379842af80aeea Mon Sep 17 00:00:00 2001 From: AdamN <7974720+anr2me@users.noreply.github.com> Date: Thu, 26 Feb 2026 16:52:44 +0700 Subject: [PATCH 221/221] oops 2 --- .github/workflows/build-and-release.yaml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.github/workflows/build-and-release.yaml b/.github/workflows/build-and-release.yaml index 549301fbea..0dba2e9177 100644 --- a/.github/workflows/build-and-release.yaml +++ b/.github/workflows/build-and-release.yaml @@ -50,7 +50,7 @@ jobs: #RUST_LOG: trace CMAKE_ARGS: "-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS -DCMAKE_TOOLCHAIN_FILE=C:/vcpkg/scripts/buildsystems/vcpkg.cmake" run: | - echo "CMAKE_ARGS=$CMAKE_ARGS" >> $GITHUB_ENV + (echo CMAKE_ARGS=%CMAKE_ARGS%)>>%GITHUB_ENV% vcpkg install openblas pkgconf python -m pip install --upgrade pip python -m pip install uv @@ -121,7 +121,7 @@ jobs: #RUST_LOG: trace CMAKE_ARGS: "-DGGML_NATIVE=OFF -DLLAMA_NATIVE=OFF -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS -DCMAKE_TOOLCHAIN_FILE=C:/vcpkg/scripts/buildsystems/vcpkg.cmake" run: | - echo "CMAKE_ARGS=$CMAKE_ARGS" >> $GITHUB_ENV + (echo CMAKE_ARGS=%CMAKE_ARGS%)>>%GITHUB_ENV% vcpkg install openblas pkgconf python -m pip install --upgrade pip python -m pip install uv