From 2fc4fa9843c0ecb0ba97239bbcdc6f357f95ffc9 Mon Sep 17 00:00:00 2001 From: turboderp <11859846+turboderp@users.noreply.github.com> Date: Sun, 12 Apr 2026 13:56:50 +0200 Subject: [PATCH] Build actions: Remove Torch 2.7-2.8 wheels for Python 3.14 --- .github/workflows/build.yml | 4 ---- exllamav3/exllamav3_ext/softcap.cu | 2 +- 2 files changed, 1 insertion(+), 5 deletions(-) diff --git a/.github/workflows/build.yml b/.github/workflows/build.yml index 960aea6..dcdcae5 100644 --- a/.github/workflows/build.yml +++ b/.github/workflows/build.yml @@ -52,8 +52,6 @@ jobs: - { artname: 'wheel', os: ubuntu-22.04, pyver: '3.13.3', cuda: '12.8.1', rocm: '', torch: '2.11.0', cudaarch: '8.0 8.6 8.9 9.0 10.0 12.0+PTX' } # Python 3.14 - - { artname: 'wheel', os: ubuntu-22.04, pyver: '3.14', cuda: '12.8.1', rocm: '', torch: '2.7.0', cudaarch: '8.0 8.6 8.9 9.0 10.0 12.0+PTX' } - - { artname: 'wheel', os: ubuntu-22.04, pyver: '3.14', cuda: '12.8.1', rocm: '', torch: '2.8.0', cudaarch: '8.0 8.6 8.9 9.0 10.0 12.0+PTX' } - { artname: 'wheel', os: ubuntu-22.04, pyver: '3.14', cuda: '12.8.1', rocm: '', torch: '2.9.0', cudaarch: '8.0 8.6 8.9 9.0 10.0 12.0+PTX' } - { artname: 'wheel', os: ubuntu-22.04, pyver: '3.14', cuda: '12.8.1', rocm: '', torch: '2.10.0', cudaarch: '8.0 8.6 8.9 9.0 10.0 12.0+PTX' } - { artname: 'wheel', os: ubuntu-22.04, pyver: '3.14', cuda: '12.8.1', rocm: '', torch: '2.11.0', cudaarch: '8.0 8.6 8.9 9.0 10.0 12.0+PTX' } @@ -87,8 +85,6 @@ jobs: - { artname: 'wheel', os: windows-2022, pyver: '3.13.3', cuda: '12.8.1', rocm: '', torch: '2.11.0', cudaarch: '8.0 8.6 8.9 9.0 10.0 12.0+PTX' } # Python 3.14 - - { artname: 'wheel', os: windows-2022, pyver: '3.14', cuda: '12.8.1', rocm: '', torch: '2.7.0', cudaarch: '8.0 8.6 8.9 9.0 10.0 12.0+PTX' } - - { artname: 'wheel', os: windows-2022, pyver: '3.14', cuda: '12.8.1', rocm: '', torch: '2.8.0', cudaarch: '8.0 8.6 8.9 9.0 10.0 12.0+PTX' } - { artname: 'wheel', os: windows-2022, pyver: '3.14', cuda: '12.8.1', rocm: '', torch: '2.9.0', cudaarch: '8.0 8.6 8.9 9.0 10.0 12.0+PTX' } - { artname: 'wheel', os: windows-2022, pyver: '3.14', cuda: '12.8.1', rocm: '', torch: '2.10.0', cudaarch: '8.0 8.6 8.9 9.0 10.0 12.0+PTX' } - { artname: 'wheel', os: windows-2022, pyver: '3.14', cuda: '12.8.1', rocm: '', torch: '2.11.0', cudaarch: '8.0 8.6 8.9 9.0 10.0 12.0+PTX' } diff --git a/exllamav3/exllamav3_ext/softcap.cu b/exllamav3/exllamav3_ext/softcap.cu index 2c6a2ef..c54c81b 100644 --- a/exllamav3/exllamav3_ext/softcap.cu +++ b/exllamav3/exllamav3_ext/softcap.cu @@ -16,7 +16,7 @@ __global__ void softcap_kernel const float scale ) { - uint64_t idx = (uint64_t)blockIdx.x * NUM_THREADS + (uint64_t)threadIdx.x; + uint64_t idx = (uint64_t)blockIdx.x * blockDim.x + (uint64_t)threadIdx.x; if (idx >= numel) return; float v = x[idx];