Fix new CUDA FA on Touring (#413)

Co-authored-by: Iwan Kawrakow <iwan.kawrakow@gmail.com>
2026-01-26 17:20:01 +00:00 · 2025-05-12 15:09:33 +03:00
parent ceb8f513e4
commit be1d5c4b7e
1 changed files with 2 additions and 2 deletions
--- a/ggml/src/ggml-cuda/fattn-new-mma.cu
+++ b/ggml/src/ggml-cuda/fattn-new-mma.cu
@@ -273,11 +273,11 @@ struct fattn_mma_f16_config<576, 512> {
    }

    static constexpr __device__ int get_nbatch_V2_device(int ncols) {
-#if __CUDA_ARCH__ == GML_CUDA_CC_TURING
+#if __CUDA_ARCH__ == CC_TURING
        return ncols <= 16 ? 64 : 128;
 #else
        return ncols <= 16 ? 256 : 128;
-#endif // __CUDA_ARCH__ == GML_CUDA_CC_TURING
+#endif // __CUDA_ARCH__ == CC_TURING
    }

    static int get_nbatch_combine_host(const int /*cc*/, const int /*ncols*/) {