From: Johannes Gäßler Date: Wed, 1 Apr 2026 19:28:19 +0000 (+0200) Subject: CUDA: fix FA kernel selection logic (#21271) X-Git-Tag: upstream/0.0.8681~57 X-Git-Url: https://git.djapps.eu/?a=commitdiff_plain;h=86221cf6dace86f47d896a38e0de652db4aa81a8;p=pkg%2Fggml%2Fsources%2Fllama.cpp CUDA: fix FA kernel selection logic (#21271) --- diff --git a/ggml/src/ggml-cuda/fattn.cu b/ggml/src/ggml-cuda/fattn.cu index a21c53610..addf93205 100644 --- a/ggml/src/ggml-cuda/fattn.cu +++ b/ggml/src/ggml-cuda/fattn.cu @@ -340,7 +340,14 @@ static best_fattn_kernel ggml_cuda_get_best_fattn_kernel(const int device, const case 128: case 112: case 256: + if (V->ne[0] != K->ne[0]) { + return BEST_FATTN_KERNEL_NONE; + } + break; case 512: + if (V->ne[0] != K->ne[0]) { + return BEST_FATTN_KERNEL_NONE; + } if (!gqa_opt_applies) { return BEST_FATTN_KERNEL_NONE; }