]> git.djapps.eu Git - pkg/ggml/sources/llama.cpp/commitdiff
sycl : handle other FA case (#21377)
authorNeo Zhang <redacted>
Mon, 6 Apr 2026 10:28:00 +0000 (18:28 +0800)
committerGitHub <redacted>
Mon, 6 Apr 2026 10:28:00 +0000 (13:28 +0300)
ggml/src/ggml-sycl/fattn-tile.hpp

index c4d24613a5577dd9373637b144b1574a1c114ae7..b4d4e0ae90e3ff97d98ed3b8158f0021c158bbb7 100644 (file)
@@ -1252,6 +1252,16 @@ static void launch_fattn_tile_switch_ncols1(ggml_backend_sycl_context & ctx, ggm
         return;
     }
 
+    {
+        constexpr int cols_per_block = ncols2*2;
+        const int nwarps    = ggml_sycl_fattn_tile_get_nthreads (DKQ, DV, cols_per_block, cc) / warp_size;
+        const int nbatch_fa = ggml_sycl_fattn_tile_get_nbatch_fa(DKQ, DV, cols_per_block, cc);
+        launch_fattn<DV, cols_per_block/ncols2, ncols2,
+            flash_attn_tile<DKQ, DV, cols_per_block / ncols2, ncols2, use_logit_softcap, warp_size>, warp_size>
+            (ctx, dst, nwarps, nbytes_shared, nbatch_fa, true, true, false);
+        return;
+    }
+
     GGML_ABORT("fatal error");
 }