return;
}
+ {
+ constexpr int cols_per_block = ncols2*2;
+ const int nwarps = ggml_sycl_fattn_tile_get_nthreads (DKQ, DV, cols_per_block, cc) / warp_size;
+ const int nbatch_fa = ggml_sycl_fattn_tile_get_nbatch_fa(DKQ, DV, cols_per_block, cc);
+ launch_fattn<DV, cols_per_block/ncols2, ncols2,
+ flash_attn_tile<DKQ, DV, cols_per_block / ncols2, ncols2, use_logit_softcap, warp_size>, warp_size>
+ (ctx, dst, nwarps, nbytes_shared, nbatch_fa, true, true, false);
+ return;
+ }
+
GGML_ABORT("fatal error");
}