From: Meng, Hengyu Date: Tue, 25 Jun 2024 02:19:20 +0000 (+0800) Subject: [SYCL] Re-enabled mul_mat_batched_sycl (#8095) X-Git-Tag: upstream/0.0.4488~1268 X-Git-Url: https://git.djapps.eu/?a=commitdiff_plain;h=083bacce14c1aaf9976aa40e8266cdc25ac749d3;p=pkg%2Fggml%2Fsources%2Fllama.cpp [SYCL] Re-enabled mul_mat_batched_sycl (#8095) --- diff --git a/ggml-sycl.cpp b/ggml-sycl.cpp index e5ddf4a3..db045336 100644 --- a/ggml-sycl.cpp +++ b/ggml-sycl.cpp @@ -4620,7 +4620,7 @@ static void ggml_sycl_mul_mat(ggml_backend_sycl_context & ctx, const ggml_tensor } else if (!split && src0->type == GGML_TYPE_F16 && !ggml_is_contiguous(src0) && !ggml_is_transposed(src1) && src1->ne[1] == 1) { // KQV single-batch ggml_sycl_mul_mat_vec_nc(ctx, src0, src1, dst); - } else if (!split && src0->type == GGML_TYPE_F16 && (src1->type == GGML_TYPE_F16) && !ggml_is_transposed(src0) && !ggml_is_transposed(src1) && src1->ne[2]*src1->ne[3] > 1) { + } else if (!split && src0->type == GGML_TYPE_F16 && !ggml_is_transposed(src0) && !ggml_is_transposed(src1) && src1->ne[2]*src1->ne[3] > 1) { // KQ + KQV multi-batch ggml_sycl_mul_mat_batched_sycl(ctx, src0, src1, dst); } else if (use_dequantize_mul_mat_vec) {