From: wangshuai09 Date: Mon, 5 Aug 2024 13:10:37 +0000 (+0800) Subject: cann: fix buffer_num and runtime speed slowly error (llama/8865) X-Git-Tag: upstream/0.0.1642~465 X-Git-Url: https://git.djapps.eu/?a=commitdiff_plain;h=70f29c767ef2ab725c9570cb1ee72b5475f42712;p=pkg%2Fggml%2Fsources%2Fggml cann: fix buffer_num and runtime speed slowly error (llama/8865) --- diff --git a/ggml/src/ggml-cann.cpp b/ggml/src/ggml-cann.cpp index a15bc8aa..81783b7b 100644 --- a/ggml/src/ggml-cann.cpp +++ b/ggml/src/ggml-cann.cpp @@ -1670,10 +1670,6 @@ GGML_CALL static bool ggml_backend_cann_supports_op(ggml_backend_t backend, // TODO: fix me // Current groupsize should not be greater than k-1 in // aclnnWeightQuantBatchMatmulV2GetWorkspaceSize(). - if (op->src[0]->ne[0]-1 > QK8_0) { - return true; - } - return false; case GGML_TYPE_Q4_0: return true; default: