]> git.djapps.eu Git - pkg/ggml/sources/ggml/commitdiff
cann: fix buffer_num and runtime speed slowly error (llama/8865)
authorwangshuai09 <redacted>
Mon, 5 Aug 2024 13:10:37 +0000 (21:10 +0800)
committerGeorgi Gerganov <redacted>
Thu, 8 Aug 2024 10:45:29 +0000 (13:45 +0300)
ggml/src/ggml-cann.cpp

index a15bc8aa29fcb7649ab8de260e5b8d05237053c7..81783b7b147dd48397390c77b18ab796c1e7c058 100644 (file)
@@ -1670,10 +1670,6 @@ GGML_CALL static bool ggml_backend_cann_supports_op(ggml_backend_t backend,
                     // TODO: fix me
                     // Current groupsize should not be greater than k-1 in
                     // aclnnWeightQuantBatchMatmulV2GetWorkspaceSize().
-                    if (op->src[0]->ne[0]-1 > QK8_0) {
-                        return true;
-                    }
-                    return false;
                 case GGML_TYPE_Q4_0:
                     return true;
                 default: