]> git.djapps.eu Git - pkg/ggml/sources/llama.cpp/commitdiff
CANN: Replace aclrtMemsetSync with aclnnInplaceZero operator (#14002)
authorluyhcsu <redacted>
Fri, 4 Jul 2025 03:50:07 +0000 (11:50 +0800)
committerGitHub <redacted>
Fri, 4 Jul 2025 03:50:07 +0000 (11:50 +0800)
Co-authored-by: luyuhong <redacted>
ggml/src/ggml-cann/aclnn_ops.cpp

index 69483de8f363ecf6b9ee3767b7920d44f4bdc818..4d5c2c182521f5ae77a3c4675a6b5428d232ee61 100755 (executable)
@@ -67,6 +67,7 @@
 #include <aclnnop/aclnn_pow.h>
 #include <aclnnop/aclnn_grouped_matmul_v3.h>
 #include <aclnnop/aclnn_fused_infer_attention_score_v2.h>
+#include <aclnnop/aclnn_zero.h>
 #include <float.h>
 
 #include <cmath>
@@ -804,10 +805,11 @@ static aclTensor* aclnn_zero(ggml_backend_cann_context& ctx, void* buffer,
         nb[i] = nb[i - 1] * ne[i - 1];
     }
 
-    ggml_cann_async_memset(ctx, buffer, n_bytes, 0);
     aclTensor* zero =
         ggml_cann_create_tensor(buffer, type, type_size, ne, nb, dims);
+    GGML_CANN_CALL_ACLNN_OP(ctx, InplaceZero, zero);
     return zero;
+    GGML_UNUSED(n_bytes);
 }
 
 /**