]> git.djapps.eu Git - pkg/ggml/sources/whisper.cpp/commitdiff
ggml: disable CUDA graphs for unsupported DUP and CONT node types (llama/12891)
authorAlan Gray <redacted>
Sun, 13 Apr 2025 21:12:21 +0000 (22:12 +0100)
committerGeorgi Gerganov <redacted>
Thu, 24 Apr 2025 17:39:16 +0000 (20:39 +0300)
Fixes #12798

ggml/src/ggml-cuda/ggml-cuda.cu

index fafe9633e202796d08ef988447143af712f6722c..4af1897017567205d842dfa0ffca75d87de78e24 100644 (file)
@@ -2488,10 +2488,10 @@ static bool check_node_graph_compatibility_and_refresh_copy_ops(ggml_backend_cud
 #endif
         }
 
-        if (node->op == GGML_OP_MUL_MAT_ID) {
+        if (node->op == GGML_OP_MUL_MAT_ID || node->op == GGML_OP_CONT || node->op == GGML_OP_DUP) {
             use_cuda_graph = false; // This node type is not supported by CUDA graph capture
 #ifndef NDEBUG
-            GGML_LOG_DEBUG("%s: disabling CUDA graphs due to mul_mat_id\n", __func__);
+            GGML_LOG_DEBUG("%s: disabling CUDA graphs due to unsupported node type\n", __func__);
 #endif
         }