From: Alan Gray Date: Sun, 13 Apr 2025 21:12:21 +0000 (+0100) Subject: ggml: disable CUDA graphs for unsupported DUP and CONT node types (llama/12891) X-Git-Tag: upstream/0.0.1982~34 X-Git-Url: https://git.djapps.eu/?a=commitdiff_plain;h=32c2b99d96e9254f364fb912b51a8b891ca8b7ac;p=pkg%2Fggml%2Fsources%2Fggml ggml: disable CUDA graphs for unsupported DUP and CONT node types (llama/12891) Fixes #12798 --- diff --git a/src/ggml-cuda/ggml-cuda.cu b/src/ggml-cuda/ggml-cuda.cu index fafe9633..4af18970 100644 --- a/src/ggml-cuda/ggml-cuda.cu +++ b/src/ggml-cuda/ggml-cuda.cu @@ -2488,10 +2488,10 @@ static bool check_node_graph_compatibility_and_refresh_copy_ops(ggml_backend_cud #endif } - if (node->op == GGML_OP_MUL_MAT_ID) { + if (node->op == GGML_OP_MUL_MAT_ID || node->op == GGML_OP_CONT || node->op == GGML_OP_DUP) { use_cuda_graph = false; // This node type is not supported by CUDA graph capture #ifndef NDEBUG - GGML_LOG_DEBUG("%s: disabling CUDA graphs due to mul_mat_id\n", __func__); + GGML_LOG_DEBUG("%s: disabling CUDA graphs due to unsupported node type\n", __func__); #endif }