From: Alan Gray Date: Sun, 13 Apr 2025 21:12:21 +0000 (+0100) Subject: ggml: disable CUDA graphs for unsupported DUP and CONT node types (#12891) X-Git-Tag: gguf-v0.16.1~28 X-Git-Url: https://git.djapps.eu/?a=commitdiff_plain;h=307bfa253dea07c9270e78fa53b133504e9c3c9d;p=pkg%2Fggml%2Fsources%2Fllama.cpp ggml: disable CUDA graphs for unsupported DUP and CONT node types (#12891) Fixes #12798 --- diff --git a/ggml/src/ggml-cuda/ggml-cuda.cu b/ggml/src/ggml-cuda/ggml-cuda.cu index fafe9633..4af18970 100644 --- a/ggml/src/ggml-cuda/ggml-cuda.cu +++ b/ggml/src/ggml-cuda/ggml-cuda.cu @@ -2488,10 +2488,10 @@ static bool check_node_graph_compatibility_and_refresh_copy_ops(ggml_backend_cud #endif } - if (node->op == GGML_OP_MUL_MAT_ID) { + if (node->op == GGML_OP_MUL_MAT_ID || node->op == GGML_OP_CONT || node->op == GGML_OP_DUP) { use_cuda_graph = false; // This node type is not supported by CUDA graph capture #ifndef NDEBUG - GGML_LOG_DEBUG("%s: disabling CUDA graphs due to mul_mat_id\n", __func__); + GGML_LOG_DEBUG("%s: disabling CUDA graphs due to unsupported node type\n", __func__); #endif }