]> git.djapps.eu Git - pkg/ggml/sources/llama.cpp/commitdiff
ggml-cuda: disable gdn for musa (#20278)
authorAman Gupta <redacted>
Mon, 9 Mar 2026 08:15:36 +0000 (16:15 +0800)
committerGitHub <redacted>
Mon, 9 Mar 2026 08:15:36 +0000 (16:15 +0800)
ggml/src/ggml-cuda/ggml-cuda.cu

index 0fafaf009318de3385423188b48214c7352a0810..cda275b8c580613aa77a8b5026d9c0ea4cd64c7f 100644 (file)
@@ -4992,9 +4992,15 @@ static bool ggml_backend_cuda_device_supports_op(ggml_backend_dev_t dev, const g
         case GGML_OP_LEAKY_RELU:
         case GGML_OP_RWKV_WKV6:
         case GGML_OP_GATED_LINEAR_ATTN:
-        case GGML_OP_GATED_DELTA_NET:
         case GGML_OP_RWKV_WKV7:
             return true;
+        case GGML_OP_GATED_DELTA_NET:
+            //TODO: enable once MUSA compiler is solved https://github.com/ggml-org/llama.cpp/pull/19504#issuecomment-4018634327
+#ifdef GGML_USE_MUSA
+            return false;
+#else
+            return true;
+#endif // GGML_USE_MUSA
         case GGML_OP_FLASH_ATTN_EXT:
             return ggml_cuda_flash_attn_ext_supported(dev_ctx->device, op);
         case GGML_OP_CROSS_ENTROPY_LOSS: