]> git.djapps.eu Git - pkg/ggml/sources/whisper.cpp/commitdiff
vulkan: tune MMVQ for Intel Windows (llama/19988)
authorRuben Ortlam <redacted>
Mon, 2 Mar 2026 14:58:25 +0000 (15:58 +0100)
committerGeorgi Gerganov <redacted>
Mon, 16 Mar 2026 11:10:15 +0000 (13:10 +0200)
ggml/src/ggml-vulkan/ggml-vulkan.cpp

index 72b11d378a74a2a089705d043d9ccd017b22eee2..23d6d39e0e8c08270c2002841c5dee9ee5548495 100644 (file)
@@ -7574,6 +7574,18 @@ static bool ggml_vk_should_use_mmvq(const vk_device& device, uint32_t m, uint32_
             return false;
         }
 
+        if (device->driver_id == vk::DriverId::eIntelProprietaryWindows) {
+            // Intel Windows proprietary driver tuning
+            switch (src0_type) {
+            case GGML_TYPE_MXFP4:
+            case GGML_TYPE_Q4_K:
+            case GGML_TYPE_Q5_K:
+                return false;
+            default:
+                return true;
+            }
+        }
+
         switch (src0_type) {
         // From tests on A770 Linux, may need more tuning
         case GGML_TYPE_Q4_0: