CUDA: Changing the CUDA scheduling strategy to spin (#16585)

author Julius Tischbein <redacted>

Wed, 15 Oct 2025 11:54:15 +0000 (13:54 +0200)

committer GitHub <redacted>

Wed, 15 Oct 2025 11:54:15 +0000 (14:54 +0300)
author Julius Tischbein <redacted>
Wed, 15 Oct 2025 11:54:15 +0000 (13:54 +0200)
committer GitHub <redacted>
Wed, 15 Oct 2025 11:54:15 +0000 (14:54 +0300)
diff --git a/ggml/src/ggml-cuda/ggml-cuda.cu b/ggml/src/ggml-cuda/ggml-cuda.cu

index da312992c80390be16b44cd27bdc44afd38d491f..a5e77672f6e95e2fdd0531a5ef39bfb86bb47951 100644 (file)
--- a/ggml/src/ggml-cuda/ggml-cuda.cu
+++ b/ggml/src/ggml-cuda/ggml-cuda.cu
@@ -273,6 +273,15 @@ static ggml_cuda_device_info ggml_cuda_init() {
          } else if (device_name.substr(0, 21) == "NVIDIA GeForce GTX 16") {
              turing_devices_without_mma.push_back({ id, device_name });
          }
+
+        // Temporary performance fix:
+        // Setting device scheduling strategy for iGPUs with cc121 to "spinning" to avoid delays in cuda synchronize calls.
+        // TODO: Check for future drivers the default scheduling strategy and
+        // remove this call again when cudaDeviceScheduleSpin is default.
+        if (prop.major == 12 && prop.minor == 1) {
+            CUDA_CHECK(cudaSetDeviceFlags(cudaDeviceScheduleSpin));
+        }
+
  #endif  // defined(GGML_USE_HIP)
      }
author	Julius Tischbein <redacted>
	Wed, 15 Oct 2025 11:54:15 +0000 (13:54 +0200)
committer	GitHub <redacted>
	Wed, 15 Oct 2025 11:54:15 +0000 (14:54 +0300)