vulkan: Set limit for task concurrency (#5427)

author Neuman Vong <redacted>

Fri, 9 Feb 2024 18:30:19 +0000 (05:30 +1100)

committer GitHub <redacted>

Fri, 9 Feb 2024 18:30:19 +0000 (19:30 +0100)
author Neuman Vong <redacted>
Fri, 9 Feb 2024 18:30:19 +0000 (05:30 +1100)
committer GitHub <redacted>
Fri, 9 Feb 2024 18:30:19 +0000 (19:30 +0100)
diff --git a/ggml_vk_generate_shaders.py b/ggml_vk_generate_shaders.py

index 4abb0383f2d5dce7c347ec5db65ddcb51ffaeff7..b2e86e18213057243b5f0e46f4a53bc820f6ed95 100644 (file)
--- a/ggml_vk_generate_shaders.py
+++ b/ggml_vk_generate_shaders.py
@@ -2067,6 +2067,8 @@ type_names = {
  
  K_QUANTS_PER_ITERATION = 2
  
+ASYNCIO_CONCURRENCY = 64
+
  output_dir = gettempdir()
  
  lock = asyncio.Lock()
@@ -2291,7 +2293,14 @@ async def main():
      tasks.append(string_to_spv("rope_neox_f32", rope_neox_src, {"A_TYPE": "float", "D_TYPE": "float"}))
      tasks.append(string_to_spv("rope_neox_f16", rope_neox_src, {"A_TYPE": "float16_t", "D_TYPE": "float16_t"}))
  
-    await asyncio.gather(*tasks)
+    # Helper to decorate tasks with semaphore acquisition.
+    async def withSemaphore(sem, task):
+        async with sem:
+            return await task
+
+    # Run tasks concurrently guarded by a concurrency limit.
+    sem = asyncio.Semaphore(ASYNCIO_CONCURRENCY)
+    await asyncio.gather(*(withSemaphore(sem, task) for task in tasks))
  
      with open("ggml-vulkan-shaders.hpp", "w") as f:
          f.write("#include <cstdint>\n\n")
author	Neuman Vong <redacted>
	Fri, 9 Feb 2024 18:30:19 +0000 (05:30 +1100)
committer	GitHub <redacted>
	Fri, 9 Feb 2024 18:30:19 +0000 (19:30 +0100)