Updates to webgpu get_memory (#18707)

author Reese Levine <redacted>

Fri, 9 Jan 2026 16:17:18 +0000 (08:17 -0800)

committer GitHub <redacted>

Fri, 9 Jan 2026 16:17:18 +0000 (08:17 -0800)
author Reese Levine <redacted>
Fri, 9 Jan 2026 16:17:18 +0000 (08:17 -0800)
committer GitHub <redacted>
Fri, 9 Jan 2026 16:17:18 +0000 (08:17 -0800)
diff --git a/ggml/src/ggml-webgpu/ggml-webgpu.cpp b/ggml/src/ggml-webgpu/ggml-webgpu.cpp

index f64f94b96f04f3bb2e4213adf79c6f001c4a6011..5b8f7f72d5713f361117063b0256148404a3b41c 100644 (file)
--- a/ggml/src/ggml-webgpu/ggml-webgpu.cpp
+++ b/ggml/src/ggml-webgpu/ggml-webgpu.cpp
@@ -19,6 +19,7 @@
  
  #include <atomic>
  #include <condition_variable>
+#include <cstdint>
  #include <cstring>
  #include <iostream>
  #include <map>
@@ -1880,9 +1881,18 @@ static const char * ggml_backend_webgpu_device_get_description(ggml_backend_dev_
  
  static void ggml_backend_webgpu_device_get_memory(ggml_backend_dev_t dev, size_t * free, size_t * total) {
      ggml_backend_webgpu_device_context * ctx = static_cast<ggml_backend_webgpu_device_context *>(dev->context);
-    // TODO: what do we actually want to return here? maxBufferSize might not be the full available memory.
-    *free                                    = ctx->webgpu_ctx->limits.maxBufferSize;
-    *total                                   = ctx->webgpu_ctx->limits.maxBufferSize;
+    // TODO: for now, return maxBufferSize as both free and total memory
+    // Track https://github.com/gpuweb/gpuweb/issues/5505 for updates.
+    uint64_t max_buffer_size = ctx->webgpu_ctx->limits.maxBufferSize;
+    // If we're on a 32-bit system, clamp to UINTPTR_MAX
+#if UINTPTR_MAX < UINT64_MAX
+    uint64_t max_ptr_size = static_cast<uint64_t>(UINTPTR_MAX);
+    if (max_buffer_size > max_ptr_size) {
+        max_buffer_size = max_ptr_size;
+    }
+#endif
+    *free  = static_cast<size_t>(max_buffer_size);
+    *total = static_cast<size_t>(max_buffer_size);
  }
  
  static enum ggml_backend_dev_type ggml_backend_webgpu_device_get_type(ggml_backend_dev_t dev) {
author	Reese Levine <redacted>
	Fri, 9 Jan 2026 16:17:18 +0000 (08:17 -0800)
committer	GitHub <redacted>
	Fri, 9 Jan 2026 16:17:18 +0000 (08:17 -0800)