CUDA: fix DEBUG_CUDA_MALLOC (llama/5729)

author Johannes Gäßler <redacted>

Mon, 26 Feb 2024 14:36:38 +0000 (15:36 +0100)

committer Georgi Gerganov <redacted>

Wed, 28 Feb 2024 11:00:29 +0000 (13:00 +0200)
author Johannes Gäßler <redacted>
Mon, 26 Feb 2024 14:36:38 +0000 (15:36 +0100)
committer Georgi Gerganov <redacted>
Wed, 28 Feb 2024 11:00:29 +0000 (13:00 +0200)
diff --git a/ggml-cuda.cu b/ggml-cuda.cu

index adad7e0fb333bad42dcffe9c36e51e64d8f8dcde..31736fd1b300f805dc2de88592951e688ce7395c 100644 (file)
--- a/ggml-cuda.cu
+++ b/ggml-cuda.cu
@@ -8079,8 +8079,8 @@ static void * ggml_cuda_pool_malloc_leg(int device, size_t size, size_t * actual
      *actual_size = look_ahead_size;
      g_cuda_pool_size[device] += look_ahead_size;
  #ifdef DEBUG_CUDA_MALLOC
-    fprintf(stderr, "%s[%d]: %d buffers, max_size = %u MB, pool_size = %u MB, requested %u MB\n", __func__, id, nnz,
-            (uint32_t)(max_size/1024/1024), (uint32_t)(g_cuda_pool_size[id]/1024/1024), (uint32_t)(size/1024/1024));
+    fprintf(stderr, "%s[%d]: %d buffers, max_size = %u MB, pool_size = %u MB, requested %u MB\n", __func__, device, nnz,
+            (uint32_t)(max_size/1024/1024), (uint32_t)(g_cuda_pool_size[device]/1024/1024), (uint32_t)(size/1024/1024));
  #endif
      return ptr;
  }
@@ -8166,7 +8166,7 @@ static void * ggml_cuda_pool_malloc_vmm(int device, size_t size, size_t * actual
      g_cuda_pool_used[device] += size;
  
  #ifdef DEBUG_CUDA_MALLOC
-    printf("cuda pool[%d]: allocated %llu bytes at %llx [%s]\n", id, (unsigned long long) size, ptr);
+    printf("cuda pool[%d]: allocated %llu bytes at %llx\n", device, (unsigned long long) size, ptr);
  #endif
  
      return ptr;
@@ -8176,7 +8176,7 @@ static void ggml_cuda_pool_free_vmm(int device, void * ptr, size_t size) {
      scoped_spin_lock lock(g_cuda_pool_lock);
  
  #ifdef DEBUG_CUDA_MALLOC
-    printf("cuda pool[%d]: freed %llu bytes at %llx\n", id, (unsigned long long) size, ptr);
+    printf("cuda pool[%d]: freed %llu bytes at %llx\n", device, (unsigned long long) size, ptr);
  #endif
  
      g_cuda_pool_used[device] -= size;
author	Johannes Gäßler <redacted>
	Mon, 26 Feb 2024 14:36:38 +0000 (15:36 +0100)
committer	Georgi Gerganov <redacted>
	Wed, 28 Feb 2024 11:00:29 +0000 (13:00 +0200)