opencl: add `backend_synchronize` (#13939)

author lhez <redacted>

Mon, 2 Jun 2025 23:54:58 +0000 (16:54 -0700)

committer GitHub <redacted>

Mon, 2 Jun 2025 23:54:58 +0000 (16:54 -0700)
author lhez <redacted>
Mon, 2 Jun 2025 23:54:58 +0000 (16:54 -0700)
committer GitHub <redacted>
Mon, 2 Jun 2025 23:54:58 +0000 (16:54 -0700)
diff --git a/ggml/src/ggml-opencl/ggml-opencl.cpp b/ggml/src/ggml-opencl/ggml-opencl.cpp

index 843acefc7152642201cab703010f2910c2c7e924..80a364380d05a7b5755cb0859ff8be624971655c 100644 (file)
--- a/ggml/src/ggml-opencl/ggml-opencl.cpp
+++ b/ggml/src/ggml-opencl/ggml-opencl.cpp
@@ -2022,7 +2022,12 @@ static bool ggml_backend_opencl_cpy_tensor_async(ggml_backend_t backend, const g
  }
  
  static void ggml_backend_opencl_synchronize(ggml_backend_t backend) {
-    GGML_UNUSED(backend);
+    auto * backend_ctx = static_cast<ggml_backend_opencl_context *>(backend->context);
+
+    cl_event evt;
+    CL_CHECK(clEnqueueBarrierWithWaitList(backend_ctx->queue, 0, nullptr, &evt));
+    CL_CHECK(clWaitForEvents(1, &evt));
+    CL_CHECK(clReleaseEvent(evt));
  }
  
  // Syncronizes the 'backend_ctx's device with others so that commands
@@ -2225,7 +2230,7 @@ static ggml_backend_i ggml_backend_opencl_i = {
      /* .set_tensor_async        = */ NULL,  /* ggml_backend_opencl_set_tensor_async */
      /* .get_tensor_async        = */ NULL,  /* ggml_backend_opencl_get_tensor_async */
      /* .cpy_tensor_async        = */ NULL,  /* ggml_backend_opencl_cpy_tensor_async */
-    /* .synchronize             = */ NULL,  /* ggml_backend_opencl_synchronize */
+    /* .synchronize             = */ ggml_backend_opencl_synchronize,
      /* .graph_plan_create       = */ NULL,
      /* .graph_plan_free         = */ NULL,
      /* .graph_plan_update       = */ NULL,
author	lhez <redacted>
	Mon, 2 Jun 2025 23:54:58 +0000 (16:54 -0700)
committer	GitHub <redacted>
	Mon, 2 Jun 2025 23:54:58 +0000 (16:54 -0700)