Mtmd: add a way to select device for vision encoder (#14236)

author stduhpf <redacted>

Tue, 22 Jul 2025 10:51:03 +0000 (12:51 +0200)

committer GitHub <redacted>

Tue, 22 Jul 2025 10:51:03 +0000 (12:51 +0200)
author stduhpf <redacted>
Tue, 22 Jul 2025 10:51:03 +0000 (12:51 +0200)
committer GitHub <redacted>
Tue, 22 Jul 2025 10:51:03 +0000 (12:51 +0200)
diff --git a/tools/mtmd/clip.cpp b/tools/mtmd/clip.cpp

index 9146c9e9c448124e8ff7affaec4ec271cf6713e6..be191404cfc7506cb4d992b90d8801153dcedbf5 100644 (file)
--- a/tools/mtmd/clip.cpp
+++ b/tools/mtmd/clip.cpp
@@ -367,8 +367,8 @@ struct clip_ctx {
      std::vector<ggml_backend_t> backend_ptrs;
      std::vector<ggml_backend_buffer_type_t> backend_buft;
  
-    ggml_backend_t backend;
-    ggml_backend_t backend_cpu;
+    ggml_backend_t backend = nullptr;
+    ggml_backend_t backend_cpu = nullptr;
      ggml_backend_buffer_ptr buf;
  
      int max_nodes = 8192;
@@ -384,9 +384,18 @@ struct clip_ctx {
          if (!backend_cpu) {
              throw std::runtime_error("failed to initialize CPU backend");
          }
-        backend = ctx_params.use_gpu
-                    ? ggml_backend_init_by_type(GGML_BACKEND_DEVICE_TYPE_GPU, nullptr)
-                    : nullptr;
+        if (ctx_params.use_gpu) {
+            auto backend_name = std::getenv("MTMD_BACKEND_DEVICE");
+            if (backend_name != nullptr) {
+                backend = ggml_backend_init_by_name(backend_name, nullptr);
+                if (!backend) {
+                    LOG_WRN("%s: Warning: Failed to initialize \"%s\" backend, falling back to default GPU backend\n", __func__, backend_name);
+                }
+            }
+            if (!backend) {
+                backend = ggml_backend_init_by_type(GGML_BACKEND_DEVICE_TYPE_GPU, nullptr);
+            }
+        }
  
          if (backend) {
              LOG_INF("%s: CLIP using %s backend\n", __func__, ggml_backend_name(backend));
author	stduhpf <redacted>
	Tue, 22 Jul 2025 10:51:03 +0000 (12:51 +0200)
committer	GitHub <redacted>
	Tue, 22 Jul 2025 10:51:03 +0000 (12:51 +0200)