mtmd: add min/max pixels gguf metadata (#19273)

author Xuan-Son Nguyen <redacted>

Mon, 2 Feb 2026 19:59:06 +0000 (20:59 +0100)

committer GitHub <redacted>

Mon, 2 Feb 2026 19:59:06 +0000 (20:59 +0100)
author Xuan-Son Nguyen <redacted>
Mon, 2 Feb 2026 19:59:06 +0000 (20:59 +0100)
committer GitHub <redacted>
Mon, 2 Feb 2026 19:59:06 +0000 (20:59 +0100)
diff --git a/gguf-py/gguf/constants.py b/gguf-py/gguf/constants.py

index 31273b2b5a715278496c44357582e9eaa9ab9cc3..6f56d36c59f8da9586c63355657fda0492ec138e 100644 (file)
--- a/gguf-py/gguf/constants.py
+++ b/gguf-py/gguf/constants.py
@@ -284,6 +284,8 @@ class Keys:
      class ClipVision:
          PROJECTOR_TYPE      = "clip.vision.projector_type" # for mixed modality models
          IMAGE_SIZE          = "clip.vision.image_size"
+        IMAGE_MIN_PIXELS    = "clip.vision.image_min_pixels"
+        IMAGE_MAX_PIXELS    = "clip.vision.image_max_pixels"
          PREPROC_IMAGE_SIZE  = "clip.vision.preproc_image_size"
          PATCH_SIZE          = "clip.vision.patch_size"
          EMBEDDING_LENGTH    = "clip.vision.embedding_length"
diff --git a/gguf-py/gguf/gguf_writer.py b/gguf-py/gguf/gguf_writer.py

index 7fbb78866bcb45fb387922f79ed0793498b590dd..0b9c650161e53880ac577aa9323e230f8dd3bd14 100644 (file)
--- a/gguf-py/gguf/gguf_writer.py
+++ b/gguf-py/gguf/gguf_writer.py
@@ -1113,6 +1113,12 @@ class GGUFWriter:
      def add_vision_image_size(self, value: int) -> None:
          self.add_uint32(Keys.ClipVision.IMAGE_SIZE, value)
  
+    def add_vision_max_pixels(self, value: int) -> None:
+        self.add_uint32(Keys.ClipVision.IMAGE_MAX_PIXELS, value)
+
+    def add_vision_min_pixels(self, value: int) -> None:
+        self.add_uint32(Keys.ClipVision.IMAGE_MIN_PIXELS, value)
+
      def add_vision_preproc_image_size(self, value: int) -> None:
          self.add_uint32(Keys.ClipVision.PREPROC_IMAGE_SIZE, value)
  
diff --git a/tools/mtmd/clip-impl.h b/tools/mtmd/clip-impl.h

index dd693623a266b9ff835158ff0b52cf387e7c420a..ad232178bf4b98b82f73bb454af91b380260ca3a 100644 (file)
--- a/tools/mtmd/clip-impl.h
+++ b/tools/mtmd/clip-impl.h
@@ -36,6 +36,8 @@
  // vision-specific
  #define KEY_VISION_PROJ_TYPE    "clip.vision.projector_type" // for models with mixed modalities
  #define KEY_IMAGE_SIZE          "clip.vision.image_size"
+#define KEY_IMAGE_MIN_PIXELS    "clip.vision.image_min_pixels"
+#define KEY_IMAGE_MAX_PIXELS    "clip.vision.image_max_pixels"
  #define KEY_PREPROC_IMAGE_SIZE  "clip.vision.preproc_image_size"
  #define KEY_PATCH_SIZE          "clip.vision.patch_size"
  #define KEY_IMAGE_MEAN          "clip.vision.image_mean"
author	Xuan-Son Nguyen <redacted>
	Mon, 2 Feb 2026 19:59:06 +0000 (20:59 +0100)
committer	GitHub <redacted>
	Mon, 2 Feb 2026 19:59:06 +0000 (20:59 +0100)
gguf-py/gguf/constants.py		patch \| blob \| history
gguf-py/gguf/gguf_writer.py		patch \| blob \| history
tools/mtmd/clip-impl.h		patch \| blob \| history