]> git.djapps.eu Git - pkg/ggml/sources/llama.cpp/commitdiff
mtmd: add min/max pixels gguf metadata (#19273)
authorXuan-Son Nguyen <redacted>
Mon, 2 Feb 2026 19:59:06 +0000 (20:59 +0100)
committerGitHub <redacted>
Mon, 2 Feb 2026 19:59:06 +0000 (20:59 +0100)
gguf-py/gguf/constants.py
gguf-py/gguf/gguf_writer.py
tools/mtmd/clip-impl.h

index 31273b2b5a715278496c44357582e9eaa9ab9cc3..6f56d36c59f8da9586c63355657fda0492ec138e 100644 (file)
@@ -284,6 +284,8 @@ class Keys:
     class ClipVision:
         PROJECTOR_TYPE      = "clip.vision.projector_type" # for mixed modality models
         IMAGE_SIZE          = "clip.vision.image_size"
+        IMAGE_MIN_PIXELS    = "clip.vision.image_min_pixels"
+        IMAGE_MAX_PIXELS    = "clip.vision.image_max_pixels"
         PREPROC_IMAGE_SIZE  = "clip.vision.preproc_image_size"
         PATCH_SIZE          = "clip.vision.patch_size"
         EMBEDDING_LENGTH    = "clip.vision.embedding_length"
index 7fbb78866bcb45fb387922f79ed0793498b590dd..0b9c650161e53880ac577aa9323e230f8dd3bd14 100644 (file)
@@ -1113,6 +1113,12 @@ class GGUFWriter:
     def add_vision_image_size(self, value: int) -> None:
         self.add_uint32(Keys.ClipVision.IMAGE_SIZE, value)
 
+    def add_vision_max_pixels(self, value: int) -> None:
+        self.add_uint32(Keys.ClipVision.IMAGE_MAX_PIXELS, value)
+
+    def add_vision_min_pixels(self, value: int) -> None:
+        self.add_uint32(Keys.ClipVision.IMAGE_MIN_PIXELS, value)
+
     def add_vision_preproc_image_size(self, value: int) -> None:
         self.add_uint32(Keys.ClipVision.PREPROC_IMAGE_SIZE, value)
 
index dd693623a266b9ff835158ff0b52cf387e7c420a..ad232178bf4b98b82f73bb454af91b380260ca3a 100644 (file)
@@ -36,6 +36,8 @@
 // vision-specific
 #define KEY_VISION_PROJ_TYPE    "clip.vision.projector_type" // for models with mixed modalities
 #define KEY_IMAGE_SIZE          "clip.vision.image_size"
+#define KEY_IMAGE_MIN_PIXELS    "clip.vision.image_min_pixels"
+#define KEY_IMAGE_MAX_PIXELS    "clip.vision.image_max_pixels"
 #define KEY_PREPROC_IMAGE_SIZE  "clip.vision.preproc_image_size"
 #define KEY_PATCH_SIZE          "clip.vision.patch_size"
 #define KEY_IMAGE_MEAN          "clip.vision.image_mean"