]> git.djapps.eu Git - pkg/ggml/sources/ggml/commitdiff
gguf : update type enum (#775)
authorJacobLinCool <redacted>
Wed, 27 Mar 2024 17:48:56 +0000 (01:48 +0800)
committerGitHub <redacted>
Wed, 27 Mar 2024 17:48:56 +0000 (19:48 +0200)
* spec: add missing semicolons in GGUF structs

Co-Authored-By: 郝東彥 Arthur Hao <redacted>
* spec: update GGUF tensor types

---------

Co-authored-by: 郝東彥 Arthur Hao <redacted>
docs/gguf.md

index fa9abea74e778f695d45993390ebb80834d7fe2b..d6ad5e276cecdecd0ce0ffd96128508a961b38e4 100644 (file)
@@ -31,26 +31,36 @@ Models are little-endian by default. They can also come in big-endian for use wi
 
 ```c
 enum ggml_type: uint32_t {
-    GGML_TYPE_F32  = 0,
-    GGML_TYPE_F16  = 1,
-    GGML_TYPE_Q4_0 = 2,
-    GGML_TYPE_Q4_1 = 3,
+    GGML_TYPE_F32     = 0,
+    GGML_TYPE_F16     = 1,
+    GGML_TYPE_Q4_0    = 2,
+    GGML_TYPE_Q4_1    = 3,
     // GGML_TYPE_Q4_2 = 4, support has been removed
-    // GGML_TYPE_Q4_3 (5) support has been removed
-    GGML_TYPE_Q5_0 = 6,
-    GGML_TYPE_Q5_1 = 7,
-    GGML_TYPE_Q8_0 = 8,
-    GGML_TYPE_Q8_1 = 9,
-    // k-quantizations
-    GGML_TYPE_Q2_K = 10,
-    GGML_TYPE_Q3_K = 11,
-    GGML_TYPE_Q4_K = 12,
-    GGML_TYPE_Q5_K = 13,
-    GGML_TYPE_Q6_K = 14,
-    GGML_TYPE_Q8_K = 15,
-    GGML_TYPE_I8,
-    GGML_TYPE_I16,
-    GGML_TYPE_I32,
+    // GGML_TYPE_Q4_3 = 5, support has been removed
+    GGML_TYPE_Q5_0    = 6,
+    GGML_TYPE_Q5_1    = 7,
+    GGML_TYPE_Q8_0    = 8,
+    GGML_TYPE_Q8_1    = 9,
+    GGML_TYPE_Q2_K    = 10,
+    GGML_TYPE_Q3_K    = 11,
+    GGML_TYPE_Q4_K    = 12,
+    GGML_TYPE_Q5_K    = 13,
+    GGML_TYPE_Q6_K    = 14,
+    GGML_TYPE_Q8_K    = 15,
+    GGML_TYPE_IQ2_XXS = 16,
+    GGML_TYPE_IQ2_XS  = 17,
+    GGML_TYPE_IQ3_XXS = 18,
+    GGML_TYPE_IQ1_S   = 19,
+    GGML_TYPE_IQ4_NL  = 20,
+    GGML_TYPE_IQ3_S   = 21,
+    GGML_TYPE_IQ2_S   = 22,
+    GGML_TYPE_IQ4_XS  = 23,
+    GGML_TYPE_I8      = 24,
+    GGML_TYPE_I16     = 25,
+    GGML_TYPE_I32     = 26,
+    GGML_TYPE_I64     = 27,
+    GGML_TYPE_F64     = 28,
+    GGML_TYPE_IQ1_M   = 29,
     GGML_TYPE_COUNT,
 };
 
@@ -85,7 +95,7 @@ enum gguf_metadata_value_type: uint32_t {
     GGUF_METADATA_VALUE_TYPE_INT64 = 11,
     // The value is a 64-bit IEEE754 floating point number.
     GGUF_METADATA_VALUE_TYPE_FLOAT64 = 12,
-}
+};
 
 // A string in GGUF.
 struct gguf_string_t {
@@ -93,7 +103,7 @@ struct gguf_string_t {
     uint64_t len;
     // The string as a UTF-8 non-null-terminated string.
     char string[len];
-}
+};
 
 union gguf_metadata_value_t {
     uint8_t uint8;