gguf : enforce that tensor names are unique (#6905)

author Xuan Son Nguyen <redacted>

Sun, 28 Apr 2024 15:36:18 +0000 (17:36 +0200)

committer GitHub <redacted>

Sun, 28 Apr 2024 15:36:18 +0000 (17:36 +0200)
author Xuan Son Nguyen <redacted>
Sun, 28 Apr 2024 15:36:18 +0000 (17:36 +0200)
committer GitHub <redacted>
Sun, 28 Apr 2024 15:36:18 +0000 (17:36 +0200)
diff --git a/ggml.c b/ggml.c

index 34eef23fcf90fd8402796703830c2e804e8b7826..cb273061c5c535a4756c065dbdf75e9a8573dc36 100644 (file)
--- a/ggml.c
+++ b/ggml.c
@@ -20819,6 +20819,14 @@ struct gguf_context * gguf_init_from_file(const char * fname, struct gguf_init_p
              // TODO: return an error instead of crashing with GGML_ASSERT
              gguf_tensor_info_sanitize(info);
  
+            // make sure there is no duplicated tensor names
+            for (uint64_t j = 0; j < i; ++j) {
+                if (strcmp(info->name.data, ctx->infos[j].name.data) == 0) {
+                    fprintf(stderr, "%s: duplicated tensor name %s\n", __func__, info->name.data);
+                    ok = false;
+                }
+            }
+
              if (!ok) {
                  fprintf(stderr, "%s: failed to read tensor info\n", __func__);
                  fclose(file);
@@ -21355,6 +21363,10 @@ void gguf_set_kv(struct gguf_context * ctx, struct gguf_context * src) {
  void gguf_add_tensor(
               struct gguf_context * ctx,
          const struct ggml_tensor * tensor) {
+    if (gguf_find_tensor(ctx, tensor->name) != -1) {
+        GGML_ASSERT(false && "duplicated tensor name");
+    }
+
      const int idx = ctx->header.n_tensors;
      ctx->infos = realloc(ctx->infos, (idx + 1)*sizeof(struct gguf_tensor_info));
  
diff --git a/gguf-py/gguf/gguf_reader.py b/gguf-py/gguf/gguf_reader.py

index 33afac552ca7523b7da16f854ef34908fafc11f3..48ef6d4ae45dfa6a79f45eea1d4bf0d743e132a6 100644 (file)
--- a/gguf-py/gguf/gguf_reader.py
+++ b/gguf-py/gguf/gguf_reader.py
@@ -234,8 +234,14 @@ class GGUFReader:
  
      def _build_tensors(self, start_offs: int, fields: list[ReaderField]) -> None:
          tensors = []
+        tensor_names = set() # keep track of name to prevent duplicated tensors
          for field in fields:
              _name_len, name_data, _n_dims, dims, raw_dtype, offset_tensor = field.parts
+            # check if there's any tensor having same name already in the list
+            tensor_name = str(bytes(name_data), encoding = 'utf-8')
+            if tensor_name in tensor_names:
+                raise ValueError(f'Found duplicated tensor with name {tensor_name}')
+            tensor_names.add(tensor_name)
              ggml_type = GGMLQuantizationType(raw_dtype[0])
              n_elems = np.prod(dims)
              block_size, type_size = GGML_QUANT_SIZES[ggml_type]
@@ -267,7 +273,7 @@ class GGUFReader:
                  item_count = n_bytes
                  item_type = np.uint8
              tensors.append(ReaderTensor(
-                name = str(bytes(name_data), encoding = 'utf-8'),
+                name = tensor_name,
                  tensor_type = ggml_type,
                  shape = dims,
                  n_elements = n_elems,
diff --git a/gguf-py/gguf/gguf_writer.py b/gguf-py/gguf/gguf_writer.py

index e3dbca454ae052803d22039df24037c1c1566e5a..ec44ac9f3813dd254dc963eb40a6be84b737004d 100644 (file)
--- a/gguf-py/gguf/gguf_writer.py
+++ b/gguf-py/gguf/gguf_writer.py
@@ -63,6 +63,7 @@ class GGUFWriter:
          self.kv_data_count = 0
          self.ti_data = bytearray()
          self.ti_data_count = 0
+        self.ti_names = set()
          self.use_temp_file = use_temp_file
          self.temp_file = None
          self.tensors = []
@@ -197,6 +198,10 @@ class GGUFWriter:
          if self.state is not WriterState.EMPTY:
              raise ValueError(f'Expected output file to be empty, got {self.state}')
  
+        if name in self.ti_names:
+            raise ValueError(f'Duplicated tensor name {name}')
+        self.ti_names.add(name)
+
          encoded_name = name.encode("utf8")
          self.ti_data += self._pack("Q", len(encoded_name))
          self.ti_data += encoded_name
diff --git a/llama.cpp b/llama.cpp

index 49f2b559e965e4875b499ea73c781f15ccae4cd7..3c64622d7c8dc1c3ae422301adc033b5a6022306 100644 (file)
--- a/llama.cpp
+++ b/llama.cpp
@@ -3120,9 +3120,17 @@ struct llama_model_loader {
  
          fver = (enum llama_fver) gguf_get_version(meta);
  
+        std::set<std::string> tensor_names;
          for (auto & w : weights) {
              n_elements += ggml_nelements(w.tensor);
              n_bytes    += ggml_nbytes(w.tensor);
+            // make sure there is no duplicated tensor names
+            const std::string name(w.tensor->name);
+            auto found = tensor_names.find(name);
+            if (found != tensor_names.end()) {
+                throw std::runtime_error(format("invalid model: tensor '%s' is duplicated", w.tensor->name));
+            }
+            tensor_names.insert(name);
          }
  
          LLAMA_LOG_INFO("%s: loaded meta data with %d key-value pairs and %d tensors from %s (version %s)\n",
author	Xuan Son Nguyen <redacted>
	Sun, 28 Apr 2024 15:36:18 +0000 (17:36 +0200)
committer	GitHub <redacted>
	Sun, 28 Apr 2024 15:36:18 +0000 (17:36 +0200)
ggml.c		patch \| blob \| history
gguf-py/gguf/gguf_reader.py		patch \| blob \| history
gguf-py/gguf/gguf_writer.py		patch \| blob \| history
llama.cpp		patch \| blob \| history