train : add general name (#6752)

author Austin <redacted>

Fri, 19 Apr 2024 07:16:45 +0000 (03:16 -0400)

committer GitHub <redacted>

Fri, 19 Apr 2024 07:16:45 +0000 (10:16 +0300)
author Austin <redacted>
Fri, 19 Apr 2024 07:16:45 +0000 (03:16 -0400)
committer GitHub <redacted>
Fri, 19 Apr 2024 07:16:45 +0000 (10:16 +0300)
diff --git a/examples/train-text-from-scratch/train-text-from-scratch.cpp b/examples/train-text-from-scratch/train-text-from-scratch.cpp

index 7d06e401b462bea9bc3ff5b97e6bed46c4087ca9..587418cc739640ae0a1260951c4edc82d70b6fed 100644 (file)
--- a/examples/train-text-from-scratch/train-text-from-scratch.cpp
+++ b/examples/train-text-from-scratch/train-text-from-scratch.cpp
@@ -73,6 +73,7 @@ struct my_llama_model {
  static const char * LLM_KV_TRAINING_TYPE_TRAIN_MODEL     = "train_model";
  static const char * LLM_KV_TRAINING_TYPE                 = "training.type";
  
+static const char * LLM_KV_GENERAL_NAME                = "general.name";
  static const char * LLM_KV_GENERAL_ARCHITECTURE        = "general.architecture";
  static const char * LLM_KV_GENERAL_FILE_TYPE           = "general.file_type";
  
@@ -529,6 +530,7 @@ static void load_llama_model_gguf(struct gguf_context * fctx, struct ggml_contex
  
  static void save_llama_model_gguf(struct gguf_context * fctx, const char * fn_vocab_model, struct my_llama_model * model) {
      const char * arch = "llama";
+
      enum llama_ftype ftype = LLAMA_FTYPE_ALL_F32;
  
      std::vector<char> keybuf;
@@ -540,6 +542,7 @@ static void save_llama_model_gguf(struct gguf_context * fctx, const char * fn_vo
  
      // set arch
      gguf_set_val_str(fctx, LLM_KV_GENERAL_ARCHITECTURE, arch);
+    gguf_set_val_str(fctx, LLM_KV_GENERAL_NAME, arch);
      gguf_set_val_u32(fctx, LLM_KV_GENERAL_FILE_TYPE, ftype);
  
      // set hparams
author	Austin <redacted>
	Fri, 19 Apr 2024 07:16:45 +0000 (03:16 -0400)
committer	GitHub <redacted>
	Fri, 19 Apr 2024 07:16:45 +0000 (10:16 +0300)