common : add default embeddings presets (#11677)

author Daniel Bevenius <redacted>

Fri, 7 Feb 2025 08:15:22 +0000 (09:15 +0100)

committer GitHub <redacted>

Fri, 7 Feb 2025 08:15:22 +0000 (09:15 +0100)
author Daniel Bevenius <redacted>
Fri, 7 Feb 2025 08:15:22 +0000 (09:15 +0100)
committer GitHub <redacted>
Fri, 7 Feb 2025 08:15:22 +0000 (09:15 +0100)
diff --git a/common/arg.cpp b/common/arg.cpp

index 76b8988819cda0f169d4e5fba9597be5783404c8..152f671ab738e2c2b56a95951dc8b7a5d1d9eacb 100644 (file)
--- a/common/arg.cpp
+++ b/common/arg.cpp
@@ -2324,5 +2324,47 @@ common_params_context common_params_parser_init(common_params & params, llama_ex
          }
      ).set_examples({LLAMA_EXAMPLE_TTS}));
  
+    add_opt(common_arg(
+        {"--embd-bge-small-en-default"},
+        string_format("use default bge-small-en-v1.5 model (note: can download weights from the internet)"),
+        [](common_params & params) {
+            params.hf_repo = "ggml-org/bge-small-en-v1.5-Q8_0-GGUF";
+            params.hf_file = "bge-small-en-v1.5-q8_0.gguf";
+            params.pooling_type = LLAMA_POOLING_TYPE_NONE;
+            params.embd_normalize = 2;
+            params.n_ctx = 512;
+            params.verbose_prompt = true;
+            params.embedding = true;
+        }
+    ).set_examples({LLAMA_EXAMPLE_EMBEDDING, LLAMA_EXAMPLE_SERVER}));
+
+    add_opt(common_arg(
+        {"--embd-e5-small-en-default"},
+        string_format("use default e5-small-v2 model (note: can download weights from the internet)"),
+        [](common_params & params) {
+            params.hf_repo = "ggml-org/e5-small-v2-Q8_0-GGUF";
+            params.hf_file = "e5-small-v2-q8_0.gguf";
+            params.pooling_type = LLAMA_POOLING_TYPE_NONE;
+            params.embd_normalize = 2;
+            params.n_ctx = 512;
+            params.verbose_prompt = true;
+            params.embedding = true;
+        }
+    ).set_examples({LLAMA_EXAMPLE_EMBEDDING, LLAMA_EXAMPLE_SERVER}));
+
+    add_opt(common_arg(
+        {"--embd-gte-small-default"},
+        string_format("use default gte-small model (note: can download weights from the internet)"),
+        [](common_params & params) {
+            params.hf_repo = "ggml-org/gte-small-Q8_0-GGUF";
+            params.hf_file = "gte-small-q8_0.gguf";
+            params.pooling_type = LLAMA_POOLING_TYPE_NONE;
+            params.embd_normalize = 2;
+            params.n_ctx = 512;
+            params.verbose_prompt = true;
+            params.embedding = true;
+        }
+    ).set_examples({LLAMA_EXAMPLE_EMBEDDING, LLAMA_EXAMPLE_SERVER}));
+
      return ctx_arg;
  }
author	Daniel Bevenius <redacted>
	Fri, 7 Feb 2025 08:15:22 +0000 (09:15 +0100)
committer	GitHub <redacted>
	Fri, 7 Feb 2025 08:15:22 +0000 (09:15 +0100)