arg : no n_predict = -2 for examples except for main and infill (#12364)

author Xuan-Son Nguyen <redacted>

Thu, 13 Mar 2025 11:34:54 +0000 (12:34 +0100)

committer GitHub <redacted>

Thu, 13 Mar 2025 11:34:54 +0000 (12:34 +0100)
author Xuan-Son Nguyen <redacted>
Thu, 13 Mar 2025 11:34:54 +0000 (12:34 +0100)
committer GitHub <redacted>
Thu, 13 Mar 2025 11:34:54 +0000 (12:34 +0100)
diff --git a/common/arg.cpp b/common/arg.cpp

index 8531f0871d44a8c500f6a17ea726c37397a87016..fe6a1eece7fed2b8a57859da965276a8513eeeb1 100644 (file)
--- a/common/arg.cpp
+++ b/common/arg.cpp
@@ -764,7 +764,11 @@ common_params_context common_params_parser_init(common_params & params, llama_ex
      ).set_env("LLAMA_ARG_CTX_SIZE"));
      add_opt(common_arg(
          {"-n", "--predict", "--n-predict"}, "N",
-        string_format("number of tokens to predict (default: %d, -1 = infinity, -2 = until context filled)", params.n_predict),
+        string_format(
+            ex == LLAMA_EXAMPLE_MAIN || ex == LLAMA_EXAMPLE_INFILL
+                ? "number of tokens to predict (default: %d, -1 = infinity, -2 = until context filled)"
+                : "number of tokens to predict (default: %d, -1 = infinity)",
+            params.n_predict),
          [](common_params & params, int value) {
              params.n_predict = value;
          }
author	Xuan-Son Nguyen <redacted>
	Thu, 13 Mar 2025 11:34:54 +0000 (12:34 +0100)
committer	GitHub <redacted>
	Thu, 13 Mar 2025 11:34:54 +0000 (12:34 +0100)