]> git.djapps.eu Git - pkg/ggml/sources/llama.cpp/commitdiff
finetune : add training data file to log message (#4979)
authorDaniel Bevenius <redacted>
Tue, 16 Jan 2024 17:54:24 +0000 (18:54 +0100)
committerGitHub <redacted>
Tue, 16 Jan 2024 17:54:24 +0000 (19:54 +0200)
This commit adds the name of the training data file to the log message
printed when the training data is tokenized.

The motivation for this change is that it can be useful to show which
file is being tokenized when running the finetune example.

Signed-off-by: Daniel Bevenius <redacted>
examples/finetune/finetune.cpp

index a6620fd73ca185e7d9a600cddbb309a7de7842a1..11fcbf443326ea22257491fd6fcfeb8e778d41c0 100644 (file)
@@ -1799,7 +1799,7 @@ int main(int argc, char ** argv) {
     std::vector<llama_token> train_tokens;
     std::vector<size_t> train_samples_begin;
     std::vector<size_t> train_samples_size;
-    printf("%s: tokenize training data\n", __func__);
+    printf("%s: tokenize training data from %s\n", __func__, params.common.fn_train_data);
     tokenize_file(lctx,
             params.common.fn_train_data,
             params.common.sample_start,