llama : clarify comment about pp and tg graphs [no ci] (#14895)

author Daniel Bevenius <redacted>

Sun, 27 Jul 2025 10:10:51 +0000 (12:10 +0200)

committer GitHub <redacted>

Sun, 27 Jul 2025 10:10:51 +0000 (12:10 +0200)
author Daniel Bevenius <redacted>
Sun, 27 Jul 2025 10:10:51 +0000 (12:10 +0200)
committer GitHub <redacted>
Sun, 27 Jul 2025 10:10:51 +0000 (12:10 +0200)
diff --git a/src/llama-context.cpp b/src/llama-context.cpp

index 84f9ccab4ec2f846a350b0cfa99732e507ce3b44..9e77fe6d869599255729b6ed0e908becf8be390d 100644 (file)
--- a/src/llama-context.cpp
+++ b/src/llama-context.cpp
@@ -298,7 +298,7 @@ llama_context::llama_context(
  
          cross.v_embd.clear();
  
-        // reserve pp graph first so that buffers are only allocated once
+        // reserve pp (prompt processing) graph first so that buffers are only allocated once
          {
              auto * gf = graph_reserve(n_tokens, n_seqs, n_tokens, mctx.get());
              if (!gf) {
@@ -309,7 +309,7 @@ llama_context::llama_context(
              n_nodes_pp  = ggml_graph_n_nodes(gf);
          }
  
-        // reserve with tg graph to get the number of splits and nodes
+        // reserve with tg (token generation) graph to get the number of splits and nodes
          {
              auto * gf = graph_reserve(n_seqs, n_seqs, n_seqs, mctx.get());
              if (!gf) {
author	Daniel Bevenius <redacted>
	Sun, 27 Jul 2025 10:10:51 +0000 (12:10 +0200)
committer	GitHub <redacted>
	Sun, 27 Jul 2025 10:10:51 +0000 (12:10 +0200)