simple : fix batch handling (#3803)

author Thibault Terrasson <redacted>

Fri, 27 Oct 2023 14:37:41 +0000 (16:37 +0200)

committer GitHub <redacted>

Fri, 27 Oct 2023 14:37:41 +0000 (08:37 -0600)
author Thibault Terrasson <redacted>
Fri, 27 Oct 2023 14:37:41 +0000 (16:37 +0200)
committer GitHub <redacted>
Fri, 27 Oct 2023 14:37:41 +0000 (08:37 -0600)
diff --git a/examples/simple/simple.cpp b/examples/simple/simple.cpp

index f376c050994d19dbb4da2c34f8331689cce8acdd..374aef6f16189c5efa7073fdc57b6edfd632001b 100644 (file)
--- a/examples/simple/simple.cpp
+++ b/examples/simple/simple.cpp
@@ -95,13 +95,8 @@ int main(int argc, char ** argv) {
      llama_batch batch = llama_batch_init(512, 0, 1);
  
      // evaluate the initial prompt
-    batch.n_tokens = tokens_list.size();
-
-    for (int32_t i = 0; i < batch.n_tokens; i++) {
-        batch.token[i]  = tokens_list[i];
-        batch.pos[i]    = i;
-        batch.seq_id[i] = 0;
-        batch.logits[i] = false;
+    for (size_t i = 0; i < tokens_list.size(); i++) {
+        llama_batch_add(batch, tokens_list[i], i, { 0 }, false);
      }
  
      // llama_decode will output logits only for the last token of the prompt
@@ -148,15 +143,10 @@ int main(int argc, char ** argv) {
              fflush(stdout);
  
              // prepare the next batch
-            batch.n_tokens = 0;
+            llama_batch_clear(batch);
  
              // push this new token for next evaluation
-            batch.token [batch.n_tokens] = new_token_id;
-            batch.pos   [batch.n_tokens] = n_cur;
-            batch.seq_id[batch.n_tokens] = 0;
-            batch.logits[batch.n_tokens] = true;
-
-            batch.n_tokens += 1;
+            llama_batch_add(batch, new_token_id, n_cur, { 0 }, true);
  
              n_decode += 1;
          }
author	Thibault Terrasson <redacted>
	Fri, 27 Oct 2023 14:37:41 +0000 (16:37 +0200)
committer	GitHub <redacted>
	Fri, 27 Oct 2023 14:37:41 +0000 (08:37 -0600)