]> git.djapps.eu Git - pkg/ggml/sources/llama.cpp/commitdiff
model-conversion : cast logits to float32 (#18009)
authorGeorgi Gerganov <redacted>
Sun, 14 Dec 2025 06:58:13 +0000 (08:58 +0200)
committerGitHub <redacted>
Sun, 14 Dec 2025 06:58:13 +0000 (08:58 +0200)
examples/model-conversion/scripts/causal/run-org-model.py

index 7d2b80057c0ec49cddcbeb7ef3dcfe1423e60701..da1132c003eb2d83689f6dd2c7ffe059b3d5055b 100755 (executable)
@@ -200,7 +200,7 @@ with torch.no_grad():
     logits = outputs.logits
 
     # Extract logits for the last token (next token prediction)
-    last_logits = logits[0, -1, :].cpu().numpy()
+    last_logits = logits[0, -1, :].float().cpu().numpy()
 
     print(f"Logits shape: {logits.shape}")
     print(f"Last token logits shape: {last_logits.shape}")