]> git.djapps.eu Git - pkg/ggml/sources/ggml/commitdiff
sycl : offload of get_rows set to 0 (llama/10432)
authorAlberto Cabrera Pérez <redacted>
Fri, 29 Nov 2024 12:38:45 +0000 (12:38 +0000)
committerGeorgi Gerganov <redacted>
Tue, 3 Dec 2024 19:05:37 +0000 (21:05 +0200)
src/ggml-sycl/ggml-sycl.cpp

index aabcdc22422fc104ded19bd91cd588ab38154ff5..808f74fa0b27e0f5c8733d3308c621dcfa16753b 100644 (file)
@@ -4493,7 +4493,7 @@ static bool ggml_backend_sycl_device_supports_buft(ggml_backend_dev_t dev, ggml_
 static int64_t get_op_batch_size(const ggml_tensor * op) {
     switch (op->op) {
         case GGML_OP_GET_ROWS:
-            return op->ne[1]; // this will increse the speed of prefill in test
+            return 0;
         case GGML_OP_MUL_MAT:
             return op->ne[1];
         case GGML_OP_MUL_MAT_ID: