]> git.djapps.eu Git - pkg/ggml/sources/ggml/commitdiff
CUDA: fixed row rounding for 0 tensor splits (llama/4594)
authorJohannes Gäßler <redacted>
Sat, 23 Dec 2023 08:16:33 +0000 (09:16 +0100)
committerGeorgi Gerganov <redacted>
Wed, 27 Dec 2023 09:40:50 +0000 (11:40 +0200)
src/ggml-cuda.cu

index 7c2a834e34382f44ca788ff006d3877f8bab1fa3..490081cac8c1b656aa1401230144cf53cb25b27b 100644 (file)
@@ -7937,12 +7937,16 @@ static void ggml_cuda_op_mul_mat(
 
             if (id != 0) {
                 row_low[id]  = ne01*g_tensor_split[id];
-                row_low[id] -= row_low[id] % rounding;
+                if (row_low[id] < ne01) {
+                    row_low[id] -= row_low[id] % rounding;
+                }
             }
 
             if (id != g_device_count - 1) {
                 row_high[id]  = ne01*g_tensor_split[id + 1];
-                row_high[id] -= row_high[id] % rounding;
+                if (row_high[id] < ne01) {
+                    row_high[id] -= row_high[id] % rounding;
+                }
             }
         }
     }