]> git.djapps.eu Git - pkg/ggml/sources/llama.cpp/commitdiff
metal : Fix dimension constraint violation in matmul2d descriptor (#21048)
authorren <redacted>
Fri, 27 Mar 2026 07:05:21 +0000 (00:05 -0700)
committerGitHub <redacted>
Fri, 27 Mar 2026 07:05:21 +0000 (09:05 +0200)
Updates Metal tensor API test probe to fix the dimension constraint violation in the matmul2d descriptor (at least one value must be a multiple of 16).

ggml/src/ggml-metal/ggml-metal-device.m

index cbef2fb4879ee82c9b2c0339cd828210782ed4d9..17d51b11b6e5932732e3fe917c4e18b12f18212d 100644 (file)
@@ -690,7 +690,7 @@ ggml_metal_device_t ggml_metal_device_init(int device) {
                     "    auto tB = B.slice((int)tgid.x, 0); \n"
                     " \n"
                     "    matmul2d< \n"
-                    "        matmul2d_descriptor(8, 8, dynamic_extent), \n"
+                    "        matmul2d_descriptor(16, 16, dynamic_extent), \n"
                     "        execution_simdgroups<4>> mm; \n"
                     " \n"
                     "    auto cT = mm.get_destination_cooperative_tensor<decltype(tA), decltype(tB), float>(); \n"
@@ -740,7 +740,7 @@ ggml_metal_device_t ggml_metal_device_init(int device) {
                     "    auto tB = B.slice((int)tgid.x, 0); \n"
                     " \n"
                     "    matmul2d< \n"
-                    "        matmul2d_descriptor(8, 8, dynamic_extent), \n"
+                    "        matmul2d_descriptor(16, 16, dynamic_extent), \n"
                     "        execution_simdgroups<4>> mm; \n"
                     " \n"
                     "    auto cT = mm.get_destination_cooperative_tensor<decltype(tA), decltype(tB), float>(); \n"