]> git.djapps.eu Git - pkg/ggml/sources/llama.cpp/commitdiff
cuda : mark BF16 CONT as unsupported
authorGeorgi Gerganov <redacted>
Wed, 28 Aug 2024 14:08:03 +0000 (17:08 +0300)
committerGeorgi Gerganov <redacted>
Sun, 8 Sep 2024 08:05:55 +0000 (11:05 +0300)
ggml/src/ggml-cuda.cu

index d33988d0277f6f7ed053ffe1ba96f412a0cf381f..af1bd0518eb6aba18307edc48d13d138a8ba1160 100644 (file)
@@ -2887,7 +2887,9 @@ GGML_CALL static bool ggml_backend_cuda_supports_op(ggml_backend_t backend, cons
         case GGML_OP_SIN:
         case GGML_OP_COS:
         case GGML_OP_CLAMP:
+            return true;
         case GGML_OP_CONT:
+            return op->src[0]->type != GGML_TYPE_BF16;
         case GGML_OP_DIAG_MASK_INF:
         case GGML_OP_SOFT_MAX:
             return true;