From: lhez Date: Mon, 25 Aug 2025 21:18:09 +0000 (-0700) Subject: opencl: fix support ops condition for `rms_norm` (llama/15560) X-Git-Tag: v0.9.1~152 X-Git-Url: https://git.djapps.eu/?a=commitdiff_plain;h=d9f431b78f339e1950daf6b4908e50093b868fae;p=pkg%2Fggml%2Fsources%2Fggml opencl: fix support ops condition for `rms_norm` (llama/15560) --- diff --git a/src/ggml-opencl/ggml-opencl.cpp b/src/ggml-opencl/ggml-opencl.cpp index df275013..36b18ddb 100644 --- a/src/ggml-opencl/ggml-opencl.cpp +++ b/src/ggml-opencl/ggml-opencl.cpp @@ -2647,8 +2647,9 @@ static bool ggml_opencl_supports_op(ggml_backend_dev_t dev, const struct ggml_te return op->src[0]->type == GGML_TYPE_F32; case GGML_OP_SOFT_MAX: case GGML_OP_NORM: - case GGML_OP_RMS_NORM: return true; + case GGML_OP_RMS_NORM: + return op->ne[0] % 4 == 0 && ggml_is_contiguous_rows(op->src[0]); case GGML_OP_REPEAT: return op->src[0]->type == GGML_TYPE_F32 && op->type == GGML_TYPE_F32; // Assuming F32 for now, can be expanded case GGML_OP_PAD: