From: Georgi Gerganov Date: Wed, 3 Jan 2024 11:01:44 +0000 (+0200) Subject: cuda : mark I16 and I32 ops as unsupported X-Git-Tag: upstream/0.0.1642~1128 X-Git-Url: https://git.djapps.eu/?a=commitdiff_plain;h=b2d18c3a9a447ab89e3aafcb78d72a9171d7700a;p=pkg%2Fggml%2Fsources%2Fggml cuda : mark I16 and I32 ops as unsupported ggml-ci --- diff --git a/src/ggml-cuda.cu b/src/ggml-cuda.cu index 8c271230..2e759d43 100644 --- a/src/ggml-cuda.cu +++ b/src/ggml-cuda.cu @@ -10039,14 +10039,22 @@ static bool ggml_backend_cuda_supports_op(ggml_backend_t backend, const ggml_ten } return false; } break; + case GGML_OP_DUP: + case GGML_OP_REPEAT: + case GGML_OP_CONCAT: + { + ggml_type src0_type = op->src[0]->type; + if (src0_type != GGML_TYPE_I32 && src0_type != GGML_TYPE_I16) { + return true; + } + return false; + } break; case GGML_OP_NONE: case GGML_OP_RESHAPE: case GGML_OP_VIEW: case GGML_OP_PERMUTE: case GGML_OP_TRANSPOSE: case GGML_OP_NORM: - case GGML_OP_REPEAT: - case GGML_OP_DUP: case GGML_OP_ADD: case GGML_OP_MUL: case GGML_OP_DIV: @@ -10063,7 +10071,6 @@ static bool ggml_backend_cuda_supports_op(ggml_backend_t backend, const ggml_ten case GGML_OP_SUM_ROWS: case GGML_OP_ARGSORT: case GGML_OP_ACC: - case GGML_OP_CONCAT: case GGML_OP_GROUP_NORM: case GGML_OP_UPSCALE: case GGML_OP_PAD: