From: R0CKSTAR Date: Tue, 12 Aug 2025 02:02:51 +0000 (+0800) Subject: musa: fix failures in test-backend-ops for mul_mat_id op (llama/15236) X-Git-Tag: upstream/0.0.2446~17 X-Git-Url: https://git.djapps.eu/?a=commitdiff_plain;h=5539b20bbc5d1af884f40b06dde7bfed61bc0677;p=pkg%2Fggml%2Fsources%2Fggml musa: fix failures in test-backend-ops for mul_mat_id op (llama/15236) * musa: fix failures in test-backend-ops for mul_mat_id op Signed-off-by: Xiaodong Ye * Address review comments Signed-off-by: Xiaodong Ye --------- Signed-off-by: Xiaodong Ye --- diff --git a/src/ggml-cuda/common.cuh b/src/ggml-cuda/common.cuh index 2e5d4879..a23da57e 100644 --- a/src/ggml-cuda/common.cuh +++ b/src/ggml-cuda/common.cuh @@ -312,11 +312,11 @@ static bool turing_mma_available(const int cc) { } static bool ampere_mma_available(const int cc) { - return cc < GGML_CUDA_CC_OFFSET_AMD && ggml_cuda_highest_compiled_arch(cc) >= GGML_CUDA_CC_AMPERE; + return GGML_CUDA_CC_IS_NVIDIA(cc) && ggml_cuda_highest_compiled_arch(cc) >= GGML_CUDA_CC_AMPERE; } static bool cp_async_available(const int cc) { - return cc < GGML_CUDA_CC_OFFSET_AMD && ggml_cuda_highest_compiled_arch(cc) >= GGML_CUDA_CC_AMPERE; + return GGML_CUDA_CC_IS_NVIDIA(cc) && ggml_cuda_highest_compiled_arch(cc) >= GGML_CUDA_CC_AMPERE; } static constexpr __device__ int ggml_cuda_get_physical_warp_size() {