musa: fix build warnings (llama/15611)

author R0CKSTAR <redacted>

Fri, 26 Sep 2025 00:56:10 +0000 (08:56 +0800)

committer Georgi Gerganov <redacted>

Mon, 29 Sep 2025 12:18:10 +0000 (15:18 +0300)
author R0CKSTAR <redacted>
Fri, 26 Sep 2025 00:56:10 +0000 (08:56 +0800)
committer Georgi Gerganov <redacted>
Mon, 29 Sep 2025 12:18:10 +0000 (15:18 +0300)
diff --git a/ggml/src/ggml-cuda/binbcast.cu b/ggml/src/ggml-cuda/binbcast.cu

index 725e1a81a1fc708f4b24b369e7b756635b2be685..60240102741f35135533943b576e5f755fd8aae5 100644 (file)
--- a/ggml/src/ggml-cuda/binbcast.cu
+++ b/ggml/src/ggml-cuda/binbcast.cu
@@ -54,7 +54,7 @@ static __global__ void k_bin_bcast(const src0_t *         src0,
      const uint32_t i2  = fastdiv((blockDim.z * blockIdx.z + threadIdx.z), ne3);
      const uint32_t i3  = (blockDim.z * blockIdx.z + threadIdx.z) - (i2 * ne3.z);
  
-    if (i0s >= ne0 || i1 >= ne1 || i2 >= ne2 || i3 >= ne3.z) {
+    if (i0s >= (uint32_t)ne0 || i1 >= (uint32_t)ne1 || i2 >= (uint32_t)ne2 || i3 >= ne3.z) {
          return;
      }
  
diff --git a/ggml/src/ggml-cuda/mmq.cu b/ggml/src/ggml-cuda/mmq.cu

index 714b23f9f49aaec6bb7ec108a36a61192da3a0b7..12bdc629bd6b200837cc238c05c6230490da42bd 100644 (file)
--- a/ggml/src/ggml-cuda/mmq.cu
+++ b/ggml/src/ggml-cuda/mmq.cu
@@ -81,7 +81,7 @@ static __global__ void mmq_ids_helper(
  #pragma unroll
              for (int offset = neu_padded; offset < warp_size; offset += neu_padded) {
                  const int tmp = __shfl_up_sync(0xFFFFFFFF, it_compact_add_self, offset, warp_size);
-                if (threadIdx.x >= offset) {
+                if (threadIdx.x >= static_cast<unsigned int>(offset)) {
                      it_compact_add_lower += tmp;
                  }
              }
@@ -110,7 +110,7 @@ static __global__ void mmq_ids_helper(
  
      expert_bounds[expert] = nex_prev;
  
-    if (expert < gridDim.x - 1) {
+    if (expert < static_cast<int>(gridDim.x) - 1) {
          return;
      }
  
diff --git a/ggml/src/ggml-cuda/mmvq.cu b/ggml/src/ggml-cuda/mmvq.cu

index 52de4e78d1321737dc58811afcdf279a123f40fa..3bf0c9ed25038785dfc16c859d3e1318f88de095 100644 (file)
--- a/ggml/src/ggml-cuda/mmvq.cu
+++ b/ggml/src/ggml-cuda/mmvq.cu
@@ -220,7 +220,7 @@ static __global__ void mul_mat_vec_q(
              tmp[j][i] = warp_reduce_sum<warp_size>(tmp[j][i]);
          }
  
-        if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + int(threadIdx.x) < stride_col_dst)) {
+        if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || uint32_t(row0 + threadIdx.x) < stride_col_dst)) {
              dst[j*stride_col_dst + threadIdx.x] = tmp[j][threadIdx.x];
          }
      }
diff --git a/ggml/src/ggml-cuda/pad_reflect_1d.cu b/ggml/src/ggml-cuda/pad_reflect_1d.cu

index 0478889da13fea01e14b3fc6341795596f3cc455..32993eb591307453cc1752a1c8b37075d691d749 100644 (file)
--- a/ggml/src/ggml-cuda/pad_reflect_1d.cu
+++ b/ggml/src/ggml-cuda/pad_reflect_1d.cu
@@ -51,6 +51,8 @@ static __global__ __launch_bounds__(CUDA_PAD_REFLECT_1D_BLOCK_SIZE, 1) void
      }
      const float value               = *(const float *) (src0_ptr + src_idx * nb00);
      *(float *) (dst_ptr + i0 * nb0) = value;
+
+    GGML_UNUSED(p1);
  }
  
  void ggml_cuda_op_pad_reflect_1d(ggml_backend_cuda_context & ctx, ggml_tensor * dst) {
author	R0CKSTAR <redacted>
	Fri, 26 Sep 2025 00:56:10 +0000 (08:56 +0800)
committer	Georgi Gerganov <redacted>
	Mon, 29 Sep 2025 12:18:10 +0000 (15:18 +0300)
ggml/src/ggml-cuda/binbcast.cu		patch \| blob \| history
ggml/src/ggml-cuda/mmq.cu		patch \| blob \| history
ggml/src/ggml-cuda/mmvq.cu		patch \| blob \| history
ggml/src/ggml-cuda/pad_reflect_1d.cu		patch \| blob \| history