cuda : remove nchannels_x argument from mul_mat_vec_nc_f16_f32 (#2028)

author Salvador E. Tropea <redacted>

Wed, 28 Jun 2023 17:27:31 +0000 (14:27 -0300)

committer GitHub <redacted>

Wed, 28 Jun 2023 17:27:31 +0000 (20:27 +0300)
author Salvador E. Tropea <redacted>
Wed, 28 Jun 2023 17:27:31 +0000 (14:27 -0300)
committer GitHub <redacted>
Wed, 28 Jun 2023 17:27:31 +0000 (20:27 +0300)
diff --git a/ggml-cuda.cu b/ggml-cuda.cu

index 5f05d9181862145be5154894adfea3e89d541e16..4e0d3dbdea4d499862ccc654461faefa3ebac85e 100644 (file)
--- a/ggml-cuda.cu
+++ b/ggml-cuda.cu
@@ -1292,7 +1292,7 @@ static __global__ void mul_mat_p021_f16_f32(const void * vx, const float * y, fl
  
  static __global__ void mul_mat_vec_nc_f16_f32( // nc == non-contiguous
      const void * vx, const float * y, float * dst, const int ncols_x, const int nrows_x,
-    const int row_stride_x, const int nchannels_x, const int channel_stride_x) {
+    const int row_stride_x, const int channel_stride_x) {
  
      const half * x = (const half *) vx;
  
@@ -1698,7 +1698,7 @@ static void ggml_mul_mat_vec_nc_f16_f32_cuda(
      const dim3 block_nums(1, nrows_x, nchannels_x);
      const dim3 block_dims(WARP_SIZE, 1, 1);
      mul_mat_vec_nc_f16_f32<<<block_nums, block_dims, 0, stream>>>
-        (vx, y, dst, ncols_x, nrows_x, row_stride_x, nchannels_x, channel_stride_x);
+        (vx, y, dst, ncols_x, nrows_x, row_stride_x, channel_stride_x);
  }
  
  static void ggml_cpy_f32_f32_cuda(
author	Salvador E. Tropea <redacted>
	Wed, 28 Jun 2023 17:27:31 +0000 (14:27 -0300)
committer	GitHub <redacted>
	Wed, 28 Jun 2023 17:27:31 +0000 (20:27 +0300)