]> git.djapps.eu Git - pkg/ggml/sources/ggml/commitdiff
CUDA: add unused vars to mmvf and mmvq (llama/16807)
authorAman Gupta <redacted>
Tue, 28 Oct 2025 02:31:21 +0000 (10:31 +0800)
committerGeorgi Gerganov <redacted>
Sat, 1 Nov 2025 07:41:35 +0000 (09:41 +0200)
src/ggml-cuda/mmvf.cu
src/ggml-cuda/mmvq.cu

index c2c31cdaf231bc7f1a72426f88af6df4a74ccb07..4e31783436d80a4abc06645ecab14b3b3c1a0aee 100644 (file)
@@ -343,6 +343,10 @@ static __global__ void mul_mat_vec_f(
     }
 
     dst[tid*stride_col_dst + row] = value;
+
+    if constexpr (!has_fusion) {
+        GGML_UNUSED_VARS(use_gate, use_bias, use_gate_bias, glu_op, gate_x, x_bias, gate_bias, sumf_gate);
+    }
 }
 
 template<typename T, typename type_acc, int ncols_dst, int block_size>
index 7a783e4fcf9b45cbf206e17f9d9dcc274881892e..be04a85cc55154cb10963c6069b4b9eafd6db5c8 100644 (file)
@@ -310,6 +310,10 @@ static __global__ void mul_mat_vec_q(
             dst[j*stride_col_dst + threadIdx.x] = result;
         }
     }
+
+    if constexpr (!has_fusion) {
+        GGML_UNUSED_VARS(use_gate, use_bias, use_gate_bias, active_glu, gate_bias, x_bias, tmp_gate);
+    }
 }
 
 static std::pair<dim3, dim3> calc_launch_params(