CUDA: add unused vars to mmvf and mmvq (llama/16807)

2025-10-28 10:31:21 +08:00 · 2025-10-28 10:31:21 +08:00 · 0c8ff48103
parent 9664420a54
commit 0c8ff48103
2 changed files with 8 additions and 0 deletions
--- a/ggml/src/ggml-cuda/mmvf.cu
+++ b/ggml/src/ggml-cuda/mmvf.cu
@ -343,6 +343,10 @@ static __global__ void mul_mat_vec_f(
    }

    dst[tid*stride_col_dst + row] = value;
+
+    if constexpr (!has_fusion) {
+        GGML_UNUSED_VARS(use_gate, use_bias, use_gate_bias, glu_op, gate_x, x_bias, gate_bias, sumf_gate);
+    }
 }

 template<typename T, typename type_acc, int ncols_dst, int block_size>
--- a/ggml/src/ggml-cuda/mmvq.cu
+++ b/ggml/src/ggml-cuda/mmvq.cu
@ -310,6 +310,10 @@ static __global__ void mul_mat_vec_q(
            dst[j*stride_col_dst + threadIdx.x] = result;
        }
    }
+
+    if constexpr (!has_fusion) {
+        GGML_UNUSED_VARS(use_gate, use_bias, use_gate_bias, active_glu, gate_bias, x_bias, tmp_gate);
+    }
 }

 static std::pair<dim3, dim3> calc_launch_params(