CUDA: fix shared memory access condition for mmv

2024-12-09 19:29:22 +01:00 · 2024-12-09 19:29:22 +01:00 · 6768787dd3
commit 6768787dd3
parent c37fb4cf62
1 changed files with 1 additions and 1 deletions
--- a/ggml/src/ggml-cuda/mmv.cu
+++ b/ggml/src/ggml-cuda/mmv.cu
@ -57,7 +57,7 @@ static __global__ void mul_mat_vec(
    if (block_size > WARP_SIZE) {
        buf_iw[tid/WARP_SIZE] = sumf;
        __syncthreads();
-        if (tid > WARP_SIZE) {
+        if (tid >= WARP_SIZE) {
            return;
        }
        sumf = buf_iw[tid];