Update ggml-cuda.cu
Co-authored-by: slaren <slarengh@gmail.com>
This commit is contained in:
parent
a3a46580f7
commit
763083e567
1 changed files with 1 additions and 1 deletions
|
@ -6898,7 +6898,7 @@ static void mul_mat_vec_q_cuda(
|
|||
const dim3 block_nums(nblocks, 1, 1);
|
||||
const dim3 block_dims(WARP_SIZE, nwarps, 1);
|
||||
|
||||
switch(ncols_y) {
|
||||
switch (ncols_y) {
|
||||
case 1:
|
||||
mul_mat_vec_q<1, qk, qi, block_q_t, vdr, vec_dot>
|
||||
<<<block_nums, block_dims, 0, stream>>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst);
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue