iq4_nl: another fix after merging with master

This commit is contained in:
Iwan Kawrakow 2024-02-19 11:40:35 +02:00
parent 1d90021241
commit e7b999c3dc

View file

@ -6852,6 +6852,7 @@ static void dequantize_row_iq1_s_cuda(const void * vx, dst_t * y, const int k, c
dequantize_block_iq1_s<<<nb, 32, 0, stream>>>(vx, y);
}
template<typename dst_t>
static void dequantize_row_iq4_nl_cuda(const void * vx, dst_t * y, const int k, cudaStream_t stream) {
const int nb = (k + QK_K - 1) / QK_K;
dequantize_block_iq4_nl<<<nb, 32, 0, stream>>>(vx, y);