ggml : fix Q4_3 cuBLAS

This commit is contained in:
Georgi Gerganov 2023-04-22 16:31:56 +03:00
parent 857308d1e8
commit 0e018fe008
No known key found for this signature in database
GPG key ID: 449E073F9DC10735
2 changed files with 5 additions and 0 deletions

3
ggml.c
View file

@ -7992,6 +7992,9 @@ static void ggml_compute_forward_mul_mat_q_f32(
else if (type == GGML_TYPE_Q4_2) {
dequantize_row_q_cuda = dequantize_row_q4_2_cuda;
}
else if (type == GGML_TYPE_Q4_3) {
dequantize_row_q_cuda = dequantize_row_q4_3_cuda;
}
else {
GGML_ASSERT(false);
}