From 6683eb496061c4d7b9055c55f94ae6f5f944272f Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Henrik=20Forst=C3=A9n?= Date: Tue, 2 Jan 2024 20:07:34 +0200 Subject: [PATCH] Fix buffer size --- ggml-quants.c | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/ggml-quants.c b/ggml-quants.c index 91cd2f0d9..aea9bae04 100644 --- a/ggml-quants.c +++ b/ggml-quants.c @@ -1336,7 +1336,7 @@ static void quantize_q_k_1(const float * x, int bits, int scale_bits, int block_ float mins[QK_K/block_size]; for (int j = 0; j < QK_K/block_size; j++) { - uint8_t q[QK_K/block_size]; + uint8_t q[block_size]; // First find least squares solution for min and scale for each block. quantize_1(&x[block_size*j], block_size, bits, q, &mins[j], &scales[j]); // Flip the sign because quantize_1 assumes that min is added, but min