Merge branch 'master' into gg/flash-attn

2024-01-28 10:53:16 +02:00 · 2024-01-28 10:53:16 +02:00 · b3dd7d975f
commit b3dd7d975f
parent 6fea843b24 b2b2bf988c
75 changed files with 4927 additions and 1996 deletions
--- a/tests/test-backend-ops.cpp
+++ b/tests/test-backend-ops.cpp
@ -102,7 +102,6 @@ static std::vector<float> tensor_to_float(const ggml_tensor * t) {
                    } else if (t->type == GGML_TYPE_I8) {
                        tv.push_back((float)*(int8_t *) &buf[i]);
                    } else if (quantized) {
-                        std::vector<float> vq(ggml_blck_size(t->type));
                        tt.to_float(&buf[i], vq.data(), ggml_blck_size(t->type));
                        tv.insert(tv.end(), vq.begin(), vq.end());
                    } else {