diff --git a/utils.cpp b/utils.cpp index 5213ecb07..1105a2f2b 100644 --- a/utils.cpp +++ b/utils.cpp @@ -5,6 +5,12 @@ #include #include + #if defined(_MSC_VER) || defined(__MINGW32__) + #include // using malloc.h with MSC/MINGW + #elif !defined(__FreeBSD__) + #include + #endif + bool gpt_params_parse(int argc, char ** argv, gpt_params & params) { for (int i = 1; i < argc; i++) { std::string arg = argv[i]; @@ -453,8 +459,8 @@ size_t ggml_quantize_q4_0(float * src, void * dst, int n, int k, int qk, int64_t assert(k % qk == 0); - std::vector pp; - pp.reserve(qk/2); + const size_t pp_size = qk / 2; + uint8_t *pp = static_cast(alloca(pp_size)); char * pdst = (char *) dst; @@ -493,7 +499,7 @@ size_t ggml_quantize_q4_0(float * src, void * dst, int n, int k, int qk, int64_t pp[l/2] = vi0 | (vi1 << 4); } - memcpy(pb, pp.data(), pp.size()); + memcpy(pb, pp, pp_size); pb += bs; } } @@ -508,8 +514,8 @@ size_t ggml_quantize_q4_1(float * src, void * dst, int n, int k, int qk, int64_t assert(k % qk == 0); - std::vector pp; - pp.reserve(qk/2); + const size_t pp_size = qk / 2; + uint8_t *pp = static_cast(alloca(pp_size)); char * pdst = (char *) dst; @@ -553,7 +559,7 @@ size_t ggml_quantize_q4_1(float * src, void * dst, int n, int k, int qk, int64_t pp[l/2] = vi0 | (vi1 << 4); } - memcpy(pb + i*qk/2, pp.data(), pp.size()); + memcpy(pb + i*qk/2, pp, pp_size); } } }