Allow "quantizing" to f16 and f32 (#1787)

* Allow "quantizing" to f16 and f32 Fix an issue where quantizing didn't respect LLAMA_NO_K_QUANTS Add brief help to the list of quantization types in the quantize tool Ignore case for quantization type arguments in the quantize tool
2023-06-13 04:23:23 -06:00 · 2023-06-13 04:23:23 -06:00 · 74d4cfa343
commit 74d4cfa343
parent 74a6d922f1
4 changed files with 154 additions and 48 deletions
--- a/1
+++ b/1
@ -127,6 +127,7 @@ endif

 ifndef LLAMA_NO_K_QUANTS
 	CFLAGS   += -DGGML_USE_K_QUANTS
+	CXXFLAGS += -DGGML_USE_K_QUANTS
 	OBJS     += k_quants.o
 endif