iq1_s: CUDA is working

2024-02-11 13:08:26 +02:00 · 2024-02-11 13:08:26 +02:00 · a9d48e9718
commit a9d48e9718
parent 80cd5bae99
6 changed files with 412 additions and 9 deletions
--- a/llama.h
+++ b/llama.h
@ -100,6 +100,7 @@ extern "C" {
        LLAMA_FTYPE_MOSTLY_Q2_K_S        = 21, // except 1d tensors
        LLAMA_FTYPE_MOSTLY_Q3_K_XS       = 22, // except 1d tensors
        LLAMA_FTYPE_MOSTLY_IQ3_XXS       = 23, // except 1d tensors
+        LLAMA_FTYPE_MOSTLY_IQ1_S         = 24, // except 1d tensors

        LLAMA_FTYPE_GUESSED = 1024, // not specified in the model file
    };