iq2_xs: CUDA and scalar CPU works

This commit is contained in:
Iwan Kawrakow 2024-01-09 18:19:02 +02:00
parent 9f21b82e4b
commit 9b6e38d8c0
5 changed files with 669 additions and 111 deletions

View file

@ -134,8 +134,9 @@ int main(int argc, char * argv[]) {
continue;
}
if ((ggml_type)i == GGML_TYPE_IQ2_XXS) {
printf("Skip %s due to missing quantization functionality\n", ggml_type_name((ggml_type) i));
const ggml_type ei = (ggml_type)i;
if (ei == GGML_TYPE_IQ2_XXS || ei == GGML_TYPE_IQ2_XS) {
printf("Skip %s due to missing quantization functionality\n", ggml_type_name(ei));
continue;
}