Compare commits
3 commits
master
...
gg/hf-test
Author | SHA1 | Date | |
---|---|---|---|
|
62d7b6c87f | ||
|
503983a69a | ||
|
ae41fd2e65 |
102 changed files with 65 additions and 570 deletions
7
Makefile
7
Makefile
|
@ -434,10 +434,8 @@ endif
|
||||||
|
|
||||||
ifndef RISCV
|
ifndef RISCV
|
||||||
|
|
||||||
ifeq ($(UNAME_M),$(filter $(UNAME_M),x86_64 i686 amd64))
|
MK_CFLAGS += -mfma -mf16c -mavx -mavx2
|
||||||
# Use all CPU extensions that are available:
|
HOST_CXXFLAGS += -mfma -mf16c -mavx -mavx2
|
||||||
MK_CFLAGS += -march=native -mtune=native
|
|
||||||
HOST_CXXFLAGS += -march=native -mtune=native
|
|
||||||
|
|
||||||
# Usage AVX-only
|
# Usage AVX-only
|
||||||
#MK_CFLAGS += -mfma -mf16c -mavx
|
#MK_CFLAGS += -mfma -mf16c -mavx
|
||||||
|
@ -446,7 +444,6 @@ ifeq ($(UNAME_M),$(filter $(UNAME_M),x86_64 i686 amd64))
|
||||||
# Usage SSSE3-only (Not is SSE3!)
|
# Usage SSSE3-only (Not is SSE3!)
|
||||||
#MK_CFLAGS += -mssse3
|
#MK_CFLAGS += -mssse3
|
||||||
#MK_CXXFLAGS += -mssse3
|
#MK_CXXFLAGS += -mssse3
|
||||||
endif
|
|
||||||
|
|
||||||
ifneq '' '$(findstring mingw,$(shell $(CC) -dumpmachine))'
|
ifneq '' '$(findstring mingw,$(shell $(CC) -dumpmachine))'
|
||||||
# The stack is only 16-byte aligned on Windows, so don't let gcc emit aligned moves.
|
# The stack is only 16-byte aligned on Windows, so don't let gcc emit aligned moves.
|
||||||
|
|
|
@ -208,13 +208,7 @@ static void ggml_cuda_flash_attn_ext_vec_f16(ggml_backend_cuda_context & ctx, gg
|
||||||
|
|
||||||
FATTN_VEC_F16_CASE(256, GGML_TYPE_F16, GGML_TYPE_F16)
|
FATTN_VEC_F16_CASE(256, GGML_TYPE_F16, GGML_TYPE_F16)
|
||||||
#else
|
#else
|
||||||
FATTN_VEC_F16_CASE(128, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0)
|
|
||||||
|
|
||||||
FATTN_VEC_F16_CASE(128, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0)
|
|
||||||
|
|
||||||
FATTN_VEC_F16_CASE( 64, GGML_TYPE_F16, GGML_TYPE_F16)
|
|
||||||
FATTN_VEC_F16_CASE(128, GGML_TYPE_F16, GGML_TYPE_F16)
|
FATTN_VEC_F16_CASE(128, GGML_TYPE_F16, GGML_TYPE_F16)
|
||||||
FATTN_VEC_F16_CASE(256, GGML_TYPE_F16, GGML_TYPE_F16)
|
|
||||||
#endif // GGML_CUDA_FA_ALL_QUANTS
|
#endif // GGML_CUDA_FA_ALL_QUANTS
|
||||||
|
|
||||||
on_no_fattn_vec_case(Q->ne[0]);
|
on_no_fattn_vec_case(Q->ne[0]);
|
||||||
|
@ -283,13 +277,7 @@ static void ggml_cuda_flash_attn_ext_vec_f32(ggml_backend_cuda_context & ctx, gg
|
||||||
|
|
||||||
FATTN_VEC_F32_CASE(256, GGML_TYPE_F16, GGML_TYPE_F16)
|
FATTN_VEC_F32_CASE(256, GGML_TYPE_F16, GGML_TYPE_F16)
|
||||||
#else
|
#else
|
||||||
FATTN_VEC_F32_CASE(128, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0)
|
|
||||||
|
|
||||||
FATTN_VEC_F32_CASE(128, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0)
|
|
||||||
|
|
||||||
FATTN_VEC_F32_CASE( 64, GGML_TYPE_F16, GGML_TYPE_F16)
|
|
||||||
FATTN_VEC_F32_CASE(128, GGML_TYPE_F16, GGML_TYPE_F16)
|
FATTN_VEC_F32_CASE(128, GGML_TYPE_F16, GGML_TYPE_F16)
|
||||||
FATTN_VEC_F32_CASE(256, GGML_TYPE_F16, GGML_TYPE_F16)
|
|
||||||
#endif // GGML_CUDA_FA_ALL_QUANTS
|
#endif // GGML_CUDA_FA_ALL_QUANTS
|
||||||
|
|
||||||
on_no_fattn_vec_case(Q->ne[0]);
|
on_no_fattn_vec_case(Q->ne[0]);
|
||||||
|
|
|
@ -32,57 +32,57 @@ void ggml_cuda_op_mul_mat_q(
|
||||||
case GGML_TYPE_Q4_0:
|
case GGML_TYPE_Q4_0:
|
||||||
mul_mat_q_case<GGML_TYPE_Q4_0>(ctx, args, stream);
|
mul_mat_q_case<GGML_TYPE_Q4_0>(ctx, args, stream);
|
||||||
break;
|
break;
|
||||||
case GGML_TYPE_Q4_1:
|
// case GGML_TYPE_Q4_1:
|
||||||
mul_mat_q_case<GGML_TYPE_Q4_1>(ctx, args, stream);
|
// mul_mat_q_case<GGML_TYPE_Q4_1>(ctx, args, stream);
|
||||||
break;
|
// break;
|
||||||
case GGML_TYPE_Q5_0:
|
// case GGML_TYPE_Q5_0:
|
||||||
mul_mat_q_case<GGML_TYPE_Q5_0>(ctx, args, stream);
|
// mul_mat_q_case<GGML_TYPE_Q5_0>(ctx, args, stream);
|
||||||
break;
|
// break;
|
||||||
case GGML_TYPE_Q5_1:
|
// case GGML_TYPE_Q5_1:
|
||||||
mul_mat_q_case<GGML_TYPE_Q5_1>(ctx, args, stream);
|
// mul_mat_q_case<GGML_TYPE_Q5_1>(ctx, args, stream);
|
||||||
break;
|
// break;
|
||||||
case GGML_TYPE_Q8_0:
|
case GGML_TYPE_Q8_0:
|
||||||
mul_mat_q_case<GGML_TYPE_Q8_0>(ctx, args, stream);
|
mul_mat_q_case<GGML_TYPE_Q8_0>(ctx, args, stream);
|
||||||
break;
|
break;
|
||||||
case GGML_TYPE_Q2_K:
|
// case GGML_TYPE_Q2_K:
|
||||||
mul_mat_q_case<GGML_TYPE_Q2_K>(ctx, args, stream);
|
// mul_mat_q_case<GGML_TYPE_Q2_K>(ctx, args, stream);
|
||||||
break;
|
// break;
|
||||||
case GGML_TYPE_Q3_K:
|
// case GGML_TYPE_Q3_K:
|
||||||
mul_mat_q_case<GGML_TYPE_Q3_K>(ctx, args, stream);
|
// mul_mat_q_case<GGML_TYPE_Q3_K>(ctx, args, stream);
|
||||||
break;
|
// break;
|
||||||
case GGML_TYPE_Q4_K:
|
case GGML_TYPE_Q4_K:
|
||||||
mul_mat_q_case<GGML_TYPE_Q4_K>(ctx, args, stream);
|
mul_mat_q_case<GGML_TYPE_Q4_K>(ctx, args, stream);
|
||||||
break;
|
break;
|
||||||
case GGML_TYPE_Q5_K:
|
// case GGML_TYPE_Q5_K:
|
||||||
mul_mat_q_case<GGML_TYPE_Q5_K>(ctx, args, stream);
|
// mul_mat_q_case<GGML_TYPE_Q5_K>(ctx, args, stream);
|
||||||
break;
|
// break;
|
||||||
case GGML_TYPE_Q6_K:
|
case GGML_TYPE_Q6_K:
|
||||||
mul_mat_q_case<GGML_TYPE_Q6_K>(ctx, args, stream);
|
mul_mat_q_case<GGML_TYPE_Q6_K>(ctx, args, stream);
|
||||||
break;
|
break;
|
||||||
case GGML_TYPE_IQ2_XXS:
|
// case GGML_TYPE_IQ2_XXS:
|
||||||
mul_mat_q_case<GGML_TYPE_IQ2_XXS>(ctx, args, stream);
|
// mul_mat_q_case<GGML_TYPE_IQ2_XXS>(ctx, args, stream);
|
||||||
break;
|
// break;
|
||||||
case GGML_TYPE_IQ2_XS:
|
// case GGML_TYPE_IQ2_XS:
|
||||||
mul_mat_q_case<GGML_TYPE_IQ2_XS>(ctx, args, stream);
|
// mul_mat_q_case<GGML_TYPE_IQ2_XS>(ctx, args, stream);
|
||||||
break;
|
// break;
|
||||||
case GGML_TYPE_IQ2_S:
|
// case GGML_TYPE_IQ2_S:
|
||||||
mul_mat_q_case<GGML_TYPE_IQ2_S>(ctx, args, stream);
|
// mul_mat_q_case<GGML_TYPE_IQ2_S>(ctx, args, stream);
|
||||||
break;
|
// break;
|
||||||
case GGML_TYPE_IQ3_XXS:
|
// case GGML_TYPE_IQ3_XXS:
|
||||||
mul_mat_q_case<GGML_TYPE_IQ3_XXS>(ctx, args, stream);
|
// mul_mat_q_case<GGML_TYPE_IQ3_XXS>(ctx, args, stream);
|
||||||
break;
|
// break;
|
||||||
case GGML_TYPE_IQ3_S:
|
// case GGML_TYPE_IQ3_S:
|
||||||
mul_mat_q_case<GGML_TYPE_IQ3_S>(ctx, args, stream);
|
// mul_mat_q_case<GGML_TYPE_IQ3_S>(ctx, args, stream);
|
||||||
break;
|
// break;
|
||||||
case GGML_TYPE_IQ1_S:
|
// case GGML_TYPE_IQ1_S:
|
||||||
mul_mat_q_case<GGML_TYPE_IQ1_S>(ctx, args, stream);
|
// mul_mat_q_case<GGML_TYPE_IQ1_S>(ctx, args, stream);
|
||||||
break;
|
// break;
|
||||||
case GGML_TYPE_IQ4_XS:
|
// case GGML_TYPE_IQ4_XS:
|
||||||
mul_mat_q_case<GGML_TYPE_IQ4_XS>(ctx, args, stream);
|
// mul_mat_q_case<GGML_TYPE_IQ4_XS>(ctx, args, stream);
|
||||||
break;
|
// break;
|
||||||
case GGML_TYPE_IQ4_NL:
|
// case GGML_TYPE_IQ4_NL:
|
||||||
mul_mat_q_case<GGML_TYPE_IQ4_NL>(ctx, args, stream);
|
// mul_mat_q_case<GGML_TYPE_IQ4_NL>(ctx, args, stream);
|
||||||
break;
|
// break;
|
||||||
default:
|
default:
|
||||||
GGML_ABORT("fatal error");
|
GGML_ABORT("fatal error");
|
||||||
break;
|
break;
|
||||||
|
|
|
@ -2906,24 +2906,24 @@ void mul_mat_q_case(ggml_backend_cuda_context & ctx, const mmq_args & args, cuda
|
||||||
#define DECL_MMQ_CASE(type) \
|
#define DECL_MMQ_CASE(type) \
|
||||||
template void mul_mat_q_case<type>(ggml_backend_cuda_context & ctx, const mmq_args & args, cudaStream_t stream) \
|
template void mul_mat_q_case<type>(ggml_backend_cuda_context & ctx, const mmq_args & args, cudaStream_t stream) \
|
||||||
|
|
||||||
extern DECL_MMQ_CASE(GGML_TYPE_Q4_0);
|
//extern DECL_MMQ_CASE(GGML_TYPE_Q4_0);
|
||||||
extern DECL_MMQ_CASE(GGML_TYPE_Q4_1);
|
//extern DECL_MMQ_CASE(GGML_TYPE_Q4_1);
|
||||||
extern DECL_MMQ_CASE(GGML_TYPE_Q5_0);
|
//extern DECL_MMQ_CASE(GGML_TYPE_Q5_0);
|
||||||
extern DECL_MMQ_CASE(GGML_TYPE_Q5_1);
|
//extern DECL_MMQ_CASE(GGML_TYPE_Q5_1);
|
||||||
extern DECL_MMQ_CASE(GGML_TYPE_Q8_0);
|
extern DECL_MMQ_CASE(GGML_TYPE_Q8_0);
|
||||||
extern DECL_MMQ_CASE(GGML_TYPE_Q2_K);
|
//extern DECL_MMQ_CASE(GGML_TYPE_Q2_K);
|
||||||
extern DECL_MMQ_CASE(GGML_TYPE_Q3_K);
|
//extern DECL_MMQ_CASE(GGML_TYPE_Q3_K);
|
||||||
extern DECL_MMQ_CASE(GGML_TYPE_Q4_K);
|
extern DECL_MMQ_CASE(GGML_TYPE_Q4_K);
|
||||||
extern DECL_MMQ_CASE(GGML_TYPE_Q5_K);
|
//extern DECL_MMQ_CASE(GGML_TYPE_Q5_K);
|
||||||
extern DECL_MMQ_CASE(GGML_TYPE_Q6_K);
|
extern DECL_MMQ_CASE(GGML_TYPE_Q6_K);
|
||||||
extern DECL_MMQ_CASE(GGML_TYPE_IQ2_XXS);
|
//extern DECL_MMQ_CASE(GGML_TYPE_IQ2_XXS);
|
||||||
extern DECL_MMQ_CASE(GGML_TYPE_IQ2_XS);
|
//extern DECL_MMQ_CASE(GGML_TYPE_IQ2_XS);
|
||||||
extern DECL_MMQ_CASE(GGML_TYPE_IQ2_S);
|
//extern DECL_MMQ_CASE(GGML_TYPE_IQ2_S);
|
||||||
extern DECL_MMQ_CASE(GGML_TYPE_IQ3_XXS);
|
//extern DECL_MMQ_CASE(GGML_TYPE_IQ3_XXS);
|
||||||
extern DECL_MMQ_CASE(GGML_TYPE_IQ3_S);
|
//extern DECL_MMQ_CASE(GGML_TYPE_IQ3_S);
|
||||||
extern DECL_MMQ_CASE(GGML_TYPE_IQ1_S);
|
//extern DECL_MMQ_CASE(GGML_TYPE_IQ1_S);
|
||||||
extern DECL_MMQ_CASE(GGML_TYPE_IQ4_NL);
|
//extern DECL_MMQ_CASE(GGML_TYPE_IQ4_NL);
|
||||||
extern DECL_MMQ_CASE(GGML_TYPE_IQ4_XS);
|
//extern DECL_MMQ_CASE(GGML_TYPE_IQ4_XS);
|
||||||
|
|
||||||
// -------------------------------------------------------------------------------------------------------------------------
|
// -------------------------------------------------------------------------------------------------------------------------
|
||||||
|
|
||||||
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f16.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_F16, GGML_TYPE_Q4_0);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f16.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_F16, GGML_TYPE_Q4_1);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f16.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_F16, GGML_TYPE_Q5_0);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f16.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_F16, GGML_TYPE_Q5_1);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f16.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_F16, GGML_TYPE_Q8_0);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f16.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q4_0, GGML_TYPE_F16);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f16.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f16.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q4_0, GGML_TYPE_Q4_1);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f16.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q4_0, GGML_TYPE_Q5_0);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f16.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q4_0, GGML_TYPE_Q5_1);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f16.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q4_0, GGML_TYPE_Q8_0);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f16.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q4_1, GGML_TYPE_F16);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f16.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q4_1, GGML_TYPE_Q4_0);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f16.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q4_1, GGML_TYPE_Q4_1);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f16.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q4_1, GGML_TYPE_Q5_0);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f16.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q4_1, GGML_TYPE_Q5_1);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f16.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q4_1, GGML_TYPE_Q8_0);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f16.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q5_0, GGML_TYPE_F16);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f16.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q5_0, GGML_TYPE_Q4_0);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f16.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q5_0, GGML_TYPE_Q4_1);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f16.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q5_0, GGML_TYPE_Q5_0);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f16.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q5_0, GGML_TYPE_Q5_1);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f16.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q5_0, GGML_TYPE_Q8_0);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f16.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q5_1, GGML_TYPE_F16);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f16.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q5_1, GGML_TYPE_Q4_0);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f16.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q5_1, GGML_TYPE_Q4_1);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f16.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q5_1, GGML_TYPE_Q5_0);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f16.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q5_1, GGML_TYPE_Q5_1);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f16.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q5_1, GGML_TYPE_Q8_0);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f16.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q8_0, GGML_TYPE_F16);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f16.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q8_0, GGML_TYPE_Q4_0);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f16.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q8_0, GGML_TYPE_Q4_1);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f16.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q8_0, GGML_TYPE_Q5_0);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f16.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q8_0, GGML_TYPE_Q5_1);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f16.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f16.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F16_CASE(256, GGML_TYPE_F16, GGML_TYPE_F16);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f16.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F16_CASE(64, GGML_TYPE_F16, GGML_TYPE_F16);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f16.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F16_CASE(64, GGML_TYPE_F16, GGML_TYPE_Q4_0);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f16.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F16_CASE(64, GGML_TYPE_F16, GGML_TYPE_Q4_1);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f16.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F16_CASE(64, GGML_TYPE_F16, GGML_TYPE_Q5_0);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f16.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F16_CASE(64, GGML_TYPE_F16, GGML_TYPE_Q5_1);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f16.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F16_CASE(64, GGML_TYPE_F16, GGML_TYPE_Q8_0);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f32.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_F16, GGML_TYPE_Q4_0);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f32.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_F16, GGML_TYPE_Q4_1);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f32.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_F16, GGML_TYPE_Q5_0);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f32.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_F16, GGML_TYPE_Q5_1);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f32.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_F16, GGML_TYPE_Q8_0);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f32.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q4_0, GGML_TYPE_F16);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f32.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f32.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q4_0, GGML_TYPE_Q4_1);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f32.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q4_0, GGML_TYPE_Q5_0);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f32.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q4_0, GGML_TYPE_Q5_1);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f32.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q4_0, GGML_TYPE_Q8_0);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f32.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q4_1, GGML_TYPE_F16);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f32.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q4_1, GGML_TYPE_Q4_0);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f32.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q4_1, GGML_TYPE_Q4_1);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f32.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q4_1, GGML_TYPE_Q5_0);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f32.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q4_1, GGML_TYPE_Q5_1);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f32.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q4_1, GGML_TYPE_Q8_0);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f32.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q5_0, GGML_TYPE_F16);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f32.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q5_0, GGML_TYPE_Q4_0);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f32.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q5_0, GGML_TYPE_Q4_1);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f32.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q5_0, GGML_TYPE_Q5_0);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f32.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q5_0, GGML_TYPE_Q5_1);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f32.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q5_0, GGML_TYPE_Q8_0);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f32.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q5_1, GGML_TYPE_F16);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f32.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q5_1, GGML_TYPE_Q4_0);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f32.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q5_1, GGML_TYPE_Q4_1);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f32.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q5_1, GGML_TYPE_Q5_0);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f32.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q5_1, GGML_TYPE_Q5_1);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f32.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q5_1, GGML_TYPE_Q8_0);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f32.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q8_0, GGML_TYPE_F16);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f32.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q8_0, GGML_TYPE_Q4_0);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f32.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q8_0, GGML_TYPE_Q4_1);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f32.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q8_0, GGML_TYPE_Q5_0);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f32.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q8_0, GGML_TYPE_Q5_1);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f32.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f32.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F32_CASE(256, GGML_TYPE_F16, GGML_TYPE_F16);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f32.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F32_CASE(64, GGML_TYPE_F16, GGML_TYPE_F16);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f32.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F32_CASE(64, GGML_TYPE_F16, GGML_TYPE_Q4_0);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f32.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F32_CASE(64, GGML_TYPE_F16, GGML_TYPE_Q4_1);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f32.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F32_CASE(64, GGML_TYPE_F16, GGML_TYPE_Q5_0);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f32.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F32_CASE(64, GGML_TYPE_F16, GGML_TYPE_Q5_1);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../fattn-vec-f32.cuh"
|
|
||||||
|
|
||||||
DECL_FATTN_VEC_F32_CASE(64, GGML_TYPE_F16, GGML_TYPE_Q8_0);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../mmq.cuh"
|
|
||||||
|
|
||||||
DECL_MMQ_CASE(GGML_TYPE_IQ1_S);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../mmq.cuh"
|
|
||||||
|
|
||||||
DECL_MMQ_CASE(GGML_TYPE_IQ2_S);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../mmq.cuh"
|
|
||||||
|
|
||||||
DECL_MMQ_CASE(GGML_TYPE_IQ2_XS);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../mmq.cuh"
|
|
||||||
|
|
||||||
DECL_MMQ_CASE(GGML_TYPE_IQ2_XXS);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../mmq.cuh"
|
|
||||||
|
|
||||||
DECL_MMQ_CASE(GGML_TYPE_IQ3_S);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../mmq.cuh"
|
|
||||||
|
|
||||||
DECL_MMQ_CASE(GGML_TYPE_IQ3_XXS);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../mmq.cuh"
|
|
||||||
|
|
||||||
DECL_MMQ_CASE(GGML_TYPE_IQ4_NL);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../mmq.cuh"
|
|
||||||
|
|
||||||
DECL_MMQ_CASE(GGML_TYPE_IQ4_XS);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../mmq.cuh"
|
|
||||||
|
|
||||||
DECL_MMQ_CASE(GGML_TYPE_Q2_K);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../mmq.cuh"
|
|
||||||
|
|
||||||
DECL_MMQ_CASE(GGML_TYPE_Q3_K);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../mmq.cuh"
|
|
||||||
|
|
||||||
DECL_MMQ_CASE(GGML_TYPE_Q4_1);
|
|
|
@ -1,5 +0,0 @@
|
||||||
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
||||||
|
|
||||||
#include "../mmq.cuh"
|
|
||||||
|
|
||||||
DECL_MMQ_CASE(GGML_TYPE_Q5_0);
|
|
Some files were not shown because too many files have changed in this diff Show more
Loading…
Add table
Add a link
Reference in a new issue