Speedup the AVX-512 implementation of ggml_vec_dot_q4_0() (#933)
This commit is contained in:
parent
47f61aaa5f
commit
f266259ad9
4 changed files with 235 additions and 44 deletions
2
ggml.h
2
ggml.h
|
@ -808,6 +808,8 @@ size_t ggml_quantize_q4_1(const float * src, void * dst, int n, int k, int64_t *
|
|||
int ggml_cpu_has_avx(void);
|
||||
int ggml_cpu_has_avx2(void);
|
||||
int ggml_cpu_has_avx512(void);
|
||||
int ggml_cpu_has_avx512_vbmi(void);
|
||||
int ggml_cpu_has_avx512_vnni(void);
|
||||
int ggml_cpu_has_fma(void);
|
||||
int ggml_cpu_has_neon(void);
|
||||
int ggml_cpu_has_arm_fma(void);
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue