Merge branch 'master' into jon/tall-and-skinny-matmul
This commit is contained in:
commit
b208c252a2
3 changed files with 505 additions and 358 deletions
2
Makefile
2
Makefile
|
@ -133,7 +133,7 @@ $(info I CC: $(CCV))
|
||||||
$(info I CXX: $(CXXV))
|
$(info I CXX: $(CXXV))
|
||||||
$(info )
|
$(info )
|
||||||
|
|
||||||
default: main quantize perplexity embedding
|
default: main quantize quantize-stats perplexity embedding
|
||||||
|
|
||||||
#
|
#
|
||||||
# Build library
|
# Build library
|
||||||
|
|
2
ggml.h
2
ggml.h
|
@ -204,6 +204,7 @@ enum ggml_type {
|
||||||
GGML_TYPE_F16 = 1,
|
GGML_TYPE_F16 = 1,
|
||||||
GGML_TYPE_Q4_0 = 2,
|
GGML_TYPE_Q4_0 = 2,
|
||||||
GGML_TYPE_Q4_1 = 3,
|
GGML_TYPE_Q4_1 = 3,
|
||||||
|
GGML_TYPE_Q8_0 = 4,
|
||||||
GGML_TYPE_I8,
|
GGML_TYPE_I8,
|
||||||
GGML_TYPE_I16,
|
GGML_TYPE_I16,
|
||||||
GGML_TYPE_I32,
|
GGML_TYPE_I32,
|
||||||
|
@ -836,6 +837,7 @@ typedef struct {
|
||||||
dequantize_row_q_t dequantize_row_q;
|
dequantize_row_q_t dequantize_row_q;
|
||||||
quantize_row_q_t quantize_row_q;
|
quantize_row_q_t quantize_row_q;
|
||||||
quantize_row_q_t quantize_row_q_reference;
|
quantize_row_q_t quantize_row_q_reference;
|
||||||
|
quantize_row_q_t quantize_row_q_dot;
|
||||||
vec_dot_q_t vec_dot_q;
|
vec_dot_q_t vec_dot_q;
|
||||||
} quantize_fns_t;
|
} quantize_fns_t;
|
||||||
|
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue