llamafile : disable sgemm for batch-size 1 (#9330)
This commit is contained in:
parent
1b9ae5189c
commit
e536426ded
1 changed files with 4 additions and 0 deletions
|
@ -1006,6 +1006,10 @@ bool llamafile_sgemm(int64_t m, int64_t n, int64_t k, const void *A, int64_t lda
|
||||||
assert(nth > 0);
|
assert(nth > 0);
|
||||||
assert(ith < nth);
|
assert(ith < nth);
|
||||||
|
|
||||||
|
// only enable sgemm for prompt processing
|
||||||
|
if (n < 2)
|
||||||
|
return false;
|
||||||
|
|
||||||
if (Ctype != GGML_TYPE_F32)
|
if (Ctype != GGML_TYPE_F32)
|
||||||
return false;
|
return false;
|
||||||
|
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue