rebase to new embed
This commit is contained in:
parent
805ae529c4
commit
97936078b7
3 changed files with 18 additions and 20 deletions
1
llama.h
1
llama.h
|
@ -262,6 +262,7 @@ extern "C" {
|
|||
bool logits_all; // the llama_decode() call computes all logits, not just the last one (DEPRECATED - set llama_batch.logits instead)
|
||||
bool embeddings; // if true, extract embeddings (together with logits)
|
||||
bool offload_kqv; // whether to offload the KQV ops (including the KV cache) to GPU
|
||||
bool causal_attn; // whether to use causal attention
|
||||
|
||||
// Abort callback
|
||||
// if it returns true, execution of llama_decode() will be aborted
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue