ggml : sync ggml (add GPT-NeoX RoPE implementation)
This commit is contained in:
parent
9ff334f3c9
commit
12b5900dbc
3 changed files with 49 additions and 17 deletions
3
ggml.h
3
ggml.h
|
@ -630,7 +630,8 @@ struct ggml_tensor * ggml_soft_max(
|
|||
|
||||
// rotary position embedding
|
||||
// in-place, returns view(a)
|
||||
// if mode == 1, skip n_past elements
|
||||
// if mode & 1 == 1, skip n_past elements
|
||||
// if mode & 2 == 1, GPT-NeoX style
|
||||
// TODO: avoid creating a new tensor every time
|
||||
struct ggml_tensor * ggml_rope(
|
||||
struct ggml_context * ctx,
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue