ggml : fix num dimensions in ggml_flash_attn_ext
This commit is contained in:
parent
a39217d428
commit
cb76d747d1
1 changed files with 1 additions and 1 deletions
2
ggml.c
2
ggml.c
|
@ -6321,7 +6321,7 @@ struct ggml_tensor * ggml_flash_attn_ext(
|
||||||
|
|
||||||
// permute(0, 2, 1, 3)
|
// permute(0, 2, 1, 3)
|
||||||
int64_t ne[4] = { q->ne[0], q->ne[2], q->ne[1], q->ne[3] };
|
int64_t ne[4] = { q->ne[0], q->ne[2], q->ne[1], q->ne[3] };
|
||||||
struct ggml_tensor * result = ggml_new_tensor(ctx, GGML_TYPE_F32, GGML_MAX_DIMS, ne);
|
struct ggml_tensor * result = ggml_new_tensor(ctx, GGML_TYPE_F32, 4, ne);
|
||||||
|
|
||||||
float params[] = { scale };
|
float params[] = { scale };
|
||||||
ggml_set_op_params(result, params, sizeof(params));
|
ggml_set_op_params(result, params, sizeof(params));
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue