cuda : implement soft_max_ext
This commit is contained in:
parent
e89597c062
commit
88519fbf97
3 changed files with 28 additions and 14 deletions
6
ggml.c
6
ggml.c
|
@ -4829,6 +4829,12 @@ static struct ggml_tensor * ggml_soft_max_impl(
|
|||
struct ggml_tensor * mask,
|
||||
float scale,
|
||||
bool inplace) {
|
||||
if (mask) {
|
||||
GGML_ASSERT(mask->ne[2] == 1);
|
||||
GGML_ASSERT(mask->ne[3] == 1);
|
||||
GGML_ASSERT(ggml_can_repeat_rows(mask, a));
|
||||
}
|
||||
|
||||
bool is_node = false;
|
||||
|
||||
if (a->grad) {
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue