ggml : revert FA K/Q names

This commit is contained in:
Georgi Gerganov 2024-07-11 12:57:48 +03:00
parent 2a3cd5de2c
commit f07f1b8afa
No known key found for this signature in database
GPG key ID: BF970631944C16B7

View file

@ -15198,8 +15198,8 @@ static void ggml_compute_forward_flash_attn_ext_f16(
const float m0 = powf(2.0f, -(max_bias ) / n_head_log2);
const float m1 = powf(2.0f, -(max_bias / 2.0f) / n_head_log2);
enum ggml_type const kq_vec_dot_type = type_traits[k->type].vec_dot_type;
ggml_from_float_t const kq_from_float = type_traits[kq_vec_dot_type].from_float;
enum ggml_type const k_vec_dot_type = type_traits[k->type].vec_dot_type;
ggml_from_float_t const q_to_vec_dot = type_traits[k_vec_dot_type].from_float;
ggml_vec_dot_t const kq_vec_dot = type_traits[k->type].vec_dot;
ggml_to_float_t const v_to_float = type_traits[v->type].to_float;
@ -15238,7 +15238,7 @@ static void ggml_compute_forward_flash_attn_ext_f16(
const int iv2 = iq2 / rv2;
const float * pq = (const float *) ((char *) q->data + (iq1*nbq1 + iq2*nbq2 + iq3*nbq3));
kq_from_float(pq, Q_q, D);
q_to_vec_dot(pq, Q_q, D);
// online softmax / attention
// loop over n_kv and n_head_kv