YaRN : correction to GPT-NeoX implementation
ggml-ci
This commit is contained in:
parent
a6fc554e26
commit
f824902623
3 changed files with 7 additions and 12 deletions
6
ggml.c
6
ggml.c
|
@ -11084,8 +11084,7 @@ static void ggml_compute_forward_rope_f32(
|
|||
theta_base *= freq_scale;
|
||||
for (int64_t ib = 0; ib < ne0/n_dims; ++ib) {
|
||||
for (int64_t ic = 0; ic < n_dims; ic += 2) {
|
||||
// simplified from `(ib * n_dims + ic) * inv_ndims`
|
||||
float cur_rot = inv_ndims * ic - ib;
|
||||
int64_t cur_rot = ib * n_dims + ic;
|
||||
|
||||
float cos_theta, sin_theta;
|
||||
rope_yarn(
|
||||
|
@ -11237,8 +11236,7 @@ static void ggml_compute_forward_rope_f16(
|
|||
theta_base *= freq_scale;
|
||||
for (int64_t ib = 0; ib < ne0/n_dims; ++ib) {
|
||||
for (int64_t ic = 0; ic < n_dims; ic += 2) {
|
||||
// simplified from `(ib * n_dims + ic) * inv_ndims`
|
||||
float cur_rot = inv_ndims * ic - ib;
|
||||
int64_t cur_rot = ib * n_dims + ic;
|
||||
|
||||
float cos_theta, sin_theta;
|
||||
rope_yarn(
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue