From ddac1ef6813132eb9e817460ef389bf7fe3c12a3 Mon Sep 17 00:00:00 2001 From: Georgi Gerganov Date: Sun, 2 Jun 2024 19:58:50 +0300 Subject: [PATCH] cuda : fix array size + indents ggml-ci --- ggml-cuda/rope.cu | 2 +- ggml.c | 4 ++-- 2 files changed, 3 insertions(+), 3 deletions(-) diff --git a/ggml-cuda/rope.cu b/ggml-cuda/rope.cu index 919884834..596fb7c13 100644 --- a/ggml-cuda/rope.cu +++ b/ggml-cuda/rope.cu @@ -1,7 +1,7 @@ #include "rope.cuh" struct rope_corr_dims { - float v[4]; // TODO: is there any reson for this to be 4 instead of 2? + float v[2]; }; static __device__ float rope_yarn_ramp(const float low, const float high, const int i0) { diff --git a/ggml.c b/ggml.c index 0ebe8ae85..b0984ae7a 100644 --- a/ggml.c +++ b/ggml.c @@ -14371,7 +14371,7 @@ static void ggml_compute_forward_rope_f32( const float sin_theta = cache[i0 + 1]; const float * const src = (float *)((char *) src0->data + i3*nb03 + i2*nb02 + i1*nb01 + i0*nb00); - float * dst_data = (float *)((char *) dst->data + i3*nb3 + i2*nb2 + i1*nb1 + i0*nb0); + float * dst_data = (float *)((char *) dst->data + i3*nb3 + i2*nb2 + i1*nb1 + i0*nb0); const float x0 = src[0]; const float x1 = src[1]; @@ -14500,7 +14500,7 @@ static void ggml_compute_forward_rope_f16( const float sin_theta = cache[i0 + 1]; const ggml_fp16_t * const src = (ggml_fp16_t *)((char *) src0->data + i3*nb03 + i2*nb02 + i1*nb01 + i0*nb00); - ggml_fp16_t * dst_data = (ggml_fp16_t *)((char *) dst->data + i3*nb3 + i2*nb2 + i1*nb1 + i0*nb0); + ggml_fp16_t * dst_data = (ggml_fp16_t *)((char *) dst->data + i3*nb3 + i2*nb2 + i1*nb1 + i0*nb0); const float x0 = GGML_FP16_TO_FP32(src[0]); const float x1 = GGML_FP16_TO_FP32(src[1]);