backends : add dev messages to support rope freq. factors

2024-05-16 13:23:30 +03:00 · 2024-05-16 13:23:30 +03:00 · 352c3859a7
commit 352c3859a7
parent 471d8170bc
3 changed files with 11 additions and 0 deletions
--- a/ggml-kompute.cpp
+++ b/ggml-kompute.cpp
@ -1677,6 +1677,10 @@ static void ggml_vk_graph_compute(struct ggml_kompute_context * ctx, struct ggml
                    } break;
                case GGML_OP_ROPE:
                    {
 #pragma message("TODO: implement phi3 frequency factors support");
 #pragma message("      https://github.com/ggerganov/llama.cpp/pull/7225");
                        GGML_ASSERT(dst->src[2] == nullptr && "phi3 frequency factors not implemented yet");
                        GGML_ASSERT(ne10 == ne02);
                        GGML_ASSERT(src0t == dstt);
                        // const int n_past = ((int32_t *) dst->op_params)[0];
--- a/ggml-sycl.cpp
+++ b/ggml-sycl.cpp
@ -14454,6 +14454,9 @@ inline void ggml_sycl_op_rope(const ggml_tensor *src0, const ggml_tensor *src1,
                              ggml_tensor *dst, const float *src0_dd,
                              const float *src1_dd, float *dst_dd,
                              const dpct::queue_ptr &main_stream) {
 #pragma message("TODO: implement phi3 frequency factors support");
 #pragma message("      https://github.com/ggerganov/llama.cpp/pull/7225");
    GGML_ASSERT(dst->src[2] == nullptr && "phi3 frequency factors not implemented yet");
    GGML_ASSERT(src0->type == GGML_TYPE_F32 || src0->type == GGML_TYPE_F16);
    GGML_ASSERT( dst->type == GGML_TYPE_F32 ||  dst->type == GGML_TYPE_F16);
--- a/ggml-vulkan.cpp
+++ b/ggml-vulkan.cpp
@ -4238,6 +4238,10 @@ static void ggml_vk_soft_max(ggml_backend_vk_context * ctx, vk_context * subctx,
 }
 static void ggml_vk_rope(ggml_backend_vk_context * ctx, vk_context * subctx, const ggml_tensor * src0, const ggml_tensor * src1, ggml_tensor * dst) {
 #pragma message("TODO: implement phi3 frequency factors support");
 #pragma message("      https://github.com/ggerganov/llama.cpp/pull/7225");
    GGML_ASSERT(dst->src[2] == nullptr && "phi3 frequency factors not implemented yet");
    const int n_dims        = ((int32_t *) dst->op_params)[1];
    const int mode          = ((int32_t *) dst->op_params)[2];
    // const int n_ctx         = ((int32_t *) dst->op_params)[3];