From 156b9b676a803d45454e450843e42d7439ec5262 Mon Sep 17 00:00:00 2001 From: Julia Longtin Date: Fri, 10 May 2024 16:28:53 +0000 Subject: [PATCH] remove useless prefetches. --- ggml-phi-knc.c | 12 +----------- 1 file changed, 1 insertion(+), 11 deletions(-) diff --git a/ggml-phi-knc.c b/ggml-phi-knc.c index 9d7a34199..00bc860f1 100644 --- a/ggml-phi-knc.c +++ b/ggml-phi-knc.c @@ -47,22 +47,12 @@ inline static void GGML_F32x16_VEC_FMA(const float32x16_t *mvec1, const float32x "vprefetch1\t64(%[VEC2])\n\t" "vprefetch0\t128(%[VEC2])\n\t" "vprefetch1\t192(%[VEC2])\n\t" - "mov\t%[ITER],%%r8\n\t" // How many vector sized chunks we are responsible for. + "mov\t%[ITER],%%r8\n\t" // How many vector sized chunks are we responsible for? "mov\t%[VEC1],%%r10\n\t" // Where do we start work in mvec1? "mov\t%[VEC2],%%r12\n\t" // Where do we start work in mvec2? "cmp\t$0,%[CLR]\n\t" // Should we clear the sum before we start? "jz\t4f\n\t" "vbroadcastss\t%[Z]%{uint8%},\t%%zmm0\n\t" // if so, use an upscaling operator to do it. - "vprefetchnta\t(%%r10)\n\t" - "vprefetchnta\t(%%r12)\n\t" - "vprefetch1\t128(%%r10)\n\t" - "vprefetch1\t128(%%r12)\n\t" - "vprefetch1\t256(%%r10)\n\t" - "vprefetch1\t256(%%r12)\n\t" - "vprefetch1\t384(%%r10)\n\t" - "vprefetch1\t384(%%r12)\n\t" - "vprefetch1\t512(%%r10)\n\t" - "vprefetch1\t512(%%r12)\n\t" "jmp\t1f\n\t" "4:\n\t" "vprefetch0\t(%[RES])\n\t"