remove useless prefetches.
This commit is contained in:
parent
d8d574c56f
commit
204bc1ffdc
1 changed files with 1 additions and 11 deletions
|
@ -47,22 +47,12 @@ inline static void GGML_F32x16_VEC_FMA(const float32x16_t *mvec1, const float32x
|
|||
"vprefetch1\t64(%[VEC2])\n\t"
|
||||
"vprefetch0\t128(%[VEC2])\n\t"
|
||||
"vprefetch1\t192(%[VEC2])\n\t"
|
||||
"mov\t%[ITER],%%r8\n\t" // How many vector sized chunks we are responsible for.
|
||||
"mov\t%[ITER],%%r8\n\t" // How many vector sized chunks are we responsible for?
|
||||
"mov\t%[VEC1],%%r10\n\t" // Where do we start work in mvec1?
|
||||
"mov\t%[VEC2],%%r12\n\t" // Where do we start work in mvec2?
|
||||
"cmp\t$0,%[CLR]\n\t" // Should we clear the sum before we start?
|
||||
"jz\t4f\n\t"
|
||||
"vbroadcastss\t%[Z]%{uint8%},\t%%zmm0\n\t" // if so, use an upscaling operator to do it.
|
||||
"vprefetchnta\t(%%r10)\n\t"
|
||||
"vprefetchnta\t(%%r12)\n\t"
|
||||
"vprefetch1\t128(%%r10)\n\t"
|
||||
"vprefetch1\t128(%%r12)\n\t"
|
||||
"vprefetch1\t256(%%r10)\n\t"
|
||||
"vprefetch1\t256(%%r12)\n\t"
|
||||
"vprefetch1\t384(%%r10)\n\t"
|
||||
"vprefetch1\t384(%%r12)\n\t"
|
||||
"vprefetch1\t512(%%r10)\n\t"
|
||||
"vprefetch1\t512(%%r12)\n\t"
|
||||
"jmp\t1f\n\t"
|
||||
"4:\n\t"
|
||||
"vprefetch0\t(%[RES])\n\t"
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue