mirror of
https://github.com/jart/cosmopolitan.git
synced 2025-05-29 16:52:28 +00:00
Speed up fmaf() on x86
This commit is contained in:
parent
640668931d
commit
40b7da8422
1 changed files with 10 additions and 0 deletions
|
@ -100,6 +100,16 @@ float fmaf(float x, float y, float z)
|
||||||
|
|
||||||
#else
|
#else
|
||||||
|
|
||||||
|
#ifdef __x86_64__
|
||||||
|
if (X86_HAVE(FMA)) {
|
||||||
|
asm("vfmadd132ss\t%1,%2,%0" : "+x"(x) : "x"(y), "x"(z));
|
||||||
|
return x;
|
||||||
|
} else if (X86_HAVE(FMA4)) {
|
||||||
|
asm("vfmaddss\t%3,%2,%1,%0" : "=x"(x) : "x"(x), "x"(y), "x"(z));
|
||||||
|
return x;
|
||||||
|
}
|
||||||
|
#endif
|
||||||
|
|
||||||
/* A double has more than twice as much precision than a float,
|
/* A double has more than twice as much precision than a float,
|
||||||
so direct double-precision arithmetic suffices, except where
|
so direct double-precision arithmetic suffices, except where
|
||||||
double rounding occurs. */
|
double rounding occurs. */
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue