mirror of
https://github.com/jart/cosmopolitan.git
synced 2025-01-31 11:37:35 +00:00
5660ec4741
This release is an atomic upgrade to GCC 14.1.0 with C23 and C++23
101 lines
3.3 KiB
C
101 lines
3.3 KiB
C
#if defined(__x86_64__) && !(__ASSEMBLER__ + __LINKER__ + 0)
|
|
#ifndef _IMMINTRIN_H_INCLUDED
|
|
#error "Never use <avxneconvertintrin.h> directly; include <immintrin.h> instead."
|
|
#endif
|
|
#ifndef _AVXNECONVERTINTRIN_H_INCLUDED
|
|
#define _AVXNECONVERTINTRIN_H_INCLUDED
|
|
#ifndef __AVXNECONVERT__
|
|
#pragma GCC push_options
|
|
#pragma GCC target ("avxneconvert")
|
|
#define __DISABLE_AVXNECONVERT__
|
|
#endif
|
|
extern __inline __m128
|
|
__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
|
|
_mm_bcstnebf16_ps (const void *__P)
|
|
{
|
|
return (__m128) __builtin_ia32_vbcstnebf162ps128 ((const __bf16 *) __P);
|
|
}
|
|
extern __inline __m256
|
|
__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
|
|
_mm256_bcstnebf16_ps (const void *__P)
|
|
{
|
|
return (__m256) __builtin_ia32_vbcstnebf162ps256 ((const __bf16 *) __P);
|
|
}
|
|
extern __inline __m128
|
|
__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
|
|
_mm_bcstnesh_ps (const void *__P)
|
|
{
|
|
return (__m128) __builtin_ia32_vbcstnesh2ps128 ((const _Float16 *) __P);
|
|
}
|
|
extern __inline __m256
|
|
__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
|
|
_mm256_bcstnesh_ps (const void *__P)
|
|
{
|
|
return (__m256) __builtin_ia32_vbcstnesh2ps256 ((const _Float16 *) __P);
|
|
}
|
|
extern __inline __m128
|
|
__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
|
|
_mm_cvtneebf16_ps (const __m128bh *__A)
|
|
{
|
|
return (__m128) __builtin_ia32_vcvtneebf162ps128 ((const __v8bf *) __A);
|
|
}
|
|
extern __inline __m256
|
|
__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
|
|
_mm256_cvtneebf16_ps (const __m256bh *__A)
|
|
{
|
|
return (__m256) __builtin_ia32_vcvtneebf162ps256 ((const __v16bf *) __A);
|
|
}
|
|
extern __inline __m128
|
|
__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
|
|
_mm_cvtneeph_ps (const __m128h *__A)
|
|
{
|
|
return (__m128) __builtin_ia32_vcvtneeph2ps128 ((const __v8hf *) __A);
|
|
}
|
|
extern __inline __m256
|
|
__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
|
|
_mm256_cvtneeph_ps (const __m256h *__A)
|
|
{
|
|
return (__m256) __builtin_ia32_vcvtneeph2ps256 ((const __v16hf *) __A);
|
|
}
|
|
extern __inline __m128
|
|
__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
|
|
_mm_cvtneobf16_ps (const __m128bh *__A)
|
|
{
|
|
return (__m128) __builtin_ia32_vcvtneobf162ps128 ((const __v8bf *) __A);
|
|
}
|
|
extern __inline __m256
|
|
__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
|
|
_mm256_cvtneobf16_ps (const __m256bh *__A)
|
|
{
|
|
return (__m256) __builtin_ia32_vcvtneobf162ps256 ((const __v16bf *) __A);
|
|
}
|
|
extern __inline __m128
|
|
__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
|
|
_mm_cvtneoph_ps (const __m128h *__A)
|
|
{
|
|
return (__m128) __builtin_ia32_vcvtneoph2ps128 ((const __v8hf *) __A);
|
|
}
|
|
extern __inline __m256
|
|
__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
|
|
_mm256_cvtneoph_ps (const __m256h *__A)
|
|
{
|
|
return (__m256) __builtin_ia32_vcvtneoph2ps256 ((const __v16hf *) __A);
|
|
}
|
|
extern __inline __m128bh
|
|
__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
|
|
_mm_cvtneps_avx_pbh (__m128 __A)
|
|
{
|
|
return (__m128bh) __builtin_ia32_cvtneps2bf16_v4sf (__A);
|
|
}
|
|
extern __inline __m128bh
|
|
__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
|
|
_mm256_cvtneps_avx_pbh (__m256 __A)
|
|
{
|
|
return (__m128bh) __builtin_ia32_cvtneps2bf16_v8sf (__A);
|
|
}
|
|
#ifdef __DISABLE_AVXNECONVERT__
|
|
#undef __DISABLE_AVXNECONVERT__
|
|
#pragma GCC pop_options
|
|
#endif
|
|
#endif
|
|
#endif
|