mirror of
https://github.com/jart/cosmopolitan.git
synced 2025-01-31 03:27:39 +00:00
100 lines
3.6 KiB
C
100 lines
3.6 KiB
C
#ifndef _IMMINTRIN_H_INCLUDED
|
|
#error "Never use <avx512cdintrin.h> directly; include <immintrin.h> instead."
|
|
#endif
|
|
|
|
#ifndef _AVX512CDINTRIN_H_INCLUDED
|
|
#define _AVX512CDINTRIN_H_INCLUDED
|
|
|
|
#ifndef __AVX512CD__
|
|
#pragma GCC push_options
|
|
#pragma GCC target("avx512cd")
|
|
#define __DISABLE_AVX512CD__
|
|
#endif /* __AVX512CD__ */
|
|
|
|
typedef long long __v8di __attribute__((__vector_size__(64)));
|
|
typedef int __v16si __attribute__((__vector_size__(64)));
|
|
|
|
typedef long long __m512i __attribute__((__vector_size__(64), __may_alias__));
|
|
typedef double __m512d __attribute__((__vector_size__(64), __may_alias__));
|
|
|
|
typedef unsigned char __mmask8;
|
|
typedef unsigned short __mmask16;
|
|
|
|
__funline __m512i _mm512_conflict_epi32(__m512i __A) {
|
|
return (__m512i)__builtin_ia32_vpconflictsi_512_mask(
|
|
(__v16si)__A, (__v16si)_mm512_setzero_si512(), (__mmask16)-1);
|
|
}
|
|
|
|
__funline __m512i _mm512_mask_conflict_epi32(__m512i __W, __mmask16 __U,
|
|
__m512i __A) {
|
|
return (__m512i)__builtin_ia32_vpconflictsi_512_mask(
|
|
(__v16si)__A, (__v16si)__W, (__mmask16)__U);
|
|
}
|
|
|
|
__funline __m512i _mm512_maskz_conflict_epi32(__mmask16 __U, __m512i __A) {
|
|
return (__m512i)__builtin_ia32_vpconflictsi_512_mask(
|
|
(__v16si)__A, (__v16si)_mm512_setzero_si512(), (__mmask16)__U);
|
|
}
|
|
|
|
__funline __m512i _mm512_conflict_epi64(__m512i __A) {
|
|
return (__m512i)__builtin_ia32_vpconflictdi_512_mask(
|
|
(__v8di)__A, (__v8di)_mm512_setzero_si512(), (__mmask8)-1);
|
|
}
|
|
|
|
__funline __m512i _mm512_mask_conflict_epi64(__m512i __W, __mmask8 __U,
|
|
__m512i __A) {
|
|
return (__m512i)__builtin_ia32_vpconflictdi_512_mask((__v8di)__A, (__v8di)__W,
|
|
(__mmask8)__U);
|
|
}
|
|
|
|
__funline __m512i _mm512_maskz_conflict_epi64(__mmask8 __U, __m512i __A) {
|
|
return (__m512i)__builtin_ia32_vpconflictdi_512_mask(
|
|
(__v8di)__A, (__v8di)_mm512_setzero_si512(), (__mmask8)__U);
|
|
}
|
|
|
|
__funline __m512i _mm512_lzcnt_epi64(__m512i __A) {
|
|
return (__m512i)__builtin_ia32_vplzcntq_512_mask(
|
|
(__v8di)__A, (__v8di)_mm512_setzero_si512(), (__mmask8)-1);
|
|
}
|
|
|
|
__funline __m512i _mm512_mask_lzcnt_epi64(__m512i __W, __mmask8 __U,
|
|
__m512i __A) {
|
|
return (__m512i)__builtin_ia32_vplzcntq_512_mask((__v8di)__A, (__v8di)__W,
|
|
(__mmask8)__U);
|
|
}
|
|
|
|
__funline __m512i _mm512_maskz_lzcnt_epi64(__mmask8 __U, __m512i __A) {
|
|
return (__m512i)__builtin_ia32_vplzcntq_512_mask(
|
|
(__v8di)__A, (__v8di)_mm512_setzero_si512(), (__mmask8)__U);
|
|
}
|
|
|
|
__funline __m512i _mm512_lzcnt_epi32(__m512i __A) {
|
|
return (__m512i)__builtin_ia32_vplzcntd_512_mask(
|
|
(__v16si)__A, (__v16si)_mm512_setzero_si512(), (__mmask16)-1);
|
|
}
|
|
|
|
__funline __m512i _mm512_mask_lzcnt_epi32(__m512i __W, __mmask16 __U,
|
|
__m512i __A) {
|
|
return (__m512i)__builtin_ia32_vplzcntd_512_mask((__v16si)__A, (__v16si)__W,
|
|
(__mmask16)__U);
|
|
}
|
|
|
|
__funline __m512i _mm512_maskz_lzcnt_epi32(__mmask16 __U, __m512i __A) {
|
|
return (__m512i)__builtin_ia32_vplzcntd_512_mask(
|
|
(__v16si)__A, (__v16si)_mm512_setzero_si512(), (__mmask16)__U);
|
|
}
|
|
|
|
__funline __m512i _mm512_broadcastmb_epi64(__mmask8 __A) {
|
|
return (__m512i)__builtin_ia32_broadcastmb512(__A);
|
|
}
|
|
|
|
__funline __m512i _mm512_broadcastmw_epi32(__mmask16 __A) {
|
|
return (__m512i)__builtin_ia32_broadcastmw512(__A);
|
|
}
|
|
|
|
#ifdef __DISABLE_AVX512CD__
|
|
#undef __DISABLE_AVX512CD__
|
|
#pragma GCC pop_options
|
|
#endif /* __DISABLE_AVX512CD__ */
|
|
|
|
#endif /* _AVX512CDINTRIN_H_INCLUDED */
|