Home
last modified time | relevance | path

Searched refs:__m512i (Results 1 – 21 of 21) sorted by relevance

/freebsd/contrib/llvm-project/clang/lib/Headers/
H A Davx10_2_512niintrin.h50 ((__m512i)__builtin_ia32_mpsadbw512((__v64qi)(__m512i)(A), \
51 (__v64qi)(__m512i)(B), (int)(imm)))
54 ((__m512i)__builtin_ia32_selectw_512( \
56 (__v32hi)(__m512i)(W)))
59 ((__m512i)__builtin_ia32_selectw_512( \
64 static __inline__ __m512i __DEFAULT_FN_ATTRS _mm512_dpbssd_epi32(__m512i __W, in _mm512_dpbssd_epi32()
65 __m512i __A, in _mm512_dpbssd_epi32()
66 __m512i __B) { in _mm512_dpbssd_epi32()
67 return (__m512i)__builtin_ia32_vpdpbssd512((__v16si)__W, (__v16si)__A, in _mm512_dpbssd_epi32()
71 static __inline__ __m512i __DEFAULT_FN_ATTRS
[all …]
H A Davx10_2_512satcvtdsintrin.h96 static __inline__ __m512i __DEFAULT_FN_ATTRS
98 return ((__m512i)__builtin_ia32_vcvttpd2qqs512_round_mask( in _mm512_cvtts_pd_epi64()
102 static __inline__ __m512i __DEFAULT_FN_ATTRS
103 _mm512_mask_cvtts_pd_epi64(__m512i __W, __mmask8 __U, __m512d __A) { in _mm512_mask_cvtts_pd_epi64()
104 return ((__m512i)__builtin_ia32_vcvttpd2qqs512_round_mask( in _mm512_mask_cvtts_pd_epi64()
107 static __inline__ __m512i __DEFAULT_FN_ATTRS
109 return ((__m512i)__builtin_ia32_vcvttpd2qqs512_round_mask( in _mm512_maskz_cvtts_pd_epi64()
115 ((__m512i)__builtin_ia32_vcvttpd2qqs512_round_mask( \
120 ((__m512i)__builtin_ia32_vcvttpd2qqs512_round_mask( \
121 (__v8df)(__m512d)(__A), (__v8di)(__m512i)(__W), (__mmask8)(__U), \
[all …]
H A Davx10_2_512satcvtintrin.h18 ((__m512i)__builtin_ia32_vcvtbf162ibs512((__v32bf)(__m512bh)(A)))
21 ((__m512i)__builtin_ia32_selectw_512((__mmask32)(U), \
23 (__v32hi)(__m512i)(W)))
26 ((__m512i)__builtin_ia32_selectw_512((__mmask32)(U), \
31 ((__m512i)__builtin_ia32_vcvtbf162iubs512((__v32bf)(__m512bh)(A)))
34 ((__m512i)__builtin_ia32_selectw_512((__mmask32)(U), \
36 (__v32hi)(__m512i)(W)))
39 ((__m512i)__builtin_ia32_selectw_512((__mmask32)(U), \
44 ((__m512i)__builtin_ia32_vcvttbf162ibs512((__v32bf)(__m512bh)(A)))
47 ((__m512i)__builtin_ia32_selectw_512((__mmask32)(U), \
[all …]
H A Davx512bitalgintrin.h23 static __inline__ __m512i __DEFAULT_FN_ATTRS
24 _mm512_popcnt_epi16(__m512i __A) in _mm512_popcnt_epi16()
26 return (__m512i)__builtin_elementwise_popcount((__v32hu)__A); in _mm512_popcnt_epi16()
29 static __inline__ __m512i __DEFAULT_FN_ATTRS
30 _mm512_mask_popcnt_epi16(__m512i __A, __mmask32 __U, __m512i __B) in _mm512_mask_popcnt_epi16()
32 return (__m512i) __builtin_ia32_selectw_512((__mmask32) __U, in _mm512_mask_popcnt_epi16()
37 static __inline__ __m512i __DEFAULT_FN_ATTRS
38 _mm512_maskz_popcnt_epi16(__mmask32 __U, __m512i __B) in _mm512_maskz_popcnt_epi16()
40 return _mm512_mask_popcnt_epi16((__m512i) _mm512_setzero_si512(), in _mm512_maskz_popcnt_epi16()
45 static __inline__ __m512i __DEFAULT_FN_ATTRS
[all …]
H A Dmovrs_avx10_2_512intrin.h23 static __inline__ __m512i __DEFAULT_FN_ATTRS512
25 return (__m512i)__builtin_ia32_vmovrsb512((const __v64qi *)(__A)); in _mm512_loadrs_epi8()
28 static __inline__ __m512i __DEFAULT_FN_ATTRS512
29 _mm512_mask_loadrs_epi8(__m512i __W, __mmask64 __U, void const *__A) { in _mm512_mask_loadrs_epi8()
30 return (__m512i)__builtin_ia32_selectb_512( in _mm512_mask_loadrs_epi8()
34 static __inline__ __m512i __DEFAULT_FN_ATTRS512
36 return (__m512i)__builtin_ia32_selectb_512((__mmask64)__U, in _mm512_maskz_loadrs_epi8()
41 static __inline__ __m512i __DEFAULT_FN_ATTRS512
43 return (__m512i)__builtin_ia32_vmovrsd512((const __v16si *)(__A)); in _mm512_loadrs_epi32()
46 static __inline__ __m512i __DEFAULT_FN_ATTRS512
[all …]
H A Davx512fintrin.h35 typedef long long __m512i __attribute__((__vector_size__(64), __aligned__(64))); typedef
190 static __inline __m512i __DEFAULT_FN_ATTRS512_CONSTEXPR
192 return __extension__(__m512i)(__v8di){0, 0, 0, 0, 0, 0, 0, 0}; in _mm512_setzero_si512()
215 static __inline__ __m512i __DEFAULT_FN_ATTRS512
218 return (__m512i)__builtin_ia32_undef512(); in _mm512_undefined_epi32()
221 static __inline__ __m512i __DEFAULT_FN_ATTRS512
224 return (__m512i)__builtin_shufflevector((__v4si) __A, (__v4si) __A, in _mm512_broadcastd_epi32()
228 static __inline__ __m512i __DEFAULT_FN_ATTRS512
229 _mm512_mask_broadcastd_epi32 (__m512i __O, __mmask16 __M, __m128i __A) in _mm512_mask_broadcastd_epi32()
231 return (__m512i)__builtin_ia32_selectd_512(__M, in _mm512_mask_broadcastd_epi32()
[all …]
H A Davx512vpopcntdqintrin.h30 static __inline__ __m512i __DEFAULT_FN_ATTRS_CONSTEXPR
31 _mm512_popcnt_epi64(__m512i __A) { in _mm512_popcnt_epi64()
32 return (__m512i)__builtin_elementwise_popcount((__v8du)__A); in _mm512_popcnt_epi64()
35 static __inline__ __m512i __DEFAULT_FN_ATTRS
36 _mm512_mask_popcnt_epi64(__m512i __W, __mmask8 __U, __m512i __A) { in _mm512_mask_popcnt_epi64()
37 return (__m512i)__builtin_ia32_selectq_512( in _mm512_mask_popcnt_epi64()
41 static __inline__ __m512i __DEFAULT_FN_ATTRS
42 _mm512_maskz_popcnt_epi64(__mmask8 __U, __m512i __A) { in _mm512_maskz_popcnt_epi64()
43 return _mm512_mask_popcnt_epi64((__m512i)_mm512_setzero_si512(), __U, __A); in _mm512_maskz_popcnt_epi64()
46 static __inline__ __m512i __DEFAULT_FN_ATTRS_CONSTEXPR
[all …]
H A Davx10_2_512convertintrin.h61 _mm512_cvtbiasph_bf8(__m512i __A, __m512h __B) { in _mm512_cvtbiasph_bf8()
68 __m256i __W, __mmask32 __U, __m512i __A, __m512h __B) { in _mm512_mask_cvtbiasph_bf8()
74 _mm512_maskz_cvtbiasph_bf8(__mmask32 __U, __m512i __A, __m512h __B) { in _mm512_maskz_cvtbiasph_bf8()
81 _mm512_cvts_biasph_bf8(__m512i __A, __m512h __B) { in _mm512_cvts_biasph_bf8()
88 __m256i __W, __mmask32 __U, __m512i __A, __m512h __B) { in _mm512_mask_cvts_biasph_bf8()
94 _mm512_maskz_cvts_biasph_bf8(__mmask32 __U, __m512i __A, __m512h __B) { in _mm512_maskz_cvts_biasph_bf8()
101 _mm512_cvtbiasph_hf8(__m512i __A, __m512h __B) { in _mm512_cvtbiasph_hf8()
108 __m256i __W, __mmask32 __U, __m512i __A, __m512h __B) { in _mm512_mask_cvtbiasph_hf8()
114 _mm512_maskz_cvtbiasph_hf8(__mmask32 __U, __m512i __A, __m512h __B) { in _mm512_maskz_cvtbiasph_hf8()
121 _mm512_cvts_biasph_hf8(__m512i __A, __m512h __B) { in _mm512_cvts_biasph_hf8()
[all …]
H A Dgfniintrin.h109 ((__m512i)__builtin_ia32_vgf2p8affineinvqb_v64qi((__v64qi)(__m512i)(A), \
110 (__v64qi)(__m512i)(B), \
114 ((__m512i)__builtin_ia32_selectb_512((__mmask64)(U), \
116 (__v64qi)(__m512i)(S)))
119 _mm512_mask_gf2p8affineinv_epi64_epi8((__m512i)_mm512_setzero_si512(), \
123 ((__m512i)__builtin_ia32_vgf2p8affineqb_v64qi((__v64qi)(__m512i)(A), \
124 (__v64qi)(__m512i)(B), \
128 ((__m512i)__builtin_ia32_selectb_512((__mmask64)(U), \
130 (__v64qi)(__m512i)(S)))
133 _mm512_mask_gf2p8affine_epi64_epi8((__m512i)_mm512_setzero_si512(), \
[all …]
H A Dsm4evexintrin.h20 static __inline__ __m512i __DEFAULT_FN_ATTRS512
21 _mm512_sm4key4_epi32(__m512i __A, __m512i __B) { in _mm512_sm4key4_epi32()
22 return (__m512i)__builtin_ia32_vsm4key4512((__v16su)__A, (__v16su)__B); in _mm512_sm4key4_epi32()
25 static __inline__ __m512i __DEFAULT_FN_ATTRS512
26 _mm512_sm4rnds4_epi32(__m512i __A, __m512i __B) { in _mm512_sm4rnds4_epi32()
27 return (__m512i)__builtin_ia32_vsm4rnds4512((__v16su)__A, (__v16su)__B); in _mm512_sm4rnds4_epi32()
H A Davx512fp16intrin.h136 static __inline__ __m512i __DEFAULT_FN_ATTRS512
138 return (__m512i)__a; in _mm512_castph_si512()
175 _mm512_castsi512_ph(__m512i __a) { in _mm512_castsi512_ph()
552 return (__m512h)_mm512_and_epi32(_mm512_set1_epi32(0x7FFF7FFF), (__m512i)__A); in _mm512_abs_ph()
556 return (__m512h)_mm512_xor_epi32((__m512i)__A, in _mm512_conj_pch()
1674 ((__m512i)__builtin_ia32_vcvtph2w512_mask((__v32hf)(A), \
1679 ((__m512i)__builtin_ia32_vcvtph2w512_mask((__v32hf)(A), (__v32hi)(W), \
1683 ((__m512i)__builtin_ia32_vcvtph2w512_mask((__v32hf)(A), \
1687 static __inline__ __m512i __DEFAULT_FN_ATTRS512
1689 return (__m512i)__builtin_ia32_vcvtph2w512_mask( in _mm512_cvtph_epi16()
[all …]
H A Damxavx512intrin.h231 #define _tile_movrow(a, b) ((__m512i)__builtin_ia32_tilemovrow(a, b))
262 static __inline__ __m512i __DEFAULT_FN_ATTRS_AVX512 _tile_movrow_internal( in _tile_movrow_internal()
264 return (__m512i)__builtin_ia32_tilemovrow_internal(m, n, src, u); in _tile_movrow_internal()
377 static __m512i __tile_movrow(__tile1024i src0, unsigned src1) { in __tile_movrow()
378 return (__m512i)_tile_movrow_internal(src0.row, src0.col, src0.tile, src1); in __tile_movrow()
H A Dvpclmulqdqintrin.h24 ((__m512i)__builtin_ia32_pclmulqdq512((__v8di)(__m512i)(A), \
25 (__v8di)(__m512i)(B), \
H A Davx10_2_512bf16intrin.h74 static __inline__ __m512i __DEFAULT_FN_ATTRS512
76 return (__m512i)__a; in _mm512_castbf16_si512()
89 _mm512_castsi512_pbh(__m512i __a) { in _mm512_castsi512_pbh()
135 (__m512i)__A); in _mm512_abs_pbh()
171 _mm512_permutex2var_pbh(__m512bh __A, __m512i __I, __m512bh __B) { in _mm512_permutex2var_pbh()
177 _mm512_permutexvar_pbh(__m512i __A, __m512bh __B) { in _mm512_permutexvar_pbh()
/freebsd/contrib/llvm-project/llvm/lib/Support/BLAKE3/
H A Dblake3_avx512.c17 INLINE __m512i loadu_512(const uint8_t src[64]) { in loadu_512()
18 return _mm512_loadu_si512((const __m512i *)src); in loadu_512()
29 INLINE void storeu_512(__m512i src, uint8_t dest[64]) { in storeu_512()
30 _mm512_storeu_si512((__m512i *)dest, src); in storeu_512()
37 INLINE __m512i add_512(__m512i a, __m512i b) { return _mm512_add_epi32(a, b); } in add_512()
43 INLINE __m512i xor_512(__m512i a, __m512i b) { return _mm512_xor_si512(a, b); } in xor_512()
49 INLINE __m512i set1_512(uint32_t x) { return _mm512_set1_epi32((int32_t)x); } in set1_512()
59 INLINE __m512i rot16_512(__m512i x) { return _mm512_ror_epi32(x, 16); } in rot16_512()
65 INLINE __m512i rot12_512(__m512i x) { return _mm512_ror_epi32(x, 12); } in rot12_512()
71 INLINE __m512i rot8_512(__m512i x) { return _mm512_ror_epi32(x, 8); } in rot8_512()
[all …]
/freebsd/sys/contrib/libsodium/src/libsodium/crypto_pwhash/argon2/
H A Dargon2-fill-block-avx512f.c45 fill_block(__m512i *state, const uint8_t *ref_block, uint8_t *next_block) in fill_block()
47 __m512i block_XY[ARGON2_512BIT_WORDS_IN_BLOCK]; in fill_block()
52 state[i], _mm512_loadu_si512((__m512i const *) (&ref_block[64 * i]))); in fill_block()
69 _mm512_storeu_si512((__m512i *) (&next_block[64 * i]), state[i]); in fill_block()
74 fill_block_with_xor(__m512i *state, const uint8_t *ref_block, in fill_block_with_xor()
77 __m512i block_XY[ARGON2_512BIT_WORDS_IN_BLOCK]; in fill_block_with_xor()
82 state[i], _mm512_loadu_si512((__m512i const *) (&ref_block[64 * i]))); in fill_block_with_xor()
84 state[i], _mm512_loadu_si512((__m512i const *) (&next_block[64 * i]))); in fill_block_with_xor()
101 _mm512_storeu_si512((__m512i *) (&next_block[64 * i]), state[i]); in fill_block_with_xor()
126 __m512i zero_block[ARGON2_512BIT_WORDS_IN_BLOCK]; in generate_addresses()
[all …]
H A Dblamka-round-avx512f.h9 static inline __m512i
10 muladd(__m512i x, __m512i y) in muladd()
12 __m512i z = _mm512_mul_epu32(x, y); in muladd()
98 __m512i t0, t1; \
/freebsd/sys/contrib/openzfs/module/zstd/lib/common/
H A Dxxhash.h4902 __m512i* const xacc = (__m512i *) acc; in XXH3_accumulate_512_avx512()
4904 XXH_STATIC_ASSERT(XXH_STRIPE_LEN == sizeof(__m512i)); in XXH3_accumulate_512_avx512()
4908 __m512i const data_vec = _mm512_loadu_si512 (input); in XXH3_accumulate_512_avx512()
4910 __m512i const key_vec = _mm512_loadu_si512 (secret); in XXH3_accumulate_512_avx512()
4912 __m512i const data_key = _mm512_xor_si512 (data_vec, key_vec); in XXH3_accumulate_512_avx512()
4914 __m512i const data_key_lo = _mm512_srli_epi64 (data_key, 32); in XXH3_accumulate_512_avx512()
4916 __m512i const product = _mm512_mul_epu32 (data_key, data_key_lo); in XXH3_accumulate_512_avx512()
4918__m512i const data_swap = _mm512_shuffle_epi32(data_vec, (_MM_PERM_ENUM)_MM_SHUFFLE(1, 0, 3, 2)); in XXH3_accumulate_512_avx512()
4919 __m512i const sum = _mm512_add_epi64(*xacc, data_swap); in XXH3_accumulate_512_avx512()
4951 XXH_STATIC_ASSERT(XXH_STRIPE_LEN == sizeof(__m512i)); in XXH3_ACCUMULATE_TEMPLATE()
[all …]
/freebsd/sys/contrib/zstd/lib/common/
H A Dxxhash.h4901 __m512i* const xacc = (__m512i *) acc; in XXH3_accumulate_512_avx512()
4903 XXH_STATIC_ASSERT(XXH_STRIPE_LEN == sizeof(__m512i)); in XXH3_accumulate_512_avx512()
4907 __m512i const data_vec = _mm512_loadu_si512 (input); in XXH3_accumulate_512_avx512()
4909 __m512i const key_vec = _mm512_loadu_si512 (secret); in XXH3_accumulate_512_avx512()
4911 __m512i const data_key = _mm512_xor_si512 (data_vec, key_vec); in XXH3_accumulate_512_avx512()
4913 __m512i const data_key_lo = _mm512_srli_epi64 (data_key, 32); in XXH3_accumulate_512_avx512()
4915 __m512i const product = _mm512_mul_epu32 (data_key, data_key_lo); in XXH3_accumulate_512_avx512()
4917__m512i const data_swap = _mm512_shuffle_epi32(data_vec, (_MM_PERM_ENUM)_MM_SHUFFLE(1, 0, 3, 2)); in XXH3_accumulate_512_avx512()
4918 __m512i const sum = _mm512_add_epi64(*xacc, data_swap); in XXH3_accumulate_512_avx512()
4950 XXH_STATIC_ASSERT(XXH_STRIPE_LEN == sizeof(__m512i)); in XXH3_ACCUMULATE_TEMPLATE()
[all …]
/freebsd/sys/contrib/libsodium/
H A Dconfigure.ac492 __m512i x = _mm512_setzero_epi32();
493 __m512i y = _mm512_permutexvar_epi64(_mm512_setr_epi64(0, 1, 4, 5, 2, 3, 6, 7), x);
/freebsd/contrib/llvm-project/llvm/lib/Target/X86/
H A DX86CallingConv.td156 // __m512, __m512i, __m512d --> ZMM
228 // __m512, __m512i, __m512d --> ZMM