| /freebsd/contrib/llvm-project/clang/lib/Headers/ |
| H A D | avx10_2_512niintrin.h | 50 ((__m512i)__builtin_ia32_mpsadbw512((__v64qi)(__m512i)(A), \ 51 (__v64qi)(__m512i)(B), (int)(imm))) 54 ((__m512i)__builtin_ia32_selectw_512( \ 56 (__v32hi)(__m512i)(W))) 59 ((__m512i)__builtin_ia32_selectw_512( \ 64 static __inline__ __m512i __DEFAULT_FN_ATTRS _mm512_dpbssd_epi32(__m512i __W, in _mm512_dpbssd_epi32() 65 __m512i __A, in _mm512_dpbssd_epi32() 66 __m512i __B) { in _mm512_dpbssd_epi32() 67 return (__m512i)__builtin_ia32_vpdpbssd512((__v16si)__W, (__v16si)__A, in _mm512_dpbssd_epi32() 71 static __inline__ __m512i __DEFAULT_FN_ATTRS [all …]
|
| H A D | avx10_2_512satcvtdsintrin.h | 96 static __inline__ __m512i __DEFAULT_FN_ATTRS 98 return ((__m512i)__builtin_ia32_vcvttpd2qqs512_round_mask( in _mm512_cvtts_pd_epi64() 102 static __inline__ __m512i __DEFAULT_FN_ATTRS 103 _mm512_mask_cvtts_pd_epi64(__m512i __W, __mmask8 __U, __m512d __A) { in _mm512_mask_cvtts_pd_epi64() 104 return ((__m512i)__builtin_ia32_vcvttpd2qqs512_round_mask( in _mm512_mask_cvtts_pd_epi64() 107 static __inline__ __m512i __DEFAULT_FN_ATTRS 109 return ((__m512i)__builtin_ia32_vcvttpd2qqs512_round_mask( in _mm512_maskz_cvtts_pd_epi64() 115 ((__m512i)__builtin_ia32_vcvttpd2qqs512_round_mask( \ 120 ((__m512i)__builtin_ia32_vcvttpd2qqs512_round_mask( \ 121 (__v8df)(__m512d)(__A), (__v8di)(__m512i)(__W), (__mmask8)(__U), \ [all …]
|
| H A D | avx10_2_512satcvtintrin.h | 18 ((__m512i)__builtin_ia32_vcvtbf162ibs512((__v32bf)(__m512bh)(A))) 21 ((__m512i)__builtin_ia32_selectw_512((__mmask32)(U), \ 23 (__v32hi)(__m512i)(W))) 26 ((__m512i)__builtin_ia32_selectw_512((__mmask32)(U), \ 31 ((__m512i)__builtin_ia32_vcvtbf162iubs512((__v32bf)(__m512bh)(A))) 34 ((__m512i)__builtin_ia32_selectw_512((__mmask32)(U), \ 36 (__v32hi)(__m512i)(W))) 39 ((__m512i)__builtin_ia32_selectw_512((__mmask32)(U), \ 44 ((__m512i)__builtin_ia32_vcvttbf162ibs512((__v32bf)(__m512bh)(A))) 47 ((__m512i)__builtin_ia32_selectw_512((__mmask32)(U), \ [all …]
|
| H A D | avx512bitalgintrin.h | 23 static __inline__ __m512i __DEFAULT_FN_ATTRS 24 _mm512_popcnt_epi16(__m512i __A) in _mm512_popcnt_epi16() 26 return (__m512i)__builtin_elementwise_popcount((__v32hu)__A); in _mm512_popcnt_epi16() 29 static __inline__ __m512i __DEFAULT_FN_ATTRS 30 _mm512_mask_popcnt_epi16(__m512i __A, __mmask32 __U, __m512i __B) in _mm512_mask_popcnt_epi16() 32 return (__m512i) __builtin_ia32_selectw_512((__mmask32) __U, in _mm512_mask_popcnt_epi16() 37 static __inline__ __m512i __DEFAULT_FN_ATTRS 38 _mm512_maskz_popcnt_epi16(__mmask32 __U, __m512i __B) in _mm512_maskz_popcnt_epi16() 40 return _mm512_mask_popcnt_epi16((__m512i) _mm512_setzero_si512(), in _mm512_maskz_popcnt_epi16() 45 static __inline__ __m512i __DEFAULT_FN_ATTRS [all …]
|
| H A D | movrs_avx10_2_512intrin.h | 23 static __inline__ __m512i __DEFAULT_FN_ATTRS512 25 return (__m512i)__builtin_ia32_vmovrsb512((const __v64qi *)(__A)); in _mm512_loadrs_epi8() 28 static __inline__ __m512i __DEFAULT_FN_ATTRS512 29 _mm512_mask_loadrs_epi8(__m512i __W, __mmask64 __U, void const *__A) { in _mm512_mask_loadrs_epi8() 30 return (__m512i)__builtin_ia32_selectb_512( in _mm512_mask_loadrs_epi8() 34 static __inline__ __m512i __DEFAULT_FN_ATTRS512 36 return (__m512i)__builtin_ia32_selectb_512((__mmask64)__U, in _mm512_maskz_loadrs_epi8() 41 static __inline__ __m512i __DEFAULT_FN_ATTRS512 43 return (__m512i)__builtin_ia32_vmovrsd512((const __v16si *)(__A)); in _mm512_loadrs_epi32() 46 static __inline__ __m512i __DEFAULT_FN_ATTRS512 [all …]
|
| H A D | avx512fintrin.h | 35 typedef long long __m512i __attribute__((__vector_size__(64), __aligned__(64))); typedef 190 static __inline __m512i __DEFAULT_FN_ATTRS512_CONSTEXPR 192 return __extension__(__m512i)(__v8di){0, 0, 0, 0, 0, 0, 0, 0}; in _mm512_setzero_si512() 215 static __inline__ __m512i __DEFAULT_FN_ATTRS512 218 return (__m512i)__builtin_ia32_undef512(); in _mm512_undefined_epi32() 221 static __inline__ __m512i __DEFAULT_FN_ATTRS512 224 return (__m512i)__builtin_shufflevector((__v4si) __A, (__v4si) __A, in _mm512_broadcastd_epi32() 228 static __inline__ __m512i __DEFAULT_FN_ATTRS512 229 _mm512_mask_broadcastd_epi32 (__m512i __O, __mmask16 __M, __m128i __A) in _mm512_mask_broadcastd_epi32() 231 return (__m512i)__builtin_ia32_selectd_512(__M, in _mm512_mask_broadcastd_epi32() [all …]
|
| H A D | avx512vpopcntdqintrin.h | 30 static __inline__ __m512i __DEFAULT_FN_ATTRS_CONSTEXPR 31 _mm512_popcnt_epi64(__m512i __A) { in _mm512_popcnt_epi64() 32 return (__m512i)__builtin_elementwise_popcount((__v8du)__A); in _mm512_popcnt_epi64() 35 static __inline__ __m512i __DEFAULT_FN_ATTRS 36 _mm512_mask_popcnt_epi64(__m512i __W, __mmask8 __U, __m512i __A) { in _mm512_mask_popcnt_epi64() 37 return (__m512i)__builtin_ia32_selectq_512( in _mm512_mask_popcnt_epi64() 41 static __inline__ __m512i __DEFAULT_FN_ATTRS 42 _mm512_maskz_popcnt_epi64(__mmask8 __U, __m512i __A) { in _mm512_maskz_popcnt_epi64() 43 return _mm512_mask_popcnt_epi64((__m512i)_mm512_setzero_si512(), __U, __A); in _mm512_maskz_popcnt_epi64() 46 static __inline__ __m512i __DEFAULT_FN_ATTRS_CONSTEXPR [all …]
|
| H A D | avx10_2_512convertintrin.h | 61 _mm512_cvtbiasph_bf8(__m512i __A, __m512h __B) { in _mm512_cvtbiasph_bf8() 68 __m256i __W, __mmask32 __U, __m512i __A, __m512h __B) { in _mm512_mask_cvtbiasph_bf8() 74 _mm512_maskz_cvtbiasph_bf8(__mmask32 __U, __m512i __A, __m512h __B) { in _mm512_maskz_cvtbiasph_bf8() 81 _mm512_cvts_biasph_bf8(__m512i __A, __m512h __B) { in _mm512_cvts_biasph_bf8() 88 __m256i __W, __mmask32 __U, __m512i __A, __m512h __B) { in _mm512_mask_cvts_biasph_bf8() 94 _mm512_maskz_cvts_biasph_bf8(__mmask32 __U, __m512i __A, __m512h __B) { in _mm512_maskz_cvts_biasph_bf8() 101 _mm512_cvtbiasph_hf8(__m512i __A, __m512h __B) { in _mm512_cvtbiasph_hf8() 108 __m256i __W, __mmask32 __U, __m512i __A, __m512h __B) { in _mm512_mask_cvtbiasph_hf8() 114 _mm512_maskz_cvtbiasph_hf8(__mmask32 __U, __m512i __A, __m512h __B) { in _mm512_maskz_cvtbiasph_hf8() 121 _mm512_cvts_biasph_hf8(__m512i __A, __m512h __B) { in _mm512_cvts_biasph_hf8() [all …]
|
| H A D | gfniintrin.h | 109 ((__m512i)__builtin_ia32_vgf2p8affineinvqb_v64qi((__v64qi)(__m512i)(A), \ 110 (__v64qi)(__m512i)(B), \ 114 ((__m512i)__builtin_ia32_selectb_512((__mmask64)(U), \ 116 (__v64qi)(__m512i)(S))) 119 _mm512_mask_gf2p8affineinv_epi64_epi8((__m512i)_mm512_setzero_si512(), \ 123 ((__m512i)__builtin_ia32_vgf2p8affineqb_v64qi((__v64qi)(__m512i)(A), \ 124 (__v64qi)(__m512i)(B), \ 128 ((__m512i)__builtin_ia32_selectb_512((__mmask64)(U), \ 130 (__v64qi)(__m512i)(S))) 133 _mm512_mask_gf2p8affine_epi64_epi8((__m512i)_mm512_setzero_si512(), \ [all …]
|
| H A D | sm4evexintrin.h | 20 static __inline__ __m512i __DEFAULT_FN_ATTRS512 21 _mm512_sm4key4_epi32(__m512i __A, __m512i __B) { in _mm512_sm4key4_epi32() 22 return (__m512i)__builtin_ia32_vsm4key4512((__v16su)__A, (__v16su)__B); in _mm512_sm4key4_epi32() 25 static __inline__ __m512i __DEFAULT_FN_ATTRS512 26 _mm512_sm4rnds4_epi32(__m512i __A, __m512i __B) { in _mm512_sm4rnds4_epi32() 27 return (__m512i)__builtin_ia32_vsm4rnds4512((__v16su)__A, (__v16su)__B); in _mm512_sm4rnds4_epi32()
|
| H A D | avx512fp16intrin.h | 136 static __inline__ __m512i __DEFAULT_FN_ATTRS512 138 return (__m512i)__a; in _mm512_castph_si512() 175 _mm512_castsi512_ph(__m512i __a) { in _mm512_castsi512_ph() 552 return (__m512h)_mm512_and_epi32(_mm512_set1_epi32(0x7FFF7FFF), (__m512i)__A); in _mm512_abs_ph() 556 return (__m512h)_mm512_xor_epi32((__m512i)__A, in _mm512_conj_pch() 1674 ((__m512i)__builtin_ia32_vcvtph2w512_mask((__v32hf)(A), \ 1679 ((__m512i)__builtin_ia32_vcvtph2w512_mask((__v32hf)(A), (__v32hi)(W), \ 1683 ((__m512i)__builtin_ia32_vcvtph2w512_mask((__v32hf)(A), \ 1687 static __inline__ __m512i __DEFAULT_FN_ATTRS512 1689 return (__m512i)__builtin_ia32_vcvtph2w512_mask( in _mm512_cvtph_epi16() [all …]
|
| H A D | amxavx512intrin.h | 231 #define _tile_movrow(a, b) ((__m512i)__builtin_ia32_tilemovrow(a, b)) 262 static __inline__ __m512i __DEFAULT_FN_ATTRS_AVX512 _tile_movrow_internal( in _tile_movrow_internal() 264 return (__m512i)__builtin_ia32_tilemovrow_internal(m, n, src, u); in _tile_movrow_internal() 377 static __m512i __tile_movrow(__tile1024i src0, unsigned src1) { in __tile_movrow() 378 return (__m512i)_tile_movrow_internal(src0.row, src0.col, src0.tile, src1); in __tile_movrow()
|
| H A D | vpclmulqdqintrin.h | 24 ((__m512i)__builtin_ia32_pclmulqdq512((__v8di)(__m512i)(A), \ 25 (__v8di)(__m512i)(B), \
|
| H A D | avx10_2_512bf16intrin.h | 74 static __inline__ __m512i __DEFAULT_FN_ATTRS512 76 return (__m512i)__a; in _mm512_castbf16_si512() 89 _mm512_castsi512_pbh(__m512i __a) { in _mm512_castsi512_pbh() 135 (__m512i)__A); in _mm512_abs_pbh() 171 _mm512_permutex2var_pbh(__m512bh __A, __m512i __I, __m512bh __B) { in _mm512_permutex2var_pbh() 177 _mm512_permutexvar_pbh(__m512i __A, __m512bh __B) { in _mm512_permutexvar_pbh()
|
| /freebsd/contrib/llvm-project/llvm/lib/Support/BLAKE3/ |
| H A D | blake3_avx512.c | 17 INLINE __m512i loadu_512(const uint8_t src[64]) { in loadu_512() 18 return _mm512_loadu_si512((const __m512i *)src); in loadu_512() 29 INLINE void storeu_512(__m512i src, uint8_t dest[64]) { in storeu_512() 30 _mm512_storeu_si512((__m512i *)dest, src); in storeu_512() 37 INLINE __m512i add_512(__m512i a, __m512i b) { return _mm512_add_epi32(a, b); } in add_512() 43 INLINE __m512i xor_512(__m512i a, __m512i b) { return _mm512_xor_si512(a, b); } in xor_512() 49 INLINE __m512i set1_512(uint32_t x) { return _mm512_set1_epi32((int32_t)x); } in set1_512() 59 INLINE __m512i rot16_512(__m512i x) { return _mm512_ror_epi32(x, 16); } in rot16_512() 65 INLINE __m512i rot12_512(__m512i x) { return _mm512_ror_epi32(x, 12); } in rot12_512() 71 INLINE __m512i rot8_512(__m512i x) { return _mm512_ror_epi32(x, 8); } in rot8_512() [all …]
|
| /freebsd/sys/contrib/libsodium/src/libsodium/crypto_pwhash/argon2/ |
| H A D | argon2-fill-block-avx512f.c | 45 fill_block(__m512i *state, const uint8_t *ref_block, uint8_t *next_block) in fill_block() 47 __m512i block_XY[ARGON2_512BIT_WORDS_IN_BLOCK]; in fill_block() 52 state[i], _mm512_loadu_si512((__m512i const *) (&ref_block[64 * i]))); in fill_block() 69 _mm512_storeu_si512((__m512i *) (&next_block[64 * i]), state[i]); in fill_block() 74 fill_block_with_xor(__m512i *state, const uint8_t *ref_block, in fill_block_with_xor() 77 __m512i block_XY[ARGON2_512BIT_WORDS_IN_BLOCK]; in fill_block_with_xor() 82 state[i], _mm512_loadu_si512((__m512i const *) (&ref_block[64 * i]))); in fill_block_with_xor() 84 state[i], _mm512_loadu_si512((__m512i const *) (&next_block[64 * i]))); in fill_block_with_xor() 101 _mm512_storeu_si512((__m512i *) (&next_block[64 * i]), state[i]); in fill_block_with_xor() 126 __m512i zero_block[ARGON2_512BIT_WORDS_IN_BLOCK]; in generate_addresses() [all …]
|
| H A D | blamka-round-avx512f.h | 9 static inline __m512i 10 muladd(__m512i x, __m512i y) in muladd() 12 __m512i z = _mm512_mul_epu32(x, y); in muladd() 98 __m512i t0, t1; \
|
| /freebsd/sys/contrib/openzfs/module/zstd/lib/common/ |
| H A D | xxhash.h | 4902 __m512i* const xacc = (__m512i *) acc; in XXH3_accumulate_512_avx512() 4904 XXH_STATIC_ASSERT(XXH_STRIPE_LEN == sizeof(__m512i)); in XXH3_accumulate_512_avx512() 4908 __m512i const data_vec = _mm512_loadu_si512 (input); in XXH3_accumulate_512_avx512() 4910 __m512i const key_vec = _mm512_loadu_si512 (secret); in XXH3_accumulate_512_avx512() 4912 __m512i const data_key = _mm512_xor_si512 (data_vec, key_vec); in XXH3_accumulate_512_avx512() 4914 __m512i const data_key_lo = _mm512_srli_epi64 (data_key, 32); in XXH3_accumulate_512_avx512() 4916 __m512i const product = _mm512_mul_epu32 (data_key, data_key_lo); in XXH3_accumulate_512_avx512() 4918 … __m512i const data_swap = _mm512_shuffle_epi32(data_vec, (_MM_PERM_ENUM)_MM_SHUFFLE(1, 0, 3, 2)); in XXH3_accumulate_512_avx512() 4919 __m512i const sum = _mm512_add_epi64(*xacc, data_swap); in XXH3_accumulate_512_avx512() 4951 XXH_STATIC_ASSERT(XXH_STRIPE_LEN == sizeof(__m512i)); in XXH3_ACCUMULATE_TEMPLATE() [all …]
|
| /freebsd/sys/contrib/zstd/lib/common/ |
| H A D | xxhash.h | 4901 __m512i* const xacc = (__m512i *) acc; in XXH3_accumulate_512_avx512() 4903 XXH_STATIC_ASSERT(XXH_STRIPE_LEN == sizeof(__m512i)); in XXH3_accumulate_512_avx512() 4907 __m512i const data_vec = _mm512_loadu_si512 (input); in XXH3_accumulate_512_avx512() 4909 __m512i const key_vec = _mm512_loadu_si512 (secret); in XXH3_accumulate_512_avx512() 4911 __m512i const data_key = _mm512_xor_si512 (data_vec, key_vec); in XXH3_accumulate_512_avx512() 4913 __m512i const data_key_lo = _mm512_srli_epi64 (data_key, 32); in XXH3_accumulate_512_avx512() 4915 __m512i const product = _mm512_mul_epu32 (data_key, data_key_lo); in XXH3_accumulate_512_avx512() 4917 … __m512i const data_swap = _mm512_shuffle_epi32(data_vec, (_MM_PERM_ENUM)_MM_SHUFFLE(1, 0, 3, 2)); in XXH3_accumulate_512_avx512() 4918 __m512i const sum = _mm512_add_epi64(*xacc, data_swap); in XXH3_accumulate_512_avx512() 4950 XXH_STATIC_ASSERT(XXH_STRIPE_LEN == sizeof(__m512i)); in XXH3_ACCUMULATE_TEMPLATE() [all …]
|
| /freebsd/sys/contrib/libsodium/ |
| H A D | configure.ac | 492 __m512i x = _mm512_setzero_epi32(); 493 __m512i y = _mm512_permutexvar_epi64(_mm512_setr_epi64(0, 1, 4, 5, 2, 3, 6, 7), x);
|
| /freebsd/contrib/llvm-project/llvm/lib/Target/X86/ |
| H A D | X86CallingConv.td | 156 // __m512, __m512i, __m512d --> ZMM 228 // __m512, __m512i, __m512d --> ZMM
|