Home
last modified time | relevance | path

Searched refs:__m256 (Results 1 – 19 of 19) sorted by relevance

/freebsd/contrib/llvm-project/clang/lib/Headers/
H A Davxintrin.h34 typedef float __m256 __attribute__ ((__vector_size__ (32), __aligned__(32))); typedef
108 static __inline __m256 __DEFAULT_FN_ATTRS
109 _mm256_add_ps(__m256 __a, __m256 __b) in _mm256_add_ps()
111 return (__m256)((__v8sf)__a+(__v8sf)__b); in _mm256_add_ps()
144 static __inline __m256 __DEFAULT_FN_ATTRS
145 _mm256_sub_ps(__m256 __a, __m256 __b) in _mm256_sub_ps()
147 return (__m256)((__v8sf)__a-(__v8sf)__b); in _mm256_sub_ps()
182 static __inline __m256 __DEFAULT_FN_ATTRS
183 _mm256_addsub_ps(__m256 __a, __m256 __b) in _mm256_addsub_ps()
185 return (__m256)__builtin_ia32_addsubps256((__v8sf)__a, (__v8sf)__b); in _mm256_addsub_ps()
[all …]
H A Dfmaintrin.h531 static __inline__ __m256 __DEFAULT_FN_ATTRS256
532 _mm256_fmadd_ps(__m256 __A, __m256 __B, __m256 __C) in _mm256_fmadd_ps()
534 return (__m256)__builtin_ia32_vfmaddps256((__v8sf)__A, (__v8sf)__B, (__v8sf)__C); in _mm256_fmadd_ps()
571 static __inline__ __m256 __DEFAULT_FN_ATTRS256
572 _mm256_fmsub_ps(__m256 __A, __m256 __B, __m256 __C) in _mm256_fmsub_ps()
574 return (__m256)__builtin_ia32_vfmaddps256((__v8sf)__A, (__v8sf)__B, -(__v8sf)__C); in _mm256_fmsub_ps()
611 static __inline__ __m256 __DEFAULT_FN_ATTRS256
612 _mm256_fnmadd_ps(__m256 __A, __m256 __B, __m256 __C) in _mm256_fnmadd_ps()
614 return (__m256)__builtin_ia32_vfmaddps256(-(__v8sf)__A, (__v8sf)__B, (__v8sf)__C); in _mm256_fnmadd_ps()
651 static __inline__ __m256 __DEFAULT_FN_ATTRS256
[all …]
H A Dfma4intrin.h143 static __inline__ __m256 __DEFAULT_FN_ATTRS256
144 _mm256_macc_ps(__m256 __A, __m256 __B, __m256 __C) in _mm256_macc_ps()
146 return (__m256)__builtin_ia32_vfmaddps256((__v8sf)__A, (__v8sf)__B, (__v8sf)__C); in _mm256_macc_ps()
155 static __inline__ __m256 __DEFAULT_FN_ATTRS256
156 _mm256_msub_ps(__m256 __A, __m256 __B, __m256 __C) in _mm256_msub_ps()
158 return (__m256)__builtin_ia32_vfmaddps256((__v8sf)__A, (__v8sf)__B, -(__v8sf)__C); in _mm256_msub_ps()
167 static __inline__ __m256 __DEFAULT_FN_ATTRS256
168 _mm256_nmacc_ps(__m256 __A, __m256 __B, __m256 __C) in _mm256_nmacc_ps()
170 return (__m256)__builtin_ia32_vfmaddps256(-(__v8sf)__A, (__v8sf)__B, (__v8sf)__C); in _mm256_nmacc_ps()
179 static __inline__ __m256 __DEFAULT_FN_ATTRS256
[all …]
H A Davxneconvertintrin.h89 static __inline__ __m256 __DEFAULT_FN_ATTRS256
91 return (__m256)__builtin_ia32_vbcstnebf162ps256((const __bf16 *)__A); in _mm256_bcstnebf16_ps()
155 static __inline__ __m256 __DEFAULT_FN_ATTRS256
157 return (__m256)__builtin_ia32_vbcstnesh2ps256((const _Float16 *)__A); in _mm256_bcstnesh_ps()
221 static __inline__ __m256 __DEFAULT_FN_ATTRS256
223 return (__m256)__builtin_ia32_vcvtneebf162ps256((const __v16bf *)__A); in _mm256_cvtneebf16_ps()
287 static __inline__ __m256 __DEFAULT_FN_ATTRS256
289 return (__m256)__builtin_ia32_vcvtneeph2ps256((const __v16hf *)__A); in _mm256_cvtneeph_ps()
353 static __inline__ __m256 __DEFAULT_FN_ATTRS256
355 return (__m256)__builtin_ia32_vcvtneobf162ps256((const __v16bf *)__A); in _mm256_cvtneobf16_ps()
[all …]
H A Dlasxintrin.h39 typedef float __m256 __attribute__((__vector_size__(32), __may_alias__)); typedef
1586 __attribute__((__gnu_inline__, __always_inline__, __artificial__)) __m256
1587 __lasx_xvfadd_s(__m256 _1, __m256 _2) { in __lasx_xvfadd_s()
1588 return (__m256)__builtin_lasx_xvfadd_s((v8f32)_1, (v8f32)_2); in __lasx_xvfadd_s()
1598 __attribute__((__gnu_inline__, __always_inline__, __artificial__)) __m256
1599 __lasx_xvfsub_s(__m256 _1, __m256 _2) { in __lasx_xvfsub_s()
1600 return (__m256)__builtin_lasx_xvfsub_s((v8f32)_1, (v8f32)_2); in __lasx_xvfsub_s()
1610 __attribute__((__gnu_inline__, __always_inline__, __artificial__)) __m256
1611 __lasx_xvfmul_s(__m256 _1, __m256 _2) { in __lasx_xvfmul_s()
1612 return (__m256)__builtin_lasx_xvfmul_s((v8f32)_1, (v8f32)_2); in __lasx_xvfmul_s()
[all …]
H A Davx10_2_512satcvtdsintrin.h237 static __inline__ __m512i __DEFAULT_FN_ATTRS _mm512_cvtts_ps_epi64(__m256 __A) { in _mm512_cvtts_ps_epi64()
244 _mm512_mask_cvtts_ps_epi64(__m512i __W, __mmask8 __U, __m256 __A) { in _mm512_mask_cvtts_ps_epi64()
250 _mm512_maskz_cvtts_ps_epi64(__mmask8 __U, __m256 __A) { in _mm512_maskz_cvtts_ps_epi64()
258 (__v8sf)(__m256)(__A), (__v8di)_mm512_undefined_epi32(), (__mmask8) - 1, \
263 (__v8sf)(__m256)(__A), (__v8di)(__m512i)(__W), (__mmask8)(__U), \
268 (__v8sf)(__m256)(__A), (__v8di)_mm512_setzero_si512(), (__mmask8)(__U), \
272 static __inline__ __m512i __DEFAULT_FN_ATTRS _mm512_cvtts_ps_epu64(__m256 __A) { in _mm512_cvtts_ps_epu64()
279 _mm512_mask_cvtts_ps_epu64(__m512i __W, __mmask8 __U, __m256 __A) { in _mm512_mask_cvtts_ps_epu64()
285 _mm512_maskz_cvtts_ps_epu64(__mmask8 __U, __m256 __A) { in _mm512_maskz_cvtts_ps_epu64()
293 (__v8sf)(__m256)(__A), (__v8di)_mm512_undefined_epi32(), (__mmask8) - 1, \
[all …]
H A Davx10_2satcvtintrin.h131 (__v8sf)(__m256)(A), (__v8su)_mm256_setzero_si256(), (__mmask8)-1))
134 ((__m256i)__builtin_ia32_vcvtps2ibs256_mask((__v8sf)(__m256)(A), \
139 (__v8sf)(__m256)(A), (__v8su)(_mm256_setzero_si256()), (__mmask8)(U)))
155 (__v8sf)(__m256)(A), (__v8su)_mm256_setzero_si256(), (__mmask8)-1))
158 ((__m256i)__builtin_ia32_vcvtps2iubs256_mask((__v8sf)(__m256)(A), \
163 (__v8sf)(__m256)(A), (__v8su)(_mm256_setzero_si256()), (__mmask8)(U)))
279 (__v8sf)(__m256)(A), (__v8su)_mm256_setzero_si256(), (__mmask8)-1))
282 ((__m256i)__builtin_ia32_vcvttps2ibs256_mask((__v8sf)(__m256)(A), \
287 (__v8sf)(__m256)(A), (__v8su)(_mm256_setzero_si256()), (__mmask8)(U)))
303 (__v8sf)(__m256)(A), (__v8su)_mm256_setzero_si256(), (__mmask8)-1))
[all …]
H A Davx10_2minmaxintrin.h129 ((__m256)__builtin_ia32_vminmaxps256_mask( \
130 (__v8sf)(__m256)(A), (__v8sf)(__m256)(B), (int)(C), \
134 ((__m256)__builtin_ia32_vminmaxps256_mask( \
135 (__v8sf)(__m256)(A), (__v8sf)(__m256)(B), (int)(C), (__v8sf)(__m256)(W), \
139 ((__m256)__builtin_ia32_vminmaxps256_mask( \
140 (__v8sf)(__m256)(A), (__v8sf)(__m256)(B), (int)(C), \
H A Df16cintrin.h139 ((__m128i)__builtin_ia32_vcvtps2ph256((__v8sf)(__m256)(a), (imm)))
153 static __inline __m256 __DEFAULT_FN_ATTRS256
156 return (__m256)__builtin_ia32_vcvtph2ps256((__v8hi)__a); in _mm256_cvtph_ps()
H A Davx10_2niintrin.h50 static __inline__ __m256 __DEFAULT_FN_ATTRS256 _mm256_dpph_ps(__m256 __W, in _mm256_dpph_ps()
53 return (__m256)__builtin_ia32_vdpphps256((__v8sf)__W, (__v16hf)__A, in _mm256_dpph_ps()
57 static __inline__ __m256 __DEFAULT_FN_ATTRS256
58 _mm256_mask_dpph_ps(__m256 __W, __mmask8 __U, __m256h __A, __m256h __B) { in _mm256_mask_dpph_ps()
59 return (__m256)__builtin_ia32_selectps_256( in _mm256_mask_dpph_ps()
63 static __inline__ __m256 __DEFAULT_FN_ATTRS256
64 _mm256_maskz_dpph_ps(__mmask8 __U, __m256 __W, __m256h __A, __m256h __B) { in _mm256_maskz_dpph_ps()
65 return (__m256)__builtin_ia32_selectps_256( in _mm256_maskz_dpph_ps()
H A Davx10_2satcvtdsintrin.h246 _mm256_cvtts_ps_epi32(__m256 __A) { in _mm256_cvtts_ps_epi32()
252 _mm256_mask_cvtts_ps_epi32(__m256i __W, __mmask8 __U, __m256 __A) { in _mm256_mask_cvtts_ps_epi32()
258 _mm256_maskz_cvtts_ps_epi32(__mmask8 __U, __m256 __A) { in _mm256_maskz_cvtts_ps_epi32()
284 _mm256_cvtts_ps_epu32(__m256 __A) { in _mm256_cvtts_ps_epu32()
290 _mm256_mask_cvtts_ps_epu32(__m256i __W, __mmask8 __U, __m256 __A) { in _mm256_mask_cvtts_ps_epu32()
296 _mm256_maskz_cvtts_ps_epu32(__mmask8 __U, __m256 __A) { in _mm256_maskz_cvtts_ps_epu32()
H A Dxopintrin.h727 ((__m256)__builtin_ia32_vpermil2ps256((__v8sf)(__m256)(X), \
728 (__v8sf)(__m256)(Y), \
755 static __inline__ __m256 __DEFAULT_FN_ATTRS256
756 _mm256_frcz_ps(__m256 __A) in _mm256_frcz_ps()
758 return (__m256)__builtin_ia32_vfrczps256((__v8sf)__A); in _mm256_frcz_ps()
H A Davx10_2convertintrin.h178 static __inline__ __m256h __DEFAULT_FN_ATTRS256 _mm256_cvtx2ps_ph(__m256 __A, in _mm256_cvtx2ps_ph()
179 __m256 __B) { in _mm256_cvtx2ps_ph()
223 _mm256_mask_cvtx2ps_ph(__m256h __W, __mmask16 __U, __m256 __A, __m256 __B) { in _mm256_mask_cvtx2ps_ph()
265 _mm256_maskz_cvtx2ps_ph(__mmask16 __U, __m256 __A, __m256 __B) { in _mm256_maskz_cvtx2ps_ph()
H A Davx2intrin.h3046 static __inline__ __m256 __DEFAULT_FN_ATTRS256
3049 return (__m256)__builtin_shufflevector((__v4sf)__X, (__v4sf)__X, 0, 0, 0, 0, 0, 0, 0, 0); in _mm256_broadcastss_ps()
3369 static __inline__ __m256 __DEFAULT_FN_ATTRS256
3370 _mm256_permutevar8x32_ps(__m256 __a, __m256i __b) in _mm256_permutevar8x32_ps()
3372 return (__m256)__builtin_ia32_permvarsf256((__v8sf)__a, (__v8si)__b); in _mm256_permutevar8x32_ps()
4249 ((__m256)__builtin_ia32_gatherd_ps256((__v8sf)(__m256)(a), \
4252 (__v8sf)(__m256)(mask), (s)))
4947 ((__m256)__builtin_ia32_gatherd_ps256((__v8sf)_mm256_undefined_ps(), \
H A Davx512fintrin.h414 _mm512_castps256_ps512(__m256 __a) in _mm512_castps256_ps512()
438 static __inline __m256 __DEFAULT_FN_ATTRS512
480 __m256 __B = __builtin_nondeterministic_value(__B); in _mm512_castps128_ps512()
606 _mm512_zextps256_ps512(__m256 __a) in _mm512_zextps256_ps512()
3731 ((__m256)__builtin_ia32_cvtpd2ps512_mask((__v8df)(__m512d)(A), \
3736 ((__m256)__builtin_ia32_cvtpd2ps512_mask((__v8df)(__m512d)(A), \
3737 (__v8sf)(__m256)(W), (__mmask8)(U), \
3741 ((__m256)__builtin_ia32_cvtpd2ps512_mask((__v8df)(__m512d)(A), \
3745 static __inline__ __m256 __DEFAULT_FN_ATTRS512
3748 return (__m256) __builtin_ia32_cvtpd2ps512_mask ((__v8df) __A, in _mm512_cvtpd_ps()
[all …]
H A Davx10_2bf16intrin.h42 static __inline__ __m256 __DEFAULT_FN_ATTRS256
44 return (__m256)__a; in _mm256_castbf16_ps()
70 static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_castps_pbh(__m256 __a) { in _mm256_castps_pbh()
H A Davx512fp16intrin.h107 static __inline__ __m256 __DEFAULT_FN_ATTRS256 _mm256_castph_ps(__m256h __a) { in _mm256_castph_ps()
108 return (__m256)__a; in _mm256_castph_ps()
145 static __inline__ __m256h __DEFAULT_FN_ATTRS256 _mm256_castps_ph(__m256 __a) { in _mm256_castps_ph()
/freebsd/sys/contrib/libsodium/
H A Dconfigure.ac459 __m256 x = _mm256_set1_ps(3.14);
460 __m256 y = _mm256_permutevar8x32_ps(x, _mm256_set1_epi32(42));
/freebsd/contrib/llvm-project/llvm/lib/Target/X86/
H A DX86CallingConv.td151 // __m256, __m256i, __m256d --> YMM
224 // __m256, __m256i, __m256d --> YMM