| /freebsd/contrib/llvm-project/clang/lib/Headers/ |
| H A D | xmmintrin.h | 19 typedef float __v4sf __attribute__((__vector_size__(16))); typedef 106 return (__m128)((__v4sf)__a + (__v4sf)__b); in _mm_add_ps() 147 return (__m128)((__v4sf)__a - (__v4sf)__b); in _mm_sub_ps() 187 return (__m128)((__v4sf)__a * (__v4sf)__b); in _mm_mul_ps() 226 return (__m128)((__v4sf)__a / (__v4sf)__b); in _mm_div_ps() 244 return (__m128)__builtin_ia32_sqrtss((__v4sf)__a); in _mm_sqrt_ss() 261 return __builtin_ia32_sqrtps((__v4sf)__a); in _mm_sqrt_ps() 279 return (__m128)__builtin_ia32_rcpss((__v4sf)__a); in _mm_rcp_ss() 296 return (__m128)__builtin_ia32_rcpps((__v4sf)__a); in _mm_rcp_ps() 315 return __builtin_ia32_rsqrtss((__v4sf)__a); in _mm_rsqrt_ss() [all …]
|
| H A D | fmaintrin.h | 38 return (__m128)__builtin_ia32_vfmaddps((__v4sf)__A, (__v4sf)__B, (__v4sf)__C); in _mm_fmadd_ps() 87 return (__m128)__builtin_ia32_vfmaddss3((__v4sf)__A, (__v4sf)__B, (__v4sf)__C); in _mm_fmadd_ss() 136 return (__m128)__builtin_ia32_vfmaddps((__v4sf)__A, (__v4sf)__B, -(__v4sf)__C); in _mm_fmsub_ps() 185 return (__m128)__builtin_ia32_vfmaddss3((__v4sf)__A, (__v4sf)__B, -(__v4sf)__C); in _mm_fmsub_ss() 234 return (__m128)__builtin_ia32_vfmaddps(-(__v4sf)__A, (__v4sf)__B, (__v4sf)__C); in _mm_fnmadd_ps() 283 return (__m128)__builtin_ia32_vfmaddss3((__v4sf)__A, -(__v4sf)__B, (__v4sf)__C); in _mm_fnmadd_ss() 332 return (__m128)__builtin_ia32_vfmaddps(-(__v4sf)__A, (__v4sf)__B, -(__v4sf)__C); in _mm_fnmsub_ps() 381 return (__m128)__builtin_ia32_vfmaddss3((__v4sf)__A, -(__v4sf)__B, -(__v4sf)__C); in _mm_fnmsub_ss() 437 return (__m128)__builtin_ia32_vfmaddsubps((__v4sf)__A, (__v4sf)__B, (__v4sf)__C); in _mm_fmaddsub_ps() 489 return (__m128)__builtin_ia32_vfmaddsubps((__v4sf)__A, (__v4sf)__B, -(__v4sf)__C); in _mm_fmsubadd_ps()
|
| H A D | fma4intrin.h | 26 return (__m128)__builtin_ia32_vfmaddps((__v4sf)__A, (__v4sf)__B, (__v4sf)__C); in _mm_macc_ps() 38 return (__m128)__builtin_ia32_vfmaddss((__v4sf)__A, (__v4sf)__B, (__v4sf)__C); in _mm_macc_ss() 50 return (__m128)__builtin_ia32_vfmaddps((__v4sf)__A, (__v4sf)__B, -(__v4sf)__C); in _mm_msub_ps() 62 return (__m128)__builtin_ia32_vfmaddss((__v4sf)__A, (__v4sf)__B, -(__v4sf)__C); in _mm_msub_ss() 74 return (__m128)__builtin_ia32_vfmaddps(-(__v4sf)__A, (__v4sf)__B, (__v4sf)__C); in _mm_nmacc_ps() 86 return (__m128)__builtin_ia32_vfmaddss(-(__v4sf)__A, (__v4sf)__B, (__v4sf)__C); in _mm_nmacc_ss() 98 return (__m128)__builtin_ia32_vfmaddps(-(__v4sf)__A, (__v4sf)__B, -(__v4sf)__C); in _mm_nmsub_ps() 110 return (__m128)__builtin_ia32_vfmaddss(-(__v4sf)__A, (__v4sf)__B, -(__v4sf)__C); in _mm_nmsub_ss() 122 return (__m128)__builtin_ia32_vfmaddsubps((__v4sf)__A, (__v4sf)__B, (__v4sf)__C); in _mm_maddsub_ps() 134 return (__m128)__builtin_ia32_vfmaddsubps((__v4sf)__A, (__v4sf)__B, -(__v4sf)__C); in _mm_msubadd_ps()
|
| H A D | avx10_2minmaxintrin.h | 115 (__v4sf)(__m128)(A), (__v4sf)(__m128)(B), (int)(C), \ 116 (__v4sf)_mm_setzero_ps(), (__mmask8)-1)) 120 (__v4sf)(__m128)(A), (__v4sf)(__m128)(B), (int)(C), (__v4sf)(__m128)(W), \ 125 (__v4sf)(__m128)(A), (__v4sf)(__m128)(B), (int)(C), \ 126 (__v4sf)_mm_setzero_ps(), (__mmask8)(U))) 205 (__v4sf)(__m128)(A), (__v4sf)(__m128)(B), (int)(C), \ 206 (__v4sf)_mm_undefined_ps(), (__mmask8)-1, _MM_FROUND_CUR_DIRECTION)) 210 (__v4sf)(__m128)(A), (__v4sf)(__m128)(B), (int)(C), (__v4sf)(W), \ 215 (__v4sf)(__m128)(A), (__v4sf)(__m128)(B), (int)(C), \ 216 (__v4sf)_mm_setzero_ps(), (__mmask8)(U), _MM_FROUND_CUR_DIRECTION)) [all …]
|
| H A D | pmmintrin.h | 72 return __builtin_ia32_addsubps((__v4sf)__a, (__v4sf)__b); in _mm_addsub_ps() 95 return __builtin_ia32_haddps((__v4sf)__a, (__v4sf)__b); in _mm_hadd_ps() 118 return __builtin_ia32_hsubps((__v4sf)__a, (__v4sf)__b); in _mm_hsub_ps() 140 return __builtin_shufflevector((__v4sf)__a, (__v4sf)__a, 1, 1, 3, 3); in _mm_movehdup_ps() 161 return __builtin_shufflevector((__v4sf)__a, (__v4sf)__a, 0, 0, 2, 2); in _mm_moveldup_ps()
|
| H A D | avx10_2satcvtdsintrin.h | 38 ((int)__builtin_ia32_vcvttss2sis32((__v4sf)(__m128)(__A), (const int)(__R))) 41 ((int)__builtin_ia32_vcvttss2sis32((__v4sf)(__m128)(__A), (const int)(__R))) 44 ((unsigned int)__builtin_ia32_vcvttss2usis32((__v4sf)(__m128)(__A), \ 49 ((unsigned long long)__builtin_ia32_vcvttss2usis64((__v4sf)(__m128)(__A), \ 57 ((long long)__builtin_ia32_vcvttss2sis64((__v4sf)(__m128)(__A), \ 61 ((long long)__builtin_ia32_vcvttss2sis64((__v4sf)(__m128)(__A), \ 229 (__v4sf)__A, (__v4si)(__m128i)_mm_undefined_si128(), (__mmask8)(-1))); in _mm_cvtts_ps_epi32() 234 return ((__m128i)__builtin_ia32_vcvttps2dqs128_mask((__v4sf)__A, (__v4si)__W, in _mm_mask_cvtts_ps_epi32() 241 (__v4sf)__A, (__v4si)(__m128i)_mm_setzero_si128(), (__mmask8)__U)); in _mm_maskz_cvtts_ps_epi32() 266 (__v4sf)__A, (__v4si)(__m128i)_mm_undefined_si128(), (__mmask8)(-1))); in _mm_cvtts_ps_epu32() [all …]
|
| H A D | avx512fintrin.h | 350 return (__m512)__builtin_shufflevector((__v4sf) __A, (__v4sf) __A, in _mm512_broadcastss_ps() 590 …return __builtin_shufflevector((__v4sf)__a, (__v4sf)_mm_setzero_ps(), 0, 1, 2, 3, 4, 5, 6, 7, 4, 5… in _mm512_zextps128_ps512() 1038 return (__m128) __builtin_ia32_maxss_round_mask ((__v4sf) __A, in _mm_mask_max_ss() 1039 (__v4sf) __B, in _mm_mask_max_ss() 1040 (__v4sf) __W, in _mm_mask_max_ss() 1047 return (__m128) __builtin_ia32_maxss_round_mask ((__v4sf) __A, in _mm_maskz_max_ss() 1048 (__v4sf) __B, in _mm_maskz_max_ss() 1049 (__v4sf) _mm_setzero_ps (), in _mm_maskz_max_ss() 1055 ((__m128)__builtin_ia32_maxss_round_mask((__v4sf)(__m128)(A), \ 1056 (__v4sf)(__m128)(B), \ [all …]
|
| H A D | avx10_2satcvtintrin.h | 119 (__v4sf)(__m128)(A), (__v4su)_mm_setzero_si128(), (__mmask8)-1)) 122 ((__m128i)__builtin_ia32_vcvtps2ibs128_mask((__v4sf)(__m128)(A), \ 127 (__v4sf)(__m128)(A), (__v4su)(_mm_setzero_si128()), (__mmask8)(U))) 143 (__v4sf)(__m128)(A), (__v4su)_mm_setzero_si128(), (__mmask8)-1)) 146 ((__m128i)__builtin_ia32_vcvtps2iubs128_mask((__v4sf)(__m128)(A), \ 151 (__v4sf)(__m128)(A), (__v4su)(_mm_setzero_si128()), (__mmask8)(U))) 267 (__v4sf)(__m128)(A), (__v4su)_mm_setzero_si128(), (__mmask8)-1)) 270 ((__m128i)__builtin_ia32_vcvttps2ibs128_mask((__v4sf)(__m128)(A), \ 275 (__v4sf)(__m128)(A), (__v4su)(_mm_setzero_si128()), (__mmask8)(U))) 291 (__v4sf)(__m128)(A), (__v4su)_mm_setzero_si128(), (__mmask8)-1)) [all …]
|
| H A D | avx512fp16intrin.h | 1524 ((__m128)__builtin_ia32_vcvtsh2ss_round_mask((__v4sf)(A), (__v8hf)(B), \ 1525 (__v4sf)_mm_undefined_ps(), \ 1530 (__v4sf)(A), (__v8hf)(B), (__v4sf)(W), (__mmask8)(U), (int)(R))) 1533 ((__m128)__builtin_ia32_vcvtsh2ss_round_mask((__v4sf)(A), (__v8hf)(B), \ 1534 (__v4sf)_mm_setzero_ps(), \ 1540 (__v4sf)__A, (__v8hf)__B, (__v4sf)_mm_undefined_ps(), (__mmask8)-1, in _mm_cvtsh_ss() 1548 return (__m128)__builtin_ia32_vcvtsh2ss_round_mask((__v4sf)__A, (__v8hf)__B, in _mm_mask_cvtsh_ss() 1549 (__v4sf)__W, (__mmask8)__U, in _mm_mask_cvtsh_ss() 1557 (__v4sf)__A, (__v8hf)__B, (__v4sf)_mm_setzero_ps(), (__mmask8)__U, in _mm_maskz_cvtsh_ss() 1562 ((__m128h)__builtin_ia32_vcvtss2sh_round_mask((__v8hf)(A), (__v4sf)(B), \ [all …]
|
| H A D | smmintrin.h | 246 ((__m128)__builtin_ia32_roundps((__v4sf)(__m128)(X), (M))) 287 ((__m128)__builtin_ia32_roundss((__v4sf)(__m128)(X), (__v4sf)(__m128)(Y), \ 419 ((__m128)__builtin_ia32_blendps((__v4sf)(__m128)(V1), (__v4sf)(__m128)(V2), \ 472 return (__m128)__builtin_ia32_blendvps((__v4sf)__V1, (__v4sf)__V2, in _mm_blendv_ps() 473 (__v4sf)__M); in _mm_blendv_ps() 603 ((__m128)__builtin_ia32_dpps((__v4sf)(__m128)(X), (__v4sf)(__m128)(Y), (M))) 870 int, __builtin_ia32_vec_ext_v4sf((__v4sf)(__m128)(X), (int)(N))) 876 (D) = __builtin_ia32_vec_ext_v4sf((__v4sf)(__m128)(X), (int)(N)); \
|
| H A D | f16cintrin.h | 42 __v4sf __r = __builtin_ia32_vcvtph2ps(__v); in _cvtsh_ss() 69 (unsigned short)(((__v8hi)__builtin_ia32_vcvtps2ph((__v4sf){a, 0, 0, 0}, \ 96 ((__m128i)__builtin_ia32_vcvtps2ph((__v4sf)(__m128)(a), (imm)))
|
| H A D | avxintrin.h | 910 return (__m128)__builtin_ia32_vpermilvarps((__v4sf)__a, (__v4si)__c); in _mm_permutevar_ps() 1128 ((__m128)__builtin_ia32_vpermilps((__v4sf)(__m128)(A), (int)(C))) 2262 return (__m256d)__builtin_convertvector((__v4sf)__a, __v4df); in _mm256_cvtps_pd() 2662 return __builtin_ia32_vtestzps((__v4sf)__a, (__v4sf)__b); in _mm_testz_ps() 2691 return __builtin_ia32_vtestcps((__v4sf)__a, (__v4sf)__b); in _mm_testc_ps() 2721 return __builtin_ia32_vtestnzcps((__v4sf)__a, (__v4sf)__b); in _mm_testnzc_ps() 3142 return (__m256)__builtin_shufflevector((__v4sf)__b, (__v4sf)__b, in _mm256_broadcast_ps() 3462 return (__m128)__builtin_ia32_maskloadps((const __v4sf *)__p, (__v4si)__m); in _mm_maskload_ps() 3583 __builtin_ia32_maskstoreps((__v4sf *)__p, (__v4si)__m, (__v4sf)__a); in _mm_maskstore_ps() 4563 return __builtin_shufflevector((__v4sf)__a, in _mm256_castps128_ps256() [all …]
|
| H A D | avx2intrin.h | 3015 return (__m128)__builtin_shufflevector((__v4sf)__X, (__v4sf)__X, 0, 0, 0, 0); in _mm_broadcastss_ps() 3049 return (__m256)__builtin_shufflevector((__v4sf)__X, (__v4sf)__X, 0, 0, 0, 0, 0, 0, 0, 0); in _mm256_broadcastss_ps() 4201 ((__m128)__builtin_ia32_gatherd_ps((__v4sf)(__m128)(a), \ 4204 (__v4sf)(__m128)(mask), (s))) 4300 ((__m128)__builtin_ia32_gatherq_ps((__v4sf)(__m128)(a), \ 4303 (__v4sf)(__m128)(mask), (s))) 4348 ((__m128)__builtin_ia32_gatherq_ps256((__v4sf)(__m128)(a), \ 4351 (__v4sf)(__m128)(mask), (s))) 4912 ((__m128)__builtin_ia32_gatherd_ps((__v4sf)_mm_undefined_ps(), \ 4915 (__v4sf)_mm_cmpeq_ps(_mm_setzero_ps(), \ [all …]
|
| H A D | avx10_2niintrin.h | 29 return (__m128)__builtin_ia32_vdpphps128((__v4sf)__W, (__v8hf)__A, in _mm_dpph_ps() 38 (__mmask8)__U, (__v4sf)_mm_dpph_ps(__W, __A, __B), (__v4sf)__W); in _mm_mask_dpph_ps() 46 (__v4sf)_mm_dpph_ps(__W, __A, __B), in _mm_maskz_dpph_ps() 47 (__v4sf)_mm_setzero_ps()); in _mm_maskz_dpph_ps()
|
| H A D | avx10_2convertintrin.h | 61 (__v4sf)__A, (__v4sf)__B, (__v8hf)_mm_setzero_ph(), (__mmask8)(-1)); in _mm_cvtx2ps_ph() 105 (__v4sf)__A, (__v4sf)__B, (__v8hf)__W, (__mmask8)__U); in _mm_mask_cvtx2ps_ph() 147 (__v4sf)__A, (__v4sf)__B, (__v8hf)_mm_setzero_ph(), (__mmask8)__U); in _mm_maskz_cvtx2ps_ph()
|
| H A D | avxneconvertintrin.h | 449 return (__m128bh)__builtin_ia32_vcvtneps2bf16128((__v4sf)__A); in _mm_cvtneps_avx_pbh()
|
| H A D | xopintrin.h | 723 ((__m128)__builtin_ia32_vpermil2ps((__v4sf)(__m128)(X), (__v4sf)(__m128)(Y), \ 734 return (__m128)__builtin_ia32_vfrczss((__v4sf)__A); in _mm_frcz_ss() 746 return (__m128)__builtin_ia32_vfrczps((__v4sf)__A); in _mm_frcz_ps()
|
| H A D | emmintrin.h | 1308 __builtin_shufflevector((__v4sf)__a, (__v4sf)__a, 0, 1), __v2df); in _mm_cvtps_pd() 1394 return (__m128)__builtin_ia32_cvtsd2ss((__v4sf)__a, (__v2df)__b); in _mm_cvtsd_ss() 3328 return (__m128) __builtin_convertvector((__v4si)__a, __v4sf); in _mm_cvtepi32_ps() 3346 return (__m128i)__builtin_ia32_cvtps2dq((__v4sf)__a); in _mm_cvtps_epi32() 3365 return (__m128i)__builtin_ia32_cvttps2dq((__v4sf)__a); in _mm_cvttps_epi32()
|
| /freebsd/contrib/llvm-project/clang/lib/Headers/ppc_wrappers/ |
| H A D | xmmintrin.h | 73 typedef vector float __v4sf; typedef 94 return ((__m128)vec_ld(0, (__v4sf *)__P)); in _mm_load_ps() 108 __v4sf __tmp; in _mm_loadr_ps() 114 __tmp = vec_ld(0, (__v4sf *)__P); in _mm_loadr_ps() 123 return __extension__(__m128)(__v4sf){__F, __F, __F, __F}; in _mm_set1_ps() 136 return __extension__(__m128)(__v4sf){__W, __X, __Y, __Z}; in _mm_set_ps() 143 return __extension__(__m128)(__v4sf){__Z, __Y, __X, __W}; in _mm_setr_ps() 150 vec_st((__v4sf)__A, 0, (__v4sf *)__P); in _mm_store_ps() 164 __v4sf __tmp; in _mm_storer_ps() 178 __v4sf __va = vec_splat((__v4sf)__A, 0); in _mm_store1_ps() [all …]
|
| H A D | pmmintrin.h | 51 const __v4sf __even_n0 = {-0.0, 0.0, -0.0, 0.0}; in _mm_addsub_ps() 52 __v4sf __even_neg_Y = vec_xor(__Y, __even_n0); in _mm_addsub_ps() 73 return (__m128)vec_add(vec_perm((__v4sf)__X, (__v4sf)__Y, __xform2), in _mm_hadd_ps() 74 vec_perm((__v4sf)__X, (__v4sf)__Y, __xform1)); in _mm_hadd_ps() 86 return (__m128)vec_sub(vec_perm((__v4sf)__X, (__v4sf)__Y, __xform2), in _mm_hsub_ps() 87 vec_perm((__v4sf)__X, (__v4sf)__Y, __xform1)); in _mm_hsub_ps()
|
| H A D | emmintrin.h | 881 __v4sf __result; in _mm_cvtpd_ps() 893 __result = (__v4sf)vec_vpkudum((__vector long long)__temp, in _mm_cvtpd_ps() 899 __result = (__v4sf)vec_perm((__v16qu)__temp, (__v16qu)__vzero, __pkperm); in _mm_cvtpd_ps() 967 __v4sf __rounded; in _mm_cvtps_epi32() 970 __rounded = vec_rint((__v4sf)__A); in _mm_cvtps_epi32() 980 __result = vec_cts((__v4sf)__A, 0); in _mm_cvttps_epi32() 989 return (__m128d)vec_doubleh((__v4sf)__A); in _mm_cvtps_pd() 993 __v4sf __a = (__v4sf)__A; in _mm_cvtps_pd() 994 __v4sf __temp; in _mm_cvtps_pd() 1067 __v4sf __result = (__v4sf)__A; in _mm_cvtsd_ss() [all …]
|