Lines Matching refs:__A

285 static __inline__ int __DEFAULT_FN_ATTRS128 _mm_comieq_sh(__m128h __A,  in _mm_comieq_sh()  argument
287 return __builtin_ia32_vcomish((__v8hf)__A, (__v8hf)__B, _CMP_EQ_OS, in _mm_comieq_sh()
291 static __inline__ int __DEFAULT_FN_ATTRS128 _mm_comilt_sh(__m128h __A, in _mm_comilt_sh() argument
293 return __builtin_ia32_vcomish((__v8hf)__A, (__v8hf)__B, _CMP_LT_OS, in _mm_comilt_sh()
297 static __inline__ int __DEFAULT_FN_ATTRS128 _mm_comile_sh(__m128h __A, in _mm_comile_sh() argument
299 return __builtin_ia32_vcomish((__v8hf)__A, (__v8hf)__B, _CMP_LE_OS, in _mm_comile_sh()
303 static __inline__ int __DEFAULT_FN_ATTRS128 _mm_comigt_sh(__m128h __A, in _mm_comigt_sh() argument
305 return __builtin_ia32_vcomish((__v8hf)__A, (__v8hf)__B, _CMP_GT_OS, in _mm_comigt_sh()
309 static __inline__ int __DEFAULT_FN_ATTRS128 _mm_comige_sh(__m128h __A, in _mm_comige_sh() argument
311 return __builtin_ia32_vcomish((__v8hf)__A, (__v8hf)__B, _CMP_GE_OS, in _mm_comige_sh()
315 static __inline__ int __DEFAULT_FN_ATTRS128 _mm_comineq_sh(__m128h __A, in _mm_comineq_sh() argument
317 return __builtin_ia32_vcomish((__v8hf)__A, (__v8hf)__B, _CMP_NEQ_US, in _mm_comineq_sh()
321 static __inline__ int __DEFAULT_FN_ATTRS128 _mm_ucomieq_sh(__m128h __A, in _mm_ucomieq_sh() argument
323 return __builtin_ia32_vcomish((__v8hf)__A, (__v8hf)__B, _CMP_EQ_OQ, in _mm_ucomieq_sh()
327 static __inline__ int __DEFAULT_FN_ATTRS128 _mm_ucomilt_sh(__m128h __A, in _mm_ucomilt_sh() argument
329 return __builtin_ia32_vcomish((__v8hf)__A, (__v8hf)__B, _CMP_LT_OQ, in _mm_ucomilt_sh()
333 static __inline__ int __DEFAULT_FN_ATTRS128 _mm_ucomile_sh(__m128h __A, in _mm_ucomile_sh() argument
335 return __builtin_ia32_vcomish((__v8hf)__A, (__v8hf)__B, _CMP_LE_OQ, in _mm_ucomile_sh()
339 static __inline__ int __DEFAULT_FN_ATTRS128 _mm_ucomigt_sh(__m128h __A, in _mm_ucomigt_sh() argument
341 return __builtin_ia32_vcomish((__v8hf)__A, (__v8hf)__B, _CMP_GT_OQ, in _mm_ucomigt_sh()
345 static __inline__ int __DEFAULT_FN_ATTRS128 _mm_ucomige_sh(__m128h __A, in _mm_ucomige_sh() argument
347 return __builtin_ia32_vcomish((__v8hf)__A, (__v8hf)__B, _CMP_GE_OQ, in _mm_ucomige_sh()
351 static __inline__ int __DEFAULT_FN_ATTRS128 _mm_ucomineq_sh(__m128h __A, in _mm_ucomineq_sh() argument
353 return __builtin_ia32_vcomish((__v8hf)__A, (__v8hf)__B, _CMP_NEQ_UQ, in _mm_ucomineq_sh()
357 static __inline__ __m512h __DEFAULT_FN_ATTRS512 _mm512_add_ph(__m512h __A, in _mm512_add_ph() argument
359 return (__m512h)((__v32hf)__A + (__v32hf)__B); in _mm512_add_ph()
363 _mm512_mask_add_ph(__m512h __W, __mmask32 __U, __m512h __A, __m512h __B) { in _mm512_mask_add_ph() argument
365 (__mmask32)__U, (__v32hf)_mm512_add_ph(__A, __B), (__v32hf)__W); in _mm512_mask_add_ph()
369 _mm512_maskz_add_ph(__mmask32 __U, __m512h __A, __m512h __B) { in _mm512_maskz_add_ph() argument
371 (__v32hf)_mm512_add_ph(__A, __B), in _mm512_maskz_add_ph()
389 static __inline__ __m512h __DEFAULT_FN_ATTRS512 _mm512_sub_ph(__m512h __A, in _mm512_sub_ph() argument
391 return (__m512h)((__v32hf)__A - (__v32hf)__B); in _mm512_sub_ph()
395 _mm512_mask_sub_ph(__m512h __W, __mmask32 __U, __m512h __A, __m512h __B) { in _mm512_mask_sub_ph() argument
397 (__mmask32)__U, (__v32hf)_mm512_sub_ph(__A, __B), (__v32hf)__W); in _mm512_mask_sub_ph()
401 _mm512_maskz_sub_ph(__mmask32 __U, __m512h __A, __m512h __B) { in _mm512_maskz_sub_ph() argument
403 (__v32hf)_mm512_sub_ph(__A, __B), in _mm512_maskz_sub_ph()
421 static __inline__ __m512h __DEFAULT_FN_ATTRS512 _mm512_mul_ph(__m512h __A, in _mm512_mul_ph() argument
423 return (__m512h)((__v32hf)__A * (__v32hf)__B); in _mm512_mul_ph()
427 _mm512_mask_mul_ph(__m512h __W, __mmask32 __U, __m512h __A, __m512h __B) { in _mm512_mask_mul_ph() argument
429 (__mmask32)__U, (__v32hf)_mm512_mul_ph(__A, __B), (__v32hf)__W); in _mm512_mask_mul_ph()
433 _mm512_maskz_mul_ph(__mmask32 __U, __m512h __A, __m512h __B) { in _mm512_maskz_mul_ph() argument
435 (__v32hf)_mm512_mul_ph(__A, __B), in _mm512_maskz_mul_ph()
453 static __inline__ __m512h __DEFAULT_FN_ATTRS512 _mm512_div_ph(__m512h __A, in _mm512_div_ph() argument
455 return (__m512h)((__v32hf)__A / (__v32hf)__B); in _mm512_div_ph()
459 _mm512_mask_div_ph(__m512h __W, __mmask32 __U, __m512h __A, __m512h __B) { in _mm512_mask_div_ph() argument
461 (__mmask32)__U, (__v32hf)_mm512_div_ph(__A, __B), (__v32hf)__W); in _mm512_mask_div_ph()
465 _mm512_maskz_div_ph(__mmask32 __U, __m512h __A, __m512h __B) { in _mm512_maskz_div_ph() argument
467 (__v32hf)_mm512_div_ph(__A, __B), in _mm512_maskz_div_ph()
485 static __inline__ __m512h __DEFAULT_FN_ATTRS512 _mm512_min_ph(__m512h __A, in _mm512_min_ph() argument
487 return (__m512h)__builtin_ia32_minph512((__v32hf)__A, (__v32hf)__B, in _mm512_min_ph()
492 _mm512_mask_min_ph(__m512h __W, __mmask32 __U, __m512h __A, __m512h __B) { in _mm512_mask_min_ph() argument
494 (__mmask32)__U, (__v32hf)_mm512_min_ph(__A, __B), (__v32hf)__W); in _mm512_mask_min_ph()
498 _mm512_maskz_min_ph(__mmask32 __U, __m512h __A, __m512h __B) { in _mm512_maskz_min_ph() argument
500 (__v32hf)_mm512_min_ph(__A, __B), in _mm512_maskz_min_ph()
518 static __inline__ __m512h __DEFAULT_FN_ATTRS512 _mm512_max_ph(__m512h __A, in _mm512_max_ph() argument
520 return (__m512h)__builtin_ia32_maxph512((__v32hf)__A, (__v32hf)__B, in _mm512_max_ph()
525 _mm512_mask_max_ph(__m512h __W, __mmask32 __U, __m512h __A, __m512h __B) { in _mm512_mask_max_ph() argument
527 (__mmask32)__U, (__v32hf)_mm512_max_ph(__A, __B), (__v32hf)__W); in _mm512_mask_max_ph()
531 _mm512_maskz_max_ph(__mmask32 __U, __m512h __A, __m512h __B) { in _mm512_maskz_max_ph() argument
533 (__v32hf)_mm512_max_ph(__A, __B), in _mm512_maskz_max_ph()
551 static __inline__ __m512h __DEFAULT_FN_ATTRS512 _mm512_abs_ph(__m512h __A) { in _mm512_abs_ph() argument
552 return (__m512h)_mm512_and_epi32(_mm512_set1_epi32(0x7FFF7FFF), (__m512i)__A); in _mm512_abs_ph()
555 static __inline__ __m512h __DEFAULT_FN_ATTRS512 _mm512_conj_pch(__m512h __A) { in _mm512_conj_pch() argument
556 return (__m512h)_mm512_xor_ps((__m512)__A, _mm512_set1_ps(-0.0f)); in _mm512_conj_pch()
560 _mm512_mask_conj_pch(__m512h __W, __mmask16 __U, __m512h __A) { in _mm512_mask_conj_pch() argument
562 (__mmask16)__U, (__v16sf)_mm512_conj_pch(__A), (__v16sf)__W); in _mm512_mask_conj_pch()
566 _mm512_maskz_conj_pch(__mmask16 __U, __m512h __A) { in _mm512_maskz_conj_pch() argument
568 (__v16sf)_mm512_conj_pch(__A), in _mm512_maskz_conj_pch()
572 static __inline__ __m128h __DEFAULT_FN_ATTRS128 _mm_add_sh(__m128h __A, in _mm_add_sh() argument
574 __A[0] += __B[0]; in _mm_add_sh()
575 return __A; in _mm_add_sh()
580 __m128h __A, in _mm_mask_add_sh() argument
582 __A = _mm_add_sh(__A, __B); in _mm_mask_add_sh()
583 return __builtin_ia32_selectsh_128(__U, __A, __W); in _mm_mask_add_sh()
587 __m128h __A, in _mm_maskz_add_sh() argument
589 __A = _mm_add_sh(__A, __B); in _mm_maskz_add_sh()
590 return __builtin_ia32_selectsh_128(__U, __A, _mm_setzero_ph()); in _mm_maskz_add_sh()
608 static __inline__ __m128h __DEFAULT_FN_ATTRS128 _mm_sub_sh(__m128h __A, in _mm_sub_sh() argument
610 __A[0] -= __B[0]; in _mm_sub_sh()
611 return __A; in _mm_sub_sh()
616 __m128h __A, in _mm_mask_sub_sh() argument
618 __A = _mm_sub_sh(__A, __B); in _mm_mask_sub_sh()
619 return __builtin_ia32_selectsh_128(__U, __A, __W); in _mm_mask_sub_sh()
623 __m128h __A, in _mm_maskz_sub_sh() argument
625 __A = _mm_sub_sh(__A, __B); in _mm_maskz_sub_sh()
626 return __builtin_ia32_selectsh_128(__U, __A, _mm_setzero_ph()); in _mm_maskz_sub_sh()
644 static __inline__ __m128h __DEFAULT_FN_ATTRS128 _mm_mul_sh(__m128h __A, in _mm_mul_sh() argument
646 __A[0] *= __B[0]; in _mm_mul_sh()
647 return __A; in _mm_mul_sh()
652 __m128h __A, in _mm_mask_mul_sh() argument
654 __A = _mm_mul_sh(__A, __B); in _mm_mask_mul_sh()
655 return __builtin_ia32_selectsh_128(__U, __A, __W); in _mm_mask_mul_sh()
659 __m128h __A, in _mm_maskz_mul_sh() argument
661 __A = _mm_mul_sh(__A, __B); in _mm_maskz_mul_sh()
662 return __builtin_ia32_selectsh_128(__U, __A, _mm_setzero_ph()); in _mm_maskz_mul_sh()
680 static __inline__ __m128h __DEFAULT_FN_ATTRS128 _mm_div_sh(__m128h __A, in _mm_div_sh() argument
682 __A[0] /= __B[0]; in _mm_div_sh()
683 return __A; in _mm_div_sh()
688 __m128h __A, in _mm_mask_div_sh() argument
690 __A = _mm_div_sh(__A, __B); in _mm_mask_div_sh()
691 return __builtin_ia32_selectsh_128(__U, __A, __W); in _mm_mask_div_sh()
695 __m128h __A, in _mm_maskz_div_sh() argument
697 __A = _mm_div_sh(__A, __B); in _mm_maskz_div_sh()
698 return __builtin_ia32_selectsh_128(__U, __A, _mm_setzero_ph()); in _mm_maskz_div_sh()
716 static __inline__ __m128h __DEFAULT_FN_ATTRS128 _mm_min_sh(__m128h __A, in _mm_min_sh() argument
719 (__v8hf)__A, (__v8hf)__B, (__v8hf)_mm_setzero_ph(), (__mmask8)-1, in _mm_min_sh()
725 __m128h __A, in _mm_mask_min_sh() argument
727 return (__m128h)__builtin_ia32_minsh_round_mask((__v8hf)__A, (__v8hf)__B, in _mm_mask_min_sh()
733 __m128h __A, in _mm_maskz_min_sh() argument
736 (__v8hf)__A, (__v8hf)__B, (__v8hf)_mm_setzero_ph(), (__mmask8)__U, in _mm_maskz_min_sh()
755 static __inline__ __m128h __DEFAULT_FN_ATTRS128 _mm_max_sh(__m128h __A, in _mm_max_sh() argument
758 (__v8hf)__A, (__v8hf)__B, (__v8hf)_mm_setzero_ph(), (__mmask8)-1, in _mm_max_sh()
764 __m128h __A, in _mm_mask_max_sh() argument
766 return (__m128h)__builtin_ia32_maxsh_round_mask((__v8hf)__A, (__v8hf)__B, in _mm_mask_max_sh()
772 __m128h __A, in _mm_maskz_max_sh() argument
775 (__v8hf)__A, (__v8hf)__B, (__v8hf)_mm_setzero_ph(), (__mmask8)__U, in _mm_maskz_max_sh()
839 _mm_mask_load_sh(__m128h __W, __mmask8 __U, const void *__A) { in _mm_mask_load_sh() argument
843 return (__m128h)__builtin_ia32_loadsh128_mask((const __v8hf *)__A, src, __U & 1); in _mm_mask_load_sh()
847 _mm_maskz_load_sh(__mmask8 __U, const void *__A) { in _mm_maskz_load_sh() argument
849 (const __v8hf *)__A, (__v8hf)_mm_setzero_ph(), __U & 1); in _mm_maskz_load_sh()
900 __m128h __A) { in _mm_mask_store_sh() argument
901 __builtin_ia32_storesh128_mask((__v8hf *)__W, __A, __U & 1); in _mm_mask_store_sh()
905 __m512h __A) { in _mm512_store_ph() argument
906 *(__m512h *)__P = __A; in _mm512_store_ph()
910 __m256h __A) { in _mm256_store_ph() argument
911 *(__m256h *)__P = __A; in _mm256_store_ph()
915 __m128h __A) { in _mm_store_ph() argument
916 *(__m128h *)__P = __A; in _mm_store_ph()
920 __m512h __A) { in _mm512_storeu_ph() argument
924 ((struct __storeu_ph *)__P)->__v = __A; in _mm512_storeu_ph()
928 __m256h __A) { in _mm256_storeu_ph() argument
932 ((struct __storeu_ph *)__P)->__v = __A; in _mm256_storeu_ph()
936 __m128h __A) { in _mm_storeu_ph() argument
940 ((struct __storeu_ph *)__P)->__v = __A; in _mm_storeu_ph()
952 __m128h __A, in _mm_mask_move_sh() argument
954 return __builtin_ia32_selectsh_128(__U, _mm_move_sh(__A, __B), __W); in _mm_mask_move_sh()
958 __m128h __A, in _mm_maskz_move_sh() argument
960 return __builtin_ia32_selectsh_128(__U, _mm_move_sh(__A, __B), in _mm_maskz_move_sh()
974 static __inline__ __m512h __DEFAULT_FN_ATTRS512 _mm512_rcp_ph(__m512h __A) { in _mm512_rcp_ph() argument
976 (__v32hf)__A, (__v32hf)_mm512_undefined_ph(), (__mmask32)-1); in _mm512_rcp_ph()
980 _mm512_mask_rcp_ph(__m512h __W, __mmask32 __U, __m512h __A) { in _mm512_mask_rcp_ph() argument
981 return (__m512h)__builtin_ia32_rcpph512_mask((__v32hf)__A, (__v32hf)__W, in _mm512_mask_rcp_ph()
986 _mm512_maskz_rcp_ph(__mmask32 __U, __m512h __A) { in _mm512_maskz_rcp_ph() argument
988 (__v32hf)__A, (__v32hf)_mm512_setzero_ph(), (__mmask32)__U); in _mm512_maskz_rcp_ph()
991 static __inline__ __m512h __DEFAULT_FN_ATTRS512 _mm512_rsqrt_ph(__m512h __A) { in _mm512_rsqrt_ph() argument
993 (__v32hf)__A, (__v32hf)_mm512_undefined_ph(), (__mmask32)-1); in _mm512_rsqrt_ph()
997 _mm512_mask_rsqrt_ph(__m512h __W, __mmask32 __U, __m512h __A) { in _mm512_mask_rsqrt_ph() argument
998 return (__m512h)__builtin_ia32_rsqrtph512_mask((__v32hf)__A, (__v32hf)__W, in _mm512_mask_rsqrt_ph()
1003 _mm512_maskz_rsqrt_ph(__mmask32 __U, __m512h __A) { in _mm512_maskz_rsqrt_ph() argument
1005 (__v32hf)__A, (__v32hf)_mm512_setzero_ph(), (__mmask32)__U); in _mm512_maskz_rsqrt_ph()
1039 static __inline__ __m512h __DEFAULT_FN_ATTRS512 _mm512_getexp_ph(__m512h __A) { in _mm512_getexp_ph() argument
1041 (__v32hf)__A, (__v32hf)_mm512_undefined_ph(), (__mmask32)-1, in _mm512_getexp_ph()
1046 _mm512_mask_getexp_ph(__m512h __W, __mmask32 __U, __m512h __A) { in _mm512_mask_getexp_ph() argument
1048 (__v32hf)__A, (__v32hf)__W, (__mmask32)__U, _MM_FROUND_CUR_DIRECTION); in _mm512_mask_getexp_ph()
1052 _mm512_maskz_getexp_ph(__mmask32 __U, __m512h __A) { in _mm512_maskz_getexp_ph() argument
1054 (__v32hf)__A, (__v32hf)_mm512_setzero_ph(), (__mmask32)__U, in _mm512_maskz_getexp_ph()
1072 static __inline__ __m512h __DEFAULT_FN_ATTRS512 _mm512_scalef_ph(__m512h __A, in _mm512_scalef_ph() argument
1075 (__v32hf)__A, (__v32hf)__B, (__v32hf)_mm512_undefined_ph(), (__mmask32)-1, in _mm512_scalef_ph()
1080 _mm512_mask_scalef_ph(__m512h __W, __mmask32 __U, __m512h __A, __m512h __B) { in _mm512_mask_scalef_ph() argument
1081 return (__m512h)__builtin_ia32_scalefph512_mask((__v32hf)__A, (__v32hf)__B, in _mm512_mask_scalef_ph()
1087 _mm512_maskz_scalef_ph(__mmask32 __U, __m512h __A, __m512h __B) { in _mm512_maskz_scalef_ph() argument
1089 (__v32hf)__A, (__v32hf)__B, (__v32hf)_mm512_setzero_ph(), (__mmask32)__U, in _mm512_maskz_scalef_ph()
1168 static __inline__ __m128h __DEFAULT_FN_ATTRS128 _mm_rcp_sh(__m128h __A, in _mm_rcp_sh() argument
1171 (__v8hf)__A, (__v8hf)__B, (__v8hf)_mm_setzero_ph(), (__mmask8)-1); in _mm_rcp_sh()
1176 __m128h __A, in _mm_mask_rcp_sh() argument
1178 return (__m128h)__builtin_ia32_rcpsh_mask((__v8hf)__A, (__v8hf)__B, in _mm_mask_rcp_sh()
1183 __m128h __A, in _mm_maskz_rcp_sh() argument
1186 (__v8hf)__A, (__v8hf)__B, (__v8hf)_mm_setzero_ph(), (__mmask8)__U); in _mm_maskz_rcp_sh()
1189 static __inline__ __m128h __DEFAULT_FN_ATTRS128 _mm_rsqrt_sh(__m128h __A, in _mm_rsqrt_sh() argument
1192 (__v8hf)__A, (__v8hf)__B, (__v8hf)_mm_setzero_ph(), (__mmask8)-1); in _mm_rsqrt_sh()
1197 __m128h __A, in _mm_mask_rsqrt_sh() argument
1199 return (__m128h)__builtin_ia32_rsqrtsh_mask((__v8hf)__A, (__v8hf)__B, in _mm_mask_rsqrt_sh()
1204 _mm_maskz_rsqrt_sh(__mmask8 __U, __m128h __A, __m128h __B) { in _mm_maskz_rsqrt_sh() argument
1206 (__v8hf)__A, (__v8hf)__B, (__v8hf)_mm_setzero_ph(), (__mmask8)__U); in _mm_maskz_rsqrt_sh()
1244 static __inline__ __m128h __DEFAULT_FN_ATTRS128 _mm_getexp_sh(__m128h __A, in _mm_getexp_sh() argument
1247 (__v8hf)__A, (__v8hf)__B, (__v8hf)_mm_setzero_ph(), (__mmask8)-1, in _mm_getexp_sh()
1252 _mm_mask_getexp_sh(__m128h __W, __mmask8 __U, __m128h __A, __m128h __B) { in _mm_mask_getexp_sh() argument
1254 (__v8hf)__A, (__v8hf)__B, (__v8hf)__W, (__mmask8)__U, in _mm_mask_getexp_sh()
1264 _mm_maskz_getexp_sh(__mmask8 __U, __m128h __A, __m128h __B) { in _mm_maskz_getexp_sh() argument
1266 (__v8hf)__A, (__v8hf)__B, (__v8hf)_mm_setzero_ph(), (__mmask8)__U, in _mm_maskz_getexp_sh()
1280 static __inline__ __m128h __DEFAULT_FN_ATTRS128 _mm_scalef_sh(__m128h __A, in _mm_scalef_sh() argument
1283 (__v8hf)__A, (__v8hf)(__B), (__v8hf)_mm_setzero_ph(), (__mmask8)-1, in _mm_scalef_sh()
1288 _mm_mask_scalef_sh(__m128h __W, __mmask8 __U, __m128h __A, __m128h __B) { in _mm_mask_scalef_sh() argument
1289 return (__m128h)__builtin_ia32_scalefsh_round_mask((__v8hf)__A, (__v8hf)__B, in _mm_mask_scalef_sh()
1300 _mm_maskz_scalef_sh(__mmask8 __U, __m128h __A, __m128h __B) { in _mm_maskz_scalef_sh() argument
1302 (__v8hf)__A, (__v8hf)__B, (__v8hf)_mm_setzero_ph(), (__mmask8)__U, in _mm_maskz_scalef_sh()
1384 static __inline__ __m512h __DEFAULT_FN_ATTRS512 _mm512_sqrt_ph(__m512h __A) { in _mm512_sqrt_ph() argument
1385 return (__m512h)__builtin_ia32_sqrtph512((__v32hf)__A, in _mm512_sqrt_ph()
1390 _mm512_mask_sqrt_ph(__m512h __W, __mmask32 __U, __m512h __A) { in _mm512_mask_sqrt_ph() argument
1393 (__v32hf)__builtin_ia32_sqrtph512((__A), (_MM_FROUND_CUR_DIRECTION)), in _mm512_mask_sqrt_ph()
1398 _mm512_maskz_sqrt_ph(__mmask32 __U, __m512h __A) { in _mm512_maskz_sqrt_ph() argument
1401 (__v32hf)__builtin_ia32_sqrtph512((__A), (_MM_FROUND_CUR_DIRECTION)), in _mm512_maskz_sqrt_ph()
1420 static __inline__ __m128h __DEFAULT_FN_ATTRS128 _mm_sqrt_sh(__m128h __A, in _mm_sqrt_sh() argument
1423 (__v8hf)(__m128h)(__A), (__v8hf)(__m128h)(__B), (__v8hf)_mm_setzero_ph(), in _mm_sqrt_sh()
1429 __m128h __A, in _mm_mask_sqrt_sh() argument
1432 (__v8hf)(__m128h)(__A), (__v8hf)(__m128h)(__B), (__v8hf)(__m128h)(__W), in _mm_mask_sqrt_sh()
1437 __m128h __A, in _mm_maskz_sqrt_sh() argument
1440 (__v8hf)(__m128h)(__A), (__v8hf)(__m128h)(__B), (__v8hf)_mm_setzero_ph(), in _mm_maskz_sqrt_sh()
1472 static __inline__ __m128h __DEFAULT_FN_ATTRS512 _mm512_cvtpd_ph(__m512d __A) { in _mm512_cvtpd_ph() argument
1474 (__v8df)__A, (__v8hf)_mm_setzero_ph(), (__mmask8)-1, in _mm512_cvtpd_ph()
1479 _mm512_mask_cvtpd_ph(__m128h __W, __mmask8 __U, __m512d __A) { in _mm512_mask_cvtpd_ph() argument
1481 (__v8df)__A, (__v8hf)__W, (__mmask8)__U, _MM_FROUND_CUR_DIRECTION); in _mm512_mask_cvtpd_ph()
1485 _mm512_maskz_cvtpd_ph(__mmask8 __U, __m512d __A) { in _mm512_maskz_cvtpd_ph() argument
1487 (__v8df)__A, (__v8hf)_mm_setzero_ph(), (__mmask8)__U, in _mm512_maskz_cvtpd_ph()
1503 static __inline__ __m512d __DEFAULT_FN_ATTRS512 _mm512_cvtph_pd(__m128h __A) { in _mm512_cvtph_pd() argument
1505 (__v8hf)__A, (__v8df)_mm512_setzero_pd(), (__mmask8)-1, in _mm512_cvtph_pd()
1510 _mm512_mask_cvtph_pd(__m512d __W, __mmask8 __U, __m128h __A) { in _mm512_mask_cvtph_pd() argument
1512 (__v8hf)__A, (__v8df)__W, (__mmask8)__U, _MM_FROUND_CUR_DIRECTION); in _mm512_mask_cvtph_pd()
1516 _mm512_maskz_cvtph_pd(__mmask8 __U, __m128h __A) { in _mm512_maskz_cvtph_pd() argument
1518 (__v8hf)__A, (__v8df)_mm512_setzero_pd(), (__mmask8)__U, in _mm512_maskz_cvtph_pd()
1536 static __inline__ __m128 __DEFAULT_FN_ATTRS128 _mm_cvtsh_ss(__m128 __A, in _mm_cvtsh_ss() argument
1539 (__v4sf)__A, (__v8hf)__B, (__v4sf)_mm_undefined_ps(), (__mmask8)-1, in _mm_cvtsh_ss()
1545 __m128 __A, in _mm_mask_cvtsh_ss() argument
1547 return (__m128)__builtin_ia32_vcvtsh2ss_round_mask((__v4sf)__A, (__v8hf)__B, in _mm_mask_cvtsh_ss()
1553 __m128 __A, in _mm_maskz_cvtsh_ss() argument
1556 (__v4sf)__A, (__v8hf)__B, (__v4sf)_mm_setzero_ps(), (__mmask8)__U, in _mm_maskz_cvtsh_ss()
1574 static __inline__ __m128h __DEFAULT_FN_ATTRS128 _mm_cvtss_sh(__m128h __A, in _mm_cvtss_sh() argument
1577 (__v8hf)__A, (__v4sf)__B, (__v8hf)_mm_undefined_ph(), (__mmask8)-1, in _mm_cvtss_sh()
1583 __m128h __A, in _mm_mask_cvtss_sh() argument
1586 (__v8hf)__A, (__v4sf)__B, (__v8hf)__W, (__mmask8)__U, in _mm_mask_cvtss_sh()
1591 __m128h __A, in _mm_maskz_cvtss_sh() argument
1594 (__v8hf)__A, (__v4sf)__B, (__v8hf)_mm_setzero_ph(), (__mmask8)__U, in _mm_maskz_cvtss_sh()
1612 static __inline__ __m128h __DEFAULT_FN_ATTRS128 _mm_cvtsd_sh(__m128h __A, in _mm_cvtsd_sh() argument
1615 (__v8hf)__A, (__v2df)__B, (__v8hf)_mm_undefined_ph(), (__mmask8)-1, in _mm_cvtsd_sh()
1621 __m128h __A, in _mm_mask_cvtsd_sh() argument
1624 (__v8hf)__A, (__v2df)__B, (__v8hf)__W, (__mmask8)__U, in _mm_mask_cvtsd_sh()
1629 _mm_maskz_cvtsd_sh(__mmask8 __U, __m128h __A, __m128d __B) { in _mm_maskz_cvtsd_sh() argument
1631 (__v8hf)__A, (__v2df)__B, (__v8hf)_mm_setzero_ph(), (__mmask8)__U, in _mm_maskz_cvtsd_sh()
1649 static __inline__ __m128d __DEFAULT_FN_ATTRS128 _mm_cvtsh_sd(__m128d __A, in _mm_cvtsh_sd() argument
1652 (__v2df)__A, (__v8hf)__B, (__v2df)_mm_undefined_pd(), (__mmask8)-1, in _mm_cvtsh_sd()
1658 __m128d __A, in _mm_mask_cvtsh_sd() argument
1661 (__v2df)__A, (__v8hf)__B, (__v2df)__W, (__mmask8)__U, in _mm_mask_cvtsh_sd()
1666 _mm_maskz_cvtsh_sd(__mmask8 __U, __m128d __A, __m128h __B) { in _mm_maskz_cvtsh_sd() argument
1668 (__v2df)__A, (__v8hf)__B, (__v2df)_mm_setzero_pd(), (__mmask8)__U, in _mm_maskz_cvtsh_sd()
1687 _mm512_cvtph_epi16(__m512h __A) { in _mm512_cvtph_epi16() argument
1689 (__v32hf)__A, (__v32hi)_mm512_setzero_epi32(), (__mmask32)-1, in _mm512_cvtph_epi16()
1694 _mm512_mask_cvtph_epi16(__m512i __W, __mmask32 __U, __m512h __A) { in _mm512_mask_cvtph_epi16() argument
1696 (__v32hf)__A, (__v32hi)__W, (__mmask32)__U, _MM_FROUND_CUR_DIRECTION); in _mm512_mask_cvtph_epi16()
1700 _mm512_maskz_cvtph_epi16(__mmask32 __U, __m512h __A) { in _mm512_maskz_cvtph_epi16() argument
1702 (__v32hf)__A, (__v32hi)_mm512_setzero_epi32(), (__mmask32)__U, in _mm512_maskz_cvtph_epi16()
1721 _mm512_cvttph_epi16(__m512h __A) { in _mm512_cvttph_epi16() argument
1723 (__v32hf)__A, (__v32hi)_mm512_setzero_epi32(), (__mmask32)-1, in _mm512_cvttph_epi16()
1728 _mm512_mask_cvttph_epi16(__m512i __W, __mmask32 __U, __m512h __A) { in _mm512_mask_cvttph_epi16() argument
1730 (__v32hf)__A, (__v32hi)__W, (__mmask32)__U, _MM_FROUND_CUR_DIRECTION); in _mm512_mask_cvttph_epi16()
1734 _mm512_maskz_cvttph_epi16(__mmask32 __U, __m512h __A) { in _mm512_maskz_cvttph_epi16() argument
1736 (__v32hf)__A, (__v32hi)_mm512_setzero_epi32(), (__mmask32)__U, in _mm512_maskz_cvttph_epi16()
1754 _mm512_cvtepi16_ph(__m512i __A) { in _mm512_cvtepi16_ph() argument
1756 (__v32hi)__A, (__v32hf)_mm512_setzero_ph(), (__mmask32)-1, in _mm512_cvtepi16_ph()
1761 _mm512_mask_cvtepi16_ph(__m512h __W, __mmask32 __U, __m512i __A) { in _mm512_mask_cvtepi16_ph() argument
1763 (__v32hi)__A, (__v32hf)__W, (__mmask32)__U, _MM_FROUND_CUR_DIRECTION); in _mm512_mask_cvtepi16_ph()
1767 _mm512_maskz_cvtepi16_ph(__mmask32 __U, __m512i __A) { in _mm512_maskz_cvtepi16_ph() argument
1769 (__v32hi)__A, (__v32hf)_mm512_setzero_ph(), (__mmask32)__U, in _mm512_maskz_cvtepi16_ph()
1788 _mm512_cvtph_epu16(__m512h __A) { in _mm512_cvtph_epu16() argument
1790 (__v32hf)__A, (__v32hu)_mm512_setzero_epi32(), (__mmask32)-1, in _mm512_cvtph_epu16()
1795 _mm512_mask_cvtph_epu16(__m512i __W, __mmask32 __U, __m512h __A) { in _mm512_mask_cvtph_epu16() argument
1797 (__v32hf)__A, (__v32hu)__W, (__mmask32)__U, _MM_FROUND_CUR_DIRECTION); in _mm512_mask_cvtph_epu16()
1801 _mm512_maskz_cvtph_epu16(__mmask32 __U, __m512h __A) { in _mm512_maskz_cvtph_epu16() argument
1803 (__v32hf)__A, (__v32hu)_mm512_setzero_epi32(), (__mmask32)__U, in _mm512_maskz_cvtph_epu16()
1822 _mm512_cvttph_epu16(__m512h __A) { in _mm512_cvttph_epu16() argument
1824 (__v32hf)__A, (__v32hu)_mm512_setzero_epi32(), (__mmask32)-1, in _mm512_cvttph_epu16()
1829 _mm512_mask_cvttph_epu16(__m512i __W, __mmask32 __U, __m512h __A) { in _mm512_mask_cvttph_epu16() argument
1831 (__v32hf)__A, (__v32hu)__W, (__mmask32)__U, _MM_FROUND_CUR_DIRECTION); in _mm512_mask_cvttph_epu16()
1835 _mm512_maskz_cvttph_epu16(__mmask32 __U, __m512h __A) { in _mm512_maskz_cvttph_epu16() argument
1837 (__v32hf)__A, (__v32hu)_mm512_setzero_epi32(), (__mmask32)__U, in _mm512_maskz_cvttph_epu16()
1855 _mm512_cvtepu16_ph(__m512i __A) { in _mm512_cvtepu16_ph() argument
1857 (__v32hu)__A, (__v32hf)_mm512_setzero_ph(), (__mmask32)-1, in _mm512_cvtepu16_ph()
1862 _mm512_mask_cvtepu16_ph(__m512h __W, __mmask32 __U, __m512i __A) { in _mm512_mask_cvtepu16_ph() argument
1864 (__v32hu)__A, (__v32hf)__W, (__mmask32)__U, _MM_FROUND_CUR_DIRECTION); in _mm512_mask_cvtepu16_ph()
1868 _mm512_maskz_cvtepu16_ph(__mmask32 __U, __m512i __A) { in _mm512_maskz_cvtepu16_ph() argument
1870 (__v32hu)__A, (__v32hf)_mm512_setzero_ph(), (__mmask32)__U, in _mm512_maskz_cvtepu16_ph()
1889 _mm512_cvtph_epi32(__m256h __A) { in _mm512_cvtph_epi32() argument
1891 (__v16hf)__A, (__v16si)_mm512_setzero_epi32(), (__mmask16)-1, in _mm512_cvtph_epi32()
1896 _mm512_mask_cvtph_epi32(__m512i __W, __mmask16 __U, __m256h __A) { in _mm512_mask_cvtph_epi32() argument
1898 (__v16hf)__A, (__v16si)__W, (__mmask16)__U, _MM_FROUND_CUR_DIRECTION); in _mm512_mask_cvtph_epi32()
1902 _mm512_maskz_cvtph_epi32(__mmask16 __U, __m256h __A) { in _mm512_maskz_cvtph_epi32() argument
1904 (__v16hf)__A, (__v16si)_mm512_setzero_epi32(), (__mmask16)__U, in _mm512_maskz_cvtph_epi32()
1923 _mm512_cvtph_epu32(__m256h __A) { in _mm512_cvtph_epu32() argument
1925 (__v16hf)__A, (__v16su)_mm512_setzero_epi32(), (__mmask16)-1, in _mm512_cvtph_epu32()
1930 _mm512_mask_cvtph_epu32(__m512i __W, __mmask16 __U, __m256h __A) { in _mm512_mask_cvtph_epu32() argument
1932 (__v16hf)__A, (__v16su)__W, (__mmask16)__U, _MM_FROUND_CUR_DIRECTION); in _mm512_mask_cvtph_epu32()
1936 _mm512_maskz_cvtph_epu32(__mmask16 __U, __m256h __A) { in _mm512_maskz_cvtph_epu32() argument
1938 (__v16hf)__A, (__v16su)_mm512_setzero_epi32(), (__mmask16)__U, in _mm512_maskz_cvtph_epu32()
1956 _mm512_cvtepi32_ph(__m512i __A) { in _mm512_cvtepi32_ph() argument
1958 (__v16si)__A, (__v16hf)_mm256_setzero_ph(), (__mmask16)-1, in _mm512_cvtepi32_ph()
1963 _mm512_mask_cvtepi32_ph(__m256h __W, __mmask16 __U, __m512i __A) { in _mm512_mask_cvtepi32_ph() argument
1965 (__v16si)__A, (__v16hf)__W, (__mmask16)__U, _MM_FROUND_CUR_DIRECTION); in _mm512_mask_cvtepi32_ph()
1969 _mm512_maskz_cvtepi32_ph(__mmask16 __U, __m512i __A) { in _mm512_maskz_cvtepi32_ph() argument
1971 (__v16si)__A, (__v16hf)_mm256_setzero_ph(), (__mmask16)__U, in _mm512_maskz_cvtepi32_ph()
1989 _mm512_cvtepu32_ph(__m512i __A) { in _mm512_cvtepu32_ph() argument
1991 (__v16su)__A, (__v16hf)_mm256_setzero_ph(), (__mmask16)-1, in _mm512_cvtepu32_ph()
1996 _mm512_mask_cvtepu32_ph(__m256h __W, __mmask16 __U, __m512i __A) { in _mm512_mask_cvtepu32_ph() argument
1998 (__v16su)__A, (__v16hf)__W, (__mmask16)__U, _MM_FROUND_CUR_DIRECTION); in _mm512_mask_cvtepu32_ph()
2002 _mm512_maskz_cvtepu32_ph(__mmask16 __U, __m512i __A) { in _mm512_maskz_cvtepu32_ph() argument
2004 (__v16su)__A, (__v16hf)_mm256_setzero_ph(), (__mmask16)__U, in _mm512_maskz_cvtepu32_ph()
2023 _mm512_cvttph_epi32(__m256h __A) { in _mm512_cvttph_epi32() argument
2025 (__v16hf)__A, (__v16si)_mm512_setzero_epi32(), (__mmask16)-1, in _mm512_cvttph_epi32()
2030 _mm512_mask_cvttph_epi32(__m512i __W, __mmask16 __U, __m256h __A) { in _mm512_mask_cvttph_epi32() argument
2032 (__v16hf)__A, (__v16si)__W, (__mmask16)__U, _MM_FROUND_CUR_DIRECTION); in _mm512_mask_cvttph_epi32()
2036 _mm512_maskz_cvttph_epi32(__mmask16 __U, __m256h __A) { in _mm512_maskz_cvttph_epi32() argument
2038 (__v16hf)__A, (__v16si)_mm512_setzero_epi32(), (__mmask16)__U, in _mm512_maskz_cvttph_epi32()
2057 _mm512_cvttph_epu32(__m256h __A) { in _mm512_cvttph_epu32() argument
2059 (__v16hf)__A, (__v16su)_mm512_setzero_epi32(), (__mmask16)-1, in _mm512_cvttph_epu32()
2064 _mm512_mask_cvttph_epu32(__m512i __W, __mmask16 __U, __m256h __A) { in _mm512_mask_cvttph_epu32() argument
2066 (__v16hf)__A, (__v16su)__W, (__mmask16)__U, _MM_FROUND_CUR_DIRECTION); in _mm512_mask_cvttph_epu32()
2070 _mm512_maskz_cvttph_epu32(__mmask16 __U, __m256h __A) { in _mm512_maskz_cvttph_epu32() argument
2072 (__v16hf)__A, (__v16su)_mm512_setzero_epi32(), (__mmask16)__U, in _mm512_maskz_cvttph_epu32()
2089 _mm512_cvtepi64_ph(__m512i __A) { in _mm512_cvtepi64_ph() argument
2091 (__v8di)__A, (__v8hf)_mm_setzero_ph(), (__mmask8)-1, in _mm512_cvtepi64_ph()
2096 _mm512_mask_cvtepi64_ph(__m128h __W, __mmask8 __U, __m512i __A) { in _mm512_mask_cvtepi64_ph() argument
2098 (__v8di)__A, (__v8hf)__W, (__mmask8)__U, _MM_FROUND_CUR_DIRECTION); in _mm512_mask_cvtepi64_ph()
2102 _mm512_maskz_cvtepi64_ph(__mmask8 __U, __m512i __A) { in _mm512_maskz_cvtepi64_ph() argument
2104 (__v8di)__A, (__v8hf)_mm_setzero_ph(), (__mmask8)__U, in _mm512_maskz_cvtepi64_ph()
2122 _mm512_cvtph_epi64(__m128h __A) { in _mm512_cvtph_epi64() argument
2124 (__v8hf)__A, (__v8di)_mm512_setzero_epi32(), (__mmask8)-1, in _mm512_cvtph_epi64()
2129 _mm512_mask_cvtph_epi64(__m512i __W, __mmask8 __U, __m128h __A) { in _mm512_mask_cvtph_epi64() argument
2131 (__v8hf)__A, (__v8di)__W, (__mmask8)__U, _MM_FROUND_CUR_DIRECTION); in _mm512_mask_cvtph_epi64()
2135 _mm512_maskz_cvtph_epi64(__mmask8 __U, __m128h __A) { in _mm512_maskz_cvtph_epi64() argument
2137 (__v8hf)__A, (__v8di)_mm512_setzero_epi32(), (__mmask8)__U, in _mm512_maskz_cvtph_epi64()
2154 _mm512_cvtepu64_ph(__m512i __A) { in _mm512_cvtepu64_ph() argument
2156 (__v8du)__A, (__v8hf)_mm_setzero_ph(), (__mmask8)-1, in _mm512_cvtepu64_ph()
2161 _mm512_mask_cvtepu64_ph(__m128h __W, __mmask8 __U, __m512i __A) { in _mm512_mask_cvtepu64_ph() argument
2163 (__v8du)__A, (__v8hf)__W, (__mmask8)__U, _MM_FROUND_CUR_DIRECTION); in _mm512_mask_cvtepu64_ph()
2167 _mm512_maskz_cvtepu64_ph(__mmask8 __U, __m512i __A) { in _mm512_maskz_cvtepu64_ph() argument
2169 (__v8du)__A, (__v8hf)_mm_setzero_ph(), (__mmask8)__U, in _mm512_maskz_cvtepu64_ph()
2187 _mm512_cvtph_epu64(__m128h __A) { in _mm512_cvtph_epu64() argument
2189 (__v8hf)__A, (__v8du)_mm512_setzero_epi32(), (__mmask8)-1, in _mm512_cvtph_epu64()
2194 _mm512_mask_cvtph_epu64(__m512i __W, __mmask8 __U, __m128h __A) { in _mm512_mask_cvtph_epu64() argument
2196 (__v8hf)__A, (__v8du)__W, (__mmask8)__U, _MM_FROUND_CUR_DIRECTION); in _mm512_mask_cvtph_epu64()
2200 _mm512_maskz_cvtph_epu64(__mmask8 __U, __m128h __A) { in _mm512_maskz_cvtph_epu64() argument
2202 (__v8hf)__A, (__v8du)_mm512_setzero_epi32(), (__mmask8)__U, in _mm512_maskz_cvtph_epu64()
2220 _mm512_cvttph_epi64(__m128h __A) { in _mm512_cvttph_epi64() argument
2222 (__v8hf)__A, (__v8di)_mm512_setzero_epi32(), (__mmask8)-1, in _mm512_cvttph_epi64()
2227 _mm512_mask_cvttph_epi64(__m512i __W, __mmask8 __U, __m128h __A) { in _mm512_mask_cvttph_epi64() argument
2229 (__v8hf)__A, (__v8di)__W, (__mmask8)__U, _MM_FROUND_CUR_DIRECTION); in _mm512_mask_cvttph_epi64()
2233 _mm512_maskz_cvttph_epi64(__mmask8 __U, __m128h __A) { in _mm512_maskz_cvttph_epi64() argument
2235 (__v8hf)__A, (__v8di)_mm512_setzero_epi32(), (__mmask8)__U, in _mm512_maskz_cvttph_epi64()
2253 _mm512_cvttph_epu64(__m128h __A) { in _mm512_cvttph_epu64() argument
2255 (__v8hf)__A, (__v8du)_mm512_setzero_epi32(), (__mmask8)-1, in _mm512_cvttph_epu64()
2260 _mm512_mask_cvttph_epu64(__m512i __W, __mmask8 __U, __m128h __A) { in _mm512_mask_cvttph_epu64() argument
2262 (__v8hf)__A, (__v8du)__W, (__mmask8)__U, _MM_FROUND_CUR_DIRECTION); in _mm512_mask_cvttph_epu64()
2266 _mm512_maskz_cvttph_epu64(__mmask8 __U, __m128h __A) { in _mm512_maskz_cvttph_epu64() argument
2268 (__v8hf)__A, (__v8du)_mm512_setzero_epi32(), (__mmask8)__U, in _mm512_maskz_cvttph_epu64()
2275 static __inline__ int __DEFAULT_FN_ATTRS128 _mm_cvtsh_i32(__m128h __A) { in _mm_cvtsh_i32() argument
2276 return (int)__builtin_ia32_vcvtsh2si32((__v8hf)__A, _MM_FROUND_CUR_DIRECTION); in _mm_cvtsh_i32()
2283 _mm_cvtsh_u32(__m128h __A) { in _mm_cvtsh_u32() argument
2284 return (unsigned int)__builtin_ia32_vcvtsh2usi32((__v8hf)__A, in _mm_cvtsh_u32()
2292 static __inline__ long long __DEFAULT_FN_ATTRS128 _mm_cvtsh_i64(__m128h __A) { in _mm_cvtsh_i64() argument
2293 return (long long)__builtin_ia32_vcvtsh2si64((__v8hf)__A, in _mm_cvtsh_i64()
2301 _mm_cvtsh_u64(__m128h __A) { in _mm_cvtsh_u64() argument
2303 (__v8hf)__A, _MM_FROUND_CUR_DIRECTION); in _mm_cvtsh_u64()
2311 _mm_cvtu32_sh(__m128h __A, unsigned int __B) { in _mm_cvtu32_sh() argument
2312 __A[0] = __B; in _mm_cvtu32_sh()
2313 return __A; in _mm_cvtu32_sh()
2322 _mm_cvtu64_sh(__m128h __A, unsigned long long __B) { in _mm_cvtu64_sh() argument
2323 __A[0] = __B; in _mm_cvtu64_sh()
2324 return __A; in _mm_cvtu64_sh()
2331 static __inline__ __m128h __DEFAULT_FN_ATTRS128 _mm_cvti32_sh(__m128h __A, in _mm_cvti32_sh() argument
2333 __A[0] = __B; in _mm_cvti32_sh()
2334 return __A; in _mm_cvti32_sh()
2341 static __inline__ __m128h __DEFAULT_FN_ATTRS128 _mm_cvti64_sh(__m128h __A, in _mm_cvti64_sh() argument
2343 __A[0] = __B; in _mm_cvti64_sh()
2344 return __A; in _mm_cvti64_sh()
2351 static __inline__ int __DEFAULT_FN_ATTRS128 _mm_cvttsh_i32(__m128h __A) { in _mm_cvttsh_i32() argument
2352 return (int)__builtin_ia32_vcvttsh2si32((__v8hf)__A, in _mm_cvttsh_i32()
2360 static __inline__ long long __DEFAULT_FN_ATTRS128 _mm_cvttsh_i64(__m128h __A) { in _mm_cvttsh_i64() argument
2361 return (long long)__builtin_ia32_vcvttsh2si64((__v8hf)__A, in _mm_cvttsh_i64()
2370 _mm_cvttsh_u32(__m128h __A) { in _mm_cvttsh_u32() argument
2371 return (unsigned int)__builtin_ia32_vcvttsh2usi32((__v8hf)__A, in _mm_cvttsh_u32()
2380 _mm_cvttsh_u64(__m128h __A) { in _mm_cvttsh_u64() argument
2382 (__v8hf)__A, _MM_FROUND_CUR_DIRECTION); in _mm_cvttsh_u64()
2399 static __inline__ __m512 __DEFAULT_FN_ATTRS512 _mm512_cvtxph_ps(__m256h __A) { in _mm512_cvtxph_ps() argument
2401 (__v16hf)__A, (__v16sf)_mm512_setzero_ps(), (__mmask16)-1, in _mm512_cvtxph_ps()
2406 _mm512_mask_cvtxph_ps(__m512 __W, __mmask16 __U, __m256h __A) { in _mm512_mask_cvtxph_ps() argument
2408 (__v16hf)__A, (__v16sf)__W, (__mmask16)__U, _MM_FROUND_CUR_DIRECTION); in _mm512_mask_cvtxph_ps()
2412 _mm512_maskz_cvtxph_ps(__mmask16 __U, __m256h __A) { in _mm512_maskz_cvtxph_ps() argument
2414 (__v16hf)__A, (__v16sf)_mm512_setzero_ps(), (__mmask16)__U, in _mm512_maskz_cvtxph_ps()
2431 static __inline__ __m256h __DEFAULT_FN_ATTRS512 _mm512_cvtxps_ph(__m512 __A) { in _mm512_cvtxps_ph() argument
2433 (__v16sf)__A, (__v16hf)_mm256_setzero_ph(), (__mmask16)-1, in _mm512_cvtxps_ph()
2438 _mm512_mask_cvtxps_ph(__m256h __W, __mmask16 __U, __m512 __A) { in _mm512_mask_cvtxps_ph() argument
2440 (__v16sf)__A, (__v16hf)__W, (__mmask16)__U, _MM_FROUND_CUR_DIRECTION); in _mm512_mask_cvtxps_ph()
2444 _mm512_maskz_cvtxps_ph(__mmask16 __U, __m512 __A) { in _mm512_maskz_cvtxps_ph() argument
2446 (__v16sf)__A, (__v16hf)_mm256_setzero_ph(), (__mmask16)__U, in _mm512_maskz_cvtxps_ph()
2510 static __inline__ __m512h __DEFAULT_FN_ATTRS512 _mm512_fmadd_ph(__m512h __A, in _mm512_fmadd_ph() argument
2513 return (__m512h)__builtin_ia32_vfmaddph512_mask((__v32hf)__A, (__v32hf)__B, in _mm512_fmadd_ph()
2519 _mm512_mask_fmadd_ph(__m512h __A, __mmask32 __U, __m512h __B, __m512h __C) { in _mm512_mask_fmadd_ph() argument
2520 return (__m512h)__builtin_ia32_vfmaddph512_mask((__v32hf)__A, (__v32hf)__B, in _mm512_mask_fmadd_ph()
2526 _mm512_mask3_fmadd_ph(__m512h __A, __m512h __B, __m512h __C, __mmask32 __U) { in _mm512_mask3_fmadd_ph() argument
2527 return (__m512h)__builtin_ia32_vfmaddph512_mask3((__v32hf)__A, (__v32hf)__B, in _mm512_mask3_fmadd_ph()
2533 _mm512_maskz_fmadd_ph(__mmask32 __U, __m512h __A, __m512h __B, __m512h __C) { in _mm512_maskz_fmadd_ph() argument
2534 return (__m512h)__builtin_ia32_vfmaddph512_maskz((__v32hf)__A, (__v32hf)__B, in _mm512_maskz_fmadd_ph()
2539 static __inline__ __m512h __DEFAULT_FN_ATTRS512 _mm512_fmsub_ph(__m512h __A, in _mm512_fmsub_ph() argument
2542 return (__m512h)__builtin_ia32_vfmaddph512_mask((__v32hf)__A, (__v32hf)__B, in _mm512_fmsub_ph()
2548 _mm512_mask_fmsub_ph(__m512h __A, __mmask32 __U, __m512h __B, __m512h __C) { in _mm512_mask_fmsub_ph() argument
2549 return (__m512h)__builtin_ia32_vfmaddph512_mask((__v32hf)__A, (__v32hf)__B, in _mm512_mask_fmsub_ph()
2555 _mm512_maskz_fmsub_ph(__mmask32 __U, __m512h __A, __m512h __B, __m512h __C) { in _mm512_maskz_fmsub_ph() argument
2557 (__v32hf)__A, (__v32hf)__B, -(__v32hf)__C, (__mmask32)__U, in _mm512_maskz_fmsub_ph()
2561 static __inline__ __m512h __DEFAULT_FN_ATTRS512 _mm512_fnmadd_ph(__m512h __A, in _mm512_fnmadd_ph() argument
2564 return (__m512h)__builtin_ia32_vfmaddph512_mask((__v32hf)__A, -(__v32hf)__B, in _mm512_fnmadd_ph()
2570 _mm512_mask3_fnmadd_ph(__m512h __A, __m512h __B, __m512h __C, __mmask32 __U) { in _mm512_mask3_fnmadd_ph() argument
2571 return (__m512h)__builtin_ia32_vfmaddph512_mask3(-(__v32hf)__A, (__v32hf)__B, in _mm512_mask3_fnmadd_ph()
2577 _mm512_maskz_fnmadd_ph(__mmask32 __U, __m512h __A, __m512h __B, __m512h __C) { in _mm512_maskz_fnmadd_ph() argument
2578 return (__m512h)__builtin_ia32_vfmaddph512_maskz(-(__v32hf)__A, (__v32hf)__B, in _mm512_maskz_fnmadd_ph()
2583 static __inline__ __m512h __DEFAULT_FN_ATTRS512 _mm512_fnmsub_ph(__m512h __A, in _mm512_fnmsub_ph() argument
2586 return (__m512h)__builtin_ia32_vfmaddph512_mask((__v32hf)__A, -(__v32hf)__B, in _mm512_fnmsub_ph()
2592 _mm512_maskz_fnmsub_ph(__mmask32 __U, __m512h __A, __m512h __B, __m512h __C) { in _mm512_maskz_fnmsub_ph() argument
2594 -(__v32hf)__A, (__v32hf)__B, -(__v32hf)__C, (__mmask32)__U, in _mm512_maskz_fnmsub_ph()
2634 _mm512_fmaddsub_ph(__m512h __A, __m512h __B, __m512h __C) { in _mm512_fmaddsub_ph() argument
2636 (__v32hf)__A, (__v32hf)__B, (__v32hf)__C, (__mmask32)-1, in _mm512_fmaddsub_ph()
2641 _mm512_mask_fmaddsub_ph(__m512h __A, __mmask32 __U, __m512h __B, __m512h __C) { in _mm512_mask_fmaddsub_ph() argument
2643 (__v32hf)__A, (__v32hf)__B, (__v32hf)__C, (__mmask32)__U, in _mm512_mask_fmaddsub_ph()
2648 _mm512_mask3_fmaddsub_ph(__m512h __A, __m512h __B, __m512h __C, __mmask32 __U) { in _mm512_mask3_fmaddsub_ph() argument
2650 (__v32hf)__A, (__v32hf)__B, (__v32hf)__C, (__mmask32)__U, in _mm512_mask3_fmaddsub_ph()
2655 _mm512_maskz_fmaddsub_ph(__mmask32 __U, __m512h __A, __m512h __B, __m512h __C) { in _mm512_maskz_fmaddsub_ph() argument
2657 (__v32hf)__A, (__v32hf)__B, (__v32hf)__C, (__mmask32)__U, in _mm512_maskz_fmaddsub_ph()
2662 _mm512_fmsubadd_ph(__m512h __A, __m512h __B, __m512h __C) { in _mm512_fmsubadd_ph() argument
2664 (__v32hf)__A, (__v32hf)__B, -(__v32hf)__C, (__mmask32)-1, in _mm512_fmsubadd_ph()
2669 _mm512_mask_fmsubadd_ph(__m512h __A, __mmask32 __U, __m512h __B, __m512h __C) { in _mm512_mask_fmsubadd_ph() argument
2671 (__v32hf)__A, (__v32hf)__B, -(__v32hf)__C, (__mmask32)__U, in _mm512_mask_fmsubadd_ph()
2676 _mm512_maskz_fmsubadd_ph(__mmask32 __U, __m512h __A, __m512h __B, __m512h __C) { in _mm512_maskz_fmsubadd_ph() argument
2678 (__v32hf)__A, (__v32hf)__B, -(__v32hf)__C, (__mmask32)__U, in _mm512_maskz_fmsubadd_ph()
2688 _mm512_mask3_fmsub_ph(__m512h __A, __m512h __B, __m512h __C, __mmask32 __U) { in _mm512_mask3_fmsub_ph() argument
2689 return (__m512h)__builtin_ia32_vfmsubph512_mask3((__v32hf)__A, (__v32hf)__B, in _mm512_mask3_fmsub_ph()
2700 _mm512_mask3_fmsubadd_ph(__m512h __A, __m512h __B, __m512h __C, __mmask32 __U) { in _mm512_mask3_fmsubadd_ph() argument
2702 (__v32hf)__A, (__v32hf)__B, (__v32hf)__C, (__mmask32)__U, in _mm512_mask3_fmsubadd_ph()
2712 _mm512_mask_fnmadd_ph(__m512h __A, __mmask32 __U, __m512h __B, __m512h __C) { in _mm512_mask_fnmadd_ph() argument
2713 return (__m512h)__builtin_ia32_vfmaddph512_mask((__v32hf)__A, -(__v32hf)__B, in _mm512_mask_fnmadd_ph()
2729 _mm512_mask_fnmsub_ph(__m512h __A, __mmask32 __U, __m512h __B, __m512h __C) { in _mm512_mask_fnmsub_ph() argument
2730 return (__m512h)__builtin_ia32_vfmaddph512_mask((__v32hf)__A, -(__v32hf)__B, in _mm512_mask_fnmsub_ph()
2736 _mm512_mask3_fnmsub_ph(__m512h __A, __m512h __B, __m512h __C, __mmask32 __U) { in _mm512_mask3_fnmsub_ph() argument
2737 return (__m512h)__builtin_ia32_vfmsubph512_mask3(-(__v32hf)__A, (__v32hf)__B, in _mm512_mask3_fnmsub_ph()
2743 __m128h __A, in _mm_fmadd_sh() argument
2745 return __builtin_ia32_vfmaddsh3_mask((__v8hf)__W, (__v8hf)__A, (__v8hf)__B, in _mm_fmadd_sh()
2751 __m128h __A, in _mm_mask_fmadd_sh() argument
2753 return __builtin_ia32_vfmaddsh3_mask((__v8hf)__W, (__v8hf)__A, (__v8hf)__B, in _mm_mask_fmadd_sh()
2768 _mm_maskz_fmadd_sh(__mmask8 __U, __m128h __A, __m128h __B, __m128h __C) { in _mm_maskz_fmadd_sh() argument
2769 return __builtin_ia32_vfmaddsh3_maskz((__v8hf)__A, (__v8hf)__B, (__v8hf)__C, in _mm_maskz_fmadd_sh()
2792 __m128h __A, in _mm_fmsub_sh() argument
2794 return (__m128h)__builtin_ia32_vfmaddsh3_mask((__v8hf)__W, (__v8hf)__A, in _mm_fmsub_sh()
2801 __m128h __A, in _mm_mask_fmsub_sh() argument
2803 return (__m128h)__builtin_ia32_vfmaddsh3_mask((__v8hf)__W, (__v8hf)__A, in _mm_mask_fmsub_sh()
2819 _mm_maskz_fmsub_sh(__mmask8 __U, __m128h __A, __m128h __B, __m128h __C) { in _mm_maskz_fmsub_sh() argument
2820 return (__m128h)__builtin_ia32_vfmaddsh3_maskz((__v8hf)__A, (__v8hf)__B, in _mm_maskz_fmsub_sh()
2843 __m128h __A, in _mm_fnmadd_sh() argument
2845 return __builtin_ia32_vfmaddsh3_mask((__v8hf)__W, -(__v8hf)__A, (__v8hf)__B, in _mm_fnmadd_sh()
2850 _mm_mask_fnmadd_sh(__m128h __W, __mmask8 __U, __m128h __A, __m128h __B) { in _mm_mask_fnmadd_sh() argument
2851 return __builtin_ia32_vfmaddsh3_mask((__v8hf)__W, -(__v8hf)__A, (__v8hf)__B, in _mm_mask_fnmadd_sh()
2866 _mm_maskz_fnmadd_sh(__mmask8 __U, __m128h __A, __m128h __B, __m128h __C) { in _mm_maskz_fnmadd_sh() argument
2867 return __builtin_ia32_vfmaddsh3_maskz((__v8hf)__A, -(__v8hf)__B, (__v8hf)__C, in _mm_maskz_fnmadd_sh()
2890 __m128h __A, in _mm_fnmsub_sh() argument
2892 return __builtin_ia32_vfmaddsh3_mask((__v8hf)__W, -(__v8hf)__A, -(__v8hf)__B, in _mm_fnmsub_sh()
2897 _mm_mask_fnmsub_sh(__m128h __W, __mmask8 __U, __m128h __A, __m128h __B) { in _mm_mask_fnmsub_sh() argument
2898 return __builtin_ia32_vfmaddsh3_mask((__v8hf)__W, -(__v8hf)__A, -(__v8hf)__B, in _mm_mask_fnmsub_sh()
2913 _mm_maskz_fnmsub_sh(__mmask8 __U, __m128h __A, __m128h __B, __m128h __C) { in _mm_maskz_fnmsub_sh() argument
2914 return __builtin_ia32_vfmaddsh3_maskz((__v8hf)__A, -(__v8hf)__B, -(__v8hf)__C, in _mm_maskz_fnmsub_sh()
2936 static __inline__ __m128h __DEFAULT_FN_ATTRS128 _mm_fcmadd_sch(__m128h __A, in _mm_fcmadd_sch() argument
2939 return (__m128h)__builtin_ia32_vfcmaddcsh_mask((__v4sf)__A, (__v4sf)__B, in _mm_fcmadd_sch()
2945 _mm_mask_fcmadd_sch(__m128h __A, __mmask8 __U, __m128h __B, __m128h __C) { in _mm_mask_fcmadd_sch() argument
2947 (__v4sf)__A, (__v4sf)(__B), (__v4sf)(__C), __U, _MM_FROUND_CUR_DIRECTION); in _mm_mask_fcmadd_sch()
2951 _mm_maskz_fcmadd_sch(__mmask8 __U, __m128h __A, __m128h __B, __m128h __C) { in _mm_maskz_fcmadd_sch() argument
2952 return (__m128h)__builtin_ia32_vfcmaddcsh_maskz((__v4sf)__A, (__v4sf)__B, in _mm_maskz_fcmadd_sch()
2958 _mm_mask3_fcmadd_sch(__m128h __A, __m128h __B, __m128h __C, __mmask8 __U) { in _mm_mask3_fcmadd_sch() argument
2960 (__v4sf)__A, (__v4sf)__B, (__v4sf)__C, __U, _MM_FROUND_CUR_DIRECTION); in _mm_mask3_fcmadd_sch()
2983 static __inline__ __m128h __DEFAULT_FN_ATTRS128 _mm_fmadd_sch(__m128h __A, in _mm_fmadd_sch() argument
2986 return (__m128h)__builtin_ia32_vfmaddcsh_mask((__v4sf)__A, (__v4sf)__B, in _mm_fmadd_sch()
2992 _mm_mask_fmadd_sch(__m128h __A, __mmask8 __U, __m128h __B, __m128h __C) { in _mm_mask_fmadd_sch() argument
2994 (__v4sf)__A, (__v4sf)(__B), (__v4sf)(__C), __U, _MM_FROUND_CUR_DIRECTION); in _mm_mask_fmadd_sch()
2998 _mm_maskz_fmadd_sch(__mmask8 __U, __m128h __A, __m128h __B, __m128h __C) { in _mm_maskz_fmadd_sch() argument
2999 return (__m128h)__builtin_ia32_vfmaddcsh_maskz((__v4sf)__A, (__v4sf)__B, in _mm_maskz_fmadd_sch()
3005 _mm_mask3_fmadd_sch(__m128h __A, __m128h __B, __m128h __C, __mmask8 __U) { in _mm_mask3_fmadd_sch() argument
3007 (__v4sf)__A, (__v4sf)__B, (__v4sf)__C, __U, _MM_FROUND_CUR_DIRECTION); in _mm_mask3_fmadd_sch()
3030 static __inline__ __m128h __DEFAULT_FN_ATTRS128 _mm_fcmul_sch(__m128h __A, in _mm_fcmul_sch() argument
3033 (__v4sf)__A, (__v4sf)__B, (__v4sf)_mm_undefined_ph(), (__mmask8)-1, in _mm_fcmul_sch()
3038 _mm_mask_fcmul_sch(__m128h __W, __mmask8 __U, __m128h __A, __m128h __B) { in _mm_mask_fcmul_sch() argument
3039 return (__m128h)__builtin_ia32_vfcmulcsh_mask((__v4sf)__A, (__v4sf)__B, in _mm_mask_fcmul_sch()
3045 _mm_maskz_fcmul_sch(__mmask8 __U, __m128h __A, __m128h __B) { in _mm_maskz_fcmul_sch() argument
3047 (__v4sf)__A, (__v4sf)__B, (__v4sf)_mm_setzero_ph(), (__mmask8)__U, in _mm_maskz_fcmul_sch()
3066 static __inline__ __m128h __DEFAULT_FN_ATTRS128 _mm_fmul_sch(__m128h __A, in _mm_fmul_sch() argument
3069 (__v4sf)__A, (__v4sf)__B, (__v4sf)_mm_undefined_ph(), (__mmask8)-1, in _mm_fmul_sch()
3075 __m128h __A, in _mm_mask_fmul_sch() argument
3077 return (__m128h)__builtin_ia32_vfmulcsh_mask((__v4sf)__A, (__v4sf)__B, in _mm_mask_fmul_sch()
3083 _mm_maskz_fmul_sch(__mmask8 __U, __m128h __A, __m128h __B) { in _mm_maskz_fmul_sch() argument
3085 (__v4sf)__A, (__v4sf)__B, (__v4sf)_mm_setzero_ph(), (__mmask8)__U, in _mm_maskz_fmul_sch()
3104 static __inline__ __m512h __DEFAULT_FN_ATTRS512 _mm512_fcmul_pch(__m512h __A, in _mm512_fcmul_pch() argument
3107 (__v16sf)__A, (__v16sf)__B, (__v16sf)_mm512_undefined_ph(), (__mmask16)-1, in _mm512_fcmul_pch()
3112 _mm512_mask_fcmul_pch(__m512h __W, __mmask16 __U, __m512h __A, __m512h __B) { in _mm512_mask_fcmul_pch() argument
3113 return (__m512h)__builtin_ia32_vfcmulcph512_mask((__v16sf)__A, (__v16sf)__B, in _mm512_mask_fcmul_pch()
3119 _mm512_maskz_fcmul_pch(__mmask16 __U, __m512h __A, __m512h __B) { in _mm512_maskz_fcmul_pch() argument
3121 (__v16sf)__A, (__v16sf)__B, (__v16sf)_mm512_setzero_ph(), (__mmask16)__U, in _mm512_maskz_fcmul_pch()
3140 static __inline__ __m512h __DEFAULT_FN_ATTRS512 _mm512_fmul_pch(__m512h __A, in _mm512_fmul_pch() argument
3143 (__v16sf)__A, (__v16sf)__B, (__v16sf)_mm512_undefined_ph(), (__mmask16)-1, in _mm512_fmul_pch()
3148 _mm512_mask_fmul_pch(__m512h __W, __mmask16 __U, __m512h __A, __m512h __B) { in _mm512_mask_fmul_pch() argument
3149 return (__m512h)__builtin_ia32_vfmulcph512_mask((__v16sf)__A, (__v16sf)__B, in _mm512_mask_fmul_pch()
3155 _mm512_maskz_fmul_pch(__mmask16 __U, __m512h __A, __m512h __B) { in _mm512_maskz_fmul_pch() argument
3157 (__v16sf)__A, (__v16sf)__B, (__v16sf)_mm512_setzero_ph(), (__mmask16)__U, in _mm512_maskz_fmul_pch()
3176 static __inline__ __m512h __DEFAULT_FN_ATTRS512 _mm512_fcmadd_pch(__m512h __A, in _mm512_fcmadd_pch() argument
3180 (__v16sf)__A, (__v16sf)__B, (__v16sf)__C, (__mmask16)-1, in _mm512_fcmadd_pch()
3185 _mm512_mask_fcmadd_pch(__m512h __A, __mmask16 __U, __m512h __B, __m512h __C) { in _mm512_mask_fcmadd_pch() argument
3187 (__v16sf)__A, (__v16sf)__B, (__v16sf)__C, (__mmask16)__U, in _mm512_mask_fcmadd_pch()
3192 _mm512_mask3_fcmadd_pch(__m512h __A, __m512h __B, __m512h __C, __mmask16 __U) { in _mm512_mask3_fcmadd_pch() argument
3194 (__v16sf)__A, (__v16sf)__B, (__v16sf)__C, (__mmask16)__U, in _mm512_mask3_fcmadd_pch()
3199 _mm512_maskz_fcmadd_pch(__mmask16 __U, __m512h __A, __m512h __B, __m512h __C) { in _mm512_maskz_fcmadd_pch() argument
3201 (__v16sf)__A, (__v16sf)__B, (__v16sf)__C, (__mmask16)__U, in _mm512_maskz_fcmadd_pch()
3225 static __inline__ __m512h __DEFAULT_FN_ATTRS512 _mm512_fmadd_pch(__m512h __A, in _mm512_fmadd_pch() argument
3228 return (__m512h)__builtin_ia32_vfmaddcph512_mask3((__v16sf)__A, (__v16sf)__B, in _mm512_fmadd_pch()
3234 _mm512_mask_fmadd_pch(__m512h __A, __mmask16 __U, __m512h __B, __m512h __C) { in _mm512_mask_fmadd_pch() argument
3235 return (__m512h)__builtin_ia32_vfmaddcph512_mask((__v16sf)__A, (__v16sf)__B, in _mm512_mask_fmadd_pch()
3241 _mm512_mask3_fmadd_pch(__m512h __A, __m512h __B, __m512h __C, __mmask16 __U) { in _mm512_mask3_fmadd_pch() argument
3243 (__v16sf)__A, (__v16sf)__B, (__v16sf)__C, (__mmask16)__U, in _mm512_mask3_fmadd_pch()
3248 _mm512_maskz_fmadd_pch(__mmask16 __U, __m512h __A, __m512h __B, __m512h __C) { in _mm512_maskz_fmadd_pch() argument
3250 (__v16sf)__A, (__v16sf)__B, (__v16sf)__C, (__mmask16)__U, in _mm512_maskz_fmadd_pch()
3295 _mm512_mask_blend_ph(__mmask32 __U, __m512h __A, __m512h __W) { in _mm512_mask_blend_ph() argument
3297 (__v32hf)__A); in _mm512_mask_blend_ph()
3301 _mm512_permutex2var_ph(__m512h __A, __m512i __I, __m512h __B) { in _mm512_permutex2var_ph() argument
3302 return (__m512h)__builtin_ia32_vpermi2varhi512((__v32hi)__A, (__v32hi)__I, in _mm512_permutex2var_ph()
3307 _mm512_permutexvar_ph(__m512i __A, __m512h __B) { in _mm512_permutexvar_ph() argument
3308 return (__m512h)__builtin_ia32_permvarhi512((__v32hi)__B, (__v32hi)__A); in _mm512_permutexvar_ph()