15f757f3fSDimitry Andric // -*- C++ -*- 25f757f3fSDimitry Andric //===----------------------------------------------------------------------===// 35f757f3fSDimitry Andric // 45f757f3fSDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 55f757f3fSDimitry Andric // See https://llvm.org/LICENSE.txt for license information. 65f757f3fSDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 75f757f3fSDimitry Andric // 85f757f3fSDimitry Andric //===----------------------------------------------------------------------===// 95f757f3fSDimitry Andric 105f757f3fSDimitry Andric #ifndef _LIBCPP_EXPERIMENTAL___SIMD_VEC_EXT_H 115f757f3fSDimitry Andric #define _LIBCPP_EXPERIMENTAL___SIMD_VEC_EXT_H 125f757f3fSDimitry Andric 13*0fca6ea1SDimitry Andric #include <__assert> 145f757f3fSDimitry Andric #include <__bit/bit_ceil.h> 155f757f3fSDimitry Andric #include <__utility/forward.h> 165f757f3fSDimitry Andric #include <__utility/integer_sequence.h> 175f757f3fSDimitry Andric #include <cstddef> 185f757f3fSDimitry Andric #include <experimental/__config> 19cb14a3feSDimitry Andric #include <experimental/__simd/declaration.h> 205f757f3fSDimitry Andric #include <experimental/__simd/traits.h> 215f757f3fSDimitry Andric #include <experimental/__simd/utility.h> 225f757f3fSDimitry Andric 235f757f3fSDimitry Andric #if _LIBCPP_STD_VER >= 17 && defined(_LIBCPP_ENABLE_EXPERIMENTAL) 245f757f3fSDimitry Andric 255f757f3fSDimitry Andric _LIBCPP_BEGIN_NAMESPACE_EXPERIMENTAL 265f757f3fSDimitry Andric inline namespace parallelism_v2 { 275f757f3fSDimitry Andric namespace simd_abi { 285f757f3fSDimitry Andric template <int _Np> 295f757f3fSDimitry Andric struct __vec_ext { 305f757f3fSDimitry Andric static constexpr size_t __simd_size = _Np; 315f757f3fSDimitry Andric }; 325f757f3fSDimitry Andric } // namespace simd_abi 335f757f3fSDimitry Andric 345f757f3fSDimitry Andric template <int _Np> 355f757f3fSDimitry Andric inline constexpr bool is_abi_tag_v<simd_abi::__vec_ext<_Np>> = _Np > 0 && _Np <= 32; 365f757f3fSDimitry Andric 375f757f3fSDimitry Andric template <class _Tp, int _Np> 385f757f3fSDimitry Andric struct __simd_storage<_Tp, simd_abi::__vec_ext<_Np>> { 395f757f3fSDimitry Andric _Tp __data __attribute__((__vector_size__(std::__bit_ceil((sizeof(_Tp) * _Np))))); 405f757f3fSDimitry Andric 415f757f3fSDimitry Andric _LIBCPP_HIDE_FROM_ABI _Tp __get(size_t __idx) const noexcept { 42cb14a3feSDimitry Andric _LIBCPP_ASSERT_VALID_ELEMENT_ACCESS(__idx >= 0 && __idx < _Np, "Index is out of bounds"); 435f757f3fSDimitry Andric return __data[__idx]; 445f757f3fSDimitry Andric } 455f757f3fSDimitry Andric _LIBCPP_HIDE_FROM_ABI void __set(size_t __idx, _Tp __v) noexcept { 46cb14a3feSDimitry Andric _LIBCPP_ASSERT_VALID_ELEMENT_ACCESS(__idx >= 0 && __idx < _Np, "Index is out of bounds"); 475f757f3fSDimitry Andric __data[__idx] = __v; 485f757f3fSDimitry Andric } 495f757f3fSDimitry Andric }; 505f757f3fSDimitry Andric 515f757f3fSDimitry Andric template <class _Tp, int _Np> 525f757f3fSDimitry Andric struct __mask_storage<_Tp, simd_abi::__vec_ext<_Np>> 535f757f3fSDimitry Andric : __simd_storage<decltype(experimental::__choose_mask_type<_Tp>()), simd_abi::__vec_ext<_Np>> {}; 545f757f3fSDimitry Andric 555f757f3fSDimitry Andric template <class _Tp, int _Np> 565f757f3fSDimitry Andric struct __simd_operations<_Tp, simd_abi::__vec_ext<_Np>> { 575f757f3fSDimitry Andric using _SimdStorage = __simd_storage<_Tp, simd_abi::__vec_ext<_Np>>; 585f757f3fSDimitry Andric using _MaskStorage = __mask_storage<_Tp, simd_abi::__vec_ext<_Np>>; 595f757f3fSDimitry Andric 605f757f3fSDimitry Andric static _LIBCPP_HIDE_FROM_ABI _SimdStorage __broadcast(_Tp __v) noexcept { 615f757f3fSDimitry Andric _SimdStorage __result; 625f757f3fSDimitry Andric for (int __i = 0; __i < _Np; ++__i) { 635f757f3fSDimitry Andric __result.__set(__i, __v); 645f757f3fSDimitry Andric } 655f757f3fSDimitry Andric return __result; 665f757f3fSDimitry Andric } 675f757f3fSDimitry Andric 685f757f3fSDimitry Andric template <class _Generator, size_t... _Is> 695f757f3fSDimitry Andric static _LIBCPP_HIDE_FROM_ABI _SimdStorage __generate_init(_Generator&& __g, std::index_sequence<_Is...>) { 705f757f3fSDimitry Andric return _SimdStorage{{__g(std::integral_constant<size_t, _Is>())...}}; 715f757f3fSDimitry Andric } 725f757f3fSDimitry Andric 735f757f3fSDimitry Andric template <class _Generator> 745f757f3fSDimitry Andric static _LIBCPP_HIDE_FROM_ABI _SimdStorage __generate(_Generator&& __g) noexcept { 755f757f3fSDimitry Andric return __generate_init(std::forward<_Generator>(__g), std::make_index_sequence<_Np>()); 765f757f3fSDimitry Andric } 777a6dacacSDimitry Andric 787a6dacacSDimitry Andric template <class _Up> 797a6dacacSDimitry Andric static _LIBCPP_HIDE_FROM_ABI void __load(_SimdStorage& __s, const _Up* __mem) noexcept { 807a6dacacSDimitry Andric for (size_t __i = 0; __i < _Np; __i++) 817a6dacacSDimitry Andric __s.__data[__i] = static_cast<_Tp>(__mem[__i]); 827a6dacacSDimitry Andric } 83*0fca6ea1SDimitry Andric 84*0fca6ea1SDimitry Andric template <class _Up> 85*0fca6ea1SDimitry Andric static _LIBCPP_HIDE_FROM_ABI void __store(_SimdStorage __s, _Up* __mem) noexcept { 86*0fca6ea1SDimitry Andric for (size_t __i = 0; __i < _Np; __i++) 87*0fca6ea1SDimitry Andric __mem[__i] = static_cast<_Up>(__s.__data[__i]); 88*0fca6ea1SDimitry Andric } 895f757f3fSDimitry Andric }; 905f757f3fSDimitry Andric 915f757f3fSDimitry Andric template <class _Tp, int _Np> 925f757f3fSDimitry Andric struct __mask_operations<_Tp, simd_abi::__vec_ext<_Np>> { 935f757f3fSDimitry Andric using _MaskStorage = __mask_storage<_Tp, simd_abi::__vec_ext<_Np>>; 945f757f3fSDimitry Andric 955f757f3fSDimitry Andric static _LIBCPP_HIDE_FROM_ABI _MaskStorage __broadcast(bool __v) noexcept { 965f757f3fSDimitry Andric _MaskStorage __result; 975f757f3fSDimitry Andric auto __all_bits_v = experimental::__set_all_bits<_Tp>(__v); 985f757f3fSDimitry Andric for (int __i = 0; __i < _Np; ++__i) { 995f757f3fSDimitry Andric __result.__set(__i, __all_bits_v); 1005f757f3fSDimitry Andric } 1015f757f3fSDimitry Andric return __result; 1025f757f3fSDimitry Andric } 1037a6dacacSDimitry Andric 1047a6dacacSDimitry Andric static _LIBCPP_HIDE_FROM_ABI void __load(_MaskStorage& __s, const bool* __mem) noexcept { 1057a6dacacSDimitry Andric for (size_t __i = 0; __i < _Np; __i++) 1067a6dacacSDimitry Andric __s.__data[__i] = experimental::__set_all_bits<_Tp>(__mem[__i]); 1077a6dacacSDimitry Andric } 108*0fca6ea1SDimitry Andric 109*0fca6ea1SDimitry Andric static _LIBCPP_HIDE_FROM_ABI void __store(_MaskStorage __s, bool* __mem) noexcept { 110*0fca6ea1SDimitry Andric for (size_t __i = 0; __i < _Np; __i++) 111*0fca6ea1SDimitry Andric __mem[__i] = static_cast<bool>(__s.__data[__i]); 112*0fca6ea1SDimitry Andric } 1135f757f3fSDimitry Andric }; 1145f757f3fSDimitry Andric 1155f757f3fSDimitry Andric } // namespace parallelism_v2 1165f757f3fSDimitry Andric _LIBCPP_END_NAMESPACE_EXPERIMENTAL 1175f757f3fSDimitry Andric 1185f757f3fSDimitry Andric #endif // _LIBCPP_STD_VER >= 17 && defined(_LIBCPP_ENABLE_EXPERIMENTAL) 1195f757f3fSDimitry Andric #endif // _LIBCPP_EXPERIMENTAL___SIMD_VEC_EXT_H 120