xref: /freebsd/contrib/llvm-project/libcxx/include/experimental/__simd/vec_ext.h (revision 0fca6ea1d4eea4c934cfff25ac9ee8ad6fe95583)
15f757f3fSDimitry Andric // -*- C++ -*-
25f757f3fSDimitry Andric //===----------------------------------------------------------------------===//
35f757f3fSDimitry Andric //
45f757f3fSDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
55f757f3fSDimitry Andric // See https://llvm.org/LICENSE.txt for license information.
65f757f3fSDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
75f757f3fSDimitry Andric //
85f757f3fSDimitry Andric //===----------------------------------------------------------------------===//
95f757f3fSDimitry Andric 
105f757f3fSDimitry Andric #ifndef _LIBCPP_EXPERIMENTAL___SIMD_VEC_EXT_H
115f757f3fSDimitry Andric #define _LIBCPP_EXPERIMENTAL___SIMD_VEC_EXT_H
125f757f3fSDimitry Andric 
13*0fca6ea1SDimitry Andric #include <__assert>
145f757f3fSDimitry Andric #include <__bit/bit_ceil.h>
155f757f3fSDimitry Andric #include <__utility/forward.h>
165f757f3fSDimitry Andric #include <__utility/integer_sequence.h>
175f757f3fSDimitry Andric #include <cstddef>
185f757f3fSDimitry Andric #include <experimental/__config>
19cb14a3feSDimitry Andric #include <experimental/__simd/declaration.h>
205f757f3fSDimitry Andric #include <experimental/__simd/traits.h>
215f757f3fSDimitry Andric #include <experimental/__simd/utility.h>
225f757f3fSDimitry Andric 
235f757f3fSDimitry Andric #if _LIBCPP_STD_VER >= 17 && defined(_LIBCPP_ENABLE_EXPERIMENTAL)
245f757f3fSDimitry Andric 
255f757f3fSDimitry Andric _LIBCPP_BEGIN_NAMESPACE_EXPERIMENTAL
265f757f3fSDimitry Andric inline namespace parallelism_v2 {
275f757f3fSDimitry Andric namespace simd_abi {
285f757f3fSDimitry Andric template <int _Np>
295f757f3fSDimitry Andric struct __vec_ext {
305f757f3fSDimitry Andric   static constexpr size_t __simd_size = _Np;
315f757f3fSDimitry Andric };
325f757f3fSDimitry Andric } // namespace simd_abi
335f757f3fSDimitry Andric 
345f757f3fSDimitry Andric template <int _Np>
355f757f3fSDimitry Andric inline constexpr bool is_abi_tag_v<simd_abi::__vec_ext<_Np>> = _Np > 0 && _Np <= 32;
365f757f3fSDimitry Andric 
375f757f3fSDimitry Andric template <class _Tp, int _Np>
385f757f3fSDimitry Andric struct __simd_storage<_Tp, simd_abi::__vec_ext<_Np>> {
395f757f3fSDimitry Andric   _Tp __data __attribute__((__vector_size__(std::__bit_ceil((sizeof(_Tp) * _Np)))));
405f757f3fSDimitry Andric 
415f757f3fSDimitry Andric   _LIBCPP_HIDE_FROM_ABI _Tp __get(size_t __idx) const noexcept {
42cb14a3feSDimitry Andric     _LIBCPP_ASSERT_VALID_ELEMENT_ACCESS(__idx >= 0 && __idx < _Np, "Index is out of bounds");
435f757f3fSDimitry Andric     return __data[__idx];
445f757f3fSDimitry Andric   }
455f757f3fSDimitry Andric   _LIBCPP_HIDE_FROM_ABI void __set(size_t __idx, _Tp __v) noexcept {
46cb14a3feSDimitry Andric     _LIBCPP_ASSERT_VALID_ELEMENT_ACCESS(__idx >= 0 && __idx < _Np, "Index is out of bounds");
475f757f3fSDimitry Andric     __data[__idx] = __v;
485f757f3fSDimitry Andric   }
495f757f3fSDimitry Andric };
505f757f3fSDimitry Andric 
515f757f3fSDimitry Andric template <class _Tp, int _Np>
525f757f3fSDimitry Andric struct __mask_storage<_Tp, simd_abi::__vec_ext<_Np>>
535f757f3fSDimitry Andric     : __simd_storage<decltype(experimental::__choose_mask_type<_Tp>()), simd_abi::__vec_ext<_Np>> {};
545f757f3fSDimitry Andric 
555f757f3fSDimitry Andric template <class _Tp, int _Np>
565f757f3fSDimitry Andric struct __simd_operations<_Tp, simd_abi::__vec_ext<_Np>> {
575f757f3fSDimitry Andric   using _SimdStorage = __simd_storage<_Tp, simd_abi::__vec_ext<_Np>>;
585f757f3fSDimitry Andric   using _MaskStorage = __mask_storage<_Tp, simd_abi::__vec_ext<_Np>>;
595f757f3fSDimitry Andric 
605f757f3fSDimitry Andric   static _LIBCPP_HIDE_FROM_ABI _SimdStorage __broadcast(_Tp __v) noexcept {
615f757f3fSDimitry Andric     _SimdStorage __result;
625f757f3fSDimitry Andric     for (int __i = 0; __i < _Np; ++__i) {
635f757f3fSDimitry Andric       __result.__set(__i, __v);
645f757f3fSDimitry Andric     }
655f757f3fSDimitry Andric     return __result;
665f757f3fSDimitry Andric   }
675f757f3fSDimitry Andric 
685f757f3fSDimitry Andric   template <class _Generator, size_t... _Is>
695f757f3fSDimitry Andric   static _LIBCPP_HIDE_FROM_ABI _SimdStorage __generate_init(_Generator&& __g, std::index_sequence<_Is...>) {
705f757f3fSDimitry Andric     return _SimdStorage{{__g(std::integral_constant<size_t, _Is>())...}};
715f757f3fSDimitry Andric   }
725f757f3fSDimitry Andric 
735f757f3fSDimitry Andric   template <class _Generator>
745f757f3fSDimitry Andric   static _LIBCPP_HIDE_FROM_ABI _SimdStorage __generate(_Generator&& __g) noexcept {
755f757f3fSDimitry Andric     return __generate_init(std::forward<_Generator>(__g), std::make_index_sequence<_Np>());
765f757f3fSDimitry Andric   }
777a6dacacSDimitry Andric 
787a6dacacSDimitry Andric   template <class _Up>
797a6dacacSDimitry Andric   static _LIBCPP_HIDE_FROM_ABI void __load(_SimdStorage& __s, const _Up* __mem) noexcept {
807a6dacacSDimitry Andric     for (size_t __i = 0; __i < _Np; __i++)
817a6dacacSDimitry Andric       __s.__data[__i] = static_cast<_Tp>(__mem[__i]);
827a6dacacSDimitry Andric   }
83*0fca6ea1SDimitry Andric 
84*0fca6ea1SDimitry Andric   template <class _Up>
85*0fca6ea1SDimitry Andric   static _LIBCPP_HIDE_FROM_ABI void __store(_SimdStorage __s, _Up* __mem) noexcept {
86*0fca6ea1SDimitry Andric     for (size_t __i = 0; __i < _Np; __i++)
87*0fca6ea1SDimitry Andric       __mem[__i] = static_cast<_Up>(__s.__data[__i]);
88*0fca6ea1SDimitry Andric   }
895f757f3fSDimitry Andric };
905f757f3fSDimitry Andric 
915f757f3fSDimitry Andric template <class _Tp, int _Np>
925f757f3fSDimitry Andric struct __mask_operations<_Tp, simd_abi::__vec_ext<_Np>> {
935f757f3fSDimitry Andric   using _MaskStorage = __mask_storage<_Tp, simd_abi::__vec_ext<_Np>>;
945f757f3fSDimitry Andric 
955f757f3fSDimitry Andric   static _LIBCPP_HIDE_FROM_ABI _MaskStorage __broadcast(bool __v) noexcept {
965f757f3fSDimitry Andric     _MaskStorage __result;
975f757f3fSDimitry Andric     auto __all_bits_v = experimental::__set_all_bits<_Tp>(__v);
985f757f3fSDimitry Andric     for (int __i = 0; __i < _Np; ++__i) {
995f757f3fSDimitry Andric       __result.__set(__i, __all_bits_v);
1005f757f3fSDimitry Andric     }
1015f757f3fSDimitry Andric     return __result;
1025f757f3fSDimitry Andric   }
1037a6dacacSDimitry Andric 
1047a6dacacSDimitry Andric   static _LIBCPP_HIDE_FROM_ABI void __load(_MaskStorage& __s, const bool* __mem) noexcept {
1057a6dacacSDimitry Andric     for (size_t __i = 0; __i < _Np; __i++)
1067a6dacacSDimitry Andric       __s.__data[__i] = experimental::__set_all_bits<_Tp>(__mem[__i]);
1077a6dacacSDimitry Andric   }
108*0fca6ea1SDimitry Andric 
109*0fca6ea1SDimitry Andric   static _LIBCPP_HIDE_FROM_ABI void __store(_MaskStorage __s, bool* __mem) noexcept {
110*0fca6ea1SDimitry Andric     for (size_t __i = 0; __i < _Np; __i++)
111*0fca6ea1SDimitry Andric       __mem[__i] = static_cast<bool>(__s.__data[__i]);
112*0fca6ea1SDimitry Andric   }
1135f757f3fSDimitry Andric };
1145f757f3fSDimitry Andric 
1155f757f3fSDimitry Andric } // namespace parallelism_v2
1165f757f3fSDimitry Andric _LIBCPP_END_NAMESPACE_EXPERIMENTAL
1175f757f3fSDimitry Andric 
1185f757f3fSDimitry Andric #endif // _LIBCPP_STD_VER >= 17 && defined(_LIBCPP_ENABLE_EXPERIMENTAL)
1195f757f3fSDimitry Andric #endif // _LIBCPP_EXPERIMENTAL___SIMD_VEC_EXT_H
120