1// -*- C++ -*- 2//===------------------------------- simd ---------------------------------===// 3// 4// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 5// See https://llvm.org/LICENSE.txt for license information. 6// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 7// 8//===----------------------------------------------------------------------===// 9#ifndef _LIBCPP_EXPERIMENTAL_SIMD 10#define _LIBCPP_EXPERIMENTAL_SIMD 11 12/* 13 experimental/simd synopsis 14 15namespace std::experimental { 16 17inline namespace parallelism_v2 { 18 19namespace simd_abi { 20 21struct scalar {}; 22template <int N> struct fixed_size {}; 23template <typename T> inline constexpr int max_fixed_size = implementation-defined; 24template <typename T> using compatible = implementation-defined; 25template <typename T> using native = implementation-defined; 26 27} // simd_abi 28 29struct element_aligned_tag {}; 30struct vector_aligned_tag {}; 31template <size_t> struct overaligned_tag {}; 32inline constexpr element_aligned_tag element_aligned{}; 33inline constexpr vector_aligned_tag vector_aligned{}; 34template <size_t N> inline constexpr overaligned_tag<N> overaligned{}; 35 36// traits [simd.traits] 37template <class T> struct is_abi_tag; 38template <class T> inline constexpr bool is_abi_tag_v = is_abi_tag<T>::value; 39 40template <class T> struct is_simd; 41template <class T> inline constexpr bool is_simd_v = is_simd<T>::value; 42 43template <class T> struct is_simd_mask; 44template <class T> inline constexpr bool is_simd_mask_v = is_simd_mask<T>::value; 45 46template <class T> struct is_simd_flag_type; 47template <class T> inline constexpr bool is_simd_flag_type_v = is_simd_flag_type<T>::value; 48 49template <class T, size_t N> struct abi_for_size { using type = see below; }; 50template <class T, size_t N> using abi_for_size_t = typename abi_for_size<T, N>::type; 51 52template <class T, class Abi = simd_abi::compatible<T>> struct simd_size; 53template <class T, class Abi = simd_abi::compatible<T>> 54inline constexpr size_t simd_size_v = simd_size<T, Abi>::value; 55 56template <class T, class U = typename T::value_type> struct memory_alignment; 57template <class T, class U = typename T::value_type> 58inline constexpr size_t memory_alignment_v = memory_alignment<T, U>::value; 59 60// class template simd [simd.class] 61template <class T, class Abi = simd_abi::compatible<T>> class simd; 62template <class T> using native_simd = simd<T, simd_abi::native<T>>; 63template <class T, int N> using fixed_size_simd = simd<T, simd_abi::fixed_size<N>>; 64 65// class template simd_mask [simd.mask.class] 66template <class T, class Abi = simd_abi::compatible<T>> class simd_mask; 67template <class T> using native_simd_mask = simd_mask<T, simd_abi::native<T>>; 68template <class T, int N> using fixed_size_simd_mask = simd_mask<T, simd_abi::fixed_size<N>>; 69 70// casts [simd.casts] 71template <class T, class U, class Abi> see below simd_cast(const simd<U, Abi>&); 72template <class T, class U, class Abi> see below static_simd_cast(const simd<U, Abi>&); 73 74template <class T, class Abi> 75fixed_size_simd<T, simd_size_v<T, Abi>> to_fixed_size(const simd<T, Abi>&) noexcept; 76template <class T, class Abi> 77fixed_size_simd_mask<T, simd_size_v<T, Abi>> to_fixed_size(const simd_mask<T, Abi>&) noexcept; 78template <class T, size_t N> native_simd<T> to_native(const fixed_size_simd<T, N>&) noexcept; 79template <class T, size_t N> 80native_simd_mask<T> to_native(const fixed_size_simd_mask<T, N>> &) noexcept; 81template <class T, size_t N> simd<T> to_compatible(const fixed_size_simd<T, N>&) noexcept; 82template <class T, size_t N> simd_mask<T> to_compatible(const fixed_size_simd_mask<T, N>&) noexcept; 83 84template <size_t... Sizes, class T, class Abi> 85tuple<simd<T, abi_for_size_t<Sizes>>...> split(const simd<T, Abi>&); 86template <size_t... Sizes, class T, class Abi> 87tuple<simd_mask<T, abi_for_size_t<Sizes>>...> split(const simd_mask<T, Abi>&); 88template <class V, class Abi> 89array<V, simd_size_v<typename V::value_type, Abi> / V::size()> split( 90const simd<typename V::value_type, Abi>&); 91template <class V, class Abi> 92array<V, simd_size_v<typename V::value_type, Abi> / V::size()> split( 93const simd_mask<typename V::value_type, Abi>&); 94 95template <class T, class... Abis> 96simd<T, abi_for_size_t<T, (simd_size_v<T, Abis> + ...)>> concat(const simd<T, Abis>&...); 97template <class T, class... Abis> 98simd_mask<T, abi_for_size_t<T, (simd_size_v<T, Abis> + ...)>> concat(const simd_mask<T, Abis>&...); 99 100// reductions [simd.mask.reductions] 101template <class T, class Abi> bool all_of(const simd_mask<T, Abi>&) noexcept; 102template <class T, class Abi> bool any_of(const simd_mask<T, Abi>&) noexcept; 103template <class T, class Abi> bool none_of(const simd_mask<T, Abi>&) noexcept; 104template <class T, class Abi> bool some_of(const simd_mask<T, Abi>&) noexcept; 105template <class T, class Abi> int popcount(const simd_mask<T, Abi>&) noexcept; 106template <class T, class Abi> int find_first_set(const simd_mask<T, Abi>&); 107template <class T, class Abi> int find_last_set(const simd_mask<T, Abi>&); 108 109bool all_of(see below) noexcept; 110bool any_of(see below) noexcept; 111bool none_of(see below) noexcept; 112bool some_of(see below) noexcept; 113int popcount(see below) noexcept; 114int find_first_set(see below) noexcept; 115int find_last_set(see below) noexcept; 116 117// masked assignment [simd.whereexpr] 118template <class M, class T> class const_where_expression; 119template <class M, class T> class where_expression; 120 121// masked assignment [simd.mask.where] 122template <class T> struct nodeduce { using type = T; }; // exposition only 123 124template <class T> using nodeduce_t = typename nodeduce<T>::type; // exposition only 125 126template <class T, class Abi> 127where_expression<simd_mask<T, Abi>, simd<T, Abi>> 128where(const typename simd<T, Abi>::mask_type&, simd<T, Abi>&) noexcept; 129 130template <class T, class Abi> 131const_where_expression<simd_mask<T, Abi>, const simd<T, Abi>> 132where(const typename simd<T, Abi>::mask_type&, const simd<T, Abi>&) noexcept; 133 134template <class T, class Abi> 135where_expression<simd_mask<T, Abi>, simd_mask<T, Abi>> 136where(const nodeduce_t<simd_mask<T, Abi>>&, simd_mask<T, Abi>&) noexcept; 137 138template <class T, class Abi> 139const_where_expression<simd_mask<T, Abi>, const simd_mask<T, Abi>> 140where(const nodeduce_t<simd_mask<T, Abi>>&, const simd_mask<T, Abi>&) noexcept; 141 142template <class T> where_expression<bool, T> where(see below k, T& d) noexcept; 143 144template <class T> 145const_where_expression<bool, const T> where(see below k, const T& d) noexcept; 146 147// reductions [simd.reductions] 148template <class T, class Abi, class BinaryOperation = std::plus<>> 149T reduce(const simd<T, Abi>&, BinaryOperation = BinaryOperation()); 150 151template <class M, class V, class BinaryOperation> 152typename V::value_type reduce(const const_where_expression<M, V>& x, 153typename V::value_type neutral_element, BinaryOperation binary_op); 154 155template <class M, class V> 156typename V::value_type reduce(const const_where_expression<M, V>& x, plus<> binary_op = plus<>()); 157 158template <class M, class V> 159typename V::value_type reduce(const const_where_expression<M, V>& x, multiplies<> binary_op); 160 161template <class M, class V> 162typename V::value_type reduce(const const_where_expression<M, V>& x, bit_and<> binary_op); 163 164template <class M, class V> 165typename V::value_type reduce(const const_where_expression<M, V>& x, bit_or<> binary_op); 166 167template <class M, class V> 168typename V::value_type reduce(const const_where_expression<M, V>& x, bit_xor<> binary_op); 169 170template <class T, class Abi> T hmin(const simd<T, Abi>&); 171template <class M, class V> T hmin(const const_where_expression<M, V>&); 172template <class T, class Abi> T hmax(const simd<T, Abi>&); 173template <class M, class V> T hmax(const const_where_expression<M, V>&); 174 175// algorithms [simd.alg] 176template <class T, class Abi> simd<T, Abi> min(const simd<T, Abi>&, const simd<T, Abi>&) noexcept; 177 178template <class T, class Abi> simd<T, Abi> max(const simd<T, Abi>&, const simd<T, Abi>&) noexcept; 179 180template <class T, class Abi> 181std::pair<simd<T, Abi>, simd<T, Abi>> minmax(const simd<T, Abi>&, const simd<T, Abi>&) noexcept; 182 183template <class T, class Abi> 184simd<T, Abi> clamp(const simd<T, Abi>& v, const simd<T, Abi>& lo, const simd<T, Abi>& hi); 185 186// [simd.whereexpr] 187template <class M, class T> 188class const_where_expression { 189 const M& mask; // exposition only 190 T& data; // exposition only 191public: 192 const_where_expression(const const_where_expression&) = delete; 193 const_where_expression& operator=(const const_where_expression&) = delete; 194 remove_const_t<T> operator-() const &&; 195 template <class U, class Flags> void copy_to(U* mem, Flags f) const &&; 196}; 197 198template <class M, class T> 199class where_expression : public const_where_expression<M, T> { 200public: 201 where_expression(const where_expression&) = delete; 202 where_expression& operator=(const where_expression&) = delete; 203 template <class U> void operator=(U&& x); 204 template <class U> void operator+=(U&& x); 205 template <class U> void operator-=(U&& x); 206 template <class U> void operator*=(U&& x); 207 template <class U> void operator/=(U&& x); 208 template <class U> void operator%=(U&& x); 209 template <class U> void operator&=(U&& x); 210 template <class U> void operator|=(U&& x); 211 template <class U> void operator^=(U&& x); 212 template <class U> void operator<<=(U&& x); 213 template <class U> void operator>>=(U&& x); 214 void operator++(); 215 void operator++(int); 216 void operator--(); 217 void operator--(int); 218 template <class U, class Flags> void copy_from(const U* mem, Flags); 219}; 220 221// [simd.class] 222template <class T, class Abi> class simd { 223public: 224 using value_type = T; 225 using reference = see below; 226 using mask_type = simd_mask<T, Abi>; 227 228 using abi_type = Abi; 229 static constexpr size_t size() noexcept; 230 simd() = default; 231 232 // implicit type conversion constructor 233 template <class U> simd(const simd<U, simd_abi::fixed_size<size()>>&); 234 235 // implicit broadcast constructor (see below for constraints) 236 template <class U> simd(U&& value); 237 238 // generator constructor (see below for constraints) 239 template <class G> explicit simd(G&& gen); 240 241 // load constructor 242 template <class U, class Flags> simd(const U* mem, Flags f); 243 244 // loads [simd.load] 245 template <class U, class Flags> void copy_from(const U* mem, Flags f); 246 247 // stores [simd.store] 248 template <class U, class Flags> void copy_to(U* mem, Flags f) const; 249 250 // scalar access [simd.subscr] 251 reference operator[](size_t); 252 value_type operator[](size_t) const; 253 254 // unary operators [simd.unary] 255 simd& operator++(); 256 simd operator++(int); 257 simd& operator--(); 258 simd operator--(int); 259 mask_type operator!() const; 260 simd operator~() const; // see below 261 simd operator+() const; 262 simd operator-() const; 263 264 // binary operators [simd.binary] 265 friend simd operator+ (const simd&, const simd&); 266 friend simd operator- (const simd&, const simd&); 267 friend simd operator* (const simd&, const simd&); 268 friend simd operator/ (const simd&, const simd&); 269 friend simd operator% (const simd&, const simd&); 270 friend simd operator& (const simd&, const simd&); 271 friend simd operator| (const simd&, const simd&); 272 friend simd operator^ (const simd&, const simd&); 273 friend simd operator<<(const simd&, const simd&); 274 friend simd operator>>(const simd&, const simd&); 275 friend simd operator<<(const simd&, int); 276 friend simd operator>>(const simd&, int); 277 278 // compound assignment [simd.cassign] 279 friend simd& operator+= (simd&, const simd&); 280 friend simd& operator-= (simd&, const simd&); 281 friend simd& operator*= (simd&, const simd&); 282 friend simd& operator/= (simd&, const simd&); 283 friend simd& operator%= (simd&, const simd&); 284 285 friend simd& operator&= (simd&, const simd&); 286 friend simd& operator|= (simd&, const simd&); 287 friend simd& operator^= (simd&, const simd&); 288 friend simd& operator<<=(simd&, const simd&); 289 friend simd& operator>>=(simd&, const simd&); 290 friend simd& operator<<=(simd&, int); 291 friend simd& operator>>=(simd&, int); 292 293 // compares [simd.comparison] 294 friend mask_type operator==(const simd&, const simd&); 295 friend mask_type operator!=(const simd&, const simd&); 296 friend mask_type operator>=(const simd&, const simd&); 297 friend mask_type operator<=(const simd&, const simd&); 298 friend mask_type operator> (const simd&, const simd&); 299 friend mask_type operator< (const simd&, const simd&); 300}; 301 302// [simd.math] 303template <class Abi> using scharv = simd<signed char, Abi>; // exposition only 304template <class Abi> using shortv = simd<short, Abi>; // exposition only 305template <class Abi> using intv = simd<int, Abi>; // exposition only 306template <class Abi> using longv = simd<long int, Abi>; // exposition only 307template <class Abi> using llongv = simd<long long int, Abi>; // exposition only 308template <class Abi> using floatv = simd<float, Abi>; // exposition only 309template <class Abi> using doublev = simd<double, Abi>; // exposition only 310template <class Abi> using ldoublev = simd<long double, Abi>; // exposition only 311template <class T, class V> using samesize = fixed_size_simd<T, V::size()>; // exposition only 312 313template <class Abi> floatv<Abi> acos(floatv<Abi> x); 314template <class Abi> doublev<Abi> acos(doublev<Abi> x); 315template <class Abi> ldoublev<Abi> acos(ldoublev<Abi> x); 316 317template <class Abi> floatv<Abi> asin(floatv<Abi> x); 318template <class Abi> doublev<Abi> asin(doublev<Abi> x); 319template <class Abi> ldoublev<Abi> asin(ldoublev<Abi> x); 320 321template <class Abi> floatv<Abi> atan(floatv<Abi> x); 322template <class Abi> doublev<Abi> atan(doublev<Abi> x); 323template <class Abi> ldoublev<Abi> atan(ldoublev<Abi> x); 324 325template <class Abi> floatv<Abi> atan2(floatv<Abi> y, floatv<Abi> x); 326template <class Abi> doublev<Abi> atan2(doublev<Abi> y, doublev<Abi> x); 327template <class Abi> ldoublev<Abi> atan2(ldoublev<Abi> y, ldoublev<Abi> x); 328 329template <class Abi> floatv<Abi> cos(floatv<Abi> x); 330template <class Abi> doublev<Abi> cos(doublev<Abi> x); 331template <class Abi> ldoublev<Abi> cos(ldoublev<Abi> x); 332 333template <class Abi> floatv<Abi> sin(floatv<Abi> x); 334template <class Abi> doublev<Abi> sin(doublev<Abi> x); 335template <class Abi> ldoublev<Abi> sin(ldoublev<Abi> x); 336 337template <class Abi> floatv<Abi> tan(floatv<Abi> x); 338template <class Abi> doublev<Abi> tan(doublev<Abi> x); 339template <class Abi> ldoublev<Abi> tan(ldoublev<Abi> x); 340 341template <class Abi> floatv<Abi> acosh(floatv<Abi> x); 342template <class Abi> doublev<Abi> acosh(doublev<Abi> x); 343template <class Abi> ldoublev<Abi> acosh(ldoublev<Abi> x); 344 345template <class Abi> floatv<Abi> asinh(floatv<Abi> x); 346template <class Abi> doublev<Abi> asinh(doublev<Abi> x); 347template <class Abi> ldoublev<Abi> asinh(ldoublev<Abi> x); 348 349template <class Abi> floatv<Abi> atanh(floatv<Abi> x); 350template <class Abi> doublev<Abi> atanh(doublev<Abi> x); 351template <class Abi> ldoublev<Abi> atanh(ldoublev<Abi> x); 352 353template <class Abi> floatv<Abi> cosh(floatv<Abi> x); 354template <class Abi> doublev<Abi> cosh(doublev<Abi> x); 355template <class Abi> ldoublev<Abi> cosh(ldoublev<Abi> x); 356 357template <class Abi> floatv<Abi> sinh(floatv<Abi> x); 358template <class Abi> doublev<Abi> sinh(doublev<Abi> x); 359template <class Abi> ldoublev<Abi> sinh(ldoublev<Abi> x); 360 361template <class Abi> floatv<Abi> tanh(floatv<Abi> x); 362template <class Abi> doublev<Abi> tanh(doublev<Abi> x); 363template <class Abi> ldoublev<Abi> tanh(ldoublev<Abi> x); 364 365template <class Abi> floatv<Abi> exp(floatv<Abi> x); 366template <class Abi> doublev<Abi> exp(doublev<Abi> x); 367template <class Abi> ldoublev<Abi> exp(ldoublev<Abi> x); 368 369template <class Abi> floatv<Abi> exp2(floatv<Abi> x); 370template <class Abi> doublev<Abi> exp2(doublev<Abi> x); 371template <class Abi> ldoublev<Abi> exp2(ldoublev<Abi> x); 372 373template <class Abi> floatv<Abi> expm1(floatv<Abi> x); 374template <class Abi> doublev<Abi> expm1(doublev<Abi> x); 375template <class Abi> ldoublev<Abi> expm1(ldoublev<Abi> x); 376 377template <class Abi> floatv<Abi> frexp(floatv<Abi> value, samesize<int, floatv<Abi>>* exp); 378template <class Abi> doublev<Abi> frexp(doublev<Abi> value, samesize<int, doublev<Abi>>* exp); 379template <class Abi> ldoublev<Abi> frexp(ldoublev<Abi> value, samesize<int, ldoublev<Abi>>* exp); 380 381template <class Abi> samesize<int, floatv<Abi>> ilogb(floatv<Abi> x); 382template <class Abi> samesize<int, doublev<Abi>> ilogb(doublev<Abi> x); 383template <class Abi> samesize<int, ldoublev<Abi>> ilogb(ldoublev<Abi> x); 384 385template <class Abi> floatv<Abi> ldexp(floatv<Abi> x, samesize<int, floatv<Abi>> exp); 386template <class Abi> doublev<Abi> ldexp(doublev<Abi> x, samesize<int, doublev<Abi>> exp); 387template <class Abi> ldoublev<Abi> ldexp(ldoublev<Abi> x, samesize<int, ldoublev<Abi>> exp); 388 389template <class Abi> floatv<Abi> log(floatv<Abi> x); 390template <class Abi> doublev<Abi> log(doublev<Abi> x); 391template <class Abi> ldoublev<Abi> log(ldoublev<Abi> x); 392 393template <class Abi> floatv<Abi> log10(floatv<Abi> x); 394template <class Abi> doublev<Abi> log10(doublev<Abi> x); 395template <class Abi> ldoublev<Abi> log10(ldoublev<Abi> x); 396 397template <class Abi> floatv<Abi> log1p(floatv<Abi> x); 398template <class Abi> doublev<Abi> log1p(doublev<Abi> x); 399template <class Abi> ldoublev<Abi> log1p(ldoublev<Abi> x); 400 401template <class Abi> floatv<Abi> log2(floatv<Abi> x); 402template <class Abi> doublev<Abi> log2(doublev<Abi> x); 403template <class Abi> ldoublev<Abi> log2(ldoublev<Abi> x); 404 405template <class Abi> floatv<Abi> logb(floatv<Abi> x); 406template <class Abi> doublev<Abi> logb(doublev<Abi> x); 407template <class Abi> ldoublev<Abi> logb(ldoublev<Abi> x); 408 409template <class Abi> floatv<Abi> modf(floatv<Abi> value, floatv<Abi>* iptr); 410template <class Abi> doublev<Abi> modf(doublev<Abi> value, doublev<Abi>* iptr); 411template <class Abi> ldoublev<Abi> modf(ldoublev<Abi> value, ldoublev<Abi>* iptr); 412 413template <class Abi> floatv<Abi> scalbn(floatv<Abi> x, samesize<int, floatv<Abi>> n); 414template <class Abi> doublev<Abi> scalbn(doublev<Abi> x, samesize<int, doublev<Abi>> n); 415template <class Abi> ldoublev<Abi> scalbn(ldoublev<Abi> x, samesize<int, ldoublev<Abi>> n); 416template <class Abi> floatv<Abi> scalbln(floatv<Abi> x, samesize<long int, floatv<Abi>> n); 417template <class Abi> doublev<Abi> scalbln(doublev<Abi> x, samesize<long int, doublev<Abi>> n); 418template <class Abi> ldoublev<Abi> scalbln(ldoublev<Abi> x, samesize<long int, ldoublev<Abi>> n); 419 420template <class Abi> floatv<Abi> cbrt(floatv<Abi> x); 421template <class Abi> doublev<Abi> cbrt(doublev<Abi> x); 422template <class Abi> ldoublev<Abi> cbrt(ldoublev<Abi> x); 423 424template <class Abi> scharv<Abi> abs(scharv<Abi> j); 425template <class Abi> shortv<Abi> abs(shortv<Abi> j); 426template <class Abi> intv<Abi> abs(intv<Abi> j); 427template <class Abi> longv<Abi> abs(longv<Abi> j); 428template <class Abi> llongv<Abi> abs(llongv<Abi> j); 429template <class Abi> floatv<Abi> abs(floatv<Abi> j); 430template <class Abi> doublev<Abi> abs(doublev<Abi> j); 431template <class Abi> ldoublev<Abi> abs(ldoublev<Abi> j); 432 433template <class Abi> floatv<Abi> hypot(floatv<Abi> x, floatv<Abi> y); 434template <class Abi> doublev<Abi> hypot(doublev<Abi> x, doublev<Abi> y); 435template <class Abi> ldoublev<Abi> hypot(doublev<Abi> x, doublev<Abi> y); 436template <class Abi> floatv<Abi> hypot(floatv<Abi> x, floatv<Abi> y, floatv<Abi> z); 437template <class Abi> doublev<Abi> hypot(doublev<Abi> x, doublev<Abi> y, doublev<Abi> z); 438template <class Abi> ldoublev<Abi> hypot(ldoublev<Abi> x, ldoublev<Abi> y, ldoublev<Abi> z); 439 440template <class Abi> floatv<Abi> pow(floatv<Abi> x, floatv<Abi> y); 441template <class Abi> doublev<Abi> pow(doublev<Abi> x, doublev<Abi> y); 442template <class Abi> ldoublev<Abi> pow(ldoublev<Abi> x, ldoublev<Abi> y); 443 444template <class Abi> floatv<Abi> sqrt(floatv<Abi> x); 445template <class Abi> doublev<Abi> sqrt(doublev<Abi> x); 446template <class Abi> ldoublev<Abi> sqrt(ldoublev<Abi> x); 447 448template <class Abi> floatv<Abi> erf(floatv<Abi> x); 449template <class Abi> doublev<Abi> erf(doublev<Abi> x); 450template <class Abi> ldoublev<Abi> erf(ldoublev<Abi> x); 451template <class Abi> floatv<Abi> erfc(floatv<Abi> x); 452template <class Abi> doublev<Abi> erfc(doublev<Abi> x); 453template <class Abi> ldoublev<Abi> erfc(ldoublev<Abi> x); 454 455template <class Abi> floatv<Abi> lgamma(floatv<Abi> x); 456template <class Abi> doublev<Abi> lgamma(doublev<Abi> x); 457template <class Abi> ldoublev<Abi> lgamma(ldoublev<Abi> x); 458 459template <class Abi> floatv<Abi> tgamma(floatv<Abi> x); 460template <class Abi> doublev<Abi> tgamma(doublev<Abi> x); 461template <class Abi> ldoublev<Abi> tgamma(ldoublev<Abi> x); 462 463template <class Abi> floatv<Abi> ceil(floatv<Abi> x); 464template <class Abi> doublev<Abi> ceil(doublev<Abi> x); 465template <class Abi> ldoublev<Abi> ceil(ldoublev<Abi> x); 466 467template <class Abi> floatv<Abi> floor(floatv<Abi> x); 468template <class Abi> doublev<Abi> floor(doublev<Abi> x); 469template <class Abi> ldoublev<Abi> floor(ldoublev<Abi> x); 470 471template <class Abi> floatv<Abi> nearbyint(floatv<Abi> x); 472template <class Abi> doublev<Abi> nearbyint(doublev<Abi> x); 473template <class Abi> ldoublev<Abi> nearbyint(ldoublev<Abi> x); 474 475template <class Abi> floatv<Abi> rint(floatv<Abi> x); 476template <class Abi> doublev<Abi> rint(doublev<Abi> x); 477template <class Abi> ldoublev<Abi> rint(ldoublev<Abi> x); 478 479template <class Abi> samesize<long int, floatv<Abi>> lrint(floatv<Abi> x); 480template <class Abi> samesize<long int, doublev<Abi>> lrint(doublev<Abi> x); 481template <class Abi> samesize<long int, ldoublev<Abi>> lrint(ldoublev<Abi> x); 482template <class Abi> samesize<long long int, floatv<Abi>> llrint(floatv<Abi> x); 483template <class Abi> samesize<long long int, doublev<Abi>> llrint(doublev<Abi> x); 484template <class Abi> samesize<long long int, ldoublev<Abi>> llrint(ldoublev<Abi> x); 485 486template <class Abi> floatv<Abi> round(floatv<Abi> x); 487template <class Abi> doublev<Abi> round(doublev<Abi> x); 488template <class Abi> ldoublev<Abi> round(ldoublev<Abi> x); 489template <class Abi> samesize<long int, floatv<Abi>> lround(floatv<Abi> x); 490template <class Abi> samesize<long int, doublev<Abi>> lround(doublev<Abi> x); 491template <class Abi> samesize<long int, ldoublev<Abi>> lround(ldoublev<Abi> x); 492template <class Abi> samesize<long long int, floatv<Abi>> llround(floatv<Abi> x); 493template <class Abi> samesize<long long int, doublev<Abi>> llround(doublev<Abi> x); 494template <class Abi> samesize<long long int, ldoublev<Abi>> llround(ldoublev<Abi> x); 495 496template <class Abi> floatv<Abi> trunc(floatv<Abi> x); 497template <class Abi> doublev<Abi> trunc(doublev<Abi> x); 498template <class Abi> ldoublev<Abi> trunc(ldoublev<Abi> x); 499 500template <class Abi> floatv<Abi> fmod(floatv<Abi> x, floatv<Abi> y); 501template <class Abi> doublev<Abi> fmod(doublev<Abi> x, doublev<Abi> y); 502template <class Abi> ldoublev<Abi> fmod(ldoublev<Abi> x, ldoublev<Abi> y); 503 504template <class Abi> floatv<Abi> remainder(floatv<Abi> x, floatv<Abi> y); 505template <class Abi> doublev<Abi> remainder(doublev<Abi> x, doublev<Abi> y); 506template <class Abi> ldoublev<Abi> remainder(ldoublev<Abi> x, ldoublev<Abi> y); 507 508template <class Abi> floatv<Abi> remquo(floatv<Abi> x, floatv<Abi> y, samesize<int, floatv<Abi>>* quo); 509template <class Abi> doublev<Abi> remquo(doublev<Abi> x, doublev<Abi> y, samesize<int, doublev<Abi>>* quo); 510template <class Abi> ldoublev<Abi> remquo(ldoublev<Abi> x, ldoublev<Abi> y, samesize<int, ldoublev<Abi>>* quo); 511 512template <class Abi> floatv<Abi> copysign(floatv<Abi> x, floatv<Abi> y); 513template <class Abi> doublev<Abi> copysign(doublev<Abi> x, doublev<Abi> y); 514template <class Abi> ldoublev<Abi> copysign(ldoublev<Abi> x, ldoublev<Abi> y); 515 516template <class Abi> doublev<Abi> nan(const char* tagp); 517template <class Abi> floatv<Abi> nanf(const char* tagp); 518template <class Abi> ldoublev<Abi> nanl(const char* tagp); 519 520template <class Abi> floatv<Abi> nextafter(floatv<Abi> x, floatv<Abi> y); 521template <class Abi> doublev<Abi> nextafter(doublev<Abi> x, doublev<Abi> y); 522template <class Abi> ldoublev<Abi> nextafter(ldoublev<Abi> x, ldoublev<Abi> y); 523 524template <class Abi> floatv<Abi> nexttoward(floatv<Abi> x, ldoublev<Abi> y); 525template <class Abi> doublev<Abi> nexttoward(doublev<Abi> x, ldoublev<Abi> y); 526template <class Abi> ldoublev<Abi> nexttoward(ldoublev<Abi> x, ldoublev<Abi> y); 527 528template <class Abi> floatv<Abi> fdim(floatv<Abi> x, floatv<Abi> y); 529template <class Abi> doublev<Abi> fdim(doublev<Abi> x, doublev<Abi> y); 530template <class Abi> ldoublev<Abi> fdim(ldoublev<Abi> x, ldoublev<Abi> y); 531 532template <class Abi> floatv<Abi> fmax(floatv<Abi> x, floatv<Abi> y); 533template <class Abi> doublev<Abi> fmax(doublev<Abi> x, doublev<Abi> y); 534template <class Abi> ldoublev<Abi> fmax(ldoublev<Abi> x, ldoublev<Abi> y); 535 536template <class Abi> floatv<Abi> fmin(floatv<Abi> x, floatv<Abi> y); 537template <class Abi> doublev<Abi> fmin(doublev<Abi> x, doublev<Abi> y); 538template <class Abi> ldoublev<Abi> fmin(ldoublev<Abi> x, ldoublev<Abi> y); 539 540template <class Abi> floatv<Abi> fma(floatv<Abi> x, floatv<Abi> y, floatv<Abi> z); 541template <class Abi> doublev<Abi> fma(doublev<Abi> x, doublev<Abi> y, doublev<Abi> z); 542template <class Abi> ldoublev<Abi> fma(ldoublev<Abi> x, ldoublev<Abi> y, ldoublev<Abi> z); 543 544template <class Abi> samesize<int, floatv<Abi>> fpclassify(floatv<Abi> x); 545template <class Abi> samesize<int, doublev<Abi>> fpclassify(doublev<Abi> x); 546template <class Abi> samesize<int, ldoublev<Abi>> fpclassify(ldoublev<Abi> x); 547 548template <class Abi> simd_mask<float, Abi> isfinite(floatv<Abi> x); 549template <class Abi> simd_mask<double, Abi> isfinite(doublev<Abi> x); 550template <class Abi> simd_mask<long double, Abi> isfinite(ldoublev<Abi> x); 551 552template <class Abi> simd_mask<float, Abi> isinf(floatv<Abi> x); 553template <class Abi> simd_mask<double, Abi> isinf(doublev<Abi> x); 554template <class Abi> simd_mask<long double, Abi> isinf(ldoublev<Abi> x); 555 556template <class Abi> simd_mask<float, Abi> isnan(floatv<Abi> x); 557template <class Abi> simd_mask<double, Abi> isnan(doublev<Abi> x); 558template <class Abi> simd_mask<long double, Abi> isnan(ldoublev<Abi> x); 559 560template <class Abi> simd_mask<float, Abi> isnormal(floatv<Abi> x); 561template <class Abi> simd_mask<double, Abi> isnormal(doublev<Abi> x); 562template <class Abi> simd_mask<long double, Abi> isnormal(ldoublev<Abi> x); 563 564template <class Abi> simd_mask<float, Abi> signbit(floatv<Abi> x); 565template <class Abi> simd_mask<double, Abi> signbit(doublev<Abi> x); 566template <class Abi> simd_mask<long double, Abi> signbit(ldoublev<Abi> x); 567 568template <class Abi> simd_mask<float, Abi> isgreater(floatv<Abi> x, floatv<Abi> y); 569template <class Abi> simd_mask<double, Abi> isgreater(doublev<Abi> x, doublev<Abi> y); 570template <class Abi> simd_mask<long double, Abi> isgreater(ldoublev<Abi> x, ldoublev<Abi> y); 571 572template <class Abi> simd_mask<float, Abi> isgreaterequal(floatv<Abi> x, floatv<Abi> y); 573template <class Abi> simd_mask<double, Abi> isgreaterequal(doublev<Abi> x, doublev<Abi> y); 574template <class Abi> simd_mask<long double, Abi> isgreaterequal(ldoublev<Abi> x, ldoublev<Abi> y); 575 576template <class Abi> simd_mask<float, Abi> isless(floatv<Abi> x, floatv<Abi> y); 577template <class Abi> simd_mask<double, Abi> isless(doublev<Abi> x, doublev<Abi> y); 578template <class Abi> simd_mask<long double, Abi> isless(ldoublev<Abi> x, ldoublev<Abi> y); 579 580template <class Abi> simd_mask<float, Abi> islessequal(floatv<Abi> x, floatv<Abi> y); 581template <class Abi> simd_mask<double, Abi> islessequal(doublev<Abi> x, doublev<Abi> y); 582template <class Abi> simd_mask<long double, Abi> islessequal(ldoublev<Abi> x, ldoublev<Abi> y); 583 584template <class Abi> simd_mask<float, Abi> islessgreater(floatv<Abi> x, floatv<Abi> y); 585template <class Abi> simd_mask<double, Abi> islessgreater(doublev<Abi> x, doublev<Abi> y); 586template <class Abi> simd_mask<long double, Abi> islessgreater(ldoublev<Abi> x, ldoublev<Abi> y); 587 588template <class Abi> simd_mask<float, Abi> isunordered(floatv<Abi> x, floatv<Abi> y); 589template <class Abi> simd_mask<double, Abi> isunordered(doublev<Abi> x, doublev<Abi> y); 590template <class Abi> simd_mask<long double, Abi> isunordered(ldoublev<Abi> x, ldoublev<Abi> y); 591 592template <class V> struct simd_div_t { V quot, rem; }; 593template <class Abi> simd_div_t<scharv<Abi>> div(scharv<Abi> numer, scharv<Abi> denom); 594template <class Abi> simd_div_t<shortv<Abi>> div(shortv<Abi> numer, shortv<Abi> denom); 595template <class Abi> simd_div_t<intv<Abi>> div(intv<Abi> numer, intv<Abi> denom); 596template <class Abi> simd_div_t<longv<Abi>> div(longv<Abi> numer, longv<Abi> denom); 597template <class Abi> simd_div_t<llongv<Abi>> div(llongv<Abi> numer, llongv<Abi> denom); 598 599// [simd.mask.class] 600template <class T, class Abi> 601class simd_mask { 602public: 603 using value_type = bool; 604 using reference = see below; 605 using simd_type = simd<T, Abi>; 606 using abi_type = Abi; 607 static constexpr size_t size() noexcept; 608 simd_mask() = default; 609 610 // broadcast constructor 611 explicit simd_mask(value_type) noexcept; 612 613 // implicit type conversion constructor 614 template <class U> simd_mask(const simd_mask<U, simd_abi::fixed_size<size()>>&) noexcept; 615 616 // load constructor 617 template <class Flags> simd_mask(const value_type* mem, Flags); 618 619 // loads [simd.mask.copy] 620 template <class Flags> void copy_from(const value_type* mem, Flags); 621 template <class Flags> void copy_to(value_type* mem, Flags) const; 622 623 // scalar access [simd.mask.subscr] 624 reference operator[](size_t); 625 value_type operator[](size_t) const; 626 627 // unary operators [simd.mask.unary] 628 simd_mask operator!() const noexcept; 629 630 // simd_mask binary operators [simd.mask.binary] 631 friend simd_mask operator&&(const simd_mask&, const simd_mask&) noexcept; 632 friend simd_mask operator||(const simd_mask&, const simd_mask&) noexcept; 633 friend simd_mask operator& (const simd_mask&, const simd_mask&) noexcept; 634 friend simd_mask operator| (const simd_mask&, const simd_mask&) noexcept; 635 friend simd_mask operator^ (const simd_mask&, const simd_mask&) noexcept; 636 637 // simd_mask compound assignment [simd.mask.cassign] 638 friend simd_mask& operator&=(simd_mask&, const simd_mask&) noexcept; 639 friend simd_mask& operator|=(simd_mask&, const simd_mask&) noexcept; 640 friend simd_mask& operator^=(simd_mask&, const simd_mask&) noexcept; 641 642 // simd_mask compares [simd.mask.comparison] 643 friend simd_mask operator==(const simd_mask&, const simd_mask&) noexcept; 644 friend simd_mask operator!=(const simd_mask&, const simd_mask&) noexcept; 645}; 646 647} // parallelism_v2 648} // std::experimental 649 650*/ 651 652#include <experimental/__config> 653#include <algorithm> 654#include <array> 655#include <cstddef> 656#include <functional> 657 658#if !defined(_LIBCPP_HAS_NO_PRAGMA_SYSTEM_HEADER) 659#pragma GCC system_header 660#endif 661 662_LIBCPP_BEGIN_NAMESPACE_EXPERIMENTAL_SIMD 663 664#if _LIBCPP_STD_VER >= 17 665 666enum class _StorageKind { 667 _Scalar, 668 _Array, 669 _VecExt, 670}; 671 672template <_StorageKind __kind, int _Np> 673struct __simd_abi {}; 674 675template <class _Tp, class _Abi> 676class __simd_storage {}; 677 678template <class _Tp, int __num_element> 679class __simd_storage<_Tp, __simd_abi<_StorageKind::_Array, __num_element>> { 680 std::array<_Tp, __num_element> __storage_; 681 682 template <class, class> 683 friend struct simd; 684 685 template <class, class> 686 friend struct simd_mask; 687 688public: 689 _Tp __get(size_t __index) const noexcept { return __storage_[__index]; }; 690 void __set(size_t __index, _Tp __val) noexcept { 691 __storage_[__index] = __val; 692 } 693}; 694 695template <class _Tp> 696class __simd_storage<_Tp, __simd_abi<_StorageKind::_Scalar, 1>> { 697 _Tp __storage_; 698 699 template <class, class> 700 friend struct simd; 701 702 template <class, class> 703 friend struct simd_mask; 704 705public: 706 _Tp __get(size_t __index) const noexcept { return (&__storage_)[__index]; }; 707 void __set(size_t __index, _Tp __val) noexcept { 708 (&__storage_)[__index] = __val; 709 } 710}; 711 712#ifndef _LIBCPP_HAS_NO_VECTOR_EXTENSION 713 714constexpr size_t __floor_pow_of_2(size_t __val) { 715 return ((__val - 1) & __val) == 0 ? __val 716 : __floor_pow_of_2((__val - 1) & __val); 717} 718 719constexpr size_t __ceil_pow_of_2(size_t __val) { 720 return __val == 1 ? 1 : __floor_pow_of_2(__val - 1) << 1; 721} 722 723template <class _Tp, size_t __bytes> 724struct __vec_ext_traits { 725#if !defined(_LIBCPP_COMPILER_CLANG) 726 typedef _Tp type __attribute__((vector_size(__ceil_pow_of_2(__bytes)))); 727#endif 728}; 729 730#if defined(_LIBCPP_COMPILER_CLANG) 731#define _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, _NUM_ELEMENT) \ 732 template <> \ 733 struct __vec_ext_traits<_TYPE, sizeof(_TYPE) * _NUM_ELEMENT> { \ 734 using type = \ 735 _TYPE __attribute__((vector_size(sizeof(_TYPE) * _NUM_ELEMENT))); \ 736 } 737 738#define _LIBCPP_SPECIALIZE_VEC_EXT_32(_TYPE) \ 739 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 1); \ 740 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 2); \ 741 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 3); \ 742 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 4); \ 743 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 5); \ 744 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 6); \ 745 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 7); \ 746 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 8); \ 747 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 9); \ 748 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 10); \ 749 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 11); \ 750 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 12); \ 751 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 13); \ 752 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 14); \ 753 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 15); \ 754 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 16); \ 755 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 17); \ 756 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 18); \ 757 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 19); \ 758 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 20); \ 759 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 21); \ 760 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 22); \ 761 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 23); \ 762 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 24); \ 763 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 25); \ 764 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 26); \ 765 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 27); \ 766 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 28); \ 767 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 29); \ 768 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 30); \ 769 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 31); \ 770 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 32); 771 772_LIBCPP_SPECIALIZE_VEC_EXT_32(char); 773_LIBCPP_SPECIALIZE_VEC_EXT_32(char16_t); 774_LIBCPP_SPECIALIZE_VEC_EXT_32(char32_t); 775_LIBCPP_SPECIALIZE_VEC_EXT_32(wchar_t); 776_LIBCPP_SPECIALIZE_VEC_EXT_32(signed char); 777_LIBCPP_SPECIALIZE_VEC_EXT_32(signed short); 778_LIBCPP_SPECIALIZE_VEC_EXT_32(signed int); 779_LIBCPP_SPECIALIZE_VEC_EXT_32(signed long); 780_LIBCPP_SPECIALIZE_VEC_EXT_32(signed long long); 781_LIBCPP_SPECIALIZE_VEC_EXT_32(unsigned char); 782_LIBCPP_SPECIALIZE_VEC_EXT_32(unsigned short); 783_LIBCPP_SPECIALIZE_VEC_EXT_32(unsigned int); 784_LIBCPP_SPECIALIZE_VEC_EXT_32(unsigned long); 785_LIBCPP_SPECIALIZE_VEC_EXT_32(unsigned long long); 786_LIBCPP_SPECIALIZE_VEC_EXT_32(float); 787_LIBCPP_SPECIALIZE_VEC_EXT_32(double); 788_LIBCPP_SPECIALIZE_VEC_EXT_32(long double); 789 790#undef _LIBCPP_SPECIALIZE_VEC_EXT_32 791#undef _LIBCPP_SPECIALIZE_VEC_EXT 792#endif 793 794template <class _Tp, int __num_element> 795class __simd_storage<_Tp, __simd_abi<_StorageKind::_VecExt, __num_element>> { 796 using _StorageType = 797 typename __vec_ext_traits<_Tp, sizeof(_Tp) * __num_element>::type; 798 799 _StorageType __storage_; 800 801 template <class, class> 802 friend struct simd; 803 804 template <class, class> 805 friend struct simd_mask; 806 807public: 808 _Tp __get(size_t __index) const noexcept { return __storage_[__index]; }; 809 void __set(size_t __index, _Tp __val) noexcept { 810 __storage_[__index] = __val; 811 } 812}; 813 814#endif // _LIBCPP_HAS_NO_VECTOR_EXTENSION 815 816template <class _Vp, class _Tp, class _Abi> 817class __simd_reference { 818 static_assert(std::is_same<_Vp, _Tp>::value, ""); 819 820 template <class, class> 821 friend struct simd; 822 823 template <class, class> 824 friend struct simd_mask; 825 826 __simd_storage<_Tp, _Abi>* __ptr_; 827 size_t __index_; 828 829 __simd_reference(__simd_storage<_Tp, _Abi>* __ptr, size_t __index) 830 : __ptr_(__ptr), __index_(__index) {} 831 832 __simd_reference(const __simd_reference&) = default; 833 834public: 835 __simd_reference() = delete; 836 __simd_reference& operator=(const __simd_reference&) = delete; 837 838 operator _Vp() const { return __ptr_->__get(__index_); } 839 840 __simd_reference operator=(_Vp __value) && { 841 __ptr_->__set(__index_, __value); 842 return *this; 843 } 844 845 __simd_reference operator++() && { 846 return std::move(*this) = __ptr_->__get(__index_) + 1; 847 } 848 849 _Vp operator++(int) && { 850 auto __val = __ptr_->__get(__index_); 851 __ptr_->__set(__index_, __val + 1); 852 return __val; 853 } 854 855 __simd_reference operator--() && { 856 return std::move(*this) = __ptr_->__get(__index_) - 1; 857 } 858 859 _Vp operator--(int) && { 860 auto __val = __ptr_->__get(__index_); 861 __ptr_->__set(__index_, __val - 1); 862 return __val; 863 } 864 865 __simd_reference operator+=(_Vp __value) && { 866 return std::move(*this) = __ptr_->__get(__index_) + __value; 867 } 868 869 __simd_reference operator-=(_Vp __value) && { 870 return std::move(*this) = __ptr_->__get(__index_) - __value; 871 } 872 873 __simd_reference operator*=(_Vp __value) && { 874 return std::move(*this) = __ptr_->__get(__index_) * __value; 875 } 876 877 __simd_reference operator/=(_Vp __value) && { 878 return std::move(*this) = __ptr_->__get(__index_) / __value; 879 } 880 881 __simd_reference operator%=(_Vp __value) && { 882 return std::move(*this) = __ptr_->__get(__index_) % __value; 883 } 884 885 __simd_reference operator>>=(_Vp __value) && { 886 return std::move(*this) = __ptr_->__get(__index_) >> __value; 887 } 888 889 __simd_reference operator<<=(_Vp __value) && { 890 return std::move(*this) = __ptr_->__get(__index_) << __value; 891 } 892 893 __simd_reference operator&=(_Vp __value) && { 894 return std::move(*this) = __ptr_->__get(__index_) & __value; 895 } 896 897 __simd_reference operator|=(_Vp __value) && { 898 return std::move(*this) = __ptr_->__get(__index_) | __value; 899 } 900 901 __simd_reference operator^=(_Vp __value) && { 902 return std::move(*this) = __ptr_->__get(__index_) ^ __value; 903 } 904}; 905 906template <class _To, class _From> 907constexpr decltype(_To{std::declval<_From>()}, true) 908__is_non_narrowing_convertible_impl(_From) { 909 return true; 910} 911 912template <class _To> 913constexpr bool __is_non_narrowing_convertible_impl(...) { 914 return false; 915} 916 917template <class _From, class _To> 918constexpr typename std::enable_if<std::is_arithmetic<_To>::value && 919 std::is_arithmetic<_From>::value, 920 bool>::type 921__is_non_narrowing_arithmetic_convertible() { 922 return __is_non_narrowing_convertible_impl<_To>(_From{}); 923} 924 925template <class _From, class _To> 926constexpr typename std::enable_if<!(std::is_arithmetic<_To>::value && 927 std::is_arithmetic<_From>::value), 928 bool>::type 929__is_non_narrowing_arithmetic_convertible() { 930 return false; 931} 932 933template <class _Tp> 934constexpr _Tp __variadic_sum() { 935 return _Tp{}; 936} 937 938template <class _Tp, class _Up, class... _Args> 939constexpr _Tp __variadic_sum(_Up __first, _Args... __rest) { 940 return static_cast<_Tp>(__first) + __variadic_sum<_Tp>(__rest...); 941} 942 943template <class _Tp> 944struct __nodeduce { 945 using type = _Tp; 946}; 947 948template <class _Tp> 949constexpr bool __vectorizable() { 950 return std::is_arithmetic<_Tp>::value && !std::is_const<_Tp>::value && 951 !std::is_volatile<_Tp>::value && !std::is_same<_Tp, bool>::value; 952} 953 954_LIBCPP_END_NAMESPACE_EXPERIMENTAL_SIMD 955_LIBCPP_BEGIN_NAMESPACE_EXPERIMENTAL_SIMD_ABI 956 957using scalar = __simd_abi<_StorageKind::_Scalar, 1>; 958 959template <int _Np> 960using fixed_size = __simd_abi<_StorageKind::_Array, _Np>; 961 962template <class _Tp> 963_LIBCPP_INLINE_VAR constexpr size_t max_fixed_size = 32; 964 965template <class _Tp> 966using compatible = fixed_size<16 / sizeof(_Tp)>; 967 968#ifndef _LIBCPP_HAS_NO_VECTOR_EXTENSION 969template <class _Tp> 970using native = __simd_abi<_StorageKind::_VecExt, 971 _LIBCPP_NATIVE_SIMD_WIDTH_IN_BYTES / sizeof(_Tp)>; 972#else 973template <class _Tp> 974using native = 975 fixed_size<_Tp, _LIBCPP_NATIVE_SIMD_WIDTH_IN_BYTES / sizeof(_Tp)>; 976#endif // _LIBCPP_HAS_NO_VECTOR_EXTENSION 977 978_LIBCPP_END_NAMESPACE_EXPERIMENTAL_SIMD_ABI 979_LIBCPP_BEGIN_NAMESPACE_EXPERIMENTAL_SIMD 980 981template <class _Tp, class _Abi = simd_abi::compatible<_Tp>> 982class simd; 983template <class _Tp, class _Abi = simd_abi::compatible<_Tp>> 984class simd_mask; 985 986struct element_aligned_tag {}; 987struct vector_aligned_tag {}; 988template <size_t> 989struct overaligned_tag {}; 990_LIBCPP_INLINE_VAR constexpr element_aligned_tag element_aligned{}; 991_LIBCPP_INLINE_VAR constexpr vector_aligned_tag vector_aligned{}; 992template <size_t _Np> 993_LIBCPP_INLINE_VAR constexpr overaligned_tag<_Np> overaligned{}; 994 995// traits [simd.traits] 996template <class _Tp> 997struct is_abi_tag : std::integral_constant<bool, false> {}; 998 999template <_StorageKind __kind, int _Np> 1000struct is_abi_tag<__simd_abi<__kind, _Np>> 1001 : std::integral_constant<bool, true> {}; 1002 1003template <class _Tp> 1004struct is_simd : std::integral_constant<bool, false> {}; 1005 1006template <class _Tp, class _Abi> 1007struct is_simd<simd<_Tp, _Abi>> : std::integral_constant<bool, true> {}; 1008 1009template <class _Tp> 1010struct is_simd_mask : std::integral_constant<bool, false> {}; 1011 1012template <class _Tp, class _Abi> 1013struct is_simd_mask<simd_mask<_Tp, _Abi>> : std::integral_constant<bool, true> { 1014}; 1015 1016template <class _Tp> 1017struct is_simd_flag_type : std::integral_constant<bool, false> {}; 1018 1019template <> 1020struct is_simd_flag_type<element_aligned_tag> 1021 : std::integral_constant<bool, true> {}; 1022 1023template <> 1024struct is_simd_flag_type<vector_aligned_tag> 1025 : std::integral_constant<bool, true> {}; 1026 1027template <size_t _Align> 1028struct is_simd_flag_type<overaligned_tag<_Align>> 1029 : std::integral_constant<bool, true> {}; 1030 1031template <class _Tp> 1032_LIBCPP_INLINE_VAR constexpr bool is_abi_tag_v = is_abi_tag<_Tp>::value; 1033template <class _Tp> 1034_LIBCPP_INLINE_VAR constexpr bool is_simd_v = is_simd<_Tp>::value; 1035template <class _Tp> 1036_LIBCPP_INLINE_VAR constexpr bool is_simd_mask_v = is_simd_mask<_Tp>::value; 1037template <class _Tp> 1038_LIBCPP_INLINE_VAR constexpr bool is_simd_flag_type_v = 1039 is_simd_flag_type<_Tp>::value; 1040template <class _Tp, size_t _Np> 1041struct abi_for_size { 1042 using type = simd_abi::fixed_size<_Np>; 1043}; 1044template <class _Tp, size_t _Np> 1045using abi_for_size_t = typename abi_for_size<_Tp, _Np>::type; 1046 1047template <class _Tp, class _Abi = simd_abi::compatible<_Tp>> 1048struct simd_size; 1049 1050template <class _Tp, _StorageKind __kind, int _Np> 1051struct simd_size<_Tp, __simd_abi<__kind, _Np>> 1052 : std::integral_constant<size_t, _Np> { 1053 static_assert( 1054 std::is_arithmetic<_Tp>::value && 1055 !std::is_same<typename std::remove_const<_Tp>::type, bool>::value, 1056 "Element type should be vectorizable"); 1057}; 1058 1059// TODO: implement it. 1060template <class _Tp, class _Up = typename _Tp::value_type> 1061struct memory_alignment; 1062 1063template <class _Tp, class _Abi = simd_abi::compatible<_Tp>> 1064_LIBCPP_INLINE_VAR constexpr size_t simd_size_v = simd_size<_Tp, _Abi>::value; 1065 1066template <class _Tp, class _Up = typename _Tp::value_type> 1067_LIBCPP_INLINE_VAR constexpr size_t memory_alignment_v = 1068 memory_alignment<_Tp, _Up>::value; 1069 1070// class template simd [simd.class] 1071template <class _Tp> 1072using native_simd = simd<_Tp, simd_abi::native<_Tp>>; 1073template <class _Tp, int _Np> 1074using fixed_size_simd = simd<_Tp, simd_abi::fixed_size<_Np>>; 1075 1076// class template simd_mask [simd.mask.class] 1077template <class _Tp> 1078using native_simd_mask = simd_mask<_Tp, simd_abi::native<_Tp>>; 1079 1080template <class _Tp, int _Np> 1081using fixed_size_simd_mask = simd_mask<_Tp, simd_abi::fixed_size<_Np>>; 1082 1083// casts [simd.casts] 1084template <class _Tp> 1085struct __static_simd_cast_traits { 1086 template <class _Up, class _Abi> 1087 static simd<_Tp, _Abi> __apply(const simd<_Up, _Abi>& __v); 1088}; 1089 1090template <class _Tp, class _NewAbi> 1091struct __static_simd_cast_traits<simd<_Tp, _NewAbi>> { 1092 template <class _Up, class _Abi> 1093 static typename std::enable_if<simd<_Up, _Abi>::size() == 1094 simd<_Tp, _NewAbi>::size(), 1095 simd<_Tp, _NewAbi>>::type 1096 __apply(const simd<_Up, _Abi>& __v); 1097}; 1098 1099template <class _Tp> 1100struct __simd_cast_traits { 1101 template <class _Up, class _Abi> 1102 static typename std::enable_if< 1103 __is_non_narrowing_arithmetic_convertible<_Up, _Tp>(), 1104 simd<_Tp, _Abi>>::type 1105 __apply(const simd<_Up, _Abi>& __v); 1106}; 1107 1108template <class _Tp, class _NewAbi> 1109struct __simd_cast_traits<simd<_Tp, _NewAbi>> { 1110 template <class _Up, class _Abi> 1111 static typename std::enable_if< 1112 __is_non_narrowing_arithmetic_convertible<_Up, _Tp>() && 1113 simd<_Up, _Abi>::size() == simd<_Tp, _NewAbi>::size(), 1114 simd<_Tp, _NewAbi>>::type 1115 __apply(const simd<_Up, _Abi>& __v); 1116}; 1117 1118template <class _Tp, class _Up, class _Abi> 1119auto simd_cast(const simd<_Up, _Abi>& __v) 1120 -> decltype(__simd_cast_traits<_Tp>::__apply(__v)) { 1121 return __simd_cast_traits<_Tp>::__apply(__v); 1122} 1123 1124template <class _Tp, class _Up, class _Abi> 1125auto static_simd_cast(const simd<_Up, _Abi>& __v) 1126 -> decltype(__static_simd_cast_traits<_Tp>::__apply(__v)) { 1127 return __static_simd_cast_traits<_Tp>::__apply(__v); 1128} 1129 1130template <class _Tp, class _Abi> 1131fixed_size_simd<_Tp, simd_size<_Tp, _Abi>::value> 1132to_fixed_size(const simd<_Tp, _Abi>&) noexcept; 1133 1134template <class _Tp, class _Abi> 1135fixed_size_simd_mask<_Tp, simd_size<_Tp, _Abi>::value> 1136to_fixed_size(const simd_mask<_Tp, _Abi>&) noexcept; 1137 1138template <class _Tp, size_t _Np> 1139native_simd<_Tp> to_native(const fixed_size_simd<_Tp, _Np>&) noexcept; 1140 1141template <class _Tp, size_t _Np> 1142native_simd_mask<_Tp> to_native(const fixed_size_simd_mask<_Tp, _Np>&) noexcept; 1143 1144template <class _Tp, size_t _Np> 1145simd<_Tp> to_compatible(const fixed_size_simd<_Tp, _Np>&) noexcept; 1146 1147template <class _Tp, size_t _Np> 1148simd_mask<_Tp> to_compatible(const fixed_size_simd_mask<_Tp, _Np>&) noexcept; 1149 1150template <size_t... __sizes, class _Tp, class _Abi> 1151tuple<simd<_Tp, abi_for_size_t<_Tp, __sizes>>...> split(const simd<_Tp, _Abi>&); 1152 1153template <size_t... __sizes, class _Tp, class _Abi> 1154tuple<simd_mask<_Tp, abi_for_size_t<_Tp, __sizes>>...> 1155split(const simd_mask<_Tp, _Abi>&); 1156 1157template <class _SimdType, class _Abi> 1158array<_SimdType, simd_size<typename _SimdType::value_type, _Abi>::value / 1159 _SimdType::size()> 1160split(const simd<typename _SimdType::value_type, _Abi>&); 1161 1162template <class _SimdType, class _Abi> 1163array<_SimdType, simd_size<typename _SimdType::value_type, _Abi>::value / 1164 _SimdType::size()> 1165split(const simd_mask<typename _SimdType::value_type, _Abi>&); 1166 1167template <class _Tp, class... _Abis> 1168simd<_Tp, abi_for_size_t<_Tp, __variadic_sum(simd_size<_Tp, _Abis>::value...)>> 1169concat(const simd<_Tp, _Abis>&...); 1170 1171template <class _Tp, class... _Abis> 1172simd_mask<_Tp, 1173 abi_for_size_t<_Tp, __variadic_sum(simd_size<_Tp, _Abis>::value...)>> 1174concat(const simd_mask<_Tp, _Abis>&...); 1175 1176// reductions [simd.mask.reductions] 1177template <class _Tp, class _Abi> 1178bool all_of(const simd_mask<_Tp, _Abi>&) noexcept; 1179template <class _Tp, class _Abi> 1180bool any_of(const simd_mask<_Tp, _Abi>&) noexcept; 1181template <class _Tp, class _Abi> 1182bool none_of(const simd_mask<_Tp, _Abi>&) noexcept; 1183template <class _Tp, class _Abi> 1184bool some_of(const simd_mask<_Tp, _Abi>&) noexcept; 1185template <class _Tp, class _Abi> 1186int popcount(const simd_mask<_Tp, _Abi>&) noexcept; 1187template <class _Tp, class _Abi> 1188int find_first_set(const simd_mask<_Tp, _Abi>&); 1189template <class _Tp, class _Abi> 1190int find_last_set(const simd_mask<_Tp, _Abi>&); 1191bool all_of(bool) noexcept; 1192bool any_of(bool) noexcept; 1193bool none_of(bool) noexcept; 1194bool some_of(bool) noexcept; 1195int popcount(bool) noexcept; 1196int find_first_set(bool) noexcept; 1197int find_last_set(bool) noexcept; 1198 1199// masked assignment [simd.whereexpr] 1200template <class _MaskType, class _Tp> 1201class const_where_expression; 1202template <class _MaskType, class _Tp> 1203class where_expression; 1204 1205// masked assignment [simd.mask.where] 1206template <class _Tp, class _Abi> 1207where_expression<simd_mask<_Tp, _Abi>, simd<_Tp, _Abi>> 1208where(const typename simd<_Tp, _Abi>::mask_type&, simd<_Tp, _Abi>&) noexcept; 1209 1210template <class _Tp, class _Abi> 1211const_where_expression<simd_mask<_Tp, _Abi>, const simd<_Tp, _Abi>> 1212where(const typename simd<_Tp, _Abi>::mask_type&, 1213 const simd<_Tp, _Abi>&) noexcept; 1214 1215template <class _Tp, class _Abi> 1216where_expression<simd_mask<_Tp, _Abi>, simd_mask<_Tp, _Abi>> 1217where(const typename __nodeduce<simd_mask<_Tp, _Abi>>::type&, 1218 simd_mask<_Tp, _Abi>&) noexcept; 1219 1220template <class _Tp, class _Abi> 1221const_where_expression<simd_mask<_Tp, _Abi>, const simd_mask<_Tp, _Abi>> 1222where(const typename __nodeduce<simd_mask<_Tp, _Abi>>::type&, 1223 const simd_mask<_Tp, _Abi>&) noexcept; 1224 1225template <class _Tp> 1226where_expression<bool, _Tp> where(bool, _Tp&) noexcept; 1227 1228template <class _Tp> 1229const_where_expression<bool, const _Tp> where(bool, const _Tp&) noexcept; 1230 1231// reductions [simd.reductions] 1232template <class _Tp, class _Abi, class _BinaryOp = std::plus<_Tp>> 1233_Tp reduce(const simd<_Tp, _Abi>&, _BinaryOp = _BinaryOp()); 1234 1235template <class _MaskType, class _SimdType, class _BinaryOp> 1236typename _SimdType::value_type 1237reduce(const const_where_expression<_MaskType, _SimdType>&, 1238 typename _SimdType::value_type neutral_element, _BinaryOp binary_op); 1239 1240template <class _MaskType, class _SimdType> 1241typename _SimdType::value_type 1242reduce(const const_where_expression<_MaskType, _SimdType>&, 1243 plus<typename _SimdType::value_type> binary_op = {}); 1244 1245template <class _MaskType, class _SimdType> 1246typename _SimdType::value_type 1247reduce(const const_where_expression<_MaskType, _SimdType>&, 1248 multiplies<typename _SimdType::value_type> binary_op); 1249 1250template <class _MaskType, class _SimdType> 1251typename _SimdType::value_type 1252reduce(const const_where_expression<_MaskType, _SimdType>&, 1253 bit_and<typename _SimdType::value_type> binary_op); 1254 1255template <class _MaskType, class _SimdType> 1256typename _SimdType::value_type 1257reduce(const const_where_expression<_MaskType, _SimdType>&, 1258 bit_or<typename _SimdType::value_type> binary_op); 1259 1260template <class _MaskType, class _SimdType> 1261typename _SimdType::value_type 1262reduce(const const_where_expression<_MaskType, _SimdType>&, 1263 bit_xor<typename _SimdType::value_type> binary_op); 1264 1265template <class _Tp, class _Abi> 1266_Tp hmin(const simd<_Tp, _Abi>&); 1267template <class _MaskType, class _SimdType> 1268typename _SimdType::value_type 1269hmin(const const_where_expression<_MaskType, _SimdType>&); 1270template <class _Tp, class _Abi> 1271_Tp hmax(const simd<_Tp, _Abi>&); 1272template <class _MaskType, class _SimdType> 1273typename _SimdType::value_type 1274hmax(const const_where_expression<_MaskType, _SimdType>&); 1275 1276// algorithms [simd.alg] 1277template <class _Tp, class _Abi> 1278simd<_Tp, _Abi> min(const simd<_Tp, _Abi>&, const simd<_Tp, _Abi>&) noexcept; 1279 1280template <class _Tp, class _Abi> 1281simd<_Tp, _Abi> max(const simd<_Tp, _Abi>&, const simd<_Tp, _Abi>&) noexcept; 1282 1283template <class _Tp, class _Abi> 1284std::pair<simd<_Tp, _Abi>, simd<_Tp, _Abi>> 1285minmax(const simd<_Tp, _Abi>&, const simd<_Tp, _Abi>&) noexcept; 1286 1287template <class _Tp, class _Abi> 1288simd<_Tp, _Abi> clamp(const simd<_Tp, _Abi>&, const simd<_Tp, _Abi>&, 1289 const simd<_Tp, _Abi>&); 1290 1291// [simd.whereexpr] 1292// TODO implement where expressions. 1293template <class _MaskType, class _Tp> 1294class const_where_expression { 1295public: 1296 const_where_expression(const const_where_expression&) = delete; 1297 const_where_expression& operator=(const const_where_expression&) = delete; 1298 typename remove_const<_Tp>::type operator-() const&&; 1299 template <class _Up, class _Flags> 1300 void copy_to(_Up*, _Flags) const&&; 1301}; 1302 1303template <class _MaskType, class _Tp> 1304class where_expression : public const_where_expression<_MaskType, _Tp> { 1305public: 1306 where_expression(const where_expression&) = delete; 1307 where_expression& operator=(const where_expression&) = delete; 1308 template <class _Up> 1309 void operator=(_Up&&); 1310 template <class _Up> 1311 void operator+=(_Up&&); 1312 template <class _Up> 1313 void operator-=(_Up&&); 1314 template <class _Up> 1315 void operator*=(_Up&&); 1316 template <class _Up> 1317 void operator/=(_Up&&); 1318 template <class _Up> 1319 void operator%=(_Up&&); 1320 template <class _Up> 1321 void operator&=(_Up&&); 1322 template <class _Up> 1323 void operator|=(_Up&&); 1324 template <class _Up> 1325 void operator^=(_Up&&); 1326 template <class _Up> 1327 void operator<<=(_Up&&); 1328 template <class _Up> 1329 void operator>>=(_Up&&); 1330 void operator++(); 1331 void operator++(int); 1332 void operator--(); 1333 void operator--(int); 1334 template <class _Up, class _Flags> 1335 void copy_from(const _Up*, _Flags); 1336}; 1337 1338// [simd.class] 1339// TODO: implement simd 1340template <class _Tp, class _Abi> 1341class simd { 1342public: 1343 using value_type = _Tp; 1344 using reference = __simd_reference<_Tp, _Tp, _Abi>; 1345 using mask_type = simd_mask<_Tp, _Abi>; 1346 using abi_type = _Abi; 1347 1348 simd() = default; 1349 simd(const simd&) = default; 1350 simd& operator=(const simd&) = default; 1351 1352 static constexpr size_t size() noexcept { 1353 return simd_size<_Tp, _Abi>::value; 1354 } 1355 1356private: 1357 __simd_storage<_Tp, _Abi> __s_; 1358 1359 template <class _Up> 1360 static constexpr bool __can_broadcast() { 1361 return (std::is_arithmetic<_Up>::value && 1362 __is_non_narrowing_arithmetic_convertible<_Up, _Tp>()) || 1363 (!std::is_arithmetic<_Up>::value && 1364 std::is_convertible<_Up, _Tp>::value) || 1365 std::is_same<typename std::remove_const<_Up>::type, int>::value || 1366 (std::is_same<typename std::remove_const<_Up>::type, 1367 unsigned int>::value && 1368 std::is_unsigned<_Tp>::value); 1369 } 1370 1371 template <class _Generator, size_t... __indicies> 1372 static constexpr decltype( 1373 std::forward_as_tuple(std::declval<_Generator>()( 1374 std::integral_constant<size_t, __indicies>())...), 1375 bool()) 1376 __can_generate(std::index_sequence<__indicies...>) { 1377 return !__variadic_sum<bool>( 1378 !__can_broadcast<decltype(std::declval<_Generator>()( 1379 std::integral_constant<size_t, __indicies>()))>()...); 1380 } 1381 1382 template <class _Generator> 1383 static bool __can_generate(...) { 1384 return false; 1385 } 1386 1387 template <class _Generator, size_t... __indicies> 1388 void __generator_init(_Generator&& __g, std::index_sequence<__indicies...>) { 1389 int __not_used[]{((*this)[__indicies] = 1390 __g(std::integral_constant<size_t, __indicies>()), 1391 0)...}; 1392 (void)__not_used; 1393 } 1394 1395public: 1396 // implicit type conversion constructor 1397 template <class _Up, 1398 class = typename std::enable_if< 1399 std::is_same<_Abi, simd_abi::fixed_size<size()>>::value && 1400 __is_non_narrowing_arithmetic_convertible<_Up, _Tp>()>::type> 1401 simd(const simd<_Up, simd_abi::fixed_size<size()>>& __v) { 1402 for (size_t __i = 0; __i < size(); __i++) { 1403 (*this)[__i] = static_cast<_Tp>(__v[__i]); 1404 } 1405 } 1406 1407 // implicit broadcast constructor 1408 template <class _Up, 1409 class = typename std::enable_if<__can_broadcast<_Up>()>::type> 1410 simd(_Up&& __rv) { 1411 auto __v = static_cast<_Tp>(__rv); 1412 for (size_t __i = 0; __i < size(); __i++) { 1413 (*this)[__i] = __v; 1414 } 1415 } 1416 1417 // generator constructor 1418 template <class _Generator, 1419 int = typename std::enable_if< 1420 __can_generate<_Generator>(std::make_index_sequence<size()>()), 1421 int>::type()> 1422 explicit simd(_Generator&& __g) { 1423 __generator_init(std::forward<_Generator>(__g), 1424 std::make_index_sequence<size()>()); 1425 } 1426 1427 // load constructor 1428 template < 1429 class _Up, class _Flags, 1430 class = typename std::enable_if<__vectorizable<_Up>()>::type, 1431 class = typename std::enable_if<is_simd_flag_type<_Flags>::value>::type> 1432 simd(const _Up* __buffer, _Flags) { 1433 // TODO: optimize for overaligned flags 1434 for (size_t __i = 0; __i < size(); __i++) { 1435 (*this)[__i] = static_cast<_Tp>(__buffer[__i]); 1436 } 1437 } 1438 1439 // loads [simd.load] 1440 template <class _Up, class _Flags> 1441 typename std::enable_if<__vectorizable<_Up>() && 1442 is_simd_flag_type<_Flags>::value>::type 1443 copy_from(const _Up* __buffer, _Flags) { 1444 *this = simd(__buffer, _Flags()); 1445 } 1446 1447 // stores [simd.store] 1448 template <class _Up, class _Flags> 1449 typename std::enable_if<__vectorizable<_Up>() && 1450 is_simd_flag_type<_Flags>::value>::type 1451 copy_to(_Up* __buffer, _Flags) const { 1452 // TODO: optimize for overaligned flags 1453 for (size_t __i = 0; __i < size(); __i++) { 1454 __buffer[__i] = static_cast<_Up>((*this)[__i]); 1455 } 1456 } 1457 1458 // scalar access [simd.subscr] 1459 reference operator[](size_t __i) { return reference(&__s_, __i); } 1460 1461 value_type operator[](size_t __i) const { return __s_.__get(__i); } 1462 1463 // unary operators [simd.unary] 1464 simd& operator++(); 1465 simd operator++(int); 1466 simd& operator--(); 1467 simd operator--(int); 1468 mask_type operator!() const; 1469 simd operator~() const; 1470 simd operator+() const; 1471 simd operator-() const; 1472 1473 // binary operators [simd.binary] 1474 friend simd operator+(const simd&, const simd&); 1475 friend simd operator-(const simd&, const simd&); 1476 friend simd operator*(const simd&, const simd&); 1477 friend simd operator/(const simd&, const simd&); 1478 friend simd operator%(const simd&, const simd&); 1479 friend simd operator&(const simd&, const simd&); 1480 friend simd operator|(const simd&, const simd&); 1481 friend simd operator^(const simd&, const simd&); 1482 friend simd operator<<(const simd&, const simd&); 1483 friend simd operator>>(const simd&, const simd&); 1484 friend simd operator<<(const simd&, int); 1485 friend simd operator>>(const simd&, int); 1486 1487 // compound assignment [simd.cassign] 1488 friend simd& operator+=(simd&, const simd&); 1489 friend simd& operator-=(simd&, const simd&); 1490 friend simd& operator*=(simd&, const simd&); 1491 friend simd& operator/=(simd&, const simd&); 1492 friend simd& operator%=(simd&, const simd&); 1493 1494 friend simd& operator&=(simd&, const simd&); 1495 friend simd& operator|=(simd&, const simd&); 1496 friend simd& operator^=(simd&, const simd&); 1497 friend simd& operator<<=(simd&, const simd&); 1498 friend simd& operator>>=(simd&, const simd&); 1499 friend simd& operator<<=(simd&, int); 1500 friend simd& operator>>=(simd&, int); 1501 1502 // compares [simd.comparison] 1503 friend mask_type operator==(const simd&, const simd&); 1504 friend mask_type operator!=(const simd&, const simd&); 1505 friend mask_type operator>=(const simd&, const simd&); 1506 friend mask_type operator<=(const simd&, const simd&); 1507 friend mask_type operator>(const simd&, const simd&); 1508 friend mask_type operator<(const simd&, const simd&); 1509}; 1510 1511// [simd.mask.class] 1512template <class _Tp, class _Abi> 1513// TODO: implement simd_mask 1514class simd_mask { 1515public: 1516 using value_type = bool; 1517 // TODO: this is strawman implementation. Turn it into a proxy type. 1518 using reference = bool&; 1519 using simd_type = simd<_Tp, _Abi>; 1520 using abi_type = _Abi; 1521 static constexpr size_t size() noexcept; 1522 simd_mask() = default; 1523 1524 // broadcast constructor 1525 explicit simd_mask(value_type) noexcept; 1526 1527 // implicit type conversion constructor 1528 template <class _Up> 1529 simd_mask(const simd_mask<_Up, simd_abi::fixed_size<size()>>&) noexcept; 1530 1531 // load constructor 1532 template <class _Flags> 1533 simd_mask(const value_type*, _Flags); 1534 1535 // loads [simd.mask.copy] 1536 template <class _Flags> 1537 void copy_from(const value_type*, _Flags); 1538 template <class _Flags> 1539 void copy_to(value_type*, _Flags) const; 1540 1541 // scalar access [simd.mask.subscr] 1542 reference operator[](size_t); 1543 value_type operator[](size_t) const; 1544 1545 // unary operators [simd.mask.unary] 1546 simd_mask operator!() const noexcept; 1547 1548 // simd_mask binary operators [simd.mask.binary] 1549 friend simd_mask operator&&(const simd_mask&, const simd_mask&) noexcept; 1550 friend simd_mask operator||(const simd_mask&, const simd_mask&) noexcept; 1551 friend simd_mask operator&(const simd_mask&, const simd_mask&)noexcept; 1552 friend simd_mask operator|(const simd_mask&, const simd_mask&) noexcept; 1553 friend simd_mask operator^(const simd_mask&, const simd_mask&) noexcept; 1554 1555 // simd_mask compound assignment [simd.mask.cassign] 1556 friend simd_mask& operator&=(simd_mask&, const simd_mask&) noexcept; 1557 friend simd_mask& operator|=(simd_mask&, const simd_mask&) noexcept; 1558 friend simd_mask& operator^=(simd_mask&, const simd_mask&) noexcept; 1559 1560 // simd_mask compares [simd.mask.comparison] 1561 friend simd_mask operator==(const simd_mask&, const simd_mask&) noexcept; 1562 friend simd_mask operator!=(const simd_mask&, const simd_mask&) noexcept; 1563}; 1564 1565#endif // _LIBCPP_STD_VER >= 17 1566 1567_LIBCPP_END_NAMESPACE_EXPERIMENTAL_SIMD 1568 1569#endif /* _LIBCPP_EXPERIMENTAL_SIMD */ 1570