1// -*- C++ -*-
2//===----------------------------------------------------------------------===//
3//
4// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
5// See https://llvm.org/LICENSE.txt for license information.
6// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
7//
8//===----------------------------------------------------------------------===//
9
10#ifndef _LIBCPP_EXPERIMENTAL_SIMD
11#define _LIBCPP_EXPERIMENTAL_SIMD
12
13/*
14    experimental/simd synopsis
15
16namespace std::experimental {
17
18inline namespace parallelism_v2 {
19
20namespace simd_abi {
21
22struct scalar {};
23template <int N> struct fixed_size {};
24template <typename T> inline constexpr int max_fixed_size = implementation-defined;
25template <typename T> using compatible = implementation-defined;
26template <typename T> using native = implementation-defined;
27
28} // simd_abi
29
30struct element_aligned_tag {};
31struct vector_aligned_tag {};
32template <size_t> struct overaligned_tag {};
33inline constexpr element_aligned_tag element_aligned{};
34inline constexpr vector_aligned_tag vector_aligned{};
35template <size_t N> inline constexpr overaligned_tag<N> overaligned{};
36
37// traits [simd.traits]
38template <class T> struct is_abi_tag;
39template <class T> inline constexpr bool is_abi_tag_v = is_abi_tag<T>::value;
40
41template <class T> struct is_simd;
42template <class T> inline constexpr bool is_simd_v = is_simd<T>::value;
43
44template <class T> struct is_simd_mask;
45template <class T> inline constexpr bool is_simd_mask_v = is_simd_mask<T>::value;
46
47template <class T> struct is_simd_flag_type;
48template <class T> inline constexpr bool is_simd_flag_type_v = is_simd_flag_type<T>::value;
49
50template <class T, size_t N> struct abi_for_size { using type = see below; };
51template <class T, size_t N> using abi_for_size_t = typename abi_for_size<T, N>::type;
52
53template <class T, class Abi = simd_abi::compatible<T>> struct simd_size;
54template <class T, class Abi = simd_abi::compatible<T>>
55inline constexpr size_t simd_size_v = simd_size<T, Abi>::value;
56
57template <class T, class U = typename T::value_type> struct memory_alignment;
58template <class T, class U = typename T::value_type>
59inline constexpr size_t memory_alignment_v = memory_alignment<T, U>::value;
60
61// class template simd [simd.class]
62template <class T, class Abi = simd_abi::compatible<T>> class simd;
63template <class T> using native_simd = simd<T, simd_abi::native<T>>;
64template <class T, int N> using fixed_size_simd = simd<T, simd_abi::fixed_size<N>>;
65
66// class template simd_mask [simd.mask.class]
67template <class T, class Abi = simd_abi::compatible<T>> class simd_mask;
68template <class T> using native_simd_mask = simd_mask<T, simd_abi::native<T>>;
69template <class T, int N> using fixed_size_simd_mask = simd_mask<T, simd_abi::fixed_size<N>>;
70
71// casts [simd.casts]
72template <class T, class U, class Abi> see below simd_cast(const simd<U, Abi>&);
73template <class T, class U, class Abi> see below static_simd_cast(const simd<U, Abi>&);
74
75template <class T, class Abi>
76fixed_size_simd<T, simd_size_v<T, Abi>> to_fixed_size(const simd<T, Abi>&) noexcept;
77template <class T, class Abi>
78fixed_size_simd_mask<T, simd_size_v<T, Abi>> to_fixed_size(const simd_mask<T, Abi>&) noexcept;
79template <class T, size_t N> native_simd<T> to_native(const fixed_size_simd<T, N>&) noexcept;
80template <class T, size_t N>
81native_simd_mask<T> to_native(const fixed_size_simd_mask<T, N>> &) noexcept;
82template <class T, size_t N> simd<T> to_compatible(const fixed_size_simd<T, N>&) noexcept;
83template <class T, size_t N> simd_mask<T> to_compatible(const fixed_size_simd_mask<T, N>&) noexcept;
84
85template <size_t... Sizes, class T, class Abi>
86tuple<simd<T, abi_for_size_t<Sizes>>...> split(const simd<T, Abi>&);
87template <size_t... Sizes, class T, class Abi>
88tuple<simd_mask<T, abi_for_size_t<Sizes>>...> split(const simd_mask<T, Abi>&);
89template <class V, class Abi>
90array<V, simd_size_v<typename V::value_type, Abi> / V::size()> split(
91const simd<typename V::value_type, Abi>&);
92template <class V, class Abi>
93array<V, simd_size_v<typename V::value_type, Abi> / V::size()> split(
94const simd_mask<typename V::value_type, Abi>&);
95
96template <class T, class... Abis>
97simd<T, abi_for_size_t<T, (simd_size_v<T, Abis> + ...)>> concat(const simd<T, Abis>&...);
98template <class T, class... Abis>
99simd_mask<T, abi_for_size_t<T, (simd_size_v<T, Abis> + ...)>> concat(const simd_mask<T, Abis>&...);
100
101// reductions [simd.mask.reductions]
102template <class T, class Abi> bool all_of(const simd_mask<T, Abi>&) noexcept;
103template <class T, class Abi> bool any_of(const simd_mask<T, Abi>&) noexcept;
104template <class T, class Abi> bool none_of(const simd_mask<T, Abi>&) noexcept;
105template <class T, class Abi> bool some_of(const simd_mask<T, Abi>&) noexcept;
106template <class T, class Abi> int popcount(const simd_mask<T, Abi>&) noexcept;
107template <class T, class Abi> int find_first_set(const simd_mask<T, Abi>&);
108template <class T, class Abi> int find_last_set(const simd_mask<T, Abi>&);
109
110bool all_of(see below) noexcept;
111bool any_of(see below) noexcept;
112bool none_of(see below) noexcept;
113bool some_of(see below) noexcept;
114int popcount(see below) noexcept;
115int find_first_set(see below) noexcept;
116int find_last_set(see below) noexcept;
117
118// masked assignment [simd.whereexpr]
119template <class M, class T> class const_where_expression;
120template <class M, class T> class where_expression;
121
122// masked assignment [simd.mask.where]
123template <class T> struct nodeduce { using type = T; }; // exposition only
124
125template <class T> using nodeduce_t = typename nodeduce<T>::type; // exposition only
126
127template <class T, class Abi>
128where_expression<simd_mask<T, Abi>, simd<T, Abi>>
129where(const typename simd<T, Abi>::mask_type&, simd<T, Abi>&) noexcept;
130
131template <class T, class Abi>
132const_where_expression<simd_mask<T, Abi>, const simd<T, Abi>>
133where(const typename simd<T, Abi>::mask_type&, const simd<T, Abi>&) noexcept;
134
135template <class T, class Abi>
136where_expression<simd_mask<T, Abi>, simd_mask<T, Abi>>
137where(const nodeduce_t<simd_mask<T, Abi>>&, simd_mask<T, Abi>&) noexcept;
138
139template <class T, class Abi>
140const_where_expression<simd_mask<T, Abi>, const simd_mask<T, Abi>>
141where(const nodeduce_t<simd_mask<T, Abi>>&, const simd_mask<T, Abi>&) noexcept;
142
143template <class T> where_expression<bool, T> where(see below k, T& d) noexcept;
144
145template <class T>
146const_where_expression<bool, const T> where(see below k, const T& d) noexcept;
147
148// reductions [simd.reductions]
149template <class T, class Abi, class BinaryOperation = std::plus<>>
150T reduce(const simd<T, Abi>&, BinaryOperation = BinaryOperation());
151
152template <class M, class V, class BinaryOperation>
153typename V::value_type reduce(const const_where_expression<M, V>& x,
154typename V::value_type neutral_element, BinaryOperation binary_op);
155
156template <class M, class V>
157typename V::value_type reduce(const const_where_expression<M, V>& x, plus<> binary_op = plus<>());
158
159template <class M, class V>
160typename V::value_type reduce(const const_where_expression<M, V>& x, multiplies<> binary_op);
161
162template <class M, class V>
163typename V::value_type reduce(const const_where_expression<M, V>& x, bit_and<> binary_op);
164
165template <class M, class V>
166typename V::value_type reduce(const const_where_expression<M, V>& x, bit_or<> binary_op);
167
168template <class M, class V>
169typename V::value_type reduce(const const_where_expression<M, V>& x, bit_xor<> binary_op);
170
171template <class T, class Abi> T hmin(const simd<T, Abi>&);
172template <class M, class V> T hmin(const const_where_expression<M, V>&);
173template <class T, class Abi> T hmax(const simd<T, Abi>&);
174template <class M, class V> T hmax(const const_where_expression<M, V>&);
175
176// algorithms [simd.alg]
177template <class T, class Abi> simd<T, Abi> min(const simd<T, Abi>&, const simd<T, Abi>&) noexcept;
178
179template <class T, class Abi> simd<T, Abi> max(const simd<T, Abi>&, const simd<T, Abi>&) noexcept;
180
181template <class T, class Abi>
182std::pair<simd<T, Abi>, simd<T, Abi>> minmax(const simd<T, Abi>&, const simd<T, Abi>&) noexcept;
183
184template <class T, class Abi>
185simd<T, Abi> clamp(const simd<T, Abi>& v, const simd<T, Abi>& lo, const simd<T, Abi>& hi);
186
187// [simd.whereexpr]
188template <class M, class T>
189class const_where_expression {
190  const M& mask; // exposition only
191  T& data; // exposition only
192public:
193  const_where_expression(const const_where_expression&) = delete;
194  const_where_expression& operator=(const const_where_expression&) = delete;
195  remove_const_t<T> operator-() const &&;
196  template <class U, class Flags> void copy_to(U* mem, Flags f) const &&;
197};
198
199template <class M, class T>
200class where_expression : public const_where_expression<M, T> {
201public:
202  where_expression(const where_expression&) = delete;
203  where_expression& operator=(const where_expression&) = delete;
204  template <class U> void operator=(U&& x);
205  template <class U> void operator+=(U&& x);
206  template <class U> void operator-=(U&& x);
207  template <class U> void operator*=(U&& x);
208  template <class U> void operator/=(U&& x);
209  template <class U> void operator%=(U&& x);
210  template <class U> void operator&=(U&& x);
211  template <class U> void operator|=(U&& x);
212  template <class U> void operator^=(U&& x);
213  template <class U> void operator<<=(U&& x);
214  template <class U> void operator>>=(U&& x);
215  void operator++();
216  void operator++(int);
217  void operator--();
218  void operator--(int);
219  template <class U, class Flags> void copy_from(const U* mem, Flags);
220};
221
222// [simd.class]
223template <class T, class Abi> class simd {
224public:
225  using value_type = T;
226  using reference = see below;
227  using mask_type = simd_mask<T, Abi>;
228
229  using abi_type = Abi;
230  static constexpr size_t size() noexcept;
231  simd() = default;
232
233  // implicit type conversion constructor
234  template <class U> simd(const simd<U, simd_abi::fixed_size<size()>>&);
235
236  // implicit broadcast constructor (see below for constraints)
237  template <class U> simd(U&& value);
238
239  // generator constructor (see below for constraints)
240  template <class G> explicit simd(G&& gen);
241
242  // load constructor
243  template <class U, class Flags> simd(const U* mem, Flags f);
244
245  // loads [simd.load]
246  template <class U, class Flags> void copy_from(const U* mem, Flags f);
247
248  // stores [simd.store]
249  template <class U, class Flags> void copy_to(U* mem, Flags f) const;
250
251  // scalar access [simd.subscr]
252  reference operator[](size_t);
253  value_type operator[](size_t) const;
254
255  // unary operators [simd.unary]
256  simd& operator++();
257  simd operator++(int);
258  simd& operator--();
259  simd operator--(int);
260  mask_type operator!() const;
261  simd operator~() const; // see below
262  simd operator+() const;
263  simd operator-() const;
264
265  // binary operators [simd.binary]
266  friend simd operator+ (const simd&, const simd&);
267  friend simd operator- (const simd&, const simd&);
268  friend simd operator* (const simd&, const simd&);
269  friend simd operator/ (const simd&, const simd&);
270  friend simd operator% (const simd&, const simd&);
271  friend simd operator& (const simd&, const simd&);
272  friend simd operator| (const simd&, const simd&);
273  friend simd operator^ (const simd&, const simd&);
274  friend simd operator<<(const simd&, const simd&);
275  friend simd operator>>(const simd&, const simd&);
276  friend simd operator<<(const simd&, int);
277  friend simd operator>>(const simd&, int);
278
279  // compound assignment [simd.cassign]
280  friend simd& operator+= (simd&, const simd&);
281  friend simd& operator-= (simd&, const simd&);
282  friend simd& operator*= (simd&, const simd&);
283  friend simd& operator/= (simd&, const simd&);
284  friend simd& operator%= (simd&, const simd&);
285
286  friend simd& operator&= (simd&, const simd&);
287  friend simd& operator|= (simd&, const simd&);
288  friend simd& operator^= (simd&, const simd&);
289  friend simd& operator<<=(simd&, const simd&);
290  friend simd& operator>>=(simd&, const simd&);
291  friend simd& operator<<=(simd&, int);
292  friend simd& operator>>=(simd&, int);
293
294  // compares [simd.comparison]
295  friend mask_type operator==(const simd&, const simd&);
296  friend mask_type operator!=(const simd&, const simd&);
297  friend mask_type operator>=(const simd&, const simd&);
298  friend mask_type operator<=(const simd&, const simd&);
299  friend mask_type operator> (const simd&, const simd&);
300  friend mask_type operator< (const simd&, const simd&);
301};
302
303// [simd.math]
304template <class Abi> using scharv = simd<signed char, Abi>; // exposition only
305template <class Abi> using shortv = simd<short, Abi>; // exposition only
306template <class Abi> using intv = simd<int, Abi>; // exposition only
307template <class Abi> using longv = simd<long int, Abi>; // exposition only
308template <class Abi> using llongv = simd<long long int, Abi>; // exposition only
309template <class Abi> using floatv = simd<float, Abi>; // exposition only
310template <class Abi> using doublev = simd<double, Abi>; // exposition only
311template <class Abi> using ldoublev = simd<long double, Abi>; // exposition only
312template <class T, class V> using samesize = fixed_size_simd<T, V::size()>; // exposition only
313
314template <class Abi> floatv<Abi> acos(floatv<Abi> x);
315template <class Abi> doublev<Abi> acos(doublev<Abi> x);
316template <class Abi> ldoublev<Abi> acos(ldoublev<Abi> x);
317
318template <class Abi> floatv<Abi> asin(floatv<Abi> x);
319template <class Abi> doublev<Abi> asin(doublev<Abi> x);
320template <class Abi> ldoublev<Abi> asin(ldoublev<Abi> x);
321
322template <class Abi> floatv<Abi> atan(floatv<Abi> x);
323template <class Abi> doublev<Abi> atan(doublev<Abi> x);
324template <class Abi> ldoublev<Abi> atan(ldoublev<Abi> x);
325
326template <class Abi> floatv<Abi> atan2(floatv<Abi> y, floatv<Abi> x);
327template <class Abi> doublev<Abi> atan2(doublev<Abi> y, doublev<Abi> x);
328template <class Abi> ldoublev<Abi> atan2(ldoublev<Abi> y, ldoublev<Abi> x);
329
330template <class Abi> floatv<Abi> cos(floatv<Abi> x);
331template <class Abi> doublev<Abi> cos(doublev<Abi> x);
332template <class Abi> ldoublev<Abi> cos(ldoublev<Abi> x);
333
334template <class Abi> floatv<Abi> sin(floatv<Abi> x);
335template <class Abi> doublev<Abi> sin(doublev<Abi> x);
336template <class Abi> ldoublev<Abi> sin(ldoublev<Abi> x);
337
338template <class Abi> floatv<Abi> tan(floatv<Abi> x);
339template <class Abi> doublev<Abi> tan(doublev<Abi> x);
340template <class Abi> ldoublev<Abi> tan(ldoublev<Abi> x);
341
342template <class Abi> floatv<Abi> acosh(floatv<Abi> x);
343template <class Abi> doublev<Abi> acosh(doublev<Abi> x);
344template <class Abi> ldoublev<Abi> acosh(ldoublev<Abi> x);
345
346template <class Abi> floatv<Abi> asinh(floatv<Abi> x);
347template <class Abi> doublev<Abi> asinh(doublev<Abi> x);
348template <class Abi> ldoublev<Abi> asinh(ldoublev<Abi> x);
349
350template <class Abi> floatv<Abi> atanh(floatv<Abi> x);
351template <class Abi> doublev<Abi> atanh(doublev<Abi> x);
352template <class Abi> ldoublev<Abi> atanh(ldoublev<Abi> x);
353
354template <class Abi> floatv<Abi> cosh(floatv<Abi> x);
355template <class Abi> doublev<Abi> cosh(doublev<Abi> x);
356template <class Abi> ldoublev<Abi> cosh(ldoublev<Abi> x);
357
358template <class Abi> floatv<Abi> sinh(floatv<Abi> x);
359template <class Abi> doublev<Abi> sinh(doublev<Abi> x);
360template <class Abi> ldoublev<Abi> sinh(ldoublev<Abi> x);
361
362template <class Abi> floatv<Abi> tanh(floatv<Abi> x);
363template <class Abi> doublev<Abi> tanh(doublev<Abi> x);
364template <class Abi> ldoublev<Abi> tanh(ldoublev<Abi> x);
365
366template <class Abi> floatv<Abi> exp(floatv<Abi> x);
367template <class Abi> doublev<Abi> exp(doublev<Abi> x);
368template <class Abi> ldoublev<Abi> exp(ldoublev<Abi> x);
369
370template <class Abi> floatv<Abi> exp2(floatv<Abi> x);
371template <class Abi> doublev<Abi> exp2(doublev<Abi> x);
372template <class Abi> ldoublev<Abi> exp2(ldoublev<Abi> x);
373
374template <class Abi> floatv<Abi> expm1(floatv<Abi> x);
375template <class Abi> doublev<Abi> expm1(doublev<Abi> x);
376template <class Abi> ldoublev<Abi> expm1(ldoublev<Abi> x);
377
378template <class Abi> floatv<Abi> frexp(floatv<Abi> value, samesize<int, floatv<Abi>>* exp);
379template <class Abi> doublev<Abi> frexp(doublev<Abi> value, samesize<int, doublev<Abi>>* exp);
380template <class Abi> ldoublev<Abi> frexp(ldoublev<Abi> value, samesize<int, ldoublev<Abi>>* exp);
381
382template <class Abi> samesize<int, floatv<Abi>> ilogb(floatv<Abi> x);
383template <class Abi> samesize<int, doublev<Abi>> ilogb(doublev<Abi> x);
384template <class Abi> samesize<int, ldoublev<Abi>> ilogb(ldoublev<Abi> x);
385
386template <class Abi> floatv<Abi> ldexp(floatv<Abi> x, samesize<int, floatv<Abi>> exp);
387template <class Abi> doublev<Abi> ldexp(doublev<Abi> x, samesize<int, doublev<Abi>> exp);
388template <class Abi> ldoublev<Abi> ldexp(ldoublev<Abi> x, samesize<int, ldoublev<Abi>> exp);
389
390template <class Abi> floatv<Abi> log(floatv<Abi> x);
391template <class Abi> doublev<Abi> log(doublev<Abi> x);
392template <class Abi> ldoublev<Abi> log(ldoublev<Abi> x);
393
394template <class Abi> floatv<Abi> log10(floatv<Abi> x);
395template <class Abi> doublev<Abi> log10(doublev<Abi> x);
396template <class Abi> ldoublev<Abi> log10(ldoublev<Abi> x);
397
398template <class Abi> floatv<Abi> log1p(floatv<Abi> x);
399template <class Abi> doublev<Abi> log1p(doublev<Abi> x);
400template <class Abi> ldoublev<Abi> log1p(ldoublev<Abi> x);
401
402template <class Abi> floatv<Abi> log2(floatv<Abi> x);
403template <class Abi> doublev<Abi> log2(doublev<Abi> x);
404template <class Abi> ldoublev<Abi> log2(ldoublev<Abi> x);
405
406template <class Abi> floatv<Abi> logb(floatv<Abi> x);
407template <class Abi> doublev<Abi> logb(doublev<Abi> x);
408template <class Abi> ldoublev<Abi> logb(ldoublev<Abi> x);
409
410template <class Abi> floatv<Abi> modf(floatv<Abi> value, floatv<Abi>* iptr);
411template <class Abi> doublev<Abi> modf(doublev<Abi> value, doublev<Abi>* iptr);
412template <class Abi> ldoublev<Abi> modf(ldoublev<Abi> value, ldoublev<Abi>* iptr);
413
414template <class Abi> floatv<Abi> scalbn(floatv<Abi> x, samesize<int, floatv<Abi>> n);
415template <class Abi> doublev<Abi> scalbn(doublev<Abi> x, samesize<int, doublev<Abi>> n);
416template <class Abi> ldoublev<Abi> scalbn(ldoublev<Abi> x, samesize<int, ldoublev<Abi>> n);
417template <class Abi> floatv<Abi> scalbln(floatv<Abi> x, samesize<long int, floatv<Abi>> n);
418template <class Abi> doublev<Abi> scalbln(doublev<Abi> x, samesize<long int, doublev<Abi>> n);
419template <class Abi> ldoublev<Abi> scalbln(ldoublev<Abi> x, samesize<long int, ldoublev<Abi>> n);
420
421template <class Abi> floatv<Abi> cbrt(floatv<Abi> x);
422template <class Abi> doublev<Abi> cbrt(doublev<Abi> x);
423template <class Abi> ldoublev<Abi> cbrt(ldoublev<Abi> x);
424
425template <class Abi> scharv<Abi> abs(scharv<Abi> j);
426template <class Abi> shortv<Abi> abs(shortv<Abi> j);
427template <class Abi> intv<Abi> abs(intv<Abi> j);
428template <class Abi> longv<Abi> abs(longv<Abi> j);
429template <class Abi> llongv<Abi> abs(llongv<Abi> j);
430template <class Abi> floatv<Abi> abs(floatv<Abi> j);
431template <class Abi> doublev<Abi> abs(doublev<Abi> j);
432template <class Abi> ldoublev<Abi> abs(ldoublev<Abi> j);
433
434template <class Abi> floatv<Abi> hypot(floatv<Abi> x, floatv<Abi> y);
435template <class Abi> doublev<Abi> hypot(doublev<Abi> x, doublev<Abi> y);
436template <class Abi> ldoublev<Abi> hypot(doublev<Abi> x, doublev<Abi> y);
437template <class Abi> floatv<Abi> hypot(floatv<Abi> x, floatv<Abi> y, floatv<Abi> z);
438template <class Abi> doublev<Abi> hypot(doublev<Abi> x, doublev<Abi> y, doublev<Abi> z);
439template <class Abi> ldoublev<Abi> hypot(ldoublev<Abi> x, ldoublev<Abi> y, ldoublev<Abi> z);
440
441template <class Abi> floatv<Abi> pow(floatv<Abi> x, floatv<Abi> y);
442template <class Abi> doublev<Abi> pow(doublev<Abi> x, doublev<Abi> y);
443template <class Abi> ldoublev<Abi> pow(ldoublev<Abi> x, ldoublev<Abi> y);
444
445template <class Abi> floatv<Abi> sqrt(floatv<Abi> x);
446template <class Abi> doublev<Abi> sqrt(doublev<Abi> x);
447template <class Abi> ldoublev<Abi> sqrt(ldoublev<Abi> x);
448
449template <class Abi> floatv<Abi> erf(floatv<Abi> x);
450template <class Abi> doublev<Abi> erf(doublev<Abi> x);
451template <class Abi> ldoublev<Abi> erf(ldoublev<Abi> x);
452template <class Abi> floatv<Abi> erfc(floatv<Abi> x);
453template <class Abi> doublev<Abi> erfc(doublev<Abi> x);
454template <class Abi> ldoublev<Abi> erfc(ldoublev<Abi> x);
455
456template <class Abi> floatv<Abi> lgamma(floatv<Abi> x);
457template <class Abi> doublev<Abi> lgamma(doublev<Abi> x);
458template <class Abi> ldoublev<Abi> lgamma(ldoublev<Abi> x);
459
460template <class Abi> floatv<Abi> tgamma(floatv<Abi> x);
461template <class Abi> doublev<Abi> tgamma(doublev<Abi> x);
462template <class Abi> ldoublev<Abi> tgamma(ldoublev<Abi> x);
463
464template <class Abi> floatv<Abi> ceil(floatv<Abi> x);
465template <class Abi> doublev<Abi> ceil(doublev<Abi> x);
466template <class Abi> ldoublev<Abi> ceil(ldoublev<Abi> x);
467
468template <class Abi> floatv<Abi> floor(floatv<Abi> x);
469template <class Abi> doublev<Abi> floor(doublev<Abi> x);
470template <class Abi> ldoublev<Abi> floor(ldoublev<Abi> x);
471
472template <class Abi> floatv<Abi> nearbyint(floatv<Abi> x);
473template <class Abi> doublev<Abi> nearbyint(doublev<Abi> x);
474template <class Abi> ldoublev<Abi> nearbyint(ldoublev<Abi> x);
475
476template <class Abi> floatv<Abi> rint(floatv<Abi> x);
477template <class Abi> doublev<Abi> rint(doublev<Abi> x);
478template <class Abi> ldoublev<Abi> rint(ldoublev<Abi> x);
479
480template <class Abi> samesize<long int, floatv<Abi>> lrint(floatv<Abi> x);
481template <class Abi> samesize<long int, doublev<Abi>> lrint(doublev<Abi> x);
482template <class Abi> samesize<long int, ldoublev<Abi>> lrint(ldoublev<Abi> x);
483template <class Abi> samesize<long long int, floatv<Abi>> llrint(floatv<Abi> x);
484template <class Abi> samesize<long long int, doublev<Abi>> llrint(doublev<Abi> x);
485template <class Abi> samesize<long long int, ldoublev<Abi>> llrint(ldoublev<Abi> x);
486
487template <class Abi> floatv<Abi> round(floatv<Abi> x);
488template <class Abi> doublev<Abi> round(doublev<Abi> x);
489template <class Abi> ldoublev<Abi> round(ldoublev<Abi> x);
490template <class Abi> samesize<long int, floatv<Abi>> lround(floatv<Abi> x);
491template <class Abi> samesize<long int, doublev<Abi>> lround(doublev<Abi> x);
492template <class Abi> samesize<long int, ldoublev<Abi>> lround(ldoublev<Abi> x);
493template <class Abi> samesize<long long int, floatv<Abi>> llround(floatv<Abi> x);
494template <class Abi> samesize<long long int, doublev<Abi>> llround(doublev<Abi> x);
495template <class Abi> samesize<long long int, ldoublev<Abi>> llround(ldoublev<Abi> x);
496
497template <class Abi> floatv<Abi> trunc(floatv<Abi> x);
498template <class Abi> doublev<Abi> trunc(doublev<Abi> x);
499template <class Abi> ldoublev<Abi> trunc(ldoublev<Abi> x);
500
501template <class Abi> floatv<Abi> fmod(floatv<Abi> x, floatv<Abi> y);
502template <class Abi> doublev<Abi> fmod(doublev<Abi> x, doublev<Abi> y);
503template <class Abi> ldoublev<Abi> fmod(ldoublev<Abi> x, ldoublev<Abi> y);
504
505template <class Abi> floatv<Abi> remainder(floatv<Abi> x, floatv<Abi> y);
506template <class Abi> doublev<Abi> remainder(doublev<Abi> x, doublev<Abi> y);
507template <class Abi> ldoublev<Abi> remainder(ldoublev<Abi> x, ldoublev<Abi> y);
508
509template <class Abi> floatv<Abi> remquo(floatv<Abi> x, floatv<Abi> y, samesize<int, floatv<Abi>>* quo);
510template <class Abi> doublev<Abi> remquo(doublev<Abi> x, doublev<Abi> y, samesize<int, doublev<Abi>>* quo);
511template <class Abi> ldoublev<Abi> remquo(ldoublev<Abi> x, ldoublev<Abi> y, samesize<int, ldoublev<Abi>>* quo);
512
513template <class Abi> floatv<Abi> copysign(floatv<Abi> x, floatv<Abi> y);
514template <class Abi> doublev<Abi> copysign(doublev<Abi> x, doublev<Abi> y);
515template <class Abi> ldoublev<Abi> copysign(ldoublev<Abi> x, ldoublev<Abi> y);
516
517template <class Abi> doublev<Abi> nan(const char* tagp);
518template <class Abi> floatv<Abi> nanf(const char* tagp);
519template <class Abi> ldoublev<Abi> nanl(const char* tagp);
520
521template <class Abi> floatv<Abi> nextafter(floatv<Abi> x, floatv<Abi> y);
522template <class Abi> doublev<Abi> nextafter(doublev<Abi> x, doublev<Abi> y);
523template <class Abi> ldoublev<Abi> nextafter(ldoublev<Abi> x, ldoublev<Abi> y);
524
525template <class Abi> floatv<Abi> nexttoward(floatv<Abi> x, ldoublev<Abi> y);
526template <class Abi> doublev<Abi> nexttoward(doublev<Abi> x, ldoublev<Abi> y);
527template <class Abi> ldoublev<Abi> nexttoward(ldoublev<Abi> x, ldoublev<Abi> y);
528
529template <class Abi> floatv<Abi> fdim(floatv<Abi> x, floatv<Abi> y);
530template <class Abi> doublev<Abi> fdim(doublev<Abi> x, doublev<Abi> y);
531template <class Abi> ldoublev<Abi> fdim(ldoublev<Abi> x, ldoublev<Abi> y);
532
533template <class Abi> floatv<Abi> fmax(floatv<Abi> x, floatv<Abi> y);
534template <class Abi> doublev<Abi> fmax(doublev<Abi> x, doublev<Abi> y);
535template <class Abi> ldoublev<Abi> fmax(ldoublev<Abi> x, ldoublev<Abi> y);
536
537template <class Abi> floatv<Abi> fmin(floatv<Abi> x, floatv<Abi> y);
538template <class Abi> doublev<Abi> fmin(doublev<Abi> x, doublev<Abi> y);
539template <class Abi> ldoublev<Abi> fmin(ldoublev<Abi> x, ldoublev<Abi> y);
540
541template <class Abi> floatv<Abi> fma(floatv<Abi> x, floatv<Abi> y, floatv<Abi> z);
542template <class Abi> doublev<Abi> fma(doublev<Abi> x, doublev<Abi> y, doublev<Abi> z);
543template <class Abi> ldoublev<Abi> fma(ldoublev<Abi> x, ldoublev<Abi> y, ldoublev<Abi> z);
544
545template <class Abi> samesize<int, floatv<Abi>> fpclassify(floatv<Abi> x);
546template <class Abi> samesize<int, doublev<Abi>> fpclassify(doublev<Abi> x);
547template <class Abi> samesize<int, ldoublev<Abi>> fpclassify(ldoublev<Abi> x);
548
549template <class Abi> simd_mask<float, Abi> isfinite(floatv<Abi> x);
550template <class Abi> simd_mask<double, Abi> isfinite(doublev<Abi> x);
551template <class Abi> simd_mask<long double, Abi> isfinite(ldoublev<Abi> x);
552
553template <class Abi> simd_mask<float, Abi> isinf(floatv<Abi> x);
554template <class Abi> simd_mask<double, Abi> isinf(doublev<Abi> x);
555template <class Abi> simd_mask<long double, Abi> isinf(ldoublev<Abi> x);
556
557template <class Abi> simd_mask<float, Abi> isnan(floatv<Abi> x);
558template <class Abi> simd_mask<double, Abi> isnan(doublev<Abi> x);
559template <class Abi> simd_mask<long double, Abi> isnan(ldoublev<Abi> x);
560
561template <class Abi> simd_mask<float, Abi> isnormal(floatv<Abi> x);
562template <class Abi> simd_mask<double, Abi> isnormal(doublev<Abi> x);
563template <class Abi> simd_mask<long double, Abi> isnormal(ldoublev<Abi> x);
564
565template <class Abi> simd_mask<float, Abi> signbit(floatv<Abi> x);
566template <class Abi> simd_mask<double, Abi> signbit(doublev<Abi> x);
567template <class Abi> simd_mask<long double, Abi> signbit(ldoublev<Abi> x);
568
569template <class Abi> simd_mask<float, Abi> isgreater(floatv<Abi> x, floatv<Abi> y);
570template <class Abi> simd_mask<double, Abi> isgreater(doublev<Abi> x, doublev<Abi> y);
571template <class Abi> simd_mask<long double, Abi> isgreater(ldoublev<Abi> x, ldoublev<Abi> y);
572
573template <class Abi> simd_mask<float, Abi> isgreaterequal(floatv<Abi> x, floatv<Abi> y);
574template <class Abi> simd_mask<double, Abi> isgreaterequal(doublev<Abi> x, doublev<Abi> y);
575template <class Abi> simd_mask<long double, Abi> isgreaterequal(ldoublev<Abi> x, ldoublev<Abi> y);
576
577template <class Abi> simd_mask<float, Abi> isless(floatv<Abi> x, floatv<Abi> y);
578template <class Abi> simd_mask<double, Abi> isless(doublev<Abi> x, doublev<Abi> y);
579template <class Abi> simd_mask<long double, Abi> isless(ldoublev<Abi> x, ldoublev<Abi> y);
580
581template <class Abi> simd_mask<float, Abi> islessequal(floatv<Abi> x, floatv<Abi> y);
582template <class Abi> simd_mask<double, Abi> islessequal(doublev<Abi> x, doublev<Abi> y);
583template <class Abi> simd_mask<long double, Abi> islessequal(ldoublev<Abi> x, ldoublev<Abi> y);
584
585template <class Abi> simd_mask<float, Abi> islessgreater(floatv<Abi> x, floatv<Abi> y);
586template <class Abi> simd_mask<double, Abi> islessgreater(doublev<Abi> x, doublev<Abi> y);
587template <class Abi> simd_mask<long double, Abi> islessgreater(ldoublev<Abi> x, ldoublev<Abi> y);
588
589template <class Abi> simd_mask<float, Abi> isunordered(floatv<Abi> x, floatv<Abi> y);
590template <class Abi> simd_mask<double, Abi> isunordered(doublev<Abi> x, doublev<Abi> y);
591template <class Abi> simd_mask<long double, Abi> isunordered(ldoublev<Abi> x, ldoublev<Abi> y);
592
593template <class V> struct simd_div_t { V quot, rem; };
594template <class Abi> simd_div_t<scharv<Abi>> div(scharv<Abi> numer, scharv<Abi> denom);
595template <class Abi> simd_div_t<shortv<Abi>> div(shortv<Abi> numer, shortv<Abi> denom);
596template <class Abi> simd_div_t<intv<Abi>> div(intv<Abi> numer, intv<Abi> denom);
597template <class Abi> simd_div_t<longv<Abi>> div(longv<Abi> numer, longv<Abi> denom);
598template <class Abi> simd_div_t<llongv<Abi>> div(llongv<Abi> numer, llongv<Abi> denom);
599
600// [simd.mask.class]
601template <class T, class Abi>
602class simd_mask {
603public:
604  using value_type = bool;
605  using reference = see below;
606  using simd_type = simd<T, Abi>;
607  using abi_type = Abi;
608  static constexpr size_t size() noexcept;
609  simd_mask() = default;
610
611  // broadcast constructor
612  explicit simd_mask(value_type) noexcept;
613
614  // implicit type conversion constructor
615  template <class U> simd_mask(const simd_mask<U, simd_abi::fixed_size<size()>>&) noexcept;
616
617  // load constructor
618  template <class Flags> simd_mask(const value_type* mem, Flags);
619
620  // loads [simd.mask.copy]
621  template <class Flags> void copy_from(const value_type* mem, Flags);
622  template <class Flags> void copy_to(value_type* mem, Flags) const;
623
624  // scalar access [simd.mask.subscr]
625  reference operator[](size_t);
626  value_type operator[](size_t) const;
627
628  // unary operators [simd.mask.unary]
629  simd_mask operator!() const noexcept;
630
631  // simd_mask binary operators [simd.mask.binary]
632  friend simd_mask operator&&(const simd_mask&, const simd_mask&) noexcept;
633  friend simd_mask operator||(const simd_mask&, const simd_mask&) noexcept;
634  friend simd_mask operator& (const simd_mask&, const simd_mask&) noexcept;
635  friend simd_mask operator| (const simd_mask&, const simd_mask&) noexcept;
636  friend simd_mask operator^ (const simd_mask&, const simd_mask&) noexcept;
637
638  // simd_mask compound assignment [simd.mask.cassign]
639  friend simd_mask& operator&=(simd_mask&, const simd_mask&) noexcept;
640  friend simd_mask& operator|=(simd_mask&, const simd_mask&) noexcept;
641  friend simd_mask& operator^=(simd_mask&, const simd_mask&) noexcept;
642
643  // simd_mask compares [simd.mask.comparison]
644  friend simd_mask operator==(const simd_mask&, const simd_mask&) noexcept;
645  friend simd_mask operator!=(const simd_mask&, const simd_mask&) noexcept;
646};
647
648} // parallelism_v2
649} // std::experimental
650
651*/
652
653#include <__assert> // all public C++ headers provide the assertion handler
654#include <__functional/operations.h>
655#include <array>
656#include <cstddef>
657#include <experimental/__config>
658#include <tuple>
659
660#if !defined(_LIBCPP_HAS_NO_PRAGMA_SYSTEM_HEADER)
661#  pragma GCC system_header
662#endif
663
664_LIBCPP_PUSH_MACROS
665#include <__undef_macros>
666
667_LIBCPP_BEGIN_NAMESPACE_EXPERIMENTAL_SIMD
668
669#if _LIBCPP_STD_VER >= 17
670
671enum class _StorageKind {
672  _Scalar,
673  _Array,
674  _VecExt,
675};
676
677template <_StorageKind __kind, int _Np>
678struct __simd_abi {};
679
680template <class _Tp, class _Abi>
681class __simd_storage {};
682
683template <class _Tp, int __num_element>
684class __simd_storage<_Tp, __simd_abi<_StorageKind::_Array, __num_element>> {
685  std::array<_Tp, __num_element> __storage_;
686
687  template <class, class>
688  friend struct simd;
689
690  template <class, class>
691  friend struct simd_mask;
692
693public:
694  _LIBCPP_HIDE_FROM_ABI _Tp __get(size_t __index) const noexcept { return __storage_[__index]; }
695  _LIBCPP_HIDE_FROM_ABI void __set(size_t __index, _Tp __val) noexcept {
696    __storage_[__index] = __val;
697  }
698};
699
700template <class _Tp>
701class __simd_storage<_Tp, __simd_abi<_StorageKind::_Scalar, 1>> {
702  _Tp __storage_;
703
704  template <class, class>
705  friend struct simd;
706
707  template <class, class>
708  friend struct simd_mask;
709
710public:
711  _LIBCPP_HIDE_FROM_ABI _Tp __get(size_t __index) const noexcept { return (&__storage_)[__index]; }
712  _LIBCPP_HIDE_FROM_ABI void __set(size_t __index, _Tp __val) noexcept {
713    (&__storage_)[__index] = __val;
714  }
715};
716
717#ifndef _LIBCPP_HAS_NO_VECTOR_EXTENSION
718
719_LIBCPP_HIDE_FROM_ABI constexpr size_t __floor_pow_of_2(size_t __val) {
720  return ((__val - 1) & __val) == 0 ? __val
721                                    : __floor_pow_of_2((__val - 1) & __val);
722}
723
724_LIBCPP_HIDE_FROM_ABI constexpr size_t __ceil_pow_of_2(size_t __val) {
725  return __val == 1 ? 1 : __floor_pow_of_2(__val - 1) << 1;
726}
727
728template <class _Tp, size_t __bytes>
729struct __vec_ext_traits {
730#if !defined(_LIBCPP_COMPILER_CLANG_BASED)
731  typedef _Tp type __attribute__((vector_size(__ceil_pow_of_2(__bytes))));
732#endif
733};
734
735#if defined(_LIBCPP_COMPILER_CLANG_BASED)
736#define _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, _NUM_ELEMENT)                        \
737  template <>                                                                  \
738  struct __vec_ext_traits<_TYPE, sizeof(_TYPE) * _NUM_ELEMENT> {               \
739    using type =                                                               \
740        _TYPE __attribute__((vector_size(sizeof(_TYPE) * _NUM_ELEMENT)));      \
741  }
742
743#define _LIBCPP_SPECIALIZE_VEC_EXT_32(_TYPE)                                   \
744  _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 1);                                        \
745  _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 2);                                        \
746  _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 3);                                        \
747  _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 4);                                        \
748  _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 5);                                        \
749  _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 6);                                        \
750  _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 7);                                        \
751  _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 8);                                        \
752  _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 9);                                        \
753  _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 10);                                       \
754  _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 11);                                       \
755  _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 12);                                       \
756  _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 13);                                       \
757  _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 14);                                       \
758  _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 15);                                       \
759  _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 16);                                       \
760  _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 17);                                       \
761  _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 18);                                       \
762  _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 19);                                       \
763  _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 20);                                       \
764  _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 21);                                       \
765  _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 22);                                       \
766  _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 23);                                       \
767  _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 24);                                       \
768  _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 25);                                       \
769  _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 26);                                       \
770  _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 27);                                       \
771  _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 28);                                       \
772  _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 29);                                       \
773  _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 30);                                       \
774  _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 31);                                       \
775  _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 32)
776
777_LIBCPP_SPECIALIZE_VEC_EXT_32(char);
778_LIBCPP_SPECIALIZE_VEC_EXT_32(char16_t);
779_LIBCPP_SPECIALIZE_VEC_EXT_32(char32_t);
780_LIBCPP_SPECIALIZE_VEC_EXT_32(wchar_t);
781_LIBCPP_SPECIALIZE_VEC_EXT_32(signed char);
782_LIBCPP_SPECIALIZE_VEC_EXT_32(signed short);
783_LIBCPP_SPECIALIZE_VEC_EXT_32(signed int);
784_LIBCPP_SPECIALIZE_VEC_EXT_32(signed long);
785_LIBCPP_SPECIALIZE_VEC_EXT_32(signed long long);
786_LIBCPP_SPECIALIZE_VEC_EXT_32(unsigned char);
787_LIBCPP_SPECIALIZE_VEC_EXT_32(unsigned short);
788_LIBCPP_SPECIALIZE_VEC_EXT_32(unsigned int);
789_LIBCPP_SPECIALIZE_VEC_EXT_32(unsigned long);
790_LIBCPP_SPECIALIZE_VEC_EXT_32(unsigned long long);
791_LIBCPP_SPECIALIZE_VEC_EXT_32(float);
792_LIBCPP_SPECIALIZE_VEC_EXT_32(double);
793_LIBCPP_SPECIALIZE_VEC_EXT_32(long double);
794
795#undef _LIBCPP_SPECIALIZE_VEC_EXT_32
796#undef _LIBCPP_SPECIALIZE_VEC_EXT
797#endif
798
799template <class _Tp, int __num_element>
800class __simd_storage<_Tp, __simd_abi<_StorageKind::_VecExt, __num_element>> {
801  using _StorageType =
802      typename __vec_ext_traits<_Tp, sizeof(_Tp) * __num_element>::type;
803
804  _StorageType __storage_;
805
806  template <class, class>
807  friend struct simd;
808
809  template <class, class>
810  friend struct simd_mask;
811
812public:
813  _LIBCPP_HIDE_FROM_ABI _Tp __get(size_t __index) const noexcept { return __storage_[__index]; }
814  _LIBCPP_HIDE_FROM_ABI void __set(size_t __index, _Tp __val) noexcept {
815    __storage_[__index] = __val;
816  }
817};
818
819#endif // _LIBCPP_HAS_NO_VECTOR_EXTENSION
820
821template <class _Vp, class _Tp, class _Abi>
822class __simd_reference {
823  static_assert(std::is_same<_Vp, _Tp>::value, "");
824
825  template <class, class>
826  friend struct simd;
827
828  template <class, class>
829  friend struct simd_mask;
830
831  __simd_storage<_Tp, _Abi>* __ptr_;
832  size_t __index_;
833
834  _LIBCPP_HIDE_FROM_ABI __simd_reference(__simd_storage<_Tp, _Abi>* __ptr, size_t __index)
835      : __ptr_(__ptr), __index_(__index) {}
836
837  _LIBCPP_HIDE_FROM_ABI __simd_reference(const __simd_reference&) = default;
838
839public:
840  __simd_reference() = delete;
841  __simd_reference& operator=(const __simd_reference&) = delete;
842
843  _LIBCPP_HIDE_FROM_ABI operator _Vp() const { return __ptr_->__get(__index_); }
844
845  _LIBCPP_HIDE_FROM_ABI __simd_reference operator=(_Vp __value) && {
846    __ptr_->__set(__index_, __value);
847    return *this;
848  }
849
850  _LIBCPP_HIDE_FROM_ABI __simd_reference operator++() && {
851    return std::move(*this) = __ptr_->__get(__index_) + 1;
852  }
853
854  _LIBCPP_HIDE_FROM_ABI _Vp operator++(int) && {
855    auto __val = __ptr_->__get(__index_);
856    __ptr_->__set(__index_, __val + 1);
857    return __val;
858  }
859
860  _LIBCPP_HIDE_FROM_ABI __simd_reference operator--() && {
861    return std::move(*this) = __ptr_->__get(__index_) - 1;
862  }
863
864  _LIBCPP_HIDE_FROM_ABI _Vp operator--(int) && {
865    auto __val = __ptr_->__get(__index_);
866    __ptr_->__set(__index_, __val - 1);
867    return __val;
868  }
869
870  _LIBCPP_HIDE_FROM_ABI __simd_reference operator+=(_Vp __value) && {
871    return std::move(*this) = __ptr_->__get(__index_) + __value;
872  }
873
874  _LIBCPP_HIDE_FROM_ABI __simd_reference operator-=(_Vp __value) && {
875    return std::move(*this) = __ptr_->__get(__index_) - __value;
876  }
877
878  _LIBCPP_HIDE_FROM_ABI __simd_reference operator*=(_Vp __value) && {
879    return std::move(*this) = __ptr_->__get(__index_) * __value;
880  }
881
882  _LIBCPP_HIDE_FROM_ABI __simd_reference operator/=(_Vp __value) && {
883    return std::move(*this) = __ptr_->__get(__index_) / __value;
884  }
885
886  _LIBCPP_HIDE_FROM_ABI __simd_reference operator%=(_Vp __value) && {
887    return std::move(*this) = __ptr_->__get(__index_) % __value;
888  }
889
890  _LIBCPP_HIDE_FROM_ABI __simd_reference operator>>=(_Vp __value) && {
891    return std::move(*this) = __ptr_->__get(__index_) >> __value;
892  }
893
894  _LIBCPP_HIDE_FROM_ABI __simd_reference operator<<=(_Vp __value) && {
895    return std::move(*this) = __ptr_->__get(__index_) << __value;
896  }
897
898  _LIBCPP_HIDE_FROM_ABI __simd_reference operator&=(_Vp __value) && {
899    return std::move(*this) = __ptr_->__get(__index_) & __value;
900  }
901
902  _LIBCPP_HIDE_FROM_ABI __simd_reference operator|=(_Vp __value) && {
903    return std::move(*this) = __ptr_->__get(__index_) | __value;
904  }
905
906  _LIBCPP_HIDE_FROM_ABI __simd_reference operator^=(_Vp __value) && {
907    return std::move(*this) = __ptr_->__get(__index_) ^ __value;
908  }
909};
910
911template <class _To, class _From>
912_LIBCPP_HIDE_FROM_ABI constexpr decltype(_To{std::declval<_From>()}, true)
913__is_non_narrowing_convertible_impl(_From) {
914  return true;
915}
916
917template <class _To>
918_LIBCPP_HIDE_FROM_ABI constexpr bool __is_non_narrowing_convertible_impl(...) {
919  return false;
920}
921
922template <class _From, class _To>
923_LIBCPP_HIDE_FROM_ABI
924constexpr typename std::enable_if<std::is_arithmetic<_To>::value &&
925                                      std::is_arithmetic<_From>::value,
926                                  bool>::type
927__is_non_narrowing_arithmetic_convertible() {
928  return experimental::__is_non_narrowing_convertible_impl<_To>(_From{});
929}
930
931template <class _From, class _To>
932_LIBCPP_HIDE_FROM_ABI
933constexpr typename std::enable_if<!(std::is_arithmetic<_To>::value &&
934                                    std::is_arithmetic<_From>::value),
935                                  bool>::type
936__is_non_narrowing_arithmetic_convertible() {
937  return false;
938}
939
940template <class _Tp>
941_LIBCPP_HIDE_FROM_ABI constexpr _Tp __variadic_sum() {
942  return _Tp{};
943}
944
945template <class _Tp, class _Up, class... _Args>
946_LIBCPP_HIDE_FROM_ABI constexpr _Tp __variadic_sum(_Up __first, _Args... __rest) {
947  return static_cast<_Tp>(__first) + experimental::__variadic_sum<_Tp>(__rest...);
948}
949
950template <class _Tp>
951struct __nodeduce {
952  using type = _Tp;
953};
954
955template <class _Tp>
956_LIBCPP_HIDE_FROM_ABI constexpr bool __vectorizable() {
957  return std::is_arithmetic<_Tp>::value && !std::is_const<_Tp>::value &&
958         !std::is_volatile<_Tp>::value && !std::is_same<_Tp, bool>::value;
959}
960
961_LIBCPP_END_NAMESPACE_EXPERIMENTAL_SIMD
962_LIBCPP_BEGIN_NAMESPACE_EXPERIMENTAL_SIMD_ABI
963
964using scalar = __simd_abi<_StorageKind::_Scalar, 1>;
965
966template <int _Np>
967using fixed_size = __simd_abi<_StorageKind::_Array, _Np>;
968
969template <class _Tp>
970inline constexpr size_t max_fixed_size = 32;
971
972template <class _Tp>
973using compatible = fixed_size<16 / sizeof(_Tp)>;
974
975#ifndef _LIBCPP_HAS_NO_VECTOR_EXTENSION
976template <class _Tp>
977using native = __simd_abi<_StorageKind::_VecExt,
978                          _LIBCPP_NATIVE_SIMD_WIDTH_IN_BYTES / sizeof(_Tp)>;
979#else
980template <class _Tp>
981using native =
982    fixed_size<_Tp, _LIBCPP_NATIVE_SIMD_WIDTH_IN_BYTES / sizeof(_Tp)>;
983#endif // _LIBCPP_HAS_NO_VECTOR_EXTENSION
984
985_LIBCPP_END_NAMESPACE_EXPERIMENTAL_SIMD_ABI
986_LIBCPP_BEGIN_NAMESPACE_EXPERIMENTAL_SIMD
987
988template <class _Tp, class _Abi = simd_abi::compatible<_Tp>>
989class simd;
990template <class _Tp, class _Abi = simd_abi::compatible<_Tp>>
991class simd_mask;
992
993struct element_aligned_tag {};
994struct vector_aligned_tag {};
995template <size_t>
996struct overaligned_tag {};
997inline constexpr element_aligned_tag element_aligned{};
998inline constexpr vector_aligned_tag vector_aligned{};
999template <size_t _Np>
1000inline constexpr overaligned_tag<_Np> overaligned{};
1001
1002// traits [simd.traits]
1003template <class _Tp>
1004struct is_abi_tag : std::integral_constant<bool, false> {};
1005
1006template <_StorageKind __kind, int _Np>
1007struct is_abi_tag<__simd_abi<__kind, _Np>>
1008    : std::integral_constant<bool, true> {};
1009
1010template <class _Tp>
1011struct is_simd : std::integral_constant<bool, false> {};
1012
1013template <class _Tp, class _Abi>
1014struct is_simd<simd<_Tp, _Abi>> : std::integral_constant<bool, true> {};
1015
1016template <class _Tp>
1017struct is_simd_mask : std::integral_constant<bool, false> {};
1018
1019template <class _Tp, class _Abi>
1020struct is_simd_mask<simd_mask<_Tp, _Abi>> : std::integral_constant<bool, true> {
1021};
1022
1023template <class _Tp>
1024struct is_simd_flag_type : std::integral_constant<bool, false> {};
1025
1026template <>
1027struct is_simd_flag_type<element_aligned_tag>
1028    : std::integral_constant<bool, true> {};
1029
1030template <>
1031struct is_simd_flag_type<vector_aligned_tag>
1032    : std::integral_constant<bool, true> {};
1033
1034template <size_t _Align>
1035struct is_simd_flag_type<overaligned_tag<_Align>>
1036    : std::integral_constant<bool, true> {};
1037
1038template <class _Tp>
1039inline constexpr bool is_abi_tag_v = is_abi_tag<_Tp>::value;
1040template <class _Tp>
1041inline constexpr bool is_simd_v = is_simd<_Tp>::value;
1042template <class _Tp>
1043inline constexpr bool is_simd_mask_v = is_simd_mask<_Tp>::value;
1044template <class _Tp>
1045inline constexpr bool is_simd_flag_type_v = is_simd_flag_type<_Tp>::value;
1046template <class _Tp, size_t _Np>
1047struct abi_for_size {
1048  using type = simd_abi::fixed_size<_Np>;
1049};
1050template <class _Tp, size_t _Np>
1051using abi_for_size_t = typename abi_for_size<_Tp, _Np>::type;
1052
1053template <class _Tp, class _Abi = simd_abi::compatible<_Tp>>
1054struct simd_size;
1055
1056template <class _Tp, _StorageKind __kind, int _Np>
1057struct simd_size<_Tp, __simd_abi<__kind, _Np>>
1058    : std::integral_constant<size_t, _Np> {
1059  static_assert(
1060      std::is_arithmetic<_Tp>::value &&
1061          !std::is_same<__remove_const_t<_Tp>, bool>::value,
1062      "Element type should be vectorizable");
1063};
1064
1065// TODO: implement it.
1066template <class _Tp, class _Up = typename _Tp::value_type>
1067struct memory_alignment;
1068
1069template <class _Tp, class _Abi = simd_abi::compatible<_Tp>>
1070inline constexpr size_t simd_size_v = simd_size<_Tp, _Abi>::value;
1071
1072template <class _Tp, class _Up = typename _Tp::value_type>
1073inline constexpr size_t memory_alignment_v = memory_alignment<_Tp, _Up>::value;
1074
1075// class template simd [simd.class]
1076template <class _Tp>
1077using native_simd = simd<_Tp, simd_abi::native<_Tp>>;
1078template <class _Tp, int _Np>
1079using fixed_size_simd = simd<_Tp, simd_abi::fixed_size<_Np>>;
1080
1081// class template simd_mask [simd.mask.class]
1082template <class _Tp>
1083using native_simd_mask = simd_mask<_Tp, simd_abi::native<_Tp>>;
1084
1085template <class _Tp, int _Np>
1086using fixed_size_simd_mask = simd_mask<_Tp, simd_abi::fixed_size<_Np>>;
1087
1088// casts [simd.casts]
1089template <class _Tp>
1090struct __static_simd_cast_traits {
1091  template <class _Up, class _Abi>
1092  static simd<_Tp, _Abi> __apply(const simd<_Up, _Abi>& __v);
1093};
1094
1095template <class _Tp, class _NewAbi>
1096struct __static_simd_cast_traits<simd<_Tp, _NewAbi>> {
1097  template <class _Up, class _Abi>
1098  static typename std::enable_if<simd<_Up, _Abi>::size() ==
1099                                     simd<_Tp, _NewAbi>::size(),
1100                                 simd<_Tp, _NewAbi>>::type
1101  __apply(const simd<_Up, _Abi>& __v);
1102};
1103
1104template <class _Tp>
1105struct __simd_cast_traits {
1106  template <class _Up, class _Abi>
1107  static typename std::enable_if<
1108      __is_non_narrowing_arithmetic_convertible<_Up, _Tp>(),
1109      simd<_Tp, _Abi>>::type
1110  __apply(const simd<_Up, _Abi>& __v);
1111};
1112
1113template <class _Tp, class _NewAbi>
1114struct __simd_cast_traits<simd<_Tp, _NewAbi>> {
1115  template <class _Up, class _Abi>
1116  static typename std::enable_if<
1117      __is_non_narrowing_arithmetic_convertible<_Up, _Tp>() &&
1118          simd<_Up, _Abi>::size() == simd<_Tp, _NewAbi>::size(),
1119      simd<_Tp, _NewAbi>>::type
1120  __apply(const simd<_Up, _Abi>& __v);
1121};
1122
1123template <class _Tp, class _Up, class _Abi>
1124_LIBCPP_HIDE_FROM_ABI auto simd_cast(const simd<_Up, _Abi>& __v)
1125    -> decltype(__simd_cast_traits<_Tp>::__apply(__v)) {
1126  return __simd_cast_traits<_Tp>::__apply(__v);
1127}
1128
1129template <class _Tp, class _Up, class _Abi>
1130_LIBCPP_HIDE_FROM_ABI auto static_simd_cast(const simd<_Up, _Abi>& __v)
1131    -> decltype(__static_simd_cast_traits<_Tp>::__apply(__v)) {
1132  return __static_simd_cast_traits<_Tp>::__apply(__v);
1133}
1134
1135template <class _Tp, class _Abi>
1136fixed_size_simd<_Tp, simd_size<_Tp, _Abi>::value>
1137to_fixed_size(const simd<_Tp, _Abi>&) noexcept;
1138
1139template <class _Tp, class _Abi>
1140fixed_size_simd_mask<_Tp, simd_size<_Tp, _Abi>::value>
1141to_fixed_size(const simd_mask<_Tp, _Abi>&) noexcept;
1142
1143template <class _Tp, size_t _Np>
1144native_simd<_Tp> to_native(const fixed_size_simd<_Tp, _Np>&) noexcept;
1145
1146template <class _Tp, size_t _Np>
1147native_simd_mask<_Tp> to_native(const fixed_size_simd_mask<_Tp, _Np>&) noexcept;
1148
1149template <class _Tp, size_t _Np>
1150simd<_Tp> to_compatible(const fixed_size_simd<_Tp, _Np>&) noexcept;
1151
1152template <class _Tp, size_t _Np>
1153simd_mask<_Tp> to_compatible(const fixed_size_simd_mask<_Tp, _Np>&) noexcept;
1154
1155template <size_t... __sizes, class _Tp, class _Abi>
1156tuple<simd<_Tp, abi_for_size_t<_Tp, __sizes>>...> split(const simd<_Tp, _Abi>&);
1157
1158template <size_t... __sizes, class _Tp, class _Abi>
1159tuple<simd_mask<_Tp, abi_for_size_t<_Tp, __sizes>>...>
1160split(const simd_mask<_Tp, _Abi>&);
1161
1162template <class _SimdType, class _Abi>
1163array<_SimdType, simd_size<typename _SimdType::value_type, _Abi>::value /
1164                     _SimdType::size()>
1165split(const simd<typename _SimdType::value_type, _Abi>&);
1166
1167template <class _SimdType, class _Abi>
1168array<_SimdType, simd_size<typename _SimdType::value_type, _Abi>::value /
1169                     _SimdType::size()>
1170split(const simd_mask<typename _SimdType::value_type, _Abi>&);
1171
1172template <class _Tp, class... _Abis>
1173simd<_Tp, abi_for_size_t<_Tp, experimental::__variadic_sum(simd_size<_Tp, _Abis>::value...)>>
1174concat(const simd<_Tp, _Abis>&...);
1175
1176template <class _Tp, class... _Abis>
1177simd_mask<_Tp,
1178          abi_for_size_t<_Tp, experimental::__variadic_sum(simd_size<_Tp, _Abis>::value...)>>
1179concat(const simd_mask<_Tp, _Abis>&...);
1180
1181// reductions [simd.mask.reductions]
1182template <class _Tp, class _Abi>
1183bool all_of(const simd_mask<_Tp, _Abi>&) noexcept;
1184template <class _Tp, class _Abi>
1185bool any_of(const simd_mask<_Tp, _Abi>&) noexcept;
1186template <class _Tp, class _Abi>
1187bool none_of(const simd_mask<_Tp, _Abi>&) noexcept;
1188template <class _Tp, class _Abi>
1189bool some_of(const simd_mask<_Tp, _Abi>&) noexcept;
1190template <class _Tp, class _Abi>
1191int popcount(const simd_mask<_Tp, _Abi>&) noexcept;
1192template <class _Tp, class _Abi>
1193int find_first_set(const simd_mask<_Tp, _Abi>&);
1194template <class _Tp, class _Abi>
1195int find_last_set(const simd_mask<_Tp, _Abi>&);
1196bool all_of(bool) noexcept;
1197bool any_of(bool) noexcept;
1198bool none_of(bool) noexcept;
1199bool some_of(bool) noexcept;
1200int popcount(bool) noexcept;
1201int find_first_set(bool) noexcept;
1202int find_last_set(bool) noexcept;
1203
1204// masked assignment [simd.whereexpr]
1205template <class _MaskType, class _Tp>
1206class const_where_expression;
1207template <class _MaskType, class _Tp>
1208class where_expression;
1209
1210// masked assignment [simd.mask.where]
1211template <class _Tp, class _Abi>
1212where_expression<simd_mask<_Tp, _Abi>, simd<_Tp, _Abi>>
1213where(const typename simd<_Tp, _Abi>::mask_type&, simd<_Tp, _Abi>&) noexcept;
1214
1215template <class _Tp, class _Abi>
1216const_where_expression<simd_mask<_Tp, _Abi>, const simd<_Tp, _Abi>>
1217where(const typename simd<_Tp, _Abi>::mask_type&,
1218      const simd<_Tp, _Abi>&) noexcept;
1219
1220template <class _Tp, class _Abi>
1221where_expression<simd_mask<_Tp, _Abi>, simd_mask<_Tp, _Abi>>
1222where(const typename __nodeduce<simd_mask<_Tp, _Abi>>::type&,
1223      simd_mask<_Tp, _Abi>&) noexcept;
1224
1225template <class _Tp, class _Abi>
1226const_where_expression<simd_mask<_Tp, _Abi>, const simd_mask<_Tp, _Abi>>
1227where(const typename __nodeduce<simd_mask<_Tp, _Abi>>::type&,
1228      const simd_mask<_Tp, _Abi>&) noexcept;
1229
1230template <class _Tp>
1231where_expression<bool, _Tp> where(bool, _Tp&) noexcept;
1232
1233template <class _Tp>
1234const_where_expression<bool, const _Tp> where(bool, const _Tp&) noexcept;
1235
1236// reductions [simd.reductions]
1237template <class _Tp, class _Abi, class _BinaryOp = std::plus<_Tp>>
1238_Tp reduce(const simd<_Tp, _Abi>&, _BinaryOp = _BinaryOp());
1239
1240template <class _MaskType, class _SimdType, class _BinaryOp>
1241typename _SimdType::value_type
1242reduce(const const_where_expression<_MaskType, _SimdType>&,
1243       typename _SimdType::value_type __neutral_element, _BinaryOp);
1244
1245template <class _MaskType, class _SimdType>
1246typename _SimdType::value_type
1247reduce(const const_where_expression<_MaskType, _SimdType>&,
1248       plus<typename _SimdType::value_type> = {});
1249
1250template <class _MaskType, class _SimdType>
1251typename _SimdType::value_type
1252reduce(const const_where_expression<_MaskType, _SimdType>&,
1253       multiplies<typename _SimdType::value_type>);
1254
1255template <class _MaskType, class _SimdType>
1256typename _SimdType::value_type
1257reduce(const const_where_expression<_MaskType, _SimdType>&,
1258       bit_and<typename _SimdType::value_type>);
1259
1260template <class _MaskType, class _SimdType>
1261typename _SimdType::value_type
1262reduce(const const_where_expression<_MaskType, _SimdType>&,
1263       bit_or<typename _SimdType::value_type>);
1264
1265template <class _MaskType, class _SimdType>
1266typename _SimdType::value_type
1267reduce(const const_where_expression<_MaskType, _SimdType>&,
1268       bit_xor<typename _SimdType::value_type>);
1269
1270template <class _Tp, class _Abi>
1271_Tp hmin(const simd<_Tp, _Abi>&);
1272template <class _MaskType, class _SimdType>
1273typename _SimdType::value_type
1274hmin(const const_where_expression<_MaskType, _SimdType>&);
1275template <class _Tp, class _Abi>
1276_Tp hmax(const simd<_Tp, _Abi>&);
1277template <class _MaskType, class _SimdType>
1278typename _SimdType::value_type
1279hmax(const const_where_expression<_MaskType, _SimdType>&);
1280
1281// algorithms [simd.alg]
1282template <class _Tp, class _Abi>
1283simd<_Tp, _Abi> min(const simd<_Tp, _Abi>&, const simd<_Tp, _Abi>&) noexcept;
1284
1285template <class _Tp, class _Abi>
1286simd<_Tp, _Abi> max(const simd<_Tp, _Abi>&, const simd<_Tp, _Abi>&) noexcept;
1287
1288template <class _Tp, class _Abi>
1289std::pair<simd<_Tp, _Abi>, simd<_Tp, _Abi>>
1290minmax(const simd<_Tp, _Abi>&, const simd<_Tp, _Abi>&) noexcept;
1291
1292template <class _Tp, class _Abi>
1293simd<_Tp, _Abi> clamp(const simd<_Tp, _Abi>&, const simd<_Tp, _Abi>&,
1294                      const simd<_Tp, _Abi>&);
1295
1296// [simd.whereexpr]
1297// TODO implement where expressions.
1298template <class _MaskType, class _Tp>
1299class const_where_expression {
1300public:
1301  const_where_expression(const const_where_expression&) = delete;
1302  const_where_expression& operator=(const const_where_expression&) = delete;
1303  __remove_const_t<_Tp> operator-() const&&;
1304  template <class _Up, class _Flags>
1305  void copy_to(_Up*, _Flags) const&&;
1306};
1307
1308template <class _MaskType, class _Tp>
1309class where_expression : public const_where_expression<_MaskType, _Tp> {
1310public:
1311  where_expression(const where_expression&) = delete;
1312  where_expression& operator=(const where_expression&) = delete;
1313  template <class _Up>
1314  void operator=(_Up&&);
1315  template <class _Up>
1316  void operator+=(_Up&&);
1317  template <class _Up>
1318  void operator-=(_Up&&);
1319  template <class _Up>
1320  void operator*=(_Up&&);
1321  template <class _Up>
1322  void operator/=(_Up&&);
1323  template <class _Up>
1324  void operator%=(_Up&&);
1325  template <class _Up>
1326  void operator&=(_Up&&);
1327  template <class _Up>
1328  void operator|=(_Up&&);
1329  template <class _Up>
1330  void operator^=(_Up&&);
1331  template <class _Up>
1332  void operator<<=(_Up&&);
1333  template <class _Up>
1334  void operator>>=(_Up&&);
1335  void operator++();
1336  void operator++(int);
1337  void operator--();
1338  void operator--(int);
1339  template <class _Up, class _Flags>
1340  void copy_from(const _Up*, _Flags);
1341};
1342
1343// [simd.class]
1344// TODO: implement simd
1345template <class _Tp, class _Abi>
1346class simd {
1347public:
1348  using value_type = _Tp;
1349  using reference = __simd_reference<_Tp, _Tp, _Abi>;
1350  using mask_type = simd_mask<_Tp, _Abi>;
1351  using abi_type = _Abi;
1352
1353  _LIBCPP_HIDE_FROM_ABI simd() = default;
1354  _LIBCPP_HIDE_FROM_ABI simd(const simd&) = default;
1355  _LIBCPP_HIDE_FROM_ABI simd& operator=(const simd&) = default;
1356
1357  static _LIBCPP_HIDE_FROM_ABI constexpr size_t size() noexcept {
1358    return simd_size<_Tp, _Abi>::value;
1359  }
1360
1361private:
1362  __simd_storage<_Tp, _Abi> __s_;
1363
1364  template <class _Up>
1365  static _LIBCPP_HIDE_FROM_ABI constexpr bool __can_broadcast() {
1366    return (std::is_arithmetic<_Up>::value &&
1367            __is_non_narrowing_arithmetic_convertible<_Up, _Tp>()) ||
1368           (!std::is_arithmetic<_Up>::value &&
1369            std::is_convertible<_Up, _Tp>::value) ||
1370           std::is_same<__remove_const_t<_Up>, int>::value ||
1371           (std::is_same<__remove_const_t<_Up>,
1372                         unsigned int>::value &&
1373            std::is_unsigned<_Tp>::value);
1374  }
1375
1376  template <class _Generator, size_t... __indicies>
1377  static _LIBCPP_HIDE_FROM_ABI constexpr decltype(
1378      std::forward_as_tuple(std::declval<_Generator>()(
1379          std::integral_constant<size_t, __indicies>())...),
1380      bool())
1381  __can_generate(std::index_sequence<__indicies...>) {
1382    return !experimental::__variadic_sum<bool>(
1383        !__can_broadcast<decltype(std::declval<_Generator>()(
1384            std::integral_constant<size_t, __indicies>()))>()...);
1385  }
1386
1387  template <class _Generator>
1388  static _LIBCPP_HIDE_FROM_ABI bool __can_generate(...) {
1389    return false;
1390  }
1391
1392  template <class _Generator, size_t... __indicies>
1393  _LIBCPP_HIDE_FROM_ABI void __generator_init(_Generator&& __g, std::index_sequence<__indicies...>) {
1394    int __not_used[]{((*this)[__indicies] =
1395                          __g(std::integral_constant<size_t, __indicies>()),
1396                      0)...};
1397    (void)__not_used;
1398  }
1399
1400public:
1401  // implicit type conversion constructor
1402  template <class _Up,
1403            class = typename std::enable_if<
1404                std::is_same<_Abi, simd_abi::fixed_size<size()>>::value &&
1405                __is_non_narrowing_arithmetic_convertible<_Up, _Tp>()>::type>
1406  _LIBCPP_HIDE_FROM_ABI simd(const simd<_Up, simd_abi::fixed_size<size()>>& __v) {
1407    for (size_t __i = 0; __i < size(); __i++) {
1408      (*this)[__i] = static_cast<_Tp>(__v[__i]);
1409    }
1410  }
1411
1412  // implicit broadcast constructor
1413  template <class _Up,
1414            class = typename std::enable_if<__can_broadcast<_Up>()>::type>
1415  _LIBCPP_HIDE_FROM_ABI simd(_Up&& __rv) {
1416    auto __v = static_cast<_Tp>(__rv);
1417    for (size_t __i = 0; __i < size(); __i++) {
1418      (*this)[__i] = __v;
1419    }
1420  }
1421
1422  // generator constructor
1423  template <class _Generator,
1424            int = typename std::enable_if<
1425                __can_generate<_Generator>(std::make_index_sequence<size()>()),
1426                int>::type()>
1427  explicit _LIBCPP_HIDE_FROM_ABI simd(_Generator&& __g) {
1428    __generator_init(std::forward<_Generator>(__g),
1429                     std::make_index_sequence<size()>());
1430  }
1431
1432  // load constructor
1433  template <
1434      class _Up, class _Flags,
1435      class = typename std::enable_if<__vectorizable<_Up>()>::type,
1436      class = typename std::enable_if<is_simd_flag_type<_Flags>::value>::type>
1437  _LIBCPP_HIDE_FROM_ABI simd(const _Up* __buffer, _Flags) {
1438    // TODO: optimize for overaligned flags
1439    for (size_t __i = 0; __i < size(); __i++) {
1440      (*this)[__i] = static_cast<_Tp>(__buffer[__i]);
1441    }
1442  }
1443
1444  // loads [simd.load]
1445  template <class _Up, class _Flags>
1446  typename std::enable_if<__vectorizable<_Up>() &&
1447                          is_simd_flag_type<_Flags>::value>::type
1448  _LIBCPP_HIDE_FROM_ABI copy_from(const _Up* __buffer, _Flags) {
1449    *this = simd(__buffer, _Flags());
1450  }
1451
1452  // stores [simd.store]
1453  template <class _Up, class _Flags>
1454  typename std::enable_if<__vectorizable<_Up>() &&
1455                          is_simd_flag_type<_Flags>::value>::type
1456  _LIBCPP_HIDE_FROM_ABI copy_to(_Up* __buffer, _Flags) const {
1457    // TODO: optimize for overaligned flags
1458    for (size_t __i = 0; __i < size(); __i++) {
1459      __buffer[__i] = static_cast<_Up>((*this)[__i]);
1460    }
1461  }
1462
1463  // scalar access [simd.subscr]
1464  _LIBCPP_HIDE_FROM_ABI reference operator[](size_t __i) { return reference(&__s_, __i); }
1465
1466  _LIBCPP_HIDE_FROM_ABI value_type operator[](size_t __i) const { return __s_.__get(__i); }
1467
1468  // unary operators [simd.unary]
1469  simd& operator++();
1470  simd operator++(int);
1471  simd& operator--();
1472  simd operator--(int);
1473  mask_type operator!() const;
1474  simd operator~() const;
1475  simd operator+() const;
1476  simd operator-() const;
1477
1478#if 0
1479  // binary operators [simd.binary]
1480  friend simd operator+(const simd&, const simd&);
1481  friend simd operator-(const simd&, const simd&);
1482  friend simd operator*(const simd&, const simd&);
1483  friend simd operator/(const simd&, const simd&);
1484  friend simd operator%(const simd&, const simd&);
1485  friend simd operator&(const simd&, const simd&);
1486  friend simd operator|(const simd&, const simd&);
1487  friend simd operator^(const simd&, const simd&);
1488  friend simd operator<<(const simd&, const simd&);
1489  friend simd operator>>(const simd&, const simd&);
1490  friend simd operator<<(const simd&, int);
1491  friend simd operator>>(const simd&, int);
1492
1493  // compound assignment [simd.cassign]
1494  friend simd& operator+=(simd&, const simd&);
1495  friend simd& operator-=(simd&, const simd&);
1496  friend simd& operator*=(simd&, const simd&);
1497  friend simd& operator/=(simd&, const simd&);
1498  friend simd& operator%=(simd&, const simd&);
1499
1500  friend simd& operator&=(simd&, const simd&);
1501  friend simd& operator|=(simd&, const simd&);
1502  friend simd& operator^=(simd&, const simd&);
1503  friend simd& operator<<=(simd&, const simd&);
1504  friend simd& operator>>=(simd&, const simd&);
1505  friend simd& operator<<=(simd&, int);
1506  friend simd& operator>>=(simd&, int);
1507
1508  // compares [simd.comparison]
1509  friend mask_type operator==(const simd&, const simd&);
1510  friend mask_type operator!=(const simd&, const simd&);
1511  friend mask_type operator>=(const simd&, const simd&);
1512  friend mask_type operator<=(const simd&, const simd&);
1513  friend mask_type operator>(const simd&, const simd&);
1514  friend mask_type operator<(const simd&, const simd&);
1515#endif
1516};
1517
1518// [simd.mask.class]
1519template <class _Tp, class _Abi>
1520// TODO: implement simd_mask
1521class simd_mask {
1522public:
1523  using value_type = bool;
1524  // TODO: this is strawman implementation. Turn it into a proxy type.
1525  using reference = bool&;
1526  using simd_type = simd<_Tp, _Abi>;
1527  using abi_type = _Abi;
1528  static constexpr size_t size() noexcept;
1529  _LIBCPP_HIDE_FROM_ABI simd_mask() = default;
1530
1531  // broadcast constructor
1532  explicit simd_mask(value_type) noexcept;
1533
1534  // implicit type conversion constructor
1535  template <class _Up>
1536  simd_mask(const simd_mask<_Up, simd_abi::fixed_size<size()>>&) noexcept;
1537
1538  // load constructor
1539  template <class _Flags>
1540  simd_mask(const value_type*, _Flags);
1541
1542  // loads [simd.mask.copy]
1543  template <class _Flags>
1544  void copy_from(const value_type*, _Flags);
1545  template <class _Flags>
1546  void copy_to(value_type*, _Flags) const;
1547
1548  // scalar access [simd.mask.subscr]
1549  reference operator[](size_t);
1550  value_type operator[](size_t) const;
1551
1552  // unary operators [simd.mask.unary]
1553  simd_mask operator!() const noexcept;
1554
1555#if 0
1556  // simd_mask binary operators [simd.mask.binary]
1557  friend simd_mask operator&&(const simd_mask&, const simd_mask&) noexcept;
1558  friend simd_mask operator||(const simd_mask&, const simd_mask&) noexcept;
1559  friend simd_mask operator&(const simd_mask&, const simd_mask&)noexcept;
1560  friend simd_mask operator|(const simd_mask&, const simd_mask&) noexcept;
1561  friend simd_mask operator^(const simd_mask&, const simd_mask&) noexcept;
1562
1563  // simd_mask compound assignment [simd.mask.cassign]
1564  friend simd_mask& operator&=(simd_mask&, const simd_mask&) noexcept;
1565  friend simd_mask& operator|=(simd_mask&, const simd_mask&) noexcept;
1566  friend simd_mask& operator^=(simd_mask&, const simd_mask&) noexcept;
1567
1568  // simd_mask compares [simd.mask.comparison]
1569  friend simd_mask operator==(const simd_mask&, const simd_mask&) noexcept;
1570  friend simd_mask operator!=(const simd_mask&, const simd_mask&) noexcept;
1571#endif
1572};
1573
1574#endif // _LIBCPP_STD_VER >= 17
1575
1576_LIBCPP_END_NAMESPACE_EXPERIMENTAL_SIMD
1577
1578_LIBCPP_POP_MACROS
1579
1580#if !defined(_LIBCPP_REMOVE_TRANSITIVE_INCLUDES) && _LIBCPP_STD_VER <= 20
1581#  include <algorithm>
1582#  include <functional>
1583#endif
1584
1585#endif /* _LIBCPP_EXPERIMENTAL_SIMD */
1586