blob: 4876ccb82d20756820494d4437aa0e2fe5da12bf [file] [log] [blame]
Tim Shen158e51b2018-04-23 21:54:06 +00001// -*- C++ -*-
2//===------------------------------- simd ---------------------------------===//
3//
4// The LLVM Compiler Infrastructure
5//
6// This file is dual licensed under the MIT and the University of Illinois Open
7// Source Licenses. See LICENSE.TXT for details.
8//
9//===----------------------------------------------------------------------===//
10#ifndef _LIBCPP_EXPERIMENTAL_SIMD
11#define _LIBCPP_EXPERIMENTAL_SIMD
12
13/*
14 experimental/simd synopsis
15
16namespace std::experimental {
17
18inline namespace parallelism_v2 {
19
20namespace simd_abi {
21
22struct scalar {};
23template <int N> struct fixed_size {};
24template <typename T> inline constexpr int max_fixed_size = implementation-defined;
25template <typename T> using compatible = implementation-defined;
26template <typename T> using native = implementation-defined;
27
28} // simd_abi
29
30struct element_aligned_tag {};
31struct vector_aligned_tag {};
32template <size_t> struct overaligned_tag {};
33inline constexpr element_aligned_tag element_aligned{};
34inline constexpr vector_aligned_tag vector_aligned{};
35template <size_t N> inline constexpr overaligned_tag<N> overaligned{};
36
37// traits [simd.traits]
38template <class T> struct is_abi_tag;
39template <class T> inline constexpr bool is_abi_tag_v = is_abi_tag<T>::value;
40
41template <class T> struct is_simd;
42template <class T> inline constexpr bool is_simd_v = is_simd<T>::value;
43
44template <class T> struct is_simd_mask;
45template <class T> inline constexpr bool is_simd_mask_v = is_simd_mask<T>::value;
46
47template <class T> struct is_simd_flag_type;
48template <class T> inline constexpr bool is_simd_flag_type_v = is_simd_flag_type<T>::value;
49
50template <class T, size_t N> struct abi_for_size { using type = see below; };
51template <class T, size_t N> using abi_for_size_t = typename abi_for_size<T, N>::type;
52
53template <class T, class Abi = simd_abi::compatible<T>> struct simd_size;
54template <class T, class Abi = simd_abi::compatible<T>>
55inline constexpr size_t simd_size_v = simd_size<T, Abi>::value;
56
57template <class T, class U = typename T::value_type> struct memory_alignment;
58template <class T, class U = typename T::value_type>
59inline constexpr size_t memory_alignment_v = memory_alignment<T, U>::value;
60
61// class template simd [simd.class]
62template <class T, class Abi = simd_abi::compatible<T>> class simd;
63template <class T> using native_simd = simd<T, simd_abi::native<T>>;
64template <class T, int N> using fixed_size_simd = simd<T, simd_abi::fixed_size<N>>;
65
66// class template simd_mask [simd.mask.class]
67template <class T, class Abi = simd_abi::compatible<T>> class simd_mask;
68template <class T> using native_simd_mask = simd_mask<T, simd_abi::native<T>>;
69template <class T, int N> using fixed_size_simd_mask = simd_mask<T, simd_abi::fixed_size<N>>;
70
71// casts [simd.casts]
72template <class T, class U, class Abi> see below simd_cast(const simd<U, Abi>&);
73template <class T, class U, class Abi> see below static_simd_cast(const simd<U, Abi>&);
74
75template <class T, class Abi>
76fixed_size_simd<T, simd_size_v<T, Abi>> to_fixed_size(const simd<T, Abi>&) noexcept;
77template <class T, class Abi>
78fixed_size_simd_mask<T, simd_size_v<T, Abi>> to_fixed_size(const simd_mask<T, Abi>&) noexcept;
79template <class T, size_t N> native_simd<T> to_native(const fixed_size_simd<T, N>&) noexcept;
80template <class T, size_t N>
81native_simd_mask<T> to_native(const fixed_size_simd_mask<T, N>> &) noexcept;
82template <class T, size_t N> simd<T> to_compatible(const fixed_size_simd<T, N>&) noexcept;
83template <class T, size_t N> simd_mask<T> to_compatible(const fixed_size_simd_mask<T, N>&) noexcept;
84
85template <size_t... Sizes, class T, class Abi>
86tuple<simd<T, abi_for_size_t<Sizes>>...> split(const simd<T, Abi>&);
87template <size_t... Sizes, class T, class Abi>
88tuple<simd_mask<T, abi_for_size_t<Sizes>>...> split(const simd_mask<T, Abi>&);
89template <class V, class Abi>
90array<V, simd_size_v<typename V::value_type, Abi> / V::size()> split(
91const simd<typename V::value_type, Abi>&);
92template <class V, class Abi>
93array<V, simd_size_v<typename V::value_type, Abi> / V::size()> split(
94const simd_mask<typename V::value_type, Abi>&);
95
96template <class T, class... Abis>
97simd<T, abi_for_size_t<T, (simd_size_v<T, Abis> + ...)>> concat(const simd<T, Abis>&...);
98template <class T, class... Abis>
99simd_mask<T, abi_for_size_t<T, (simd_size_v<T, Abis> + ...)>> concat(const simd_mask<T, Abis>&...);
100
101// reductions [simd.mask.reductions]
102template <class T, class Abi> bool all_of(const simd_mask<T, Abi>&) noexcept;
103template <class T, class Abi> bool any_of(const simd_mask<T, Abi>&) noexcept;
104template <class T, class Abi> bool none_of(const simd_mask<T, Abi>&) noexcept;
105template <class T, class Abi> bool some_of(const simd_mask<T, Abi>&) noexcept;
106template <class T, class Abi> int popcount(const simd_mask<T, Abi>&) noexcept;
107template <class T, class Abi> int find_first_set(const simd_mask<T, Abi>&);
108template <class T, class Abi> int find_last_set(const simd_mask<T, Abi>&);
109
110bool all_of(see below) noexcept;
111bool any_of(see below) noexcept;
112bool none_of(see below) noexcept;
113bool some_of(see below) noexcept;
114int popcount(see below) noexcept;
115int find_first_set(see below) noexcept;
116int find_last_set(see below) noexcept;
117
118// masked assignment [simd.whereexpr]
119template <class M, class T> class const_where_expression;
120template <class M, class T> class where_expression;
121
122// masked assignment [simd.mask.where]
123template <class T> struct nodeduce { using type = T; }; // exposition only
124
125template <class T> using nodeduce_t = typename nodeduce<T>::type; // exposition only
126
127template <class T, class Abi>
128where_expression<simd_mask<T, Abi>, simd<T, Abi>>
129where(const typename simd<T, Abi>::mask_type&, simd<T, Abi>&) noexcept;
130
131template <class T, class Abi>
132const_where_expression<simd_mask<T, Abi>, const simd<T, Abi>>
133where(const typename simd<T, Abi>::mask_type&, const simd<T, Abi>&) noexcept;
134
135template <class T, class Abi>
136where_expression<simd_mask<T, Abi>, simd_mask<T, Abi>>
137where(const nodeduce_t<simd_mask<T, Abi>>&, simd_mask<T, Abi>&) noexcept;
138
139template <class T, class Abi>
140const_where_expression<simd_mask<T, Abi>, const simd_mask<T, Abi>>
141where(const nodeduce_t<simd_mask<T, Abi>>&, const simd_mask<T, Abi>&) noexcept;
142
143template <class T> where_expression<bool, T> where(see below k, T& d) noexcept;
144
145template <class T>
146const_where_expression<bool, const T> where(see below k, const T& d) noexcept;
147
148// reductions [simd.reductions]
149template <class T, class Abi, class BinaryOperation = std::plus<>>
150T reduce(const simd<T, Abi>&, BinaryOperation = BinaryOperation());
151
152template <class M, class V, class BinaryOperation>
153typename V::value_type reduce(const const_where_expression<M, V>& x,
154typename V::value_type neutral_element, BinaryOperation binary_op);
155
156template <class M, class V>
157typename V::value_type reduce(const const_where_expression<M, V>& x, plus<> binary_op = plus<>());
158
159template <class M, class V>
160typename V::value_type reduce(const const_where_expression<M, V>& x, multiplies<> binary_op);
161
162template <class M, class V>
163typename V::value_type reduce(const const_where_expression<M, V>& x, bit_and<> binary_op);
164
165template <class M, class V>
166typename V::value_type reduce(const const_where_expression<M, V>& x, bit_or<> binary_op);
167
168template <class M, class V>
169typename V::value_type reduce(const const_where_expression<M, V>& x, bit_xor<> binary_op);
170
171template <class T, class Abi> T hmin(const simd<T, Abi>&);
172template <class M, class V> T hmin(const const_where_expression<M, V>&);
173template <class T, class Abi> T hmax(const simd<T, Abi>&);
174template <class M, class V> T hmax(const const_where_expression<M, V>&);
175
176// algorithms [simd.alg]
177template <class T, class Abi> simd<T, Abi> min(const simd<T, Abi>&, const simd<T, Abi>&) noexcept;
178
179template <class T, class Abi> simd<T, Abi> max(const simd<T, Abi>&, const simd<T, Abi>&) noexcept;
180
181template <class T, class Abi>
182std::pair<simd<T, Abi>, simd<T, Abi>> minmax(const simd<T, Abi>&, const simd<T, Abi>&) noexcept;
183
184template <class T, class Abi>
185simd<T, Abi> clamp(const simd<T, Abi>& v, const simd<T, Abi>& lo, const simd<T, Abi>& hi);
186
187// [simd.whereexpr]
188template <class M, class T>
189class const_where_expression {
190 const M& mask; // exposition only
191 T& data; // exposition only
192public:
193 const_where_expression(const const_where_expression&) = delete;
194 const_where_expression& operator=(const const_where_expression&) = delete;
195 remove_const_t<T> operator-() const &&;
196 template <class U, class Flags> void copy_to(U* mem, Flags f) const &&;
197};
198
199template <class M, class T>
200class where_expression : public const_where_expression<M, T> {
201public:
202 where_expression(const where_expression&) = delete;
203 where_expression& operator=(const where_expression&) = delete;
204 template <class U> void operator=(U&& x);
205 template <class U> void operator+=(U&& x);
206 template <class U> void operator-=(U&& x);
207 template <class U> void operator*=(U&& x);
208 template <class U> void operator/=(U&& x);
209 template <class U> void operator%=(U&& x);
210 template <class U> void operator&=(U&& x);
211 template <class U> void operator|=(U&& x);
212 template <class U> void operator^=(U&& x);
213 template <class U> void operator<<=(U&& x);
214 template <class U> void operator>>=(U&& x);
215 void operator++();
216 void operator++(int);
217 void operator--();
218 void operator--(int);
219 template <class U, class Flags> void copy_from(const U* mem, Flags);
220};
221
222// [simd.class]
223template <class T, class Abi> class simd {
224public:
225 using value_type = T;
226 using reference = see below;
227 using mask_type = simd_mask<T, Abi>;
228
229 using abi_type = Abi;
230 static constexpr size_t size() noexcept;
231 simd() = default;
232
233 // implicit type conversion constructor
234 template <class U> simd(const simd<U, simd_abi::fixed_size<size()>>&);
235
236 // implicit broadcast constructor (see below for constraints)
237 template <class U> simd(U&& value);
238
239 // generator constructor (see below for constraints)
240 template <class G> explicit simd(G&& gen);
241
242 // load constructor
243 template <class U, class Flags> simd(const U* mem, Flags f);
244
245 // loads [simd.load]
246 template <class U, class Flags> void copy_from(const U* mem, Flags f);
247
248 // stores [simd.store]
249 template <class U, class Flags> void copy_to(U* mem, Flags f) const;
250
251 // scalar access [simd.subscr]
252 reference operator[](size_t);
253 value_type operator[](size_t) const;
254
255 // unary operators [simd.unary]
256 simd& operator++();
257 simd operator++(int);
258 simd& operator--();
259 simd operator--(int);
260 mask_type operator!() const;
261 simd operator~() const; // see below
262 simd operator+() const;
263 simd operator-() const;
264
265 // binary operators [simd.binary]
266 friend simd operator+ (const simd&, const simd&);
267 friend simd operator- (const simd&, const simd&);
268 friend simd operator* (const simd&, const simd&);
269 friend simd operator/ (const simd&, const simd&);
270 friend simd operator% (const simd&, const simd&);
271 friend simd operator& (const simd&, const simd&);
272 friend simd operator| (const simd&, const simd&);
273 friend simd operator^ (const simd&, const simd&);
274 friend simd operator<<(const simd&, const simd&);
275 friend simd operator>>(const simd&, const simd&);
276 friend simd operator<<(const simd&, int);
277 friend simd operator>>(const simd&, int);
278
279 // compound assignment [simd.cassign]
280 friend simd& operator+= (simd&, const simd&);
281 friend simd& operator-= (simd&, const simd&);
282 friend simd& operator*= (simd&, const simd&);
283 friend simd& operator/= (simd&, const simd&);
284 friend simd& operator%= (simd&, const simd&);
285
286 friend simd& operator&= (simd&, const simd&);
287 friend simd& operator|= (simd&, const simd&);
288 friend simd& operator^= (simd&, const simd&);
289 friend simd& operator<<=(simd&, const simd&);
290 friend simd& operator>>=(simd&, const simd&);
291 friend simd& operator<<=(simd&, int);
292 friend simd& operator>>=(simd&, int);
293
294 // compares [simd.comparison]
295 friend mask_type operator==(const simd&, const simd&);
296 friend mask_type operator!=(const simd&, const simd&);
297 friend mask_type operator>=(const simd&, const simd&);
298 friend mask_type operator<=(const simd&, const simd&);
299 friend mask_type operator> (const simd&, const simd&);
300 friend mask_type operator< (const simd&, const simd&);
301};
302
303// [simd.math]
304template <class Abi> using scharv = simd<signed char, Abi>; // exposition only
305template <class Abi> using shortv = simd<short, Abi>; // exposition only
306template <class Abi> using intv = simd<int, Abi>; // exposition only
307template <class Abi> using longv = simd<long int, Abi>; // exposition only
308template <class Abi> using llongv = simd<long long int, Abi>; // exposition only
309template <class Abi> using floatv = simd<float, Abi>; // exposition only
310template <class Abi> using doublev = simd<double, Abi>; // exposition only
311template <class Abi> using ldoublev = simd<long double, Abi>; // exposition only
312template <class T, class V> using samesize = fixed_size_simd<T, V::size()>; // exposition only
313
314template <class Abi> floatv<Abi> acos(floatv<Abi> x);
315template <class Abi> doublev<Abi> acos(doublev<Abi> x);
316template <class Abi> ldoublev<Abi> acos(ldoublev<Abi> x);
317
318template <class Abi> floatv<Abi> asin(floatv<Abi> x);
319template <class Abi> doublev<Abi> asin(doublev<Abi> x);
320template <class Abi> ldoublev<Abi> asin(ldoublev<Abi> x);
321
322template <class Abi> floatv<Abi> atan(floatv<Abi> x);
323template <class Abi> doublev<Abi> atan(doublev<Abi> x);
324template <class Abi> ldoublev<Abi> atan(ldoublev<Abi> x);
325
326template <class Abi> floatv<Abi> atan2(floatv<Abi> y, floatv<Abi> x);
327template <class Abi> doublev<Abi> atan2(doublev<Abi> y, doublev<Abi> x);
328template <class Abi> ldoublev<Abi> atan2(ldoublev<Abi> y, ldoublev<Abi> x);
329
330template <class Abi> floatv<Abi> cos(floatv<Abi> x);
331template <class Abi> doublev<Abi> cos(doublev<Abi> x);
332template <class Abi> ldoublev<Abi> cos(ldoublev<Abi> x);
333
334template <class Abi> floatv<Abi> sin(floatv<Abi> x);
335template <class Abi> doublev<Abi> sin(doublev<Abi> x);
336template <class Abi> ldoublev<Abi> sin(ldoublev<Abi> x);
337
338template <class Abi> floatv<Abi> tan(floatv<Abi> x);
339template <class Abi> doublev<Abi> tan(doublev<Abi> x);
340template <class Abi> ldoublev<Abi> tan(ldoublev<Abi> x);
341
342template <class Abi> floatv<Abi> acosh(floatv<Abi> x);
343template <class Abi> doublev<Abi> acosh(doublev<Abi> x);
344template <class Abi> ldoublev<Abi> acosh(ldoublev<Abi> x);
345
346template <class Abi> floatv<Abi> asinh(floatv<Abi> x);
347template <class Abi> doublev<Abi> asinh(doublev<Abi> x);
348template <class Abi> ldoublev<Abi> asinh(ldoublev<Abi> x);
349
350template <class Abi> floatv<Abi> atanh(floatv<Abi> x);
351template <class Abi> doublev<Abi> atanh(doublev<Abi> x);
352template <class Abi> ldoublev<Abi> atanh(ldoublev<Abi> x);
353
354template <class Abi> floatv<Abi> cosh(floatv<Abi> x);
355template <class Abi> doublev<Abi> cosh(doublev<Abi> x);
356template <class Abi> ldoublev<Abi> cosh(ldoublev<Abi> x);
357
358template <class Abi> floatv<Abi> sinh(floatv<Abi> x);
359template <class Abi> doublev<Abi> sinh(doublev<Abi> x);
360template <class Abi> ldoublev<Abi> sinh(ldoublev<Abi> x);
361
362template <class Abi> floatv<Abi> tanh(floatv<Abi> x);
363template <class Abi> doublev<Abi> tanh(doublev<Abi> x);
364template <class Abi> ldoublev<Abi> tanh(ldoublev<Abi> x);
365
366template <class Abi> floatv<Abi> exp(floatv<Abi> x);
367template <class Abi> doublev<Abi> exp(doublev<Abi> x);
368template <class Abi> ldoublev<Abi> exp(ldoublev<Abi> x);
369
370template <class Abi> floatv<Abi> exp2(floatv<Abi> x);
371template <class Abi> doublev<Abi> exp2(doublev<Abi> x);
372template <class Abi> ldoublev<Abi> exp2(ldoublev<Abi> x);
373
374template <class Abi> floatv<Abi> expm1(floatv<Abi> x);
375template <class Abi> doublev<Abi> expm1(doublev<Abi> x);
376template <class Abi> ldoublev<Abi> expm1(ldoublev<Abi> x);
377
378template <class Abi> floatv<Abi> frexp(floatv<Abi> value, samesize<int, floatv<Abi>>* exp);
379template <class Abi> doublev<Abi> frexp(doublev<Abi> value, samesize<int, doublev<Abi>>* exp);
380template <class Abi> ldoublev<Abi> frexp(ldoublev<Abi> value, samesize<int, ldoublev<Abi>>* exp);
381
382template <class Abi> samesize<int, floatv<Abi>> ilogb(floatv<Abi> x);
383template <class Abi> samesize<int, doublev<Abi>> ilogb(doublev<Abi> x);
384template <class Abi> samesize<int, ldoublev<Abi>> ilogb(ldoublev<Abi> x);
385
386template <class Abi> floatv<Abi> ldexp(floatv<Abi> x, samesize<int, floatv<Abi>> exp);
387template <class Abi> doublev<Abi> ldexp(doublev<Abi> x, samesize<int, doublev<Abi>> exp);
388template <class Abi> ldoublev<Abi> ldexp(ldoublev<Abi> x, samesize<int, ldoublev<Abi>> exp);
389
390template <class Abi> floatv<Abi> log(floatv<Abi> x);
391template <class Abi> doublev<Abi> log(doublev<Abi> x);
392template <class Abi> ldoublev<Abi> log(ldoublev<Abi> x);
393
394template <class Abi> floatv<Abi> log10(floatv<Abi> x);
395template <class Abi> doublev<Abi> log10(doublev<Abi> x);
396template <class Abi> ldoublev<Abi> log10(ldoublev<Abi> x);
397
398template <class Abi> floatv<Abi> log1p(floatv<Abi> x);
399template <class Abi> doublev<Abi> log1p(doublev<Abi> x);
400template <class Abi> ldoublev<Abi> log1p(ldoublev<Abi> x);
401
402template <class Abi> floatv<Abi> log2(floatv<Abi> x);
403template <class Abi> doublev<Abi> log2(doublev<Abi> x);
404template <class Abi> ldoublev<Abi> log2(ldoublev<Abi> x);
405
406template <class Abi> floatv<Abi> logb(floatv<Abi> x);
407template <class Abi> doublev<Abi> logb(doublev<Abi> x);
408template <class Abi> ldoublev<Abi> logb(ldoublev<Abi> x);
409
410template <class Abi> floatv<Abi> modf(floatv<Abi> value, floatv<Abi>* iptr);
411template <class Abi> doublev<Abi> modf(doublev<Abi> value, doublev<Abi>* iptr);
412template <class Abi> ldoublev<Abi> modf(ldoublev<Abi> value, ldoublev<Abi>* iptr);
413
414template <class Abi> floatv<Abi> scalbn(floatv<Abi> x, samesize<int, floatv<Abi>> n);
415template <class Abi> doublev<Abi> scalbn(doublev<Abi> x, samesize<int, doublev<Abi>> n);
416template <class Abi> ldoublev<Abi> scalbn(ldoublev<Abi> x, samesize<int, ldoublev<Abi>> n);
417template <class Abi> floatv<Abi> scalbln(floatv<Abi> x, samesize<long int, floatv<Abi>> n);
418template <class Abi> doublev<Abi> scalbln(doublev<Abi> x, samesize<long int, doublev<Abi>> n);
419template <class Abi> ldoublev<Abi> scalbln(ldoublev<Abi> x, samesize<long int, ldoublev<Abi>> n);
420
421template <class Abi> floatv<Abi> cbrt(floatv<Abi> x);
422template <class Abi> doublev<Abi> cbrt(doublev<Abi> x);
423template <class Abi> ldoublev<Abi> cbrt(ldoublev<Abi> x);
424
425template <class Abi> scharv<Abi> abs(scharv<Abi> j);
426template <class Abi> shortv<Abi> abs(shortv<Abi> j);
427template <class Abi> intv<Abi> abs(intv<Abi> j);
428template <class Abi> longv<Abi> abs(longv<Abi> j);
429template <class Abi> llongv<Abi> abs(llongv<Abi> j);
430template <class Abi> floatv<Abi> abs(floatv<Abi> j);
431template <class Abi> doublev<Abi> abs(doublev<Abi> j);
432template <class Abi> ldoublev<Abi> abs(ldoublev<Abi> j);
433
434template <class Abi> floatv<Abi> hypot(floatv<Abi> x, floatv<Abi> y);
435template <class Abi> doublev<Abi> hypot(doublev<Abi> x, doublev<Abi> y);
436template <class Abi> ldoublev<Abi> hypot(doublev<Abi> x, doublev<Abi> y);
437template <class Abi> floatv<Abi> hypot(floatv<Abi> x, floatv<Abi> y, floatv<Abi> z);
438template <class Abi> doublev<Abi> hypot(doublev<Abi> x, doublev<Abi> y, doublev<Abi> z);
439template <class Abi> ldoublev<Abi> hypot(ldoublev<Abi> x, ldoublev<Abi> y, ldoublev<Abi> z);
440
441template <class Abi> floatv<Abi> pow(floatv<Abi> x, floatv<Abi> y);
442template <class Abi> doublev<Abi> pow(doublev<Abi> x, doublev<Abi> y);
443template <class Abi> ldoublev<Abi> pow(ldoublev<Abi> x, ldoublev<Abi> y);
444
445template <class Abi> floatv<Abi> sqrt(floatv<Abi> x);
446template <class Abi> doublev<Abi> sqrt(doublev<Abi> x);
447template <class Abi> ldoublev<Abi> sqrt(ldoublev<Abi> x);
448
449template <class Abi> floatv<Abi> erf(floatv<Abi> x);
450template <class Abi> doublev<Abi> erf(doublev<Abi> x);
451template <class Abi> ldoublev<Abi> erf(ldoublev<Abi> x);
452template <class Abi> floatv<Abi> erfc(floatv<Abi> x);
453template <class Abi> doublev<Abi> erfc(doublev<Abi> x);
454template <class Abi> ldoublev<Abi> erfc(ldoublev<Abi> x);
455
456template <class Abi> floatv<Abi> lgamma(floatv<Abi> x);
457template <class Abi> doublev<Abi> lgamma(doublev<Abi> x);
458template <class Abi> ldoublev<Abi> lgamma(ldoublev<Abi> x);
459
460template <class Abi> floatv<Abi> tgamma(floatv<Abi> x);
461template <class Abi> doublev<Abi> tgamma(doublev<Abi> x);
462template <class Abi> ldoublev<Abi> tgamma(ldoublev<Abi> x);
463
464template <class Abi> floatv<Abi> ceil(floatv<Abi> x);
465template <class Abi> doublev<Abi> ceil(doublev<Abi> x);
466template <class Abi> ldoublev<Abi> ceil(ldoublev<Abi> x);
467
468template <class Abi> floatv<Abi> floor(floatv<Abi> x);
469template <class Abi> doublev<Abi> floor(doublev<Abi> x);
470template <class Abi> ldoublev<Abi> floor(ldoublev<Abi> x);
471
472template <class Abi> floatv<Abi> nearbyint(floatv<Abi> x);
473template <class Abi> doublev<Abi> nearbyint(doublev<Abi> x);
474template <class Abi> ldoublev<Abi> nearbyint(ldoublev<Abi> x);
475
476template <class Abi> floatv<Abi> rint(floatv<Abi> x);
477template <class Abi> doublev<Abi> rint(doublev<Abi> x);
478template <class Abi> ldoublev<Abi> rint(ldoublev<Abi> x);
479
480template <class Abi> samesize<long int, floatv<Abi>> lrint(floatv<Abi> x);
481template <class Abi> samesize<long int, doublev<Abi>> lrint(doublev<Abi> x);
482template <class Abi> samesize<long int, ldoublev<Abi>> lrint(ldoublev<Abi> x);
483template <class Abi> samesize<long long int, floatv<Abi>> llrint(floatv<Abi> x);
484template <class Abi> samesize<long long int, doublev<Abi>> llrint(doublev<Abi> x);
485template <class Abi> samesize<long long int, ldoublev<Abi>> llrint(ldoublev<Abi> x);
486
487template <class Abi> floatv<Abi> round(floatv<Abi> x);
488template <class Abi> doublev<Abi> round(doublev<Abi> x);
489template <class Abi> ldoublev<Abi> round(ldoublev<Abi> x);
490template <class Abi> samesize<long int, floatv<Abi>> lround(floatv<Abi> x);
491template <class Abi> samesize<long int, doublev<Abi>> lround(doublev<Abi> x);
492template <class Abi> samesize<long int, ldoublev<Abi>> lround(ldoublev<Abi> x);
493template <class Abi> samesize<long long int, floatv<Abi>> llround(floatv<Abi> x);
494template <class Abi> samesize<long long int, doublev<Abi>> llround(doublev<Abi> x);
495template <class Abi> samesize<long long int, ldoublev<Abi>> llround(ldoublev<Abi> x);
496
497template <class Abi> floatv<Abi> trunc(floatv<Abi> x);
498template <class Abi> doublev<Abi> trunc(doublev<Abi> x);
499template <class Abi> ldoublev<Abi> trunc(ldoublev<Abi> x);
500
501template <class Abi> floatv<Abi> fmod(floatv<Abi> x, floatv<Abi> y);
502template <class Abi> doublev<Abi> fmod(doublev<Abi> x, doublev<Abi> y);
503template <class Abi> ldoublev<Abi> fmod(ldoublev<Abi> x, ldoublev<Abi> y);
504
505template <class Abi> floatv<Abi> remainder(floatv<Abi> x, floatv<Abi> y);
506template <class Abi> doublev<Abi> remainder(doublev<Abi> x, doublev<Abi> y);
507template <class Abi> ldoublev<Abi> remainder(ldoublev<Abi> x, ldoublev<Abi> y);
508
509template <class Abi> floatv<Abi> remquo(floatv<Abi> x, floatv<Abi> y, samesize<int, floatv<Abi>>* quo);
510template <class Abi> doublev<Abi> remquo(doublev<Abi> x, doublev<Abi> y, samesize<int, doublev<Abi>>* quo);
511template <class Abi> ldoublev<Abi> remquo(ldoublev<Abi> x, ldoublev<Abi> y, samesize<int, ldoublev<Abi>>* quo);
512
513template <class Abi> floatv<Abi> copysign(floatv<Abi> x, floatv<Abi> y);
514template <class Abi> doublev<Abi> copysign(doublev<Abi> x, doublev<Abi> y);
515template <class Abi> ldoublev<Abi> copysign(ldoublev<Abi> x, ldoublev<Abi> y);
516
517template <class Abi> doublev<Abi> nan(const char* tagp);
518template <class Abi> floatv<Abi> nanf(const char* tagp);
519template <class Abi> ldoublev<Abi> nanl(const char* tagp);
520
521template <class Abi> floatv<Abi> nextafter(floatv<Abi> x, floatv<Abi> y);
522template <class Abi> doublev<Abi> nextafter(doublev<Abi> x, doublev<Abi> y);
523template <class Abi> ldoublev<Abi> nextafter(ldoublev<Abi> x, ldoublev<Abi> y);
524
525template <class Abi> floatv<Abi> nexttoward(floatv<Abi> x, ldoublev<Abi> y);
526template <class Abi> doublev<Abi> nexttoward(doublev<Abi> x, ldoublev<Abi> y);
527template <class Abi> ldoublev<Abi> nexttoward(ldoublev<Abi> x, ldoublev<Abi> y);
528
529template <class Abi> floatv<Abi> fdim(floatv<Abi> x, floatv<Abi> y);
530template <class Abi> doublev<Abi> fdim(doublev<Abi> x, doublev<Abi> y);
531template <class Abi> ldoublev<Abi> fdim(ldoublev<Abi> x, ldoublev<Abi> y);
532
533template <class Abi> floatv<Abi> fmax(floatv<Abi> x, floatv<Abi> y);
534template <class Abi> doublev<Abi> fmax(doublev<Abi> x, doublev<Abi> y);
535template <class Abi> ldoublev<Abi> fmax(ldoublev<Abi> x, ldoublev<Abi> y);
536
537template <class Abi> floatv<Abi> fmin(floatv<Abi> x, floatv<Abi> y);
538template <class Abi> doublev<Abi> fmin(doublev<Abi> x, doublev<Abi> y);
539template <class Abi> ldoublev<Abi> fmin(ldoublev<Abi> x, ldoublev<Abi> y);
540
541template <class Abi> floatv<Abi> fma(floatv<Abi> x, floatv<Abi> y, floatv<Abi> z);
542template <class Abi> doublev<Abi> fma(doublev<Abi> x, doublev<Abi> y, doublev<Abi> z);
543template <class Abi> ldoublev<Abi> fma(ldoublev<Abi> x, ldoublev<Abi> y, ldoublev<Abi> z);
544
545template <class Abi> samesize<int, floatv<Abi>> fpclassify(floatv<Abi> x);
546template <class Abi> samesize<int, doublev<Abi>> fpclassify(doublev<Abi> x);
547template <class Abi> samesize<int, ldoublev<Abi>> fpclassify(ldoublev<Abi> x);
548
549template <class Abi> simd_mask<float, Abi> isfinite(floatv<Abi> x);
550template <class Abi> simd_mask<double, Abi> isfinite(doublev<Abi> x);
551template <class Abi> simd_mask<long double, Abi> isfinite(ldoublev<Abi> x);
552
553template <class Abi> simd_mask<float, Abi> isinf(floatv<Abi> x);
554template <class Abi> simd_mask<double, Abi> isinf(doublev<Abi> x);
555template <class Abi> simd_mask<long double, Abi> isinf(ldoublev<Abi> x);
556
557template <class Abi> simd_mask<float, Abi> isnan(floatv<Abi> x);
558template <class Abi> simd_mask<double, Abi> isnan(doublev<Abi> x);
559template <class Abi> simd_mask<long double, Abi> isnan(ldoublev<Abi> x);
560
561template <class Abi> simd_mask<float, Abi> isnormal(floatv<Abi> x);
562template <class Abi> simd_mask<double, Abi> isnormal(doublev<Abi> x);
563template <class Abi> simd_mask<long double, Abi> isnormal(ldoublev<Abi> x);
564
565template <class Abi> simd_mask<float, Abi> signbit(floatv<Abi> x);
566template <class Abi> simd_mask<double, Abi> signbit(doublev<Abi> x);
567template <class Abi> simd_mask<long double, Abi> signbit(ldoublev<Abi> x);
568
569template <class Abi> simd_mask<float, Abi> isgreater(floatv<Abi> x, floatv<Abi> y);
570template <class Abi> simd_mask<double, Abi> isgreater(doublev<Abi> x, doublev<Abi> y);
571template <class Abi> simd_mask<long double, Abi> isgreater(ldoublev<Abi> x, ldoublev<Abi> y);
572
573template <class Abi> simd_mask<float, Abi> isgreaterequal(floatv<Abi> x, floatv<Abi> y);
574template <class Abi> simd_mask<double, Abi> isgreaterequal(doublev<Abi> x, doublev<Abi> y);
575template <class Abi> simd_mask<long double, Abi> isgreaterequal(ldoublev<Abi> x, ldoublev<Abi> y);
576
577template <class Abi> simd_mask<float, Abi> isless(floatv<Abi> x, floatv<Abi> y);
578template <class Abi> simd_mask<double, Abi> isless(doublev<Abi> x, doublev<Abi> y);
579template <class Abi> simd_mask<long double, Abi> isless(ldoublev<Abi> x, ldoublev<Abi> y);
580
581template <class Abi> simd_mask<float, Abi> islessequal(floatv<Abi> x, floatv<Abi> y);
582template <class Abi> simd_mask<double, Abi> islessequal(doublev<Abi> x, doublev<Abi> y);
583template <class Abi> simd_mask<long double, Abi> islessequal(ldoublev<Abi> x, ldoublev<Abi> y);
584
585template <class Abi> simd_mask<float, Abi> islessgreater(floatv<Abi> x, floatv<Abi> y);
586template <class Abi> simd_mask<double, Abi> islessgreater(doublev<Abi> x, doublev<Abi> y);
587template <class Abi> simd_mask<long double, Abi> islessgreater(ldoublev<Abi> x, ldoublev<Abi> y);
588
589template <class Abi> simd_mask<float, Abi> isunordered(floatv<Abi> x, floatv<Abi> y);
590template <class Abi> simd_mask<double, Abi> isunordered(doublev<Abi> x, doublev<Abi> y);
591template <class Abi> simd_mask<long double, Abi> isunordered(ldoublev<Abi> x, ldoublev<Abi> y);
592
593template <class V> struct simd_div_t { V quot, rem; };
594template <class Abi> simd_div_t<scharv<Abi>> div(scharv<Abi> numer, scharv<Abi> denom);
595template <class Abi> simd_div_t<shortv<Abi>> div(shortv<Abi> numer, shortv<Abi> denom);
596template <class Abi> simd_div_t<intv<Abi>> div(intv<Abi> numer, intv<Abi> denom);
597template <class Abi> simd_div_t<longv<Abi>> div(longv<Abi> numer, longv<Abi> denom);
598template <class Abi> simd_div_t<llongv<Abi>> div(llongv<Abi> numer, llongv<Abi> denom);
599
600// [simd.mask.class]
601template <class T, class Abi>
602class simd_mask {
603public:
604 using value_type = bool;
605 using reference = see below;
606 using simd_type = simd<T, Abi>;
607 using abi_type = Abi;
608 static constexpr size_t size() noexcept;
609 simd_mask() = default;
610
611 // broadcast constructor
612 explicit simd_mask(value_type) noexcept;
613
614 // implicit type conversion constructor
615 template <class U> simd_mask(const simd_mask<U, simd_abi::fixed_size<size()>>&) noexcept;
616
617 // load constructor
618 template <class Flags> simd_mask(const value_type* mem, Flags);
619
620 // loads [simd.mask.copy]
621 template <class Flags> void copy_from(const value_type* mem, Flags);
622 template <class Flags> void copy_to(value_type* mem, Flags) const;
623
624 // scalar access [simd.mask.subscr]
625 reference operator[](size_t);
626 value_type operator[](size_t) const;
627
628 // unary operators [simd.mask.unary]
629 simd_mask operator!() const noexcept;
630
631 // simd_mask binary operators [simd.mask.binary]
632 friend simd_mask operator&&(const simd_mask&, const simd_mask&) noexcept;
633 friend simd_mask operator||(const simd_mask&, const simd_mask&) noexcept;
634 friend simd_mask operator& (const simd_mask&, const simd_mask&) noexcept;
635 friend simd_mask operator| (const simd_mask&, const simd_mask&) noexcept;
636 friend simd_mask operator^ (const simd_mask&, const simd_mask&) noexcept;
637
638 // simd_mask compound assignment [simd.mask.cassign]
639 friend simd_mask& operator&=(simd_mask&, const simd_mask&) noexcept;
640 friend simd_mask& operator|=(simd_mask&, const simd_mask&) noexcept;
641 friend simd_mask& operator^=(simd_mask&, const simd_mask&) noexcept;
642
643 // simd_mask compares [simd.mask.comparison]
644 friend simd_mask operator==(const simd_mask&, const simd_mask&) noexcept;
645 friend simd_mask operator!=(const simd_mask&, const simd_mask&) noexcept;
646};
647
648} // parallelism_v2
649} // std::experimental
650
651*/
652
653#include <experimental/__config>
654#include <array>
655#include <cstddef>
656#include <functional>
657
658#if !defined(_LIBCPP_HAS_NO_PRAGMA_SYSTEM_HEADER)
659#pragma GCC system_header
660#endif
661
662_LIBCPP_BEGIN_NAMESPACE_EXPERIMENTAL_SIMD
663
664enum class _StorageKind {
665 _Scalar,
666 _Array,
667};
668
669template <_StorageKind __kind, int _Np>
670struct __simd_abi {};
671
672template <class _Tp, class _Abi>
673struct __simd_storage_traits {};
674
675template <class _Tp, int __num_element>
676struct __simd_storage_traits<_Tp,
677 __simd_abi<_StorageKind::_Array, __num_element>> {
678 using type = std::array<_Tp, __num_element>;
679};
680
681template <class _Tp>
682struct __simd_storage_traits<_Tp, __simd_abi<_StorageKind::_Scalar, 1>> {
683 using type = _Tp;
684};
685
686template <class _To, class _From>
687constexpr decltype(_To{std::declval<_From>()}, true)
688__is_non_narrowing_convertible_impl(_From) {
689 return true;
690}
691
692template <class _To>
693constexpr bool __is_non_narrowing_convertible_impl(...) {
694 return false;
695}
696
697template <class _From, class _To>
698constexpr typename std::enable_if<std::is_arithmetic<_To>::value &&
699 std::is_arithmetic<_From>::value,
700 bool>::type
701__is_non_narrowing_arithmetic_convertible() {
702 return __is_non_narrowing_convertible_impl<_To>(_From{});
703}
704
705template <class _From, class _To>
706constexpr typename std::enable_if<!(std::is_arithmetic<_To>::value &&
707 std::is_arithmetic<_From>::value),
708 bool>::type
709__is_non_narrowing_arithmetic_convertible() {
710 return false;
711}
712
713template <class _Tp>
714constexpr _Tp __variadic_sum() {
715 return _Tp{};
716}
717
718template <class _Tp, class _Up, class... _Args>
719constexpr _Tp __variadic_sum(_Up __first, _Args... __rest) {
720 return static_cast<_Tp>(__first) + __variadic_sum<_Tp>(__rest...);
721}
722
723_LIBCPP_END_NAMESPACE_EXPERIMENTAL_SIMD
724_LIBCPP_BEGIN_NAMESPACE_EXPERIMENTAL_SIMD_ABI
725
726using scalar = __simd_abi<_StorageKind::_Scalar, 1>;
727
728template <int _Np>
729using fixed_size = __simd_abi<_StorageKind::_Array, _Np>;
730
731#if _LIBCPP_STD_VER > 14 && !defined(_LIBCPP_HAS_NO_VARIABLE_TEMPLATES)
732template <class _Tp>
733_LIBCPP_INLINE_VAR constexpr int max_fixed_size = 32;
734#endif
735template <class _Tp>
736using compatible = fixed_size<16 / sizeof(_Tp)>;
737template <class _Tp>
738using native = compatible<_Tp>;
739
740_LIBCPP_END_NAMESPACE_EXPERIMENTAL_SIMD_ABI
741_LIBCPP_BEGIN_NAMESPACE_EXPERIMENTAL_SIMD
742
743template <class _Tp, class _Abi = simd_abi::compatible<_Tp>>
744class simd;
745template <class _Tp, class _Abi = simd_abi::compatible<_Tp>>
746class simd_mask;
747
748struct element_aligned_tag {};
749struct vector_aligned_tag {};
750template <size_t>
751struct overaligned_tag {};
752#if _LIBCPP_STD_VER > 14
753_LIBCPP_INLINE_VAR constexpr element_aligned_tag element_aligned{};
754_LIBCPP_INLINE_VAR constexpr vector_aligned_tag vector_aligned{};
755#if !defined(_LIBCPP_HAS_NO_VARIABLE_TEMPLATES)
756template <size_t _Np>
757_LIBCPP_INLINE_VAR constexpr overaligned_tag<_Np> overaligned{};
758#endif
759#endif
760
761// traits [simd.traits]
762template <class _Tp>
763struct is_abi_tag : std::integral_constant<bool, false> {};
764
765template <_StorageKind __kind, int _Np>
766struct is_abi_tag<__simd_abi<__kind, _Np>>
767 : std::integral_constant<bool, true> {};
768
769template <class _Tp>
770struct is_simd : std::integral_constant<bool, false> {};
771
772template <class _Tp, class _Abi>
773struct is_simd<simd<_Tp, _Abi>> : std::integral_constant<bool, true> {};
774
775template <class _Tp>
776struct is_simd_mask : std::integral_constant<bool, false> {};
777
778template <class _Tp, class _Abi>
779struct is_simd_mask<simd_mask<_Tp, _Abi>> : std::integral_constant<bool, true> {
780};
781
782template <class _Tp>
783struct is_simd_flag_type : std::integral_constant<bool, false> {};
784
785template <>
786struct is_simd_flag_type<element_aligned_tag>
787 : std::integral_constant<bool, true> {};
788
789template <>
790struct is_simd_flag_type<vector_aligned_tag>
791 : std::integral_constant<bool, true> {};
792
793template <size_t _Align>
794struct is_simd_flag_type<overaligned_tag<_Align>>
795 : std::integral_constant<bool, true> {};
796
797#if _LIBCPP_STD_VER > 14 && !defined(_LIBCPP_HAS_NO_VARIABLE_TEMPLATES)
798template <class _Tp>
799_LIBCPP_INLINE_VAR constexpr bool is_abi_tag_v = is_abi_tag<_Tp>::value;
800template <class _Tp>
801_LIBCPP_INLINE_VAR constexpr bool is_simd_v = is_simd<_Tp>::value;
802template <class _Tp>
803_LIBCPP_INLINE_VAR constexpr bool is_simd_mask_v = is_simd_mask<_Tp>::value;
804template <class _Tp>
805_LIBCPP_INLINE_VAR constexpr bool is_simd_flag_type_v =
806 is_simd_flag_type<_Tp>::value;
807#endif
808template <class _Tp, size_t _Np>
809struct abi_for_size {
810 using type = simd_abi::fixed_size<_Np>;
811};
812template <class _Tp, size_t _Np>
813using abi_for_size_t = typename abi_for_size<_Tp, _Np>::type;
814
815template <class _Tp, class _Abi = simd_abi::compatible<_Tp>>
816struct simd_size;
817
818template <class _Tp, _StorageKind __kind, int _Np>
819struct simd_size<_Tp, __simd_abi<__kind, _Np>>
820 : std::integral_constant<size_t, _Np> {
821 static_assert(
822 std::is_arithmetic<_Tp>::value &&
823 !std::is_same<typename std::remove_const<_Tp>::type, bool>::value,
824 "Element type should be vectorizable");
825};
826
827template <class _Tp, class _Up = typename _Tp::value_type>
828struct memory_alignment;
829
830#if _LIBCPP_STD_VER > 14 && !defined(_LIBCPP_HAS_NO_VARIABLE_TEMPLATES)
831template <class _Tp, class _Abi = simd_abi::compatible<_Tp>>
832_LIBCPP_INLINE_VAR constexpr size_t simd_size_v = simd_size<_Tp, _Abi>::value;
833
834template <class _Tp, class _Up = typename _Tp::value_type>
835_LIBCPP_INLINE_VAR constexpr size_t memory_alignment_v =
836 memory_alignment<_Tp, _Up>::value;
837#endif
838
839// class template simd [simd.class]
840template <class _Tp>
841using native_simd = simd<_Tp, simd_abi::native<_Tp>>;
842template <class _Tp, int _Np>
843using fixed_size_simd = simd<_Tp, simd_abi::fixed_size<_Np>>;
844
845// class template simd_mask [simd.mask.class]
846template <class _Tp>
847using native_simd_mask = simd_mask<_Tp, simd_abi::native<_Tp>>;
848
849template <class _Tp, int _Np>
850using fixed_size_simd_mask = simd_mask<_Tp, simd_abi::fixed_size<_Np>>;
851
852// casts [simd.casts]
853template <class _Tp>
854struct __static_simd_cast_traits {
855 template <class _Up, class _Abi>
856 static simd<_Tp, _Abi> __apply(const simd<_Up, _Abi>& __v);
857};
858
859template <class _Tp, class _NewAbi>
860struct __static_simd_cast_traits<simd<_Tp, _NewAbi>> {
861 template <class _Up, class _Abi>
862 static typename std::enable_if<simd<_Up, _Abi>::size() ==
863 simd<_Tp, _NewAbi>::size(),
864 simd<_Tp, _NewAbi>>::type
865 __apply(const simd<_Up, _Abi>& __v);
866};
867
868template <class _Tp>
869struct __simd_cast_traits {
870 template <class _Up, class _Abi>
871 static typename std::enable_if<
872 __is_non_narrowing_arithmetic_convertible<_Up, _Tp>(),
873 simd<_Tp, _Abi>>::type
874 __apply(const simd<_Up, _Abi>& __v);
875};
876
877template <class _Tp, class _NewAbi>
878struct __simd_cast_traits<simd<_Tp, _NewAbi>> {
879 template <class _Up, class _Abi>
880 static typename std::enable_if<
881 __is_non_narrowing_arithmetic_convertible<_Up, _Tp>() &&
882 simd<_Up, _Abi>::size() == simd<_Tp, _NewAbi>::size(),
883 simd<_Tp, _NewAbi>>::type
884 __apply(const simd<_Up, _Abi>& __v);
885};
886
887template <class _Tp, class _Up, class _Abi>
888auto simd_cast(const simd<_Up, _Abi>& __v)
889 -> decltype(__simd_cast_traits<_Tp>::__apply(__v)) {
890 return __simd_cast_traits<_Tp>::__apply(__v);
891}
892
893template <class _Tp, class _Up, class _Abi>
894auto static_simd_cast(const simd<_Up, _Abi>& __v)
895 -> decltype(__static_simd_cast_traits<_Tp>::__apply(__v)) {
896 return __static_simd_cast_traits<_Tp>::__apply(__v);
897}
898
899template <class _Tp, class _Abi>
900fixed_size_simd<_Tp, simd_size<_Tp, _Abi>::value>
901to_fixed_size(const simd<_Tp, _Abi>&) noexcept;
902
903template <class _Tp, class _Abi>
904fixed_size_simd_mask<_Tp, simd_size<_Tp, _Abi>::value>
905to_fixed_size(const simd_mask<_Tp, _Abi>&) noexcept;
906
907template <class _Tp, size_t _Np>
908native_simd<_Tp> to_native(const fixed_size_simd<_Tp, _Np>&) noexcept;
909
910template <class _Tp, size_t _Np>
911native_simd_mask<_Tp> to_native(const fixed_size_simd_mask<_Tp, _Np>&) noexcept;
912
913template <class _Tp, size_t _Np>
914simd<_Tp> to_compatible(const fixed_size_simd<_Tp, _Np>&) noexcept;
915
916template <class _Tp, size_t _Np>
917simd_mask<_Tp> to_compatible(const fixed_size_simd_mask<_Tp, _Np>&) noexcept;
918
919template <size_t... __sizes, class _Tp, class _Abi>
920tuple<simd<_Tp, abi_for_size_t<_Tp, __sizes>>...> split(const simd<_Tp, _Abi>&);
921
922template <size_t... __sizes, class _Tp, class _Abi>
923tuple<simd_mask<_Tp, abi_for_size_t<_Tp, __sizes>>...>
924split(const simd_mask<_Tp, _Abi>&);
925
926template <class _SimdType, class _Abi>
927array<_SimdType, simd_size<typename _SimdType::value_type, _Abi>::value /
928 _SimdType::size()>
929split(const simd<typename _SimdType::value_type, _Abi>&);
930
931template <class _SimdType, class _Abi>
932array<_SimdType, simd_size<typename _SimdType::value_type, _Abi>::value /
933 _SimdType::size()>
934split(const simd_mask<typename _SimdType::value_type, _Abi>&);
935
936template <class _Tp, class... _Abis>
937simd<_Tp, abi_for_size_t<_Tp, __variadic_sum(simd_size<_Tp, _Abis>::value...)>>
938concat(const simd<_Tp, _Abis>&...);
939
940template <class _Tp, class... _Abis>
941simd_mask<_Tp,
942 abi_for_size_t<_Tp, __variadic_sum(simd_size<_Tp, _Abis>::value...)>>
943concat(const simd_mask<_Tp, _Abis>&...);
944
945// reductions [simd.mask.reductions]
946template <class _Tp, class _Abi>
947bool all_of(const simd_mask<_Tp, _Abi>&) noexcept;
948template <class _Tp, class _Abi>
949bool any_of(const simd_mask<_Tp, _Abi>&) noexcept;
950template <class _Tp, class _Abi>
951bool none_of(const simd_mask<_Tp, _Abi>&) noexcept;
952template <class _Tp, class _Abi>
953bool some_of(const simd_mask<_Tp, _Abi>&) noexcept;
954template <class _Tp, class _Abi>
955int popcount(const simd_mask<_Tp, _Abi>&) noexcept;
956template <class _Tp, class _Abi>
957int find_first_set(const simd_mask<_Tp, _Abi>&);
958template <class _Tp, class _Abi>
959int find_last_set(const simd_mask<_Tp, _Abi>&);
960bool all_of(bool) noexcept;
961bool any_of(bool) noexcept;
962bool none_of(bool) noexcept;
963bool some_of(bool) noexcept;
964int popcount(bool) noexcept;
965int find_first_set(bool) noexcept;
966int find_last_set(bool) noexcept;
967
968// masked assignment [simd.whereexpr]
969template <class _MaskType, class _Tp>
970class const_where_expression;
971template <class _MaskType, class _Tp>
972class where_expression;
973
974// masked assignment [simd.mask.where]
975template <class _Tp>
976struct __nodeduce {
977 using type = _Tp;
978};
979
980template <class _Tp, class _Abi>
981where_expression<simd_mask<_Tp, _Abi>, simd<_Tp, _Abi>>
982where(const typename simd<_Tp, _Abi>::mask_type&, simd<_Tp, _Abi>&) noexcept;
983
984template <class _Tp, class _Abi>
985const_where_expression<simd_mask<_Tp, _Abi>, const simd<_Tp, _Abi>>
986where(const typename simd<_Tp, _Abi>::mask_type&,
987 const simd<_Tp, _Abi>&) noexcept;
988
989template <class _Tp, class _Abi>
990where_expression<simd_mask<_Tp, _Abi>, simd_mask<_Tp, _Abi>>
991where(const typename __nodeduce<simd_mask<_Tp, _Abi>>::type&,
992 simd_mask<_Tp, _Abi>&) noexcept;
993
994template <class _Tp, class _Abi>
995const_where_expression<simd_mask<_Tp, _Abi>, const simd_mask<_Tp, _Abi>>
996where(const typename __nodeduce<simd_mask<_Tp, _Abi>>::type&,
997 const simd_mask<_Tp, _Abi>&) noexcept;
998
999template <class _Tp>
1000where_expression<bool, _Tp> where(bool, _Tp&) noexcept;
1001
1002template <class _Tp>
1003const_where_expression<bool, const _Tp> where(bool, const _Tp&) noexcept;
1004
1005// reductions [simd.reductions]
1006template <class _Tp, class _Abi, class _BinaryOp = std::plus<_Tp>>
1007_Tp reduce(const simd<_Tp, _Abi>&, _BinaryOp = _BinaryOp());
1008
1009template <class _MaskType, class _SimdType, class _BinaryOp>
1010typename _SimdType::value_type
1011reduce(const const_where_expression<_MaskType, _SimdType>&,
1012 typename _SimdType::value_type neutral_element, _BinaryOp binary_op);
1013
1014template <class _MaskType, class _SimdType>
1015typename _SimdType::value_type
1016reduce(const const_where_expression<_MaskType, _SimdType>&,
1017 plus<typename _SimdType::value_type> binary_op = {});
1018
1019template <class _MaskType, class _SimdType>
1020typename _SimdType::value_type
1021reduce(const const_where_expression<_MaskType, _SimdType>&,
1022 multiplies<typename _SimdType::value_type> binary_op);
1023
1024template <class _MaskType, class _SimdType>
1025typename _SimdType::value_type
1026reduce(const const_where_expression<_MaskType, _SimdType>&,
1027 bit_and<typename _SimdType::value_type> binary_op);
1028
1029template <class _MaskType, class _SimdType>
1030typename _SimdType::value_type
1031reduce(const const_where_expression<_MaskType, _SimdType>&,
1032 bit_or<typename _SimdType::value_type> binary_op);
1033
1034template <class _MaskType, class _SimdType>
1035typename _SimdType::value_type
1036reduce(const const_where_expression<_MaskType, _SimdType>&,
1037 bit_xor<typename _SimdType::value_type> binary_op);
1038
1039template <class _Tp, class _Abi>
1040_Tp hmin(const simd<_Tp, _Abi>&);
1041template <class _MaskType, class _SimdType>
1042typename _SimdType::value_type
1043hmin(const const_where_expression<_MaskType, _SimdType>&);
1044template <class _Tp, class _Abi>
1045_Tp hmax(const simd<_Tp, _Abi>&);
1046template <class _MaskType, class _SimdType>
1047typename _SimdType::value_type
1048hmax(const const_where_expression<_MaskType, _SimdType>&);
1049
1050// algorithms [simd.alg]
1051template <class _Tp, class _Abi>
1052simd<_Tp, _Abi> min(const simd<_Tp, _Abi>&, const simd<_Tp, _Abi>&) noexcept;
1053
1054template <class _Tp, class _Abi>
1055simd<_Tp, _Abi> max(const simd<_Tp, _Abi>&, const simd<_Tp, _Abi>&) noexcept;
1056
1057template <class _Tp, class _Abi>
1058std::pair<simd<_Tp, _Abi>, simd<_Tp, _Abi>>
1059minmax(const simd<_Tp, _Abi>&, const simd<_Tp, _Abi>&) noexcept;
1060
1061template <class _Tp, class _Abi>
1062simd<_Tp, _Abi> clamp(const simd<_Tp, _Abi>&, const simd<_Tp, _Abi>&,
1063 const simd<_Tp, _Abi>&);
1064
1065// [simd.whereexpr]
1066// TODO implement where expressions.
1067template <class _MaskType, class _Tp>
1068class const_where_expression {
1069public:
1070 const_where_expression(const const_where_expression&) = delete;
1071 const_where_expression& operator=(const const_where_expression&) = delete;
1072 typename remove_const<_Tp>::type operator-() const&&;
1073 template <class _Up, class _Flags>
1074 void copy_to(_Up*, _Flags) const&&;
1075};
1076
1077template <class _MaskType, class _Tp>
1078class where_expression : public const_where_expression<_MaskType, _Tp> {
1079public:
1080 where_expression(const where_expression&) = delete;
1081 where_expression& operator=(const where_expression&) = delete;
1082 template <class _Up>
1083 void operator=(_Up&&);
1084 template <class _Up>
1085 void operator+=(_Up&&);
1086 template <class _Up>
1087 void operator-=(_Up&&);
1088 template <class _Up>
1089 void operator*=(_Up&&);
1090 template <class _Up>
1091 void operator/=(_Up&&);
1092 template <class _Up>
1093 void operator%=(_Up&&);
1094 template <class _Up>
1095 void operator&=(_Up&&);
1096 template <class _Up>
1097 void operator|=(_Up&&);
1098 template <class _Up>
1099 void operator^=(_Up&&);
1100 template <class _Up>
1101 void operator<<=(_Up&&);
1102 template <class _Up>
1103 void operator>>=(_Up&&);
1104 void operator++();
1105 void operator++(int);
1106 void operator--();
1107 void operator--(int);
1108 template <class _Up, class _Flags>
1109 void copy_from(const _Up*, _Flags);
1110};
1111
1112// [simd.class]
1113// TODO: implement simd
1114template <class _Tp, class _Abi>
1115class simd {
1116private:
1117 template <class _Up>
1118 static constexpr bool __can_broadcast() {
1119 return (std::is_arithmetic<_Up>::value &&
1120 __is_non_narrowing_arithmetic_convertible<_Up, _Tp>()) ||
1121 (!std::is_arithmetic<_Up>::value &&
1122 std::is_convertible<_Up, _Tp>::value) ||
1123 std::is_same<typename std::remove_const<_Up>::type, int>::value ||
1124 (std::is_same<typename std::remove_const<_Up>::type,
1125 unsigned int>::value &&
1126 std::is_unsigned<_Tp>::value);
1127 }
1128
1129public:
1130 using value_type = _Tp;
1131 // TODO: this is strawman implementation. Turn it into a proxy type.
1132 using reference = _Tp&;
1133 using mask_type = simd_mask<_Tp, _Abi>;
1134
1135 using abi_type = _Abi;
1136
1137 static constexpr size_t size() noexcept {
1138 return simd_size<_Tp, _Abi>::value;
1139 }
1140
1141 simd() = default;
1142
1143 // implicit type conversion constructor
1144 template <class _Up,
1145 class = typename std::enable_if<
1146 std::is_same<_Abi, simd_abi::fixed_size<size()>>::value &&
1147 __is_non_narrowing_arithmetic_convertible<_Up, _Tp>()>::type>
1148 simd(const simd<_Up, simd_abi::fixed_size<size()>>&) {}
1149
1150 // implicit broadcast constructor
1151 template <class _Up,
1152 class = typename std::enable_if<__can_broadcast<_Up>()>::type>
1153 simd(_Up&&);
1154
1155 // generator constructor
1156 // TODO: for now only check for the index 0. This is because C++11 doesn't
1157 // have index_sequence, and it's hard to check for all indicies without using
1158 // index_sequence.
1159 template <class _Generator,
1160 int = decltype(simd(std::declval<_Generator>()(
1161 std::integral_constant<size_t, 0>())),
1162 int())()>
1163 explicit simd(_Generator&&);
1164
1165 // load constructor
1166 template <class _Up, class _Flags>
1167 simd(const _Up*, _Flags);
1168
1169 // loads [simd.load]
1170 template <class _Up, class _Flags>
1171 void copy_from(const _Up*, _Flags);
1172
1173 // stores [simd.store]
1174 template <class _Up, class _Flags>
1175 void copy_to(_Up*, _Flags) const;
1176
1177 // scalar access [simd.subscr]
1178 reference operator[](size_t);
1179 value_type operator[](size_t) const;
1180
1181 // unary operators [simd.unary]
1182 simd& operator++();
1183 simd operator++(int);
1184 simd& operator--();
1185 simd operator--(int);
1186 mask_type operator!() const;
1187 simd operator~() const;
1188 simd operator+() const;
1189 simd operator-() const;
1190
1191 // binary operators [simd.binary]
1192 friend simd operator+(const simd&, const simd&);
1193 friend simd operator-(const simd&, const simd&);
1194 friend simd operator*(const simd&, const simd&);
1195 friend simd operator/(const simd&, const simd&);
1196 friend simd operator%(const simd&, const simd&);
1197 friend simd operator&(const simd&, const simd&);
1198 friend simd operator|(const simd&, const simd&);
1199 friend simd operator^(const simd&, const simd&);
1200 friend simd operator<<(const simd&, const simd&);
1201 friend simd operator>>(const simd&, const simd&);
1202 friend simd operator<<(const simd&, int);
1203 friend simd operator>>(const simd&, int);
1204
1205 // compound assignment [simd.cassign]
1206 friend simd& operator+=(simd&, const simd&);
1207 friend simd& operator-=(simd&, const simd&);
1208 friend simd& operator*=(simd&, const simd&);
1209 friend simd& operator/=(simd&, const simd&);
1210 friend simd& operator%=(simd&, const simd&);
1211
1212 friend simd& operator&=(simd&, const simd&);
1213 friend simd& operator|=(simd&, const simd&);
1214 friend simd& operator^=(simd&, const simd&);
1215 friend simd& operator<<=(simd&, const simd&);
1216 friend simd& operator>>=(simd&, const simd&);
1217 friend simd& operator<<=(simd&, int);
1218 friend simd& operator>>=(simd&, int);
1219
1220 // compares [simd.comparison]
1221 friend mask_type operator==(const simd&, const simd&);
1222 friend mask_type operator!=(const simd&, const simd&);
1223 friend mask_type operator>=(const simd&, const simd&);
1224 friend mask_type operator<=(const simd&, const simd&);
1225 friend mask_type operator>(const simd&, const simd&);
1226 friend mask_type operator<(const simd&, const simd&);
1227};
1228
1229// [simd.mask.class]
1230template <class _Tp, class _Abi>
1231// TODO: implement simd_mask
1232class simd_mask {
1233public:
1234 using value_type = bool;
1235 // TODO: this is strawman implementation. Turn it into a proxy type.
1236 using reference = bool&;
1237 using simd_type = simd<_Tp, _Abi>;
1238 using abi_type = _Abi;
1239 static constexpr size_t size() noexcept;
1240 simd_mask() = default;
1241
1242 // broadcast constructor
1243 explicit simd_mask(value_type) noexcept;
1244
1245 // implicit type conversion constructor
1246 template <class _Up>
1247 simd_mask(const simd_mask<_Up, simd_abi::fixed_size<size()>>&) noexcept;
1248
1249 // load constructor
1250 template <class _Flags>
1251 simd_mask(const value_type*, _Flags);
1252
1253 // loads [simd.mask.copy]
1254 template <class _Flags>
1255 void copy_from(const value_type*, _Flags);
1256 template <class _Flags>
1257 void copy_to(value_type*, _Flags) const;
1258
1259 // scalar access [simd.mask.subscr]
1260 reference operator[](size_t);
1261 value_type operator[](size_t) const;
1262
1263 // unary operators [simd.mask.unary]
1264 simd_mask operator!() const noexcept;
1265
1266 // simd_mask binary operators [simd.mask.binary]
1267 friend simd_mask operator&&(const simd_mask&, const simd_mask&) noexcept;
1268 friend simd_mask operator||(const simd_mask&, const simd_mask&) noexcept;
1269 friend simd_mask operator&(const simd_mask&, const simd_mask&)noexcept;
1270 friend simd_mask operator|(const simd_mask&, const simd_mask&) noexcept;
1271 friend simd_mask operator^(const simd_mask&, const simd_mask&) noexcept;
1272
1273 // simd_mask compound assignment [simd.mask.cassign]
1274 friend simd_mask& operator&=(simd_mask&, const simd_mask&) noexcept;
1275 friend simd_mask& operator|=(simd_mask&, const simd_mask&) noexcept;
1276 friend simd_mask& operator^=(simd_mask&, const simd_mask&) noexcept;
1277
1278 // simd_mask compares [simd.mask.comparison]
1279 friend simd_mask operator==(const simd_mask&, const simd_mask&) noexcept;
1280 friend simd_mask operator!=(const simd_mask&, const simd_mask&) noexcept;
1281};
1282
1283_LIBCPP_END_NAMESPACE_EXPERIMENTAL_SIMD
1284
1285#endif /* _LIBCPP_EXPERIMENTAL_SIMD */